- 论坛徽章:
- 0
|
我以前写的代码,你如果是要做gzip检测可以用到它- #coding:utf-8
-
- import urllib2
- import StringIO,gzip,re
- from time import ctime
- MANZZBD_PPURLGF = 'http://.+?\..+?\..+'
- URLXFPE_RAWORDV = "http://"
- WORSPA_SOZGVERT = "http://www."
- urlroot=urllib2.HTTPHandler(debuglevel=1)
- opener = urllib2.build_opener(urlroot)
-
- class VaurlpathzxcrError(BaseException) : pass
- class MrhandirzkanrError(VaurlpathzxcrError) : pass
- class URLrOotavrManroot:
-
- def __init__(self,lower):
-
- self.lower = lower
- self.pack = False
- self.data = False
- self.cgix = False
- self.inurlSpcltGagdg()
- self.sooRrootManseek()
- self.vuiBichuHworldn()
-
- #发送gzip压缩请求
- def inurlSpcltGagdg(self):
- valchar = urllib2.Request(self.lower,
- headers={'Accept-encoding':'gzip'})
- self.cgix = opener.open(valchar).read()
-
- #解压gzip文件
- def sooRrootManseek(self):
- self.pack = self.cgix
- passdir = StringIO.StringIO(self.pack)
- gzipper = gzip.GzipFile(fileobj=passdir)
- self.data = gzipper.read()
- #压缩前后进行对比
- def vuiBichuHworldn(self):
- if len(self.data) is len(self.cgix):
- raise VaurlpathzxcrError("Don't support the link")
- else:
- print "The current time %s" % ctime()
-
- class URLcossNoruermoher:
- def __init__(self,hasrrt):
- if not WORSPA_SOZGVERT in hasrrt:
- hasrrt = WORSPA_SOZGVERT + hasrrt
- if not URLXFPE_RAWORDV in hasrrt:
- hasrrt = URLXFPE_RAWORDV + hasrrt
- if re.findall(MANZZBD_PPURLGF,hasrrt):
- self.seek = URLrOotavrManroot(hasrrt)
- else:
- raise MrhandirzkanrError('url requirements specification')
-
-
- def main():
- URLcossNoruermoher('http://www.gov.cn/')
- if __name__=="__main__":
- main()
-
-
复制代码 |
|