- 论坛徽章:
- 0
|
#tp.py
from HTMLParser import HTMLParser
import sys
class titleParser(HTMLParser):
def __init__(self):
self.title='..'
print self.title
self.key=0
HTMLParser.__init__(self)
print 'cc'
def handle_starttag(self,tag,attrs):
if tag=='title':
self.key=1
print self.key
print 'ok'
def handle_data(self,data):
self.title+=data
def handle_endtag(self,tag,attrs):
self.key=0
def gettitle(self):
#print 'haha'
print self.title
return self.title
fd=open(sys.argv[1])
print 'aa'
tp=titleParser()
print'bb'
print fd.read()
tp.feed(fd.read())
print 'bb'
print 'title is',tp.gettitle()
这个是源程序,打印网页的title 为什么打印不出来呢? |
|