- 论坛徽章:
- 0
|
- #! /usr/bin/env python
- #coding=utf-8
- import sys
- reload(sys)
- sys.setdefaultencoding('gb2312')
- from BeautifulSoup import BeautifulSoup as BeautifulSoup
- content = '''
- <span class="pipe">|</span>
- <div id="ADV_13039"></div>
- <div class="ppost" data-field='{"author":{"id":281340474,"name":"是无户",is_private":false,"outer_id":"141251325"},"content":{"id":17628581128,"is_anonym":false,"open_id":"tieba","open_type":"","date":"2012-03-02 20:38","vote_crypt":"","floor":1,"type":"00"}}'></div>'
- '''
- soup = BeautifulSoup(content)
- divs = soup('div')
- for div in divs:
- if "data-field" in dict(div.attrs):
- print div['data-field']
复制代码 输出
> "C:\Python27\python.exe" -u "E:\script\Untitled 1.py"
{"author":{"id":281340474,"name":"是无户",is_private":false,"outer_id":"141251325"},"content":{"id":17628581128,"is_anonym":false,"open_id":"tieba","open_type":"","date":"2012-03-02 20:38","vote_crypt":"","floor":1,"type":"00"}}
|
|