yyyyyyyyyyyyyyyyyyyy

博客园 首页 新随笔 联系 订阅 管理
复制代码
from lxml import etree

import codecs
import sys
from lxml import etree

def parser(p):
    tree = etree.HTML(open(str(p)+'.html', 'r').read())
    
    nodes = tree.xpath("//div[@class='BlueTable']//tr")
    #nodes = tree.xpath("//text()")
    for n in nodes:
        #mystr=etree.tostring(n,pretty_print=True)
        mystr=etree.tostring(n, method="html")
        print(etree.HTML(mystr).xpath("//text()"))

for p in range(1,211):
    parser(p);
复制代码

 

posted on   xxxxxxxx1x2xxxxxxx  阅读(432)  评论(0编辑  收藏  举报
努力加载评论中...
点击右上角即可分享
微信分享提示