随笔分类 - 黑科技
摘要:1 #-*- coding:utf-8 -*- 2 # -*- coding: utf-8 -*- 3 #encoding:utf-8 4 import urllib 5 import urllib2 6 import cookielib 7 import re 8 9 10 class SDU: 11 12 def __init__(self): 13 ...
阅读全文
摘要:1 #encoding:utf-8 2 # -*- coding: utf-8 -*- 3 # coding:utf-8 4 import urllib 5 import urllib2 6 import re 7 #处理页面标签类 8 9 class Tool: 10 #去除img标签,7位长空格 11 removeImg = re.compile('| {...
阅读全文
摘要:1 # -*- coding:utf-8 -*- 2 import urllib2 3 import re 4 for page in range(1,5): 5 url = 'http://www.qiushibaike.com/hot/page/' + str(page) 6 user_agent = 'Mozilla/4.0 (compatible; MSIE ...
阅读全文