python 爬取简书评论

import json

import  requests
from lxml import etree
from time import sleep


url = "https://www.jianshu.com/shakespeare/notes/60479187/comments?page=1&count=100&author_only=false&order_by=desc"
headers = {
    "User-Agent":"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/79.0.3945.88 Safari/537.36",
    "Refer":"https://www.jianshu.com"
}

resp = requests.get(url,headers=headers)
content = resp.content.decode('utf-8')
res = json.loads(content)
data = res['comments']


for item in data:
    print(item['compiled_content'])

 

posted @ 2020-03-14 11:35  brady-wang  阅读(293)  评论(0编辑  收藏  举报