bs4解析基础

#!usr/bin/python

from bs4 import BeautifulSoup
if __name__ == "__main__":
    #将本地的html文档中的数据加载到该对象中
    fp = open('./test.html', 'r', encoding='utf-8')
    soup = BeautifulSoup(fp,'lxml')
    # print(soup)
    print(soup.a)   #soup.tagName返回的是html中第一次出现的a标签
    print(soup.div)   #soup.tagName返回的是html中第一次出现的div标签
    #find('tagName'):等同于soup.div
    print(soup.find('div')) #print(soup.div)
    print(soup.find('div',class_='song').string)
    print(soup.find_all('a'))

    print(soup.select('.tang'))
    print(soup.select('.tang > ul > li > a')[0])
    print(soup.select('.tang > ul a')[0].text)


posted @ 2020-07-28 08:37  一只小白呀  阅读(145)  评论(0编辑  收藏  举报