天天看点

Python百度百科爬虫

import requests
from bs4 import BeautifulSoup
for name in iter (input,''):
    url="https://baike.baidu.com/item/"+name+"?fr=aladdin"
    res=requests.get(url,headers={"user-agent": "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/84.0.4147.89 Safari/537.36 SLBrowser/7.0.0.5211 SLBChan/11"})
    soup = BeautifulSoup(res.text, 'html.parser')
    # print(res.text)
    ans=soup.find(class_="para")
    try:
        print(ans.text)
    except:
        continue

           
Python百度百科爬虫