python 单页面爬取数据
python 单页面爬取数据
python
# 单页面xpath爬虫
from bs4 import BeautifulSoup
import requests
url = "https://www.zhonghuadiancang.com/foxuebaodian/dazhidulun/140376.html"
data = requests.get(url).content.decode('utf-8', 'ignore')
soup = BeautifulSoup(data, 'html.parser').get_text()
soup = soup.replace(" ", "")
print('\033[33;1m' + soup + '\033[0m')