Skip to content

python 单页面爬取数据

python 单页面爬取数据

python
# 单页面xpath爬虫
from bs4 import BeautifulSoup
import requests

url = "https://www.zhonghuadiancang.com/foxuebaodian/dazhidulun/140376.html"
data =   requests.get(url).content.decode('utf-8', 'ignore')

soup = BeautifulSoup(data, 'html.parser').get_text()

soup = soup.replace(" ", "")

print('\033[33;1m' + soup + '\033[0m')