网页数据解析三种方式正则表达式123456import reimport requestsresp = requests.get(url=url, headers=headers)pattern = re.compile(r'正则表达式')data = pattern.findall(resp.text) bs412345678import bs4import requestsresp = requests.get(url=url, headers=headers)# 创建BeautifulSoup对象soup = bs4.BeautifulSoup(resp.text, 'lxml')# 通过CSS选择器从页面中提取标签data = soup.select("css选择器") xpath1234567import requestsfrom lxml import etreeresp = requests.get(url=url, headers=headers)tree = etree.HTML(resp.text)data = tree.xpath("xpath路径")