import requests
from bs4 import BeautifulSoup
# 定义一个简单的函数来获取网页内容defget_html(url):try:
response = requests.get(url)if response.status_code ==200:return response.text
else:returnNoneexcept requests.RequestException:returnNone# 定义一个函数来解析网页并提取所需信息defparse_html(html):
soup = BeautifulSoup(html,'html.parser')# 假设我们要提取的信息是标题
title = soup.find('title')return title.text if title elseNone# 使用示例
url ='https://www.example.com'
html = get_html(url)if html:
parsed_title = parse_html(html)print(f"The title of the webpage is: {parsed_title}")else:print("Failed to retrieve the webpage content.")
评论已关闭