import requests
from bs4 import BeautifulSoup
import pandas as pd
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0
url = 'https://www.xxx.com/xxx'
response = requests.get(url,headers=headers)
if response.status_code == 200:
soup = BeautifulSoup(response.text, 'html.parser')
news_titles = soup.find_all('h1', class_='post_title')
df = pd.DataFrame(news_titles)
df.columns = ['标题']
df.to_excel('output.xlsx', index=False)
for title in news_titles:
print(title.text)
else:
print('Failed to retrieve the webpage')
