import requests
from bs4 import BeautifulSoup
import pandas as pd
def get_exhibition_data():
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'
}
url = "https://shanghai.andexpo.com/"
response = requests.get(url, headers=headers)
response.encoding = 'utf-8'
if response.status_code != 200:
print("请求失败,状态码:", response.status_code)
return []
soup = BeautifulSoup(response.text, 'html.parser')
exhibitions = []
for item in soup.select('.exhibition-item'):
name = item.select_one('.title').text.strip()
time = item.select_one('.time').text.strip()
industry = item.select_one('.industry').text.strip()
location = item.select_one('.address').text.strip()
exhibitions.append({
'展会名称': name,
'时间': time,
'行业': industry,
'地址': location
})
return exhibitions
def save_to_excel(data):
df = pd.DataFrame(data)
df.to_excel('上海展会数据.xlsx', index=False)
print("数据已保存到 上海展会数据.xlsx")
if __name__ == '__main__':
exhibition_data = get_exhibition_data()
if exhibition_data:
save_to_excel(exhibition_data)
else:
print("未获取到有效数据")