import pandas as pd
from scipy import stats
file_path = '/mnt/data/A题-沃尔玛客户购买行为数据集.xlsx'
data_new = pd.read_excel(file_path)
data_new_clean = data_new.drop(index=0)
data_new_clean['Purchase_Amount'] = pd.to_numeric(data_new_clean['Purchase_Amount'], errors='coerce')
data_new_clean['Age'] = pd.to_numeric(data_new_clean['Age'], errors='coerce')
data_new_clean['Purchase_Amount'].fillna(data_new_clean['Purchase_Amount'].mean(), inplace=True)
data_new_clean['Age'].fillna(data_new_clean['Age'].mean(), inplace=True)
data_new_clean['City'] = data_new_clean['City'].astype('category')
city_purchase_data = data_new_clean.groupby('City')['Purchase_Amount'].apply(list)
f_statistic, p_value = stats.f_oneway(*city_purchase_data)
print("F统计量:", f_statistic)
print("P值:", p_value)