import pandas as pdimport numpy as np# 构造含缺失值数据集:pay_time 保证无空值df = pd.DataFrame({ "user_id": range(1, 101), "age": np.random.choice([np.nan] + list(range(18, 55)), 100), "consume": np.random.choice([np.nan] + [round(x,2) for x in np.random.uniform(50, 5000, 90)], 100), "pay_time": pd.date_range("2025-05-01", periods=100, freq="D"), "remark": np.random.choice([np.nan, "正常订单", "加急", "开票"], 100)})df.to_excel("missing_data.xlsx", index=False)print("含缺失值测试数据生成完成")