监控数据质量
def monitor_data_quality(data):
missing_ratio = data.isnull().sum() / len(data)
if missing_ratio > 0.1:
alert('数据缺失比例过高')
# 检测异常值
upper_bound = data['price'].mean() + 3 * data['price'].std()
lower_bound = data['price'].mean() - 3 * data['price'].std()
outliers = data[(data['price'] > upper_bound) | (data['price'] < lower_bound)]
return outliers
发布于2025-5-21 00:49 郑州

