defclean_sales_data(raw_data):"""数据清洗流水线"""return[{"date": item["date"],"amount":float(item["amount"]),"region": item["region"].strip()or"未知"}for item in raw_data
iffloat(item["amount"])>0# 过滤负值]# 测试数据
raw =[{"date":"2023-08-01","amount":"1500","region":" 华东 "},{"date":"2023-08-02","amount":"-999","region":""}]print(clean_sales_data(raw))# 仅保留第一条有效记录
二、多维度数据统计
defcalculate_kpis(data):"""计算关键业务指标"""return{"total_sales":sum(item["amount"]for item in data),"avg_daily":sum(item["amount"]for item in data)/len(data),"top_region":max(set([item["region"]for item in data]),
key=lambda x:sum(i["amount"]for i in data if i["region"]==x))}# 使用示例
sales_data =[{"region":"华东","amount":1500},{"region":"华南","amount":2000},{"region":"华东","amount":1800}]print(calculate_kpis(sales_data))# {'total_sales': 5300, 'avg_daily': 1766.67, 'top_region': '华东'}