数据处理
单次处理
def process_data(single_data):
ad_1 = single_data
# 处理重复的字段
del ad_1['成交金额']
# 处理异常值
ad_1['GMV'] = ad_1['GMV']/100
# ROI
ad_1['ROI'] = round(ad_1['GMV']/ad_1['消耗'], 2)
# 广告策略
ad_1['商品名称'] = ad_1['广告计划名称'].split('_')[0]
ad_1['人群标签'] = ad_1['广告计划名称'].split('_')[1]
ad_1['用户年龄'] = ad_1['广告计划名称'].split('_')[2]
ad_1['用户等级'] = ad_1['广告计划名称'].split('_')[3]
# 处理数据
process_data(ad_list[i])
批量处理
def batch_data(data):
for i in range(len(data)):
ad_1 = data[i]
# 处理重复的字段
del ad_1['成交金额']
# 处理异常值
ad_1['GMV'] = ad_1['GMV']/100
# ROI
ad_1['ROI'] = round(ad_1['GMV']/ad_1['消耗'], 2)
# 广告策略
ad_1['商品名称'] = ad_1['广告计划名称'].split('_')[0]
ad_1['人群标签'] = ad_1['广告计划名称'].split('_')[1]
ad_1['用户年龄'] = ad_1['广告计划名称'].split('_')[2]
ad_1['用户等级'] = ad_1['广告计划名称'].split('_')[3]
# 批量处理数据
batch_data(ad_list)
对批量处理数据简化
def batch_data(data):
for i in range(len(data)):
process_data(data[i])
# 批量处理数据
batch_data(ad_list)