excel 文件合并实战
import os,zipfile
import pandas as pd
zip_files = ['sales_data.zip','traffic_data.zip']
for file in zip_files:
    fz = zipfile.ZipFile(file)
    fz.extractall()
def read_data(file_name):
    data = pd.read_csv(file_name)
    data['日期']=os.path.splitext(file_name)[0][-8:]
    return data
two_data_path = ['traffic_data','sales_data']
two_df_list = []
for each_path in two_data_path:
    files = [os.path.join(each_path,i) for i in os.listdir(each_path)] # 获取每个文件路径    
    df_list = [read_data(i) for i in files] # 获取每个文件数据
    two_df_list.append(pd.concat(df_list))
# 合并两个df
merge_df = pd.merge(two_df_list[0],two_df_list[1],on=['日期','产品SKU'],how='outer')
print(merge_df.head(3))
# 格式调整
merge_df2  = merge_df[['日期','产品SKU', '产品浏览量', '产品加入购物车次数',  '订单产品数量', '订单产品收入']]
merge_df2['日期']= [pd.datetime.strptime(i,'%Y%m%d') for i in merge_df2['日期']]
print(merge_df2.head(3))
# 输出数据到单独文件
merge_df2.to_excel('merge_data.xlsx',index=False)