merge_df.py 977 B

12345678910111213
  1. import pandas as pd
  2. # path = r'E:\code\name_classify\data_before\Shopify7月订单-客户数据.xlsx'
  3. # df_origin = pd.read_excel(path)
  4. # df_result = pd.read_csv(r'E:\code\name_classify\data_before\result_1.csv')
  5. # # df_result['classify'] = df_result['v'].apply(lambda x : str(x).replace('Non-Chinese', '非华裔').replace('non-Chinese', '非华裔').replace('Chinese','华裔').replace('可能是华裔','华裔')\
  6. # # .replace('可能华裔','华裔').replace('非华人','华裔').replace('华人','非华裔').replace('是','华裔').replace('否','非华裔'))
  7. # df_final = df_origin.merge(df_result, on='name', how='left')
  8. # df_final = df_origin.merge(df_result, on='name', how='left').drop_duplicates(subset=['Name','name'], keep='first')
  9. df_final = pd.read_excel(r'E:\code\name_classify\output_final.xlsx')
  10. df_final.drop_duplicates(subset=['Name','name'], keep='first')
  11. df_final.to_excel('output_final_8.xlsx')