內關聯
import pandas as pd
df1 = pd.read_csv(r'score_20200625.csv', encoding='utf_8', low_memory=False)
df2 = pd.read_csv(r'score_20200727.csv', encoding='utf_8', low_memory=False)
# 內關聯
df3 = pd.merge(left=df2, right=df1, how='inner',
left_on='bd_code', right_on='bd_code')
# 保存內關聯的結果
df3.to_csv('inner_join.csv', header=True, index=True)
左關聯
import pandas as pd
df1 = pd.read_csv(r'score_20200625.csv', encoding='utf_8', low_memory=False)
df2 = pd.read_csv(r'score_20200727.csv', encoding='utf_8', low_memory=False)
# 左關聯
df3 = pd.merge(left=df2, right=df1, how='left',
left_on='bd_code', right_on='bd_code')
# 取沒有關聯上的部分
df3 = df3[df3.isnull().T.any()]
# 保存左關聯的結果
df3.to_csv('left_join.csv', header=True, index=True)