import pandas as pd
import datacompy
if __name__ == '__main__':
a = [(1, 2, 5), (3, 4, 5), (2, 3, 4)]
df = pd.DataFrame(data=a, columns=["a", 'b', 'c'])
a2 = [(1, 2, 5), (3, 9, 5), (4, 3, 4)]
df2 = pd.DataFrame(data=a2, columns=["a", 'b', 'c'])
print(df)
print(df2)
print("------------------")
c = datacompy.Compare(df, df2, join_columns=['a']) # join_columns 类似唯一键,会根据这些列join
print("df1独有的行:")
print(c.df1_unq_rows)
print("df2独有的行:")
print(c.df2_unq_rows)
print("df1独有的列:")
print(c.df1_unq_columns())
print("df2独有的列:")
print(c.df2_unq_columns())
print("不匹配的行:")
print(c.all_mismatch())
print("列名是否匹配")
print(c.all_columns_match())
print("是否匹配")
print(c.matches())