1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45
| a=pd.DataFrame({'A': ['TP512','TP601','TP108','TP509','TP601'],'B':['M7','M5','M6','M5','M10']}) b = a.drop_duplicates() c = a.drop_duplicates(subset='B',keep="first",inplace = False) d = a.drop_duplicates(subset='B',keep="last",inplace = False) e = a.drop_duplicates(subset='A',keep="first",inplace = False)
print('没有去重前:','\n',a) print('全部列去重,删除重复保留首先出现的:','\n',b) print('B列去重,删除重复保留首先出现的:','\n',c) print('B列去重,删除重复保留最后出现的:','\n',d) print('A列去重,删除重复保留最后出现的:','\n',e)
----> 没有去重前: A B 0 TP512 M7 1 TP601 M5 2 TP108 M6 3 TP509 M5 4 TP601 M10 全部列去重,删除重复保留首先出现的: A B 0 TP512 M7 1 TP601 M5 2 TP108 M6 3 TP509 M5 4 TP601 M10 B列去重,删除重复保留首先出现的: A B 0 TP512 M7 1 TP601 M5 2 TP108 M6 4 TP601 M10 B列去重,删除重复保留最后出现的: A B 0 TP512 M7 2 TP108 M6 3 TP509 M5 4 TP601 M10 A列去重,删除重复保留最后出现的: A B 0 TP512 M7 1 TP601 M5 2 TP108 M6 3 TP509 M5
|