12345678910111213141516171819202122232425262728293031323334 |
- import pandas as pd
- import json
- path = "download.xlsx"
- name_set = set()
- id_set = set()
- name_id_dict = {}
- df_list = pd.read_excel(path, usecols=[17, 18]).values.tolist()
- for item in df_list:
- name_set.add(item[0])
- id_set.add(item[1])
- key = item[1]
- value = str(item[0])
- if name_id_dict.get(key):
- name_id_dict[key].add(value)
- else:
- name_id_dict[key] = set()
- name_id_dict[key].add(value)
- print(len(name_set))
- print(len(id_set))
- count = 0
- for key in name_id_dict:
- if len(name_id_dict[key]) > 1:
- print(key, "\t", name_id_dict[key])
- count += 1
- print(name_id_dict['MzUzMjMxNTE3Ng=='])
- # with open("fake_id.json", "w", encoding="utf-8") as f:
- # f.write(json.dumps(list(id_set)))
|