import random
import pandas as pd
import numpy as np
df1 = pd.read_excel(r'C:\Users\Administrator\Desktop\项目标签_人员.xlsx')
df1['人员id']= df1['人员id'].astype('str')
gp = df1.groupby("项目标签")["人员id"].apply(lambda x:x.str.cat(sep=",")).reset_index()
gp.head()
flag =[]for bq in df2["项目标签"]:
tags =set()for i,value in gp.iterrows():
word = value["项目标签"]if bq == word:
doc_id = random.choice(value["人员id"].split(","))
tags.add(doc_id)
tag ="".join(tags)if tag:
flag.append(tag)else:
flag.append(None)
df2["人员id匹配"]= flag
df2.to_excel(r'C:\Users\Administrator\Desktop\out_put.xlsx',index=False)
flag =[]for row in df2["项目标签"].values:if row in df1['项目标签'].tolist():
flag.append(row)else:
flag.append(None)
df2["flag"]= flag
df2.head()