data=pd.DataFrame({
'框':['a','a','b','b','c','c','d','d','c','c','b','b','a','b','d'],
'水果':['香蕉','苹果','香蕉','苹果','香蕉','苹果','香蕉','苹果','橘子','菠萝','菠萝','山竹','西瓜','草莓','草莓']
})
像是上面这样的数据,有多个框内放入不同种类的水果,去除掉每个框共有的水果,统计哪些是特色水果,这应该怎么做?
data=pd.DataFrame({
'框':['a','a','b','b','c','c','d','d','c','c','b','b','a','b','d'],
'水果':['香蕉','苹果','香蕉','苹果','香蕉','苹果','香蕉','苹果','橘子','菠萝','菠萝','山竹','西瓜','草莓','草莓']
})
像是上面这样的数据,有多个框内放入不同种类的水果,去除掉每个框共有的水果,统计哪些是特色水果,这应该怎么做?
data=pd.DataFrame({
'框':['a','a','b','b','c','c','d','d','c','c','b','b','a','b','d'],
'水果':['香蕉','苹果','香蕉','苹果','香蕉','苹果','香蕉','苹果','橘子','菠萝','菠萝','山竹','西瓜','草莓','草莓']})
s = set(data.框)
ss = set(data['水果'])
for i in s:
ss = ss & set(data.loc[data.框==i[0], '水果'])
data.drop(data[data.水果.isin(ss)].index, inplace=True)
data = data.sort_values(by='框')
data.reset_index(drop=True, inplace=True)
print(data)