import pandas as pd
import numpy as np
pd.options.display.max_columns = 999
orders = pd.read_excel('D:/Code/.vscode/Orders.xlsx')
orders['Year'] = pd.DatetimeIndex(orders.Date).year
groups = orders.groupby(['Category','Year'])
s = groups['Total'].sum()
c = groups['ID'].count()
pt2 = pd.DataFrame({'sum':s,'count':c})
print(pt2)
利用groupby生成新的dataframe
import pandas as pd
import numpy as np
pd.options.display.max_columns = 999
orders = pd.read_excel('D:/Code/.vscode/Orders.xlsx')
orders['Year'] = pd.DatetimeIndex(orders.Date).year
pt1 = orders.pivot_table(index='Category',columns='Year',values='Total',aggfunc=np.sum)
print(pt1)
这是用了NP的聚合函数