0%

python库-pandas的使用

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
import pandas as pd

# 生成DataFrame,以读取excel为例
excelFile = 'TEMP.xlsx'
df = pd.DataFrame(pd.read_excel(excelFile))

# 过滤字段
df1 = df[['Project Name', 'Status', 'Offer', 'Tax Rate', 'PM']]

# 条件筛选
df2 = df1.loc[df1['PM'] == 'Bob']

# 多条件筛选
df3 = df1.loc[df1['PM'] == 'Bob'].loc[df1['Status'] == 'Completed']

# 获取某列的值
pmList = df1[['PM']].values.T.tolist()[:][0]
print(pmList)

# 遍历
for pm in list(set(pmList)):
dfByPM = df1.loc[df1['PM'] == pm]
print('\r\n')
print(dfByPM)

# 统计总和
sum_list = [['PM', 'Offer']]
for pm in pmList:
temp = []
dfByPM = df.loc[df['PM'] == pm]
temp.append(pm)
for col in dfByPM.columns:
if col == 'Offer':
sumValue = dfByPM[col].sum() # 计数指定列的和
temp.append(sumValue)
sum_list.append(temp)