-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathpandasDFGroupBy2.py
More file actions
43 lines (30 loc) · 1.04 KB
/
Copy pathpandasDFGroupBy2.py
File metadata and controls
43 lines (30 loc) · 1.04 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
# -*- coding: utf-8 -*-
"""
Created on Thu Mar 14 15:08:15 2019
@author: u
"""
import pandas as pd
import numpy as np
df = pd.read_excel('MLBPlayerSalaries.xlsx')
df = pd.read_csv('MBPlayerSalaries200Sample2.csv')
print ('msg 1')
print('1,1',df.iloc[1,1])
print ('msg 2')
print('0:1,0:1\n',df.iloc[0:1,0:5])
print ( df.head())
print ( df.columns )
#Index(['Unnamed: 0', 'Unnamed: 0.1', 'Unnamed: 0.1.1', 'Year', 'Player',
# 'Salary', 'Position', 'Team'],
g1 = df.groupby(["Player"]).size().reset_index(name='Number per player')
print (g1)
g1 = df.groupby(["Team"]).size().reset_index(name='Number per team')
print (g1)
g1 = df.groupby(["Year"]).size().reset_index(name='Number per year')
print (g1)
print ( '-- g1 = df.groupby(["Year"]).sum() --' ) # sums all the number columns
g1 = df.groupby(["Year"]).sum()
print (g1)
grouped = ( df.groupby(['Year']).agg({ "Salary":np.sum} ) ) # sums specified number columns
print(grouped)
g1 = df.groupby(['Year']).agg({ "Salary":np.mean} )
print (g1)