Dsbda 3
Dsbda 3
In [2]: ed=pd.read_csv("Employee_Data.csv")
In [3]: ed
0 1 5 28 Female 250000
1 2 1 21 Male 50000
2 3 3 23 Female 170000
3 4 2 22 Male 25000
4 5 1 17 Male 10000
5 6 25 62 Male 5001000
6 7 19 54 Female 800000
7 8 2 21 Female 9000
8 9 10 36 Female 61500
9 10 15 54 Female 650000
10 11 4 26 Female 250000
11 12 6 29 Male 1400000
12 13 14 39 Male 6000050
13 14 11 40 Male 220100
14 15 2 23 Male 7500
15 16 4 27 Female 87000
16 17 10 34 Female 930000
17 18 15 54 Female 7900000
18 19 2 21 Male 15000
19 20 10 36 Male 330000
20 21 15 54 Male 6570000
21 22 4 26 Male 25000
22 23 5 29 Male 6845000
23 24 1 21 Female 6000
24 25 4 23 Female 8900
25 26 3 22 Female 20000
26 27 1 18 Male 3000
27 28 27 62 Female 10000000
28 29 19 54 Female 5000000
29 30 2 21 Female 6100
30 31 10 34 Male 80000
31 32 15 54 Male 900000
32 33 20 55 Female 1540000
33 34 19 53 Female 9300000
34 35 16 49 Male 7600000
In [4]: ed.mean()
In [5]: ed.loc[:,'Age'].mean()
35.48571428571429
Out[5]:
In [6]: ed.mean(axis=1)[0:4]
In [7]: ed.median()
In [8]: ed.loc[:,'Age'].median()
29.0
Out[8]:
In [9]: ed.median(axis=1)[0:10]
In [10]: ed.mode()
In [11]: ed.loc[:,'Age'].mode()
0 54
Out[11]:
Name: Age, dtype: int64
In [12]: ed.min()
ID 1
Out[12]:
Experience_Years 1
Age 17
Gender Female
Salary 3000
dtype: object
17
Out[13]:
17
Out[14]:
In [15]: ed.max()
ID 35
Out[15]:
Experience_Years 27
Age 62
Gender Male
Salary 10000000
dtype: object
62
Out[16]:
62
Out[17]:
In [18]: ed.std()
In [19]: ed.loc[:,'Age'].std()
14.643551940884361
Out[19]:
In [20]: ed.std(axis=1)[0:4]
In [21]: ed.groupby(['Gender'])['Age'].mean()
Gender
Out[21]:
Female 37.111111
Male 33.764706
Name: Age, dtype: float64
Gender
Out[22]:
Female 2.054917e+06
Male 2.063626e+06
Name: Income, dtype: float64
In [24]: enc_ed
Out[24]: 0 1
0 1.0 0.0
1 0.0 1.0
2 1.0 0.0
3 0.0 1.0
4 0.0 1.0
5 0.0 1.0
6 1.0 0.0
7 1.0 0.0
8 1.0 0.0
9 1.0 0.0
10 1.0 0.0
11 0.0 1.0
12 0.0 1.0
13 0.0 1.0
14 0.0 1.0
15 1.0 0.0
16 1.0 0.0
17 1.0 0.0
18 0.0 1.0
19 0.0 1.0
20 0.0 1.0
21 0.0 1.0
22 0.0 1.0
23 1.0 0.0
24 1.0 0.0
25 1.0 0.0
26 0.0 1.0
27 1.0 0.0
28 1.0 0.0
29 1.0 0.0
30 0.0 1.0
31 0.0 1.0
32 1.0 0.0
33 1.0 0.0
34 0.0 1.0
In [25]: ed_encode=ed_u.join(enc_ed)
ed_encode
In [30]: iris
In [32]: print('Iris-setosa')
print(iris[irisSet].describe())
Iris-setosa
Sepal_Length Sepal_Width Petal_Length Petal_Width
count 50.00000 50.000000 50.000000 50.00000
mean 5.00600 3.418000 1.464000 0.24400
std 0.35249 0.381024 0.173511 0.10721
min 4.30000 2.300000 1.000000 0.10000
25% 4.80000 3.125000 1.400000 0.20000
50% 5.00000 3.400000 1.500000 0.20000
75% 5.20000 3.675000 1.575000 0.30000
max 5.80000 4.400000 1.900000 0.60000
In [34]: print('Iris-versicolor')
print(iris[irisVer].describe())
In [36]: print('Iris-virginica')
print(iris[irisVir].describe())
Iris-virginica
Sepal_Length Sepal_Width Petal_Length Petal_Width
count 50.00000 50.000000 50.000000 50.00000
mean 6.58800 2.974000 5.552000 2.02600
std 0.63588 0.322497 0.551895 0.27465
min 4.90000 2.200000 4.500000 1.40000
25% 6.22500 2.800000 5.100000 1.80000
50% 6.50000 3.000000 5.550000 2.00000
75% 6.90000 3.175000 5.875000 2.30000
max 7.90000 3.800000 6.900000 2.50000
In [ ]: