Pandas
Pandas
[3]: 0 4
1 7
2 -5
3 3
dtype: int64
[4]: d 4
b 7
a -5
c 3
dtype: int64
[5]: obj2.index
[6]: d 4
b 7
c 3
dtype: int64
[9]: sdata = {'Ohio': 35000, 'Texas': 71000, 'Oregon': 16000, 'Utah': 5000}
obj3 = pd.Series(sdata)
obj3
1
Manav Tarsariya ET22BTIT132
[9]: Ohio 35000
Texas 71000
Oregon 16000
Utah 5000
dtype: int64
[16]: frame2.columns
[17]: frame2['state']
[18]: frame.year
[18]: 0 2000
1 2001
2 2002
3 2001
4 2002
5 2003
Name: year, dtype: int64
[19]: frame2.loc['three']
3
Manav Tarsariya
ET22BTIT132
[21]: frame2
[23]: frame2
4
Manav Tarsariya ET22BTIT132
[26]: del frame2['eastern']
frame2.columns
[27]: pop = {'Nevada': {2001: 2.4, 2002: 2.9}, 'Ohio': {2000: 1.5, 2001: 1.7, 2002: 3.
↪6}}
frame4 = pd.DataFrame(pop)
frame4
[29]: frame3.T
[35]: frame3.values
5
Manav Tarsariya ET22BTIT132
[35]: array([[2.4, 1.7],
[2.9, 3.6],
[nan, 1.5]])
[36]: frame2.values
[38]: 0 1.5
1 -2.5
2 0.0
dtype: float64
[41]: True
[42]: False
[43]: obj = pd.Series([4.5, 7.2, -5.3, 3.6], index=['d', 'b', 'a', 'c'])
obj
[43]: d 4.5
b 7.2
a -5.3
c 3.6
dtype: float64
6
Manav Tarsariya ET22BTIT132
[44]: a -5.3
b 7.2
c 3.6
d 4.5
e NaN
dtype: float64
[45]: 0 blue
2 purple
4 yellow
dtype: object
[46]: 0 blue
1 blue
2 purple
3 purple
4 yellow
5 yellow
dtype: object
7
Manav Tarsariya ET22BTIT132
[50]: Texas Utah California
a 1 NaN 2
c 4 NaN 5
d 7 NaN 8
[51]: a 0.0
b 1.0
c 2.0
d 3.0
e 4.0
dtype: float64
[52]: a 0.0
b 1.0
d 3.0
e 4.0
dtype: float64
8
Manav Tarsariya ET22BTIT132
New York 12 14 15
[57]: data['two']
[57]: Ohio 1
Colorado 5
Utah 9
New York 13
Name: two, dtype: int32
[60]: data[:2]
9
Manav Tarsariya
ET22BTIT132
Utah 8 9 10 11
New York 12 13 14 15
[62]: two 5
three 6
Name: Colorado, dtype: int32
[63]: four 11
one 8
two 9
Name: Utah, dtype: int32
[65]: Ohio 1
Colorado 5
Utah 9
Name: two, dtype: int32
[67]: a 5.2
c 1.1
d NaN
e 0.0
f NaN
g NaN
dtype: float64
10
Manav Tarsariya ET22BTIT132
[68]: s2+s1
[68]: a 5.2
c 1.1
d NaN
e 0.0
f NaN
g NaN
dtype: float64
df1
[69]: b c d
Ohio 0.0 1.0 2.0
Texas 3.0 4.0 5.0
Colorado 6.0 7.0 8.0
[70]: df2
[70]: b d e
Utah 0.0 1.0 2.0
Ohio 3.0 4.0 5.0
Texas 6.0 7.0 8.0
Oregon 9.0 10.0 11.0
[71]: df1+df2
[71]: b c d e
Colorado NaN NaN NaN NaN
Ohio 3.0 NaN 6.0 NaN
Oregon NaN NaN NaN NaN
Texas 9.0 NaN 12.0 NaN
Utah NaN NaN NaN NaN
[72]: df2+df1
[72]: b c d e
Colorado NaN NaN NaN NaN
Ohio 3.0 NaN 6.0 NaN
Oregon NaN NaN NaN NaN
Texas 9.0 NaN 12.0 NaN
Utah NaN NaN NaN NaN
11
Manav Tarsariya ET22BTIT132
[73]: df1 = pd.DataFrame(np.arange(12.).reshape((3, 4)),columns=list('abcd'))
df2 = pd.DataFrame(np.arange(20.).reshape((4, 5)), columns=list('abcde'))
df2.loc[1, 'b'] = np.nan
df1
[73]: a b c d
0 0.0 1.0 2.0 3.0
1 4.0 5.0 6.0 7.0
2 8.0 9.0 10.0 11.0
[74]: df2
[74]: a b c d e
0 0.0 1.0 2.0 3.0 4.0
1 5.0 NaN 7.0 8.0 9.0
2 10.0 11.0 12.0 13.0 14.0
3 15.0 16.0 17.0 18.0 19.0
[75]: df1+df2
[75]: a b c d e
0 0.0 2.0 4.0 6.0 NaN
1 9.0 NaN 13.0 15.0 NaN
2 18.0 20.0 22.0 24.0 NaN
3 NaN NaN NaN NaN NaN
[76]: df2+df1
[76]: a b c d e
0 0.0 2.0 4.0 6.0 NaN
1 9.0 NaN 13.0 15.0 NaN
2 18.0 20.0 22.0 24.0 NaN
3 NaN NaN NaN NaN NaN
[77]: df1
[77]: a b c d
0 0.0 1.0 2.0 3.0
1 4.0 5.0 6.0 7.0
2 8.0 9.0 10.0 11.0
[78]: df2
[78]: a b c d e
0 0.0 1.0 2.0 3.0 4.0
1 5.0 NaN 7.0 8.0 9.0
2 10.0 11.0 12.0 13.0 14.0
12
Manav Tarsariya ET22BTIT132
3 15.0 16.0 17.0 18.0 19.0
[80]: df2
[80]: a b c d e
0 0.0 1.0 2.0 3.0 4.0
1 5.0 6.0 7.0 8.0 9.0
2 10.0 11.0 12.0 13.0 14.0
3 15.0 16.0 17.0 18.0 19.0
[81]: a b c d e
0 0.0 2.0 4.0 6.0 4.0
1 9.0 11.0 13.0 15.0 9.0
2 18.0 20.0 22.0 24.0 14.0
3 15.0 16.0 17.0 18.0 19.0
[84]: 1 / df1
[84]: a b c d
0 inf 1.000000 0.500000 0.333333
1 0.250 0.200000 0.166667 0.142857
2 0.125 0.111111 0.100000 0.090909
[85]: df1.rdiv(1)
[85]: a b c d
0 inf 1.000000 0.500000 0.333333
1 0.250 0.200000 0.166667 0.142857
2 0.125 0.111111 0.100000 0.090909
[86]: a b c d e
0 0.0 1.0 2.0 3.0 0
13
Manav Tarsariya ET22BTIT132
1 4.0 5.0 6.0 7.0 0
2 8.0 9.0 10.0 11.0 0
[88]: arr[0]
[89]: arr-arr[0]
series = frame.iloc[0]
series
[90]: b 0.0
d 1.0
e 2.0
Name: Utah, dtype: float64
[91]: frame
[91]: b d e
Utah 0.0 1.0 2.0
Ohio 3.0 4.0 5.0
Texas 6.0 7.0 8.0
Oregon 9.0 10.0 11.0
14
Manav Tarsariya ET22BTIT132
[93]: frame.sub(series3, axis='index')
[93]: b d e
Utah -1.0 0.0 1.0
Ohio -1.0 0.0 1.0
Texas -1.0 0.0 1.0
Oregon -1.0 0.0 1.0
frame
[95]: b d e
Utah -1.878290 -0.008359 -0.423879
Ohio -1.838317 -0.319728 -1.481255
Texas 0.265776 -0.403625 0.374745
Oregon 0.671574 -0.775854 1.068877
[96]: np.abs(frame)
[96]: b d e
Utah 1.878290 0.008359 0.423879
Ohio 1.838317 0.319728 1.481255
Texas 0.265776 0.403625 0.374745
Oregon 0.671574 0.775854 1.068877
[97]: b 2.549863
d 0.767494
e 2.550132
dtype: float64
15
Manav Tarsariya ET22BTIT132
Oregon 1.844731
dtype: float64
[99]: frame
[99]: b d e
Utah -1.878290 -0.008359 -0.423879
Ohio -1.838317 -0.319728 -1.481255
Texas 0.265776 -0.403625 0.374745
Oregon 0.671574 -0.775854 1.068877
[100]: b d e
min -1.878290 -0.775854 -1.481255
max 0.671574 -0.008359 1.068877
[101]: b d e
Utah 3.527972 0.000070 0.179674
Ohio 3.379409 0.102226 2.194117
Texas 0.070637 0.162913 0.140434
Oregon 0.451011 0.601949 1.142498
frame.apply(f)
16
Manav Tarsariya ET22BTIT132
[109]: frame.apply(f)
[109]: b None
d None
e None
dtype: object
[115]: b d e
Utah -1.88 -0.01 -0.42
Ohio -1.84 -0.32 -1.48
Texas 0.27 -0.40 0.37
Oregon 0.67 -0.78 1.07
[116]: frame['e'].map(format)
[117]: a 1
b 2
c 3
d 0
dtype: int64
17
Manav Tarsariya ET22BTIT132
frame.sort_index()
[118]: d a b c
one 4 5 6 7
three 0 1 2 3
[119]: frame.sort_index(axis=1)
[119]: a b c d
three 1 2 3 0
one 5 6 7 4
[120]: d c b a
three 0 3 2 1
one 4 7 6 5
[121]: b a
0 4 0
1 7 1
2 -3 0
3 2 1
[122]: frame.sort_values(by='b')
[122]: b a
2 -3 0
3 2 1
0 4 0
1 7 1
[123]: b a
2 -3 0
0 4 0
3 2 1
1 7 1
18
Manav Tarsariya ET22BTIT132
[124]: 0 6.5
1 1.0
2 6.5
3 4.5
4 3.0
5 2.0
6 4.5
dtype: float64
[125]: obj.rank(method='first')
[125]: 0 6.0
1 1.0
2 7.0
3 4.0
4 3.0
5 2.0
6 5.0
dtype: float64
[126]: 0 2.0
1 7.0
2 2.0
3 4.0
4 5.0
5 6.0
6 4.0
dtype: float64
[128]: frame = pd.DataFrame({'b': [4.3, 7, -3, 2], 'a': [0, 1, 0, 1], 'c': [-2, 5, 8,␣
↪-2.5]})
frame.rank(axis='columns')frame
[128]: b a c
0 4.3 0 -2.0
1 7.0 1 5.0
2 -3.0 0 8.0
3 2.0 1 -2.5
[129]: frame.rank(axis='columns')
[129]: b a c
0 3.0 2.0 1.0
1 3.0 1.0 2.0
2 1.0 2.0 3.0
19
Manav Tarsariya ET22BTIT132
3 3.0 2.0 1.0
[130]: a 0
a 1
b 2
b 3
c 4
dtype: int64
[131]: obj['a']
[131]: a 0
a 1
dtype: int64
[132]: 0 1 2
a -0.120697 -1.900689 0.659151
a -0.161534 -0.120115 -0.697666
b 1.762015 -0.733370 -1.154350
b -0.476266 -1.405778 1.035751
[133]: df.loc['b']
[133]: 0 1 2
b 1.762015 -0.733370 -1.154350
b -0.476266 -1.405778 1.035751
df
20
Manav Tarsariya ET22BTIT132
[10]: df.sum()
[11]: df.sum(axis='columns')
[11]: a 1.40
b 2.60
c 0.00
d -0.55
dtype: float64
[12]: a NaN
b 1.300
c NaN
d -0.275
dtype: float64
[13]: df.idxmax()
[13]: one b
two d
dtype: object
[14]: df.cumsum()
[15]: df.tail()
[16]: obj = pd.Series(['c', 'a', 'd', 'a', 'a', 'b', 'b', 'c', 'c'])
[17]: obj
21
Manav Tarsariya ET22BTIT132
[17]: 0 c
1 a
2 d
3 a
4 a
5 b
6 b
7 c
8 c
dtype: object
[19]: unique
[20]: obj.value_counts()
[20]: c 3
a 3
b 2
d 1
dtype: int64
[21]: d 1
a 3
b 2
c 3
dtype: int64
[24]: 0 True
1 False
22
Manav Tarsariya ET22BTIT132
2 False
3 False
4 False
5 True
6 True
7 True
8 True
dtype: bool
[25]: obj[mask]
[25]: 0 c
5 b
6 b
7 c
8 c
dtype: object
[ ]:
23
Manav Tarsariya ET22BTIT132