PYTHON Coding Practice ?
PYTHON Coding Practice ?
Import libraries
Creating DataFrame
In [2]: a = {"door":(5,3,4,7,2),"window":(2,5,7,8,6)}
b = pd.DataFrame(a)
b
Out[2]:
door window
0 5 2
1 3 5
2 4 7
3 7 8
4 2 6
In [3]: c = {"price":(12,15,72,64,52)}
d = pd.DataFrame(c)
d
Out[3]:
price
0 12
1 15
2 72
3 64
4 52
Joining DataFrames
pd.concat()
In [4]: e = pd.concat([b,d],axis = 1)
e
Out[4]:
door window price
0 5 2 12
1 3 5 15
2 4 7 72
3 7 8 64
4 2 6 52
In [5]: e.head()
Out[5]:
door window price
0 5 2 12
1 3 5 15
2 4 7 72
3 7 8 64
4 2 6 52
In [6]: e.tail()
Out[6]:
door window price
0 5 2 12
1 3 5 15
2 4 7 72
3 7 8 64
4 2 6 52
In [7]: e.describe()
Out[7]:
door window price
In [8]: e.info()
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 5 entries, 0 to 4
Data columns (total 3 columns):
# Column Non-Null Count Dtype
--- ------ -------------- -----
0 door 5 non-null int64
1 window 5 non-null int64
2 price 5 non-null int64
dtypes: int64(3)
memory usage: 248.0 bytes
In [9]: e[['door']]
Out[9]:
door
0 5
1 3
2 4
3 7
4 2
Out[10]:
door price
0 5 12
1 3 15
2 4 72
3 7 64
4 2 52
In [11]: e
Out[11]:
door window price
0 5 2 12
1 3 5 15
2 4 7 72
3 7 8 64
4 2 6 52
Out[12]: 7
Out[13]: 7
In [14]: e[e["price"]>20]
Out[14]:
door window price
2 4 7 72
3 7 8 64
4 2 6 52
In [15]: e
Out[15]:
door window price
0 5 2 12
1 3 5 15
2 4 7 72
3 7 8 64
4 2 6 52
Out[16]:
door price
0 5 12
1 3 15
2 4 72
3 7 64
4 2 52
In [17]: g = {"window":(2,5,7,None,5)}
h=pd.DataFrame(g)
h
Out[17]:
window
0 2.0
1 5.0
2 7.0
3 NaN
4 5.0
In [18]: h.fillna(3)
Out[18]:
window
0 2.0
1 5.0
2 7.0
3 3.0
4 5.0
In [19]: h
Out[19]:
window
0 2.0
1 5.0
2 7.0
3 NaN
4 5.0
In [20]: h.fillna(h["window"].mean())
Out[20]:
window
0 2.00
1 5.00
2 7.00
3 4.75
4 5.00
In [21]: h.fillna(h["window"].median())
Out[21]:
window
0 2.0
1 5.0
2 7.0
3 5.0
4 5.0
In [22]: h.fillna(h["window"].mode()[0])
Out[22]:
window
0 2.0
1 5.0
2 7.0
3 5.0
4 5.0
In [23]: e
Out[23]:
door window price
0 5 2 12
1 3 5 15
2 4 7 72
3 7 8 64
4 2 6 52
In [24]: e["fan"]=[1,2,5,2,4]
e
Out[24]:
door window price fan
0 5 2 12 1
1 3 5 15 2
2 4 7 72 5
3 7 8 64 2
4 2 6 52 4
In [25]: e[["door","window","fan","price"]]
Out[25]:
door window fan price
0 5 2 1 12
1 3 5 2 15
2 4 7 5 72
3 7 8 2 64
4 2 6 4 52
Out[26]:
door window fan price
0 5 2 1 12
1 3 5 2 15
2 4 7 5 72
3 7 8 2 64
4 2 6 4 52
In [27]: e
Out[27]:
door window price fan
0 5 2 12 1
1 3 5 15 2
2 4 7 72 5
3 7 8 64 2
4 2 6 52 4
In [28]: e.mean()
In [29]: e.median()
In [30]: e.mode().iloc[0]
In [31]: e.var()
In [32]: e.std()
In [33]: e.corr()
Out[33]:
door window price fan
In [34]: e.cov()
Out[34]:
door window price fan