DSBDA02
DSBDA02
Roll_no : COTB67
Practical 2
In [1]:
sp =
pd.read_csv("/home/student/Desktop/Dataset/AcademicPerformanceNEW.cs
v"
sp.isnull()
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
In [2]:
In [3]:
Out[3]: gender math reading writing placement club join placement region score score score score year
count
0 False False False False False False False False 1 False False
False False False False False False 2 False False False False False
False False False 3 False False False False False False False False
6 False False False False False False False False 7 False False
9 False False False False False False False False 10 False False False
False False False False True 11 True False False False False False False
False
False False False False False False True 20 False False False
gender
Out[6]: scoremath reading score writing score placementscore club yearjoin
placementcount region
In
[7]: sp.notnull()
Out[7]:
gender math reading writing placement club join placement region score score
score score year count
0 True True True True True True True True 1 True True
True True True True True True 2 True True True True True
3 True True True True True True True True 4 True True
6 True True True True True True True True 7 True True
13 True True True True True True True True 14 True True
True True True True True True 15 True True True True
True True True True 16 True True True True True True
True True
17 True True False True True True True True 18 False True True
True True True True True 19 True True True True True True
True False 20 True True True True True True True True
23 True True True True True True True True 24 True True
True True True True True True 25 True True True True
True True True True 26 True True True True True True
In
True True 27 True True True True True True True True 28
sp.dropna()
Out[8]:
gender math reading writing placement club join placement region score score score score year
count
4 Female 62 65.0 68.0 87 2018.0 3 Mulshi 6 Female 77 100.0 72.0 93 2020.0 3 Karad
sp.dropna(how = 'all')
Out[9]:
gender math reading writing placement club join placement region score score score score year
count
sp.dropna(axis=1)
Out[10]:
math score placement score placement count
0 66 97 3
1 91 76 22 72 79 23
99 84 24 62 87 3
5 69 50 16 77 93 3
7 62 96 3
8 75 77 29 79 85 3
10 61 80 2
11 61 80 2
12 78 90 3
13 66 98 3 14 80 95 3 15 72 84 2 16 80 79
17 60 85 3 18 80 89 3 19
72 76 2 20 67 91 3 21
69 77 2 22 64 75 2
23 74 100 3
24 77 84 2
25 75 86 3
26 65 96 3 27 64 95 3 28 69 75 2
Out[11]:
gender scoremath reading score writing score placementscore club yearjoin
placementcount region
28
In
[12]: print(np.where(sp['math score']>90))
(array([1, 3]),)
In
[13]: print(np.where(sp['reading score'] <25))
(array([], dtype=int64),)
[14]:
In [12]:
[18]:
In
[19]: from sklearn.preprocessing import
LabelEncoder le = LabelEncoder()
In [ ]: