Dsbda 3a
Dsbda 3a
Out[84]: Age Gender Education Level Job Title Years of Experience Salary
In [87]: dataset.head()
Out[88]: 33.62085944494181
In [89]: dataset.Age.median()
Out[89]: 32.0
In [90]: dataset.Age.mode()
Out[90]: 0 27.0
Name: Age, dtype: float64
In [91]: dataset.Age.max()
Out[91]: 62.0
In [92]: dataset.Age.min()
Out[92]: 21.0
Out[95]: 115326.96477086132
In [96]: dataset.Salary.mode()
Out[96]: 0 140000.0
Name: Salary, dtype: float64
In [97]: dataset.Salary.median()
Out[97]: 115000.0
In [98]: dataset.Salary.max()
Out[98]: 250000.0
In [99]: dataset.Salary.min()
Out[99]: 350.0
In [102]: dataset.median()
In [103]: dataset.min()
In [104]: dataset.max()
In [105]: dataset.Age.mode()
Out[105]: 0 27.0
Name: Age, dtype: float64
In [106]: dataset.groupby(['Age']).count()
Out[106]: Years of Experience Salary
Age
21.0 18 18
22.0 15 15
40.0 92 92
47.0 47 47
48.0 98 98
49.0 91 91
50.0 88 88
51.0 30 30
52.0 29 29
53.0 7 7
54.0 68 68
55.0 16 16
Years of Experience Salary
Age
56.0 11 11
57.0 9 9
58.0 7 7
60.0 5 5
61.0 2 2
62.0 5 5
In [107]: dataset.isnull()
Box Plot
In [110]: import matplotlib.pyplot as plt
In [111]: dataset = pd.read_csv(r"C:\Users\khush\Desktop\Salary_Data.csv")
In [112]: x = dataset['Age']
y = dataset['Salary']
interquartile range
In [114]: first_quartile = np.percentile(Age, 25)
25% : -0.6727350412768447
75% : 0.6434662147791437
75% max
Age
21.0 25000.0 25000.0
22.0 45000.0 51832.0
23.0 52807.0 119836.0
24.0 60000.0 125000.0
25.0 90000.0 169159.0
26.0 85000.0 135000.0
27.0 80000.0 180000.0
28.0 110000.0 175000.0
29.0 95000.0 182000.0
30.0 120000.0 190000.0
31.0 140000.0 195000.0
32.0 145000.0 195000.0
33.0 148000.0 198000.0
34.0 160976.0 196000.0
35.0 140000.0 190000.0
36.0 160000.0 185000.0
37.0 170000.0 195000.0
38.0 155000.0 195000.0
39.0 170000.0 210000.0
40.0 160000.0 215000.0
41.0 185000.0 200000.0
42.0 180000.0 197000.0
43.0 185000.0 198000.0
44.0 170000.0 220000.0
45.0 185000.0 250000.0
46.0 180000.0 220000.0
47.0 190000.0 200000.0
48.0 210000.0 219000.0
49.0 195000.0 228000.0
50.0 200000.0 250000.0
51.0 230000.0 240000.0
52.0 190596.0 250000.0
53.0 188357.0 195000.0
54.0 195000.0 195270.0
55.0 210000.0 210000.0
56.0 195000.0 210000.0
57.0 195000.0 200000.0
58.0 200000.0 200000.0
60.0 188651.0 195000.0
61.0 200000.0 200000.0
62.0 200000.0 200000.0
In [ ]: