Programs of Python Pandas
Programs of Python Pandas
CLASS-12(SCIENCE)
SN PYTHON CODES OF PANDAS PRACTICALLY DEMONSTRATED IN ONLINE
CLASSES:
1 #using NumPy arrays-Creation of array from Pandas Series
import pandas as pd
import numpy as np
series1 = [10,20,30,40] #series1 is a pandas series
n1 =np.array(series1) #n1 is a numpy array
print(series1)
print(n1)
2 #Binary Operations on Data frames
import pandas as pd
student ={'Unit Test-1':[5,6,8,3,10], 'Unit Test-2': [7,8,9,6,15]}
student1 ={'Unit Test-1':[3,3,6,6,8], 'Unit Test-2': [5,9,8,10,5]}
ds =pd.DataFrame(student)
ds1 =pd.DataFrame(student1)
print(ds)
print(ds1)
print("Subtraction")
print(ds.sub(ds1))
print("rsub")
print(ds.rsub(ds1))
print("Addition")
print(ds.add(ds1))
print("radd")
print(ds.radd(ds1))
print("Multiplication")
print(ds.mul(ds1))
print("Division")
print(ds.div(ds1))
3 #Broadcasting using 1-D array
import pandas as pd
a = [[2,5,6],[5,8,9]]
df =pd.DataFrame(a)
print(df)
4 #Broadcasting on two data frames of same sizes
import pandas as pd
a =[2,5,6,7,8]
b =[5,8,9,4,10]
df1 =pd.DataFrame(a)
df2 =pd.DataFrame(b)
print(df1)
print(df2)
5 #Implementing pipelining/chaining by performing addition and division
#operation one after the other using pipe()
import pandas as pd
import numpy as np
import math
#user defined functions
def adder(adder1,adder2):
return adder1+adder2
def divide(adder1,adder2):
return adder1/adder2
import pandas as pd
df =pd.read_csv("E:\\Data\\Employee.csv")
df1 = df.to_csv("E:\\Data\\Emp.csv",columns =["Empid",'Name'])
10 #To illustrate pivot_table() function on the dataframe
#generated using .csv file-Employee.csv
import pandas as pd
df =pd.read_csv("E:\\Data\\Employee.csv",skiprows =1,
names =['E_id','Ename','E_age','Ecity','Esalary'])
print(df)
r=df.pivot_table(df,index=['Ename'],aggfunc="sum")
print(r)
11 #Implementing iteritems()-displaying dataframe contents columnwise
import pandas as pd
total_sales ={2015:{'Qtr1':34500,'Qtr2':45000,'Qtr3':50000,'Qtr4':39000},
2016:{'Qtr1':44500,'Qtr2':65000,'Qtr3':70000,'Qtr4':49000},
2017:{'Qtr1':44500,'Qtr2':65000,'Qtr3':70000,'Qtr4':49000}}
df= pd.DataFrame(total_sales) #Converting data series into Data frame
for (col,colSeries) in df.iteritems(): #displaying column-wise data
print("Column Index :",col)
print("Containing :")
print(colSeries)
12 #To perform all the aggregate and statistical functions in Pandas
import pandas as pd
import numpy as np
#Create a Dictionary of series
d = {'Name':pd.Series(['Sachin','Dhoni','Virat','Rohit','Shikhar']),
'Age':pd.Series([26,25,25,24,31]),
'Score':pd.Series([87,67,89,55,47])}
#Create a DataFrame
df= pd.DataFrame(d)
print("Dataframecontents")
print (df)
print(df.count())
print("count age",df[['Age']].count())
print("sum of score",df[['Score']].sum())
print("minimum age",df[['Age']].min())
print("maximum score",df[['Score']].max())
print("mean age",df[['Age']].mean())
print("mode of age",df[['Age']].mode())
print("median of score",df[['Score']].median())
13 #Creating data frame by passing a list of dictionaries
import pandas as pd
newstudent =[{'Rinku':67,'Ritu':78,'Ajay':75,'Pankaj':88,'Aditya':92},
{'Rinku':77,'Ritu':58,'Ajay':87,'Pankaj':65},
{'Rinku':88,'Ajay':67,'Pankaj':74,'Aditya':70}]
newdf =pd.DataFrame(newstudent)
print(newdf)
14 # Use of Histogram and hist() method
import pandas as pd
import matplotlib.pyplot as plt
print("\n")
print ( "Dataframe of Values\n")
monthlysale ={'Salesman':["Ankur","Pawan","Jiten","Rahul","Pawan",
"Ankur","Karan","Akshit","Mudit","Jiten",
"Karan","Rinku"],
'Sales' : [1000,300,800,900,1000,500,60,1000,900,50,600,450],
'Quarter' :[1,1,1,2,2,2,3,3,3,4,4,4],
'District': ['Wazirabad','Sirmore','Dehradun','Solan',
'Mandi','Kangra','Chail','Dehradun',
'Kangra','Solan','Mandi','Sirmore'] }
df = pd.DataFrame(monthlysale )
df.hist() #hist() by default, creates histogram for all numeric columns
plt.show()
15 #Implementing iterrows()
import pandas as pd
total_sales ={2015:{'Qtr1':34500,'Qtr2':45000,'Qtr3':50000,'Qtr4':39000},
2016:{'Qtr1':44500,'Qtr2':65000,'Qtr3':70000,'Qtr4':49000},
2017:{'Qtr1':44500,'Qtr2':65000,'Qtr3':70000,'Qtr4':49000}}
df= pd.DataFrame(total_sales) #Converting data series into Data frame
for (row,rowSeries) in df.iterrows():
print("RowIndex :",row)
print("Containing :")
print(rowSeries)
16 #Creating data frame from student list
import pandas as pd1
data1 = [['Shreya',20],['Rakshit',22],['Srijan',18]]
df1 = pd1.DataFrame(data1,columns=['Name','Age']) #Defining column
names
#to be displayed as headings
print(df1)
17 #Creating data frame from student list
import pandas as pd1
data1 = [['Shreya',20],['Rakshit',22],['Srijan',18]]
df1 = pd1.DataFrame(data1,columns=['Name','Age']) #Defining column
names
#to be displayed as headings
print(df1)
table =pd1.DataFrame(df1)
print(table)
print("Index Value")
print(table.index)
print("Column Name")
print(table.columns)
18 #Sorting the data in a data frame
import pandas as pd
student_marks =pd.Series({'Vijaya':80,'Rahul':92,'Meghna':67,
'Radhika':95,'Shaurya':97})
student_age =pd.Series({'Vijaya':32,'Rahul':28,'Meghna':30,
'Radhika':25,'Shaurya':20})
student_df =pd.DataFrame({'Marks':student_marks,'Age':student_age})
print(student_df)
#Sorting the data on the basis of marks in ascending order
print(student_df.sort_values(by=['Marks'],ascending=False)) #Sorted
#in descending order of Marks
19 #Altering dataframe labels
import pandas as pd
df ={'Name':['Rinku','Ritu','Ajay','Pankaj','Aditya'],
'IP':[78,88,98,90,87]}
print(df)
table =pd.Series(df)
table1 =pd.DataFrame(table)
print(table)
print("Index Value")
print(table1.index)
print("Column Name")
print(table1.columns)
21 #Pivoting using pivot() method
#Creating a DataFrame
import pandas as pd
ClassXII_result= {'Name':['Radhika','Sonia','Shaurya','Radhika'],\
'Subject':['IP','CS','Maths','Phy'],\
'Marks':[98,87,99,87],\
'Grade':['A1','A2','A1','B']}
df=
pd.DataFrame(ClassXII_result,columns=['Name','Subject','Marks','Grade'])
print(df)
22 #Illustrating the use of pivot_table() method
import pandas as pd
name_dict = { 'INVIGILATOR' : ["Rajesh",
"Naveen","Anil","Naveen","Rajesh"],\
'AMOUNT' : [550,550,550,550,550], }
df = pd.DataFrame(name_dict )
print(df)
pd.pivot_table(df, index = ['INVIGILATOR'],aggfunc="sum")
23 #Illustrate pivot_table for all the columns with Filtering
import pandas as pd
sale_dict = {'ITEM_NAME':["NOTEBOOK",
"PEN","INKPEN","NOTEBOOK","PEN"],\
'AMOUNT':[100,50,30,100,50],\
'QUANTITY':[2,5,3,3,5] }
df = pd.DataFrame(sale_dict )
print(df)
pd.pivot_table(df, index = ['ITEM_NAME','AMOUNT','QUANTITY'],
aggfunc='sum')
24 #Program on Quantile
import pandas as pd
import numpy as np
df= pd.DataFrame(np.array([[1, 1], [2, 10], [3, 100], [4, 1000]]),columns=['a',
'b'])
print(df)
print(df.quantile(0.5)) #50% quantile or median
25 #To compute variance for the given data set
import numpy as np
dataset= [2,6,8,12,18,24,28,32]
print(variance)
DATE:11/12/20