0% found this document useful (0 votes)
4 views

Notes for Dataframe ip

The document provides various methods for creating Pandas DataFrames using different data structures such as numpy arrays, lists of dictionaries, and dictionaries of lists. It also demonstrates how to customize index labels for rows and columns and how to select specific rows and columns from a DataFrame. Additionally, it includes examples of selecting single and multiple columns using different methods.

Uploaded by

Jayabharathi
Copyright
© © All Rights Reserved
We take content rights seriously. If you suspect this is your content, claim it here.
Available Formats
Download as DOCX, PDF, TXT or read online on Scribd
0% found this document useful (0 votes)
4 views

Notes for Dataframe ip

The document provides various methods for creating Pandas DataFrames using different data structures such as numpy arrays, lists of dictionaries, and dictionaries of lists. It also demonstrates how to customize index labels for rows and columns and how to select specific rows and columns from a DataFrame. Additionally, it includes examples of selecting single and multiple columns using different methods.

Uploaded by

Jayabharathi
Copyright
© © All Rights Reserved
We take content rights seriously. If you suspect this is your content, claim it here.
Available Formats
Download as DOCX, PDF, TXT or read online on Scribd
You are on page 1/ 7

DataFrame

'''#Creation of Empty DataFrame


import pandas as pd
df=pd.DataFrame()
print(df)

#Creation of DataFrame from numpy ndarrays


import pandas as pd
import numpy as np
arr=np.array([11,12,13,14])
df=pd.DataFrame(arr)
print(df)

#Creation of DataFrame from numpy ndarrays


import pandas as pd
import numpy as np
arr=np.array([11,12,13,14])
arr1=np.array([1,2,3,4])
arr2=np.array([101,102,103,104])
df=pd.DataFrame([arr,arr1,arr2])
print(df)

#Creation of DataFrame from numpy ndarrays with custom index label


import pandas as pd
import numpy as np
arr=np.array([11,12,13,14])
arr1=np.array([1,2,3,4])
arr2=np.array([101,102,103,104])
df=pd.DataFrame([arr,arr1,arr2],index=['R1','R2','R3'],columns=['C1','C2','C3','C4'])
print(df)

#Creation of DataFrame from List of Dictionaries


import pandas as pd
D1={'Name':'Jaya','Marks':87}
D2={'Name':'Abi','Age':17,'Marks':87}

1
D3={'Name':'Kavi','Age':18,'Marks':76}
l=[D1,D2,D3]
df=pd.DataFrame(l)
print(df)

#Creation of DataFrame from List of Dictionaries with custom index value for
rows
import pandas as pd
D1={'Name':'Jaya','Marks':87}
D2={'Name':'Abi','Age':17,'Marks':87}
D3={'Name':'Kavi','Age':18,'Marks':76}
l=[D1,D2,D3]
df=pd.DataFrame(l,index=['R1','R2','R3'])
print(df)

#Creation of DataFrame from List of Dictionaries with custom index value for
columns
import pandas as pd
D1={'Name':'Jaya','Marks':87}
D2={'Name':'Abi','Age':17,'Marks':87}
D3={'Name':'Kavi','Age':18,'Marks':76}
l=[D1,D2,D3]
df=pd.DataFrame(l,index=['R1','R2','R3'],columns=['a1','a2','a3'])
print(df)

#Creation of DataFrame from List of Dictionaries with key values as column


but changing sequence
import pandas as pd
D1={'Name':'Jaya','Marks':87}
D2={'Name':'Abi','Age':17,'Marks':87}
D3={'Name':'Kavi','Age':18,'Marks':76}
l=[D1,D2,D3]
df=pd.DataFrame(l,index=['R1','R2','R3'],columns=['Name','Age','Marks'])
print(df)

2
#Creation of DataFrame from Dictionary of Lists
import pandas as pd
N=['jaya','bala','krish']
A=[14,17,15]
M=[98,78,68]
D={'Name':N,'Age':A,'Marks':M}
df=pd.DataFrame(D)
print(df)

#Creation of DataFrame from Dictionary of List with custom index value for
rows
import pandas as pd
N=['jaya','bala','krish']
A=[14,17,15]
M=[98,78,68]
D={'Name':N,'Age':A,'Marks':M}
df=pd.DataFrame(D,index=['R1','R2','R3'])
print(df)

#Creation of DataFrame from Dictionary of List with custom index value for
columns
import pandas as pd
N=['jaya','bala','krish']
A=[14,17,15]
M=[98,78,68]
D={'Name':N,'Age':A,'Marks':M}
df=pd.DataFrame(D,index=['R1','R2','R3'],columns=['a1','a2','a3'])
print(df)

#Creation of DataFrame from Dictionary of List with changing sequence of


column
import pandas as pd
N=['jaya','bala','krish']
A=[14,17,15]
M=[98,78,68]

3
D={'Name':N,'Age':A,'Marks':M}
df=pd.DataFrame(D,index=['R1','R2','R3'],columns=['Marks','Age','Name'])
print(df)

#Creation of DataFrame from Series(includes dtype)


import pandas as pd
L=[14,17,15]
s=pd.Series(L)
print(s)

#Creation of DataFrame from Series(dtype not include)


import pandas as pd
s1=pd.Series([11,12,13,14,15])
s2=pd.Series([1,2,3,4,5])
s3=pd.Series([111,122,133,144,155])
s4=pd.Series([21,22,23,24,9])
df=pd.DataFrame([s1,s2,s3,s4])
print(df)

#Creation of DataFrame from Series(dtype not include)with Custom index label


for rows
import pandas as pd
s1=pd.Series([11,12,13,14,15])
s2=pd.Series([1,2,3,4,5])
s3=pd.Series([111,122,133,144,155])
s4=pd.Series([21,22,23,24,9])
df=pd.DataFrame([s1,s2,s3,s4],index=['a','b','c','d'])
print(df)

#Creation of DataFrame from Series with Custom index label for columns
import pandas as pd
s1=pd.Series([11,12,13,14,15],index=['a','b','c','d','e'])
s2=pd.Series([1,2,3,4,5],index=['a','b','c','d','e'])
s3=pd.Series([111,122,133,144,155],index=['a','b','c','d','e'])
s4=pd.Series([21,22,23,24,45],index=['a','b','c','d','e'])
df=pd.DataFrame([s1,s2,s3,s4])

4
print(df)

#Creation of DataFrame from Series with Custom index label for columns and
rows
import pandas as pd
s1=pd.Series([11,12,13,14,15],index=['a','b','c','d','e'])
s2=pd.Series([1,2,3,4,5],index=['a','b','c','d','e'])
s3=pd.Series([111,122,133,144,155],index=['a','b','c','d','e'])
s4=pd.Series([21,22,23,24,45],index=['a','b','c','d','e'])
df=pd.DataFrame([s1,s2,s3,s4],index=['aa','bb','cc','dd'])
print(df)

#Creation of DataFrame from Series (includes dtype) with Custom index label
for rows
import pandas as pd
L=[14,17,15]
s=pd.Series(L,index=['R1','R2','R3'])
print(s)

#Creation of DataFrame from Series (includes dtype) with Custom index label
for column
import pandas as pd
L=[14,17,15]
s=pd.Series(L,index=['R1','R2','R3'])
df=pd.DataFrame(s,columns=['C1'])
print(df)'''

#Creation of DataFrame from Dictionary of Series


import pandas as pd
s1=pd.Series([11,12,13,14,15])
s2=pd.Series([1,2,3,4,5])
s3=pd.Series([111,122,133,144,155])
s4=pd.Series([21,22,23,24,9])
D={'key1':s1,'key2':s2,'key3':s3,'key4':s4}
df=pd.DataFrame(D)
print(df)

5
#Creation of DataFrame from Dictionary of Dictionary

import pandas as pd

D1={'Name':'Jaya','Marks':87}

D2={'Name':'Abi','Age':17,'Marks':87}

D3={'Name':'Kavi','Age':18,'Marks':76}

DD={"Humanities":D1,"Medical":D2,"Non Med":D3}

df=pd.DataFrame(DD)

print(df)

#Select options in rows and columns

import pandas as pd

N=['jaya','bala','krish','sakthi','abi','bharathi','geetha','sandhya']

A=[14,17,15,15,13,14,13,12]

M=[98,78,68,65,87,98,76,65]

S=['cs','bio','pe','ip','cs','ip','bio','cs']

D={'Name':N,'Age':A,'Marks':M,'Subject':S}

df=pd.DataFrame(D,index=['R1','R2','R3','R4','R5','R6','R7','R8'],columns=['Name','Ag
e','Marks','Subject'])

print(df)

print("************************************")

#Selecting a single column

#Method-1

#Using square bracklet

print(df['Name'])

print("************************************")

print(df['Marks'])

6
print("************************************")

#Method-2

#Using Dot Notation

print(df.Name)

print("************************************")

#Selecting multiple columns

#Method-1

#Using Double square bracklets

print(df[['Name','Age']])

print("************************************")

#Method-2

#Accessing data using loc

print(df.loc['Name':'Marks']) # Empty Dataframe

print("************************************")

print(df.loc[:,'Name':'Marks']) #Start,Stop and Step

print("************************************")

#Selecitng Multiple Rows

print(df.loc['R2':'R4']) #includes stop value

print("************************************")

print(df.loc['R2':'R4',:]) #includes stop value

You might also like