0% found this document useful (0 votes)

8 views6 pages

Etl1 6

Uploaded by

23bsds152sanjays

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

8 views6 pages

Etl1 6

Uploaded by

23bsds152sanjays

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 6

EX-1

CODE
import pandas as pd

str1 = 'abc def abcdef icd'

print("Original series:")

print(str1)

ser = pd.Series(list(str1))

element_freq = ser.value_counts()

print(element_freq)

current_freq = element_freq.dropna().index[-1]

result = "".join(ser.replace(' ', current_freq))

print(result)

OUTPUT

EX-2

CODE
import pandas as pd
df = pd.DataFrame({'X':[78,85,96,80,86],
'Y':[84,94,89,83,86],'Z':[86,97,96,72,83]});
print(df)
OUTPUT

EX-3

CODE
import pandas as pd

import numpy as np

exam_data={'name':['Anasstasia','Dima','Katherine','James','Emily','Michael',
'Matthew','Laura','Kelvin','Jonas'],'score':[12.5,9,16.5,np.nan,9,20,14.5,np.
nan,8,19],'attempts':[1,3,2,3,2,3,1,1,2,1],'qualify':['yes','no','yes','no','
no','yes','yes','no','no','yes']}

labels=['a','b','c','d','e','f','g','h','i','j']

df=pd.DataFrame(exam_data,index=labels)

print("Summary of the basic information about this DataFrame and its data:")

print(df.info())

OUTPUT
EX-4

CODE
import pandas as pd

pd.set_option('display.max_rows', None)

student_data = pd.DataFrame({

'name': ['Alberto Franco','Gino Mcneill','Ryan Parkes','Eesha

Hinton','Gino Mcne','David Parkes'],

'date_Of_Birth':
['15/05/2002','17/05/2002','16/02/1999','25/09/1998','11/05/2002','15/09/1997
'],'roll_no': ['s001','s002','s003','s001','s002','s004'],'class': ['V',
'V','VI', 'VI', 'V', 'VI'],'age': [12, 12, 13, 13, 14, 12],'height': [173,
192, 186, 167, 151, 159],'weight': [35, 32, 33, 30, 31, 32],'address':
['street1', 'street2', 'street3', 'street', 'street2', 'street4']},
index=['S1', 'S2', 'S3', 'S4', 'S5', 'S6'])

print("Original DataFrame:")

print(student_data)

print('\nMean, min, and max value of age for each value of the school:')

grouped_single = student_data.groupby('name').agg({'age': ['mean', 'min',

'max']})

print(grouped_single)

OUTPUT
EX-5

CODE

import pandas as pd

import numpy as np

pd.set_option('display.max_rows', None)

df = pd.DataFrame({'ord_no': [70001, np.nan, 70002, 70004, np.nan, 70005,

np.nan, 70010, 70003, 70012, np.nan, 70013],'purch_amt': [150.5, 270.65,
65.26, 110.5, 948.5, 2400.6, 5760, 1983.43, 2480.4, 250.45, 75.29,
3045.6],'ord_date': ['2012-10-05', '2012-09-10', np.nan, '2012-08-17', '2012-
09-10', '2012-07-27', '2012-09-10', '2012-10-10', '2012-10-10', '2012-06-27',
'2012-08-17', '2012-04-25'],'customer_id': [3002, 3001, 3001, 3003, 3002,
3001, 3001, 3004, 3003, 3002, 3001, 3001],'salesman_id': [5002, 5003, 5001,
np.nan, 5002, 5001, 5001, np.nan, 5003, 5002, 5003, np.nan]})

print("Original Orders DataFrame:")

print(df)

print("\nNumber of missing values in the DataFrame:")

print(df.isna().sum())

OUTPUT
EX-6

CODE

import pandas as pd

import numpy as np

np.random.seed(24)

df = pd.DataFrame({'A': np.linspace(1, 10, 10)})

df = pd.concat([df, pd.DataFrame(np.random.randn(10, 4),

columns=list('BCDE'))], axis=1)

df.iloc[0, 2] = np.nan

df.iloc[3, 3] = np.nan

df.iloc[4, 1] = np.nan

df.iloc[9, 4] = np.nan

print("Original DataFrame:")

print(df)

def highlight_max(s):

'''

Highlight the maximum in a Series green.

'''

is_max = s == s.max()

return ['background-color: green' if v else '' for v in is_max]

print("\nHighlight the maximum value in each column:")

df.style.apply(highlight_max, subset=pd.IndexSlice[:, ['B', 'C', 'D', 'E']])

OUTPUT

DA Lab Manual r22
No ratings yet
DA Lab Manual r22
31 pages
Ip Class 12 Practical File
No ratings yet
Ip Class 12 Practical File
61 pages
Final Class 12 Commerce Practical File
No ratings yet
Final Class 12 Commerce Practical File
19 pages
Ip-12-2023-24 Practical File
No ratings yet
Ip-12-2023-24 Practical File
19 pages
IP Lab Record
No ratings yet
IP Lab Record
23 pages
Class 12 IP Final Practical
No ratings yet
Class 12 IP Final Practical
21 pages
CSC - 310 Advanced Python Programming Continuous Assessment-2 Assignment:Ca2
No ratings yet
CSC - 310 Advanced Python Programming Continuous Assessment-2 Assignment:Ca2
33 pages
Data Frame Creation
No ratings yet
Data Frame Creation
10 pages
Python Pandas
No ratings yet
Python Pandas
13 pages
Ip Practical File
No ratings yet
Ip Practical File
20 pages
Programs of Python Pandas
No ratings yet
Programs of Python Pandas
15 pages
Lab Programs
No ratings yet
Lab Programs
53 pages
Ip Project
No ratings yet
Ip Project
27 pages
Xii Ip Practical File 24-25
No ratings yet
Xii Ip Practical File 24-25
111 pages
12 Pandas
100% (1)
12 Pandas
21 pages
PythonFinal (8,9,10,11) Removed
No ratings yet
PythonFinal (8,9,10,11) Removed
8 pages
Solution
No ratings yet
Solution
8 pages
Even Students
No ratings yet
Even Students
36 pages
PDF&Rendition 1
No ratings yet
PDF&Rendition 1
47 pages
BSC CSIT Final Year Project Report On Sword of Warrior Game Project Report
No ratings yet
BSC CSIT Final Year Project Report On Sword of Warrior Game Project Report
52 pages
Oddstudents
No ratings yet
Oddstudents
35 pages
FDS Slot 3
No ratings yet
FDS Slot 3
15 pages
Practicals
No ratings yet
Practicals
11 pages
Dealing With Missing Values
No ratings yet
Dealing With Missing Values
19 pages
Ds Pract 2 Vedanti
No ratings yet
Ds Pract 2 Vedanti
7 pages
XII IP Practical Code and Output
No ratings yet
XII IP Practical Code and Output
4 pages
Info Programs Questions
No ratings yet
Info Programs Questions
18 pages
Pandasmatplotlib Practical File
No ratings yet
Pandasmatplotlib Practical File
15 pages
Module 1: Introduction To CAD Software
100% (1)
Module 1: Introduction To CAD Software
8 pages
Creation of Series Using List, Dictionary & Ndarray
No ratings yet
Creation of Series Using List, Dictionary & Ndarray
65 pages
4 Arrays in 'C'
100% (10)
4 Arrays in 'C'
19 pages
Excel XP Pivot Tables Exercises
No ratings yet
Excel XP Pivot Tables Exercises
6 pages
Project Prog
No ratings yet
Project Prog
6 pages
Create A Pandas Series From A Dictionary of Values and An Ndarray
No ratings yet
Create A Pandas Series From A Dictionary of Values and An Ndarray
15 pages
M90 User Guide
No ratings yet
M90 User Guide
60 pages
Xii Record (Dataframe & CSV)
No ratings yet
Xii Record (Dataframe & CSV)
11 pages
Microsoft Certified: Azure Security Engineer Associate
No ratings yet
Microsoft Certified: Azure Security Engineer Associate
78 pages
Session 11 Lecture 1
No ratings yet
Session 11 Lecture 1
6 pages
PYTHON PROGRAMMING: Data Handling
No ratings yet
PYTHON PROGRAMMING: Data Handling
12 pages
ML Lab Manual Final
No ratings yet
ML Lab Manual Final
36 pages
Lift Book
No ratings yet
Lift Book
277 pages
Answers Practical File
No ratings yet
Answers Practical File
19 pages
Document (4) - 1
No ratings yet
Document (4) - 1
15 pages
DAV Practicals
No ratings yet
DAV Practicals
26 pages
Data Analyzer
No ratings yet
Data Analyzer
10 pages
Info Practical
No ratings yet
Info Practical
56 pages
ImageJ User Guide
100% (1)
ImageJ User Guide
199 pages
Xii Ip Practical List 2022-23-1
No ratings yet
Xii Ip Practical List 2022-23-1
23 pages
50 Excel Shortcuts To Save Time and Effort in Articleship
No ratings yet
50 Excel Shortcuts To Save Time and Effort in Articleship
9 pages
AD3301 - Data - Transformation - Ipynb - Colaboratory
No ratings yet
AD3301 - Data - Transformation - Ipynb - Colaboratory
27 pages
Q1 SUMMATIVE TEST 2 Trends and Issues in ICT
No ratings yet
Q1 SUMMATIVE TEST 2 Trends and Issues in ICT
2 pages
12 IP File Programs 6 To 17
No ratings yet
12 IP File Programs 6 To 17
9 pages
Data (MCS102) Module 1
No ratings yet
Data (MCS102) Module 1
40 pages
Journal 12
No ratings yet
Journal 12
54 pages
VLAN Interview Questions and Answers
100% (1)
VLAN Interview Questions and Answers
2 pages
Practical-9 PYTHON
No ratings yet
Practical-9 PYTHON
5 pages
ConVox CCS NRHM
No ratings yet
ConVox CCS NRHM
29 pages
Term 1 IP AK
No ratings yet
Term 1 IP AK
6 pages
10) Merging Dataframes: # Detecting Duplicates
No ratings yet
10) Merging Dataframes: # Detecting Duplicates
7 pages
Practical File IP
No ratings yet
Practical File IP
27 pages
Dsbda Assignment 1
No ratings yet
Dsbda Assignment 1
5 pages
Ip Practical File
No ratings yet
Ip Practical File
18 pages
Recursion, As A Different Way of Solving Problems. Example Programs Such As Finding Factorial. Fibon
No ratings yet
Recursion, As A Different Way of Solving Problems. Example Programs Such As Finding Factorial. Fibon
11 pages
12 Pandas
No ratings yet
12 Pandas
14 pages
List of Practical Ip065 Xii Session 2025 CKC Academy
No ratings yet
List of Practical Ip065 Xii Session 2025 CKC Academy
19 pages
Lab Record IP
No ratings yet
Lab Record IP
13 pages
Bca C++ Pratical
No ratings yet
Bca C++ Pratical
35 pages
Unit3 - 3) Pandas - Ipynb - Colab
No ratings yet
Unit3 - 3) Pandas - Ipynb - Colab
11 pages
Lab2.2 Kritika
No ratings yet
Lab2.2 Kritika
10 pages
Code Explanation For Date Types
No ratings yet
Code Explanation For Date Types
8 pages
Exp3 Python
No ratings yet
Exp3 Python
15 pages
Exp 3
No ratings yet
Exp 3
10 pages
Encoder:: US/.html
No ratings yet
Encoder:: US/.html
2 pages
4 Marks Questions
No ratings yet
4 Marks Questions
17 pages
Ok55-Fb - Dindllb Eng Web Mfl70504378
No ratings yet
Ok55-Fb - Dindllb Eng Web Mfl70504378
46 pages
HVM100 Blaze Manual
No ratings yet
HVM100 Blaze Manual
70 pages
Practical File Questions With Answers
No ratings yet
Practical File Questions With Answers
7 pages
iON Digital Assessment: Redefining The Future of Assessment Process
No ratings yet
iON Digital Assessment: Redefining The Future of Assessment Process
8 pages
Practice Questions2
No ratings yet
Practice Questions2
2 pages
Walchand Institute of Technology, Solapur: Direct Linking Loaders
No ratings yet
Walchand Institute of Technology, Solapur: Direct Linking Loaders
14 pages
2020 Marvell Product Selector Guide: Total Solutions From Marvell
No ratings yet
2020 Marvell Product Selector Guide: Total Solutions From Marvell
29 pages
Jonah Marindoque Balicoco SAS 21 Nursing InformaticsFINAL
No ratings yet
Jonah Marindoque Balicoco SAS 21 Nursing InformaticsFINAL
9 pages
80305a PDF
No ratings yet
80305a PDF
7 pages
Shared Mailboxes - Owner's Guide 15feb 2022
No ratings yet
Shared Mailboxes - Owner's Guide 15feb 2022
12 pages
Quotation For Real Estate
No ratings yet
Quotation For Real Estate
4 pages
Department of Computer Science & Engineering: B.Tech. Semester - 4 Question Bank 2101CS402 - Madf
No ratings yet
Department of Computer Science & Engineering: B.Tech. Semester - 4 Question Bank 2101CS402 - Madf
2 pages
Oracle: Question & Answers
No ratings yet
Oracle: Question & Answers
7 pages
Sheet No. Sheet Name: Hierarchical Block
No ratings yet
Sheet No. Sheet Name: Hierarchical Block
8 pages
Office 2013 Keys
No ratings yet
Office 2013 Keys
1 page
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet

Etl1 6

Uploaded by

Etl1 6

Uploaded by

EX-1

str1 = 'abc def abcdef icd'

result = "".join(ser.replace(' ', current_freq))

'name': ['Alberto Franco','Gino Mcneill','Ryan Parkes','Eesha

grouped_single = student_data.groupby('name').agg({'age': ['mean', 'min',

df = pd.DataFrame({'ord_no': [70001, np.nan, 70002, 70004, np.nan, 70005,

print("Original Orders DataFrame:")

print("\nNumber of missing values in the DataFrame:")

df = pd.DataFrame({'A': np.linspace(1, 10, 10)})

df = pd.concat([df, pd.DataFrame(np.random.randn(10, 4),

Highlight the maximum in a Series green.

return ['background-color: green' if v else '' for v in is_max]

print("\nHighlight the maximum value in each column:")

df.style.apply(highlight_max, subset=pd.IndexSlice[:, ['B', 'C', 'D', 'E']])

You might also like