0% found this document useful (0 votes)

56 views27 pages

CSV Python Annotated

This document discusses reading and writing CSV files in Python using the csv module. It covers reading data from a CSV file, accessing specific columns, writing data to a CSV file, and various formatting options like delimiters, quoting styles, and escape characters.

Uploaded by

Suman Das

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

56 views27 pages

CSV Python Annotated

Uploaded by

Suman Das

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 27

100 DAYS OF DATA

WORKING WITH CSV

DATA ANALYSIS OF TITANIC DATA SET INCLUDED

Data analysis from a CSV file in Python

Learn to read and write CSV files in Python

•
COPY

name,age,height(cm),weight(kg)
Lenin,30,188,90
Phil,42,178,76
Claire,40,165,54
Alex,18,140,46

csv

pandas
csv.reader

COPY

import csv

with open('my_family.csv') as input:

csv_reader = csv.reader(input, delimiter=',')
line_count = 0
for row in csv_reader:
if line_count == 0:
print(f'Header row - {", ".join(row)}')
line_count += 1
else:
print(f'{row[0]} is {row[1]} years old, {row[2]} cm tal
line_count += 1
print(f'Total: {line_count} lines')

COPY

Header row - name, age, height(cm), weight(kg)

Lenin is 30 years old, 188 cm tall and 90 kg heavy
Phil is 42 years old, 178 cm tall and 76 kg heavy
Claire is 40 years old, 165 cm tall and 54 kg heavy
Alex is 18 years old, 140 cm tall and 46 kg heavy
Total: 5 lines
line_count

csv.reader next(reader object,

None)

COPY

import csv

with open('my_family.csv') as input:

csv_reader = csv.reader(input, delimiter=',')
line_count = 0
next(csv_reader, None) #ignore the header
for row in csv_reader:
print(f'{row[0]} is {row[1]} years old, {row[2]} cm tall an
line_count += 1
print(f'Total: {line_count} lines')

COPY

Lenin is 30 years old, 188 cm tall and 90 kg heavy

Phil is 42 years old, 178 cm tall and 76 kg heavy
Claire is 40 years old, 165 cm tall and 54 kg heavy
Alex is 18 years old, 140 cm tall and 46 kg heavy
Total: 4 lines
Total: 4 lines

csv.DictReader

DictReader

COPY

import csv

with open('my_family.csv') as input:

csv_reader = csv.DictReader(input, delimiter=',')
for row in csv_reader:
print(f'{row["name"]} is {row["age"]} years old, {row["heig
print(f'Total: {csv_reader.line_num} lines')

csv_reader.line_num

csv.DictReader

csv.DictReader
csv.writer

COPY

import csv

header = ['Name', 'Age', 'Height(cm)', 'Weight(kg)']

data = [ ['Phil', 42, 178, 76],

['Alex', 18, 140, 46],
['Claire', 40, 165, 54] ]

filename = "my_family.csv"

with open(filename, 'w') as output:

csvwriter = csv.writer(output)

# Write a single list

csvwriter.writerow(header)

# Writing a list of lists

csvwriter.writerows(data)
COPY

Name,Age,Height(cm),Weight(kg)
Phil,42,178,76
Alex,18,140,46
Claire,40,165,54

writerow

writerows

csv.writer ,

delimiter

COPY

import csv

header = ['Name', 'Age', 'Height(cm)', 'Weight(kg)']

data = [ ['Phil', 42, 178, 76],

['Alex', 18, 140, 46],
['Claire', 40, 165, 54] ]

filename = "my_family.csv"
with open(filename, 'w') as output:
csvwriter = csv.writer(output, delimiter = '|')

# Write a single list

csvwriter.writerow(header)

# Writing a list of lists

csvwriter.writerows(data)

COPY

Name|Age|Height(cm)|Weight(kg)
Phil|42|178|76
Alex|18|140|46
Claire|40|165|54

DictWriter

fieldnames

COPY

import csv

header = ['Name', 'Age', 'Height(cm)', 'Weight(kg)']

data = [
data = [
{"Name":"Phil", "Age": 42, "Height(cm)":178, "Weight(kg)":76},
{"Name":"Claire", "Age": 40, "Height(cm)":165, "Weight(kg)":54}
{"Name":"Alex", "Age": 18, "Height(cm)":140, "Weight(kg)":46}
]

filename = "my_family.csv"

with open(filename, 'w') as output:

csvwriter = csv.DictWriter(output, fieldnames=header)
csvwriter.writeheader()
for row in data:
csvwriter.writerow(row)

COPY

Name,Age,Height(cm),Weight(kg)
Phil,42,178,76
Claire,40,165,54
Alex,18,140,46

writerows

COPY

import csv

header = ['Name', 'Age', 'Height(cm)', 'Weight(kg)']

data = [
{"Name":"Phil", "Age": 42, "Height(cm)":178, "Weight(kg)":76},
{"Name":"Claire", "Age": 40, "Height(cm)":165, "Weight(kg)":54}
{"Name":"Alex", "Age": 18, "Height(cm)":140, "Weight(kg)":46}
]

filename = "my_family.csv"

with open(filename, 'w') as output:

csvwriter = csv.DictWriter(output, fieldnames=header)
csvwriter.writeheader()
csvwriter.writerows(data)

COPY

Name,Age,Height(cm),Weight(kg)
Phil,42,178,76
Claire,40,165,54
Alex,18,140,46

"
"

COPY

Name,Age,Height(cm),Weight(kg),Address
Phil,42,178,76,'Gryffindor room, Hogwarts'
Claire,40,165,54,'Snapes room, Hogwarts'
Alex,18,140,46,'4 Private Drive, Little Whinging'

quotechar

COPY

import csv

filename = "my_family.csv"

with open(filename, 'r') as output:

csvreader = csv.reader(output, quotechar="'")
for row in csvreader:
print(row)
COPY

['Name', 'Age', 'Height(cm)', 'Weight(kg)', 'Address']

['Phil', '42', '178', '76', 'Gryffindor room, Hogwarts']
['Claire', '40', '165', '54', 'Snapes room, Hogwarts']
['Alex', '18', '140', '46', '4 Private Drive, Little Whinging']

quoting

csv.QUOTE_MINIMAL

csv.QUOTE_ALL

csv.QUOTE_NONNUMERIC

csv.QUOTE_NONE

COPY

import csv

filename = "my_family.csv"

header = ['Name','Age','Height(cm)','Weight(kg)','Address']

data = [
['Phil',42,178,76,'Gryffindor room, Hogwarts'],
['Claire',40,165,54,'Snapes room, Hogwarts'],
[ , , , , p , g ],
['Alex',18,140,46,'4 Private Drive, Little Whinging']
]

with open(filename, 'w') as output:

csvwriter = csv.writer(output, quotechar="'", quoting=csv.QUOTE_A
csvwriter.writerow(header)
csvwriter.writerows(data)

csv.QUOTE_ALL

COPY

'Name','Age','Height(cm)','Weight(kg)','Address'
'Phil','42','178','76','Gryffindor room, Hogwarts'
'Claire','40','165','54','Snapes room, Hogwarts'
'Alex','18','140','46','4 Private Drive, Little Whinging'

csv.QUOTE_NONE

COPY

import csv
filename = "my_family.csv"

header = ['Name','Age','Height(cm)','Weight(kg)','Address']

data = [
['Phil',42,178,76,'Gryffindor room, Hogwarts'],
['Claire',40,165,54,'Snapes room, Hogwarts'],
['Alex',18,140,46,'4 Private Drive, Little Whinging']
]

with open(filename, 'w') as output:

csvwriter = csv.writer(output, quotechar="'", quoting=csv.QUOTE_N
csvwriter.writerow(header)
csvwriter.writerows(data)

COPY

Traceback (most recent call last):

File "main.py", line 16, in <module>
csvwriter.writerows(data)
_csv.Error: need to escape, but no escapechar set

csv.QUOTE_NONE csv

escapechar
\

COPY

import csv

filename = "my_family.csv"

header = ['Name','Age','Height(cm)','Weight(kg)','Address']

data = [
['Phil',42,178,76,'Gryffindor room, Hogwarts'],
['Claire',40,165,54,'Snapes room, Hogwarts'],
['Alex',18,140,46,'4 Private Drive, Little Whinging']
]

with open(filename, 'w') as output:

csvwriter = csv.writer(output, quotechar="'", quoting=csv.QUOTE_N
csvwriter.writerow(header)
csvwriter.writerows(data)

COPY

Name,Age,Height(cm),Weight(kg),Address
Phil,42,178,76,Gryffindor room\, Hogwarts
Claire,40,165,54,Snapes room\, Hogwarts
Alex,18,140,46,4 Private Drive\, Little Whinging
\

COPY

Name, Age, Height(cm), Weight(kg), Address

Phil, 42, 178, 76, 'Gryffindor room, Hogwarts'
Claire, 40, 165, 54, 'Snapes room, Hogwarts'
Alex, 18, 140, 46, '4 Private Drive, Little Whinging'

skipinitialspace

COPY

import csv

with open('my_family.csv', 'r') as f:

csv_reader = csv.reader(f, quotechar="'")

for line in csv_reader:

print(line)
p ( )

COPY

['Name', ' Age', ' Height(cm)', ' Weight(kg)', ' Address']

['Phil', ' 42', ' 178', ' 76', " 'Gryffindor room", " Hogwarts'"]
['Claire', ' 40', ' 165', ' 54', " 'Snapes room", " Hogwarts'"]
['Alex', ' 18', ' 140', ' 46', " '4 Private Drive", " Little Whingi

skipinitialspace

True

COPY

import csv

with open('my_family.csv', 'r') as f:

csv_reader = csv.reader(f, quotechar="'", skipinitialspace=True

for line in csv_reader:

print(line)

COPY

['Name', 'Age', 'Height(cm)', 'Weight(kg)', 'Address']

['Phil', '42', '178', '76', 'Gryffindor room, Hogwarts']
['Claire', '40', '165', '54', 'Snapes room, Hogwarts']
[ , , , , p , g ]
['Alex', '18', '140', '46', '4 Private Drive, Little Whinging']

COPY

import pandas as pd

df = pd.read_csv('my_family.csv')
print(df)

COPY

Name Age Height(cm) Weight(kg)

0 Phil 42 178 76
1 Claire 40 165 54
2 Alex 18 140 46
COPY

import pandas as pd

df = pd.read_csv('my_family.csv')

print(type(df['Age'][0]))
print(type(df['Height(cm)'][0]))
print(type(df['Weight(kg)'][0]))

COPY

names
pd.read_csv()

COPY

Phil,42,178,76
Claire,40,165,54
Alex,18,140,46

COPY

import pandas as pd

df = pd.read_csv('my_family.csv',
index_col='Name',
names=['Name', 'Age', 'Height(cm)', 'Weight(kg)']
)
print(df)

COPY

Age Height(cm) Weight(kg)

Name
Phil 42 178 76
Claire 40 165 54
Alex 18 140 46
df.to_csv

COPY

import pandas as pd

df = pd.read_csv('my_family.csv',
index_col='Name',
names=['Name', 'Age', 'Height(cm)', 'Weight(kg)']
)
df.to_csv('my_new_family.csv')

COPY

Age Height(cm) Weight(kg)

Name
Phil 42 178 76
Claire 40 165 54
Alex 18 140 46
COPY

import pandas as pd

#load the csv file

df = pd.read_csv('train.csv')

# Column Names
print(df.columns)

# Count unique values in Sex column

print(df['Sex'].value_counts())

# Percentage of male and female passengers

print(df['Sex'].value_counts(normalize=True))
COPY

Index(['PassengerId', 'Survived', 'Pclass', 'Name', 'Sex', 'Age',

'Parch', 'Ticket', 'Fare', 'Cabin', 'Embarked'],
dtype='object')
male 577
female 314
Name: Sex, dtype: int64
male 0.647587
female 0.352413
Name: Sex, dtype: float64

COPY

import pandas as pd

#load the csv file

df = pd.read_csv('train.csv')

# Column Names
print(df.columns)

# Count unique values in Sex column

print(df[df["Survived"] == 1]['Sex'].value_counts())
# Percentage of surviving male and female passengers
print(df[df["Survived"] == 1]['Sex'].value_counts(normalize=True))

COPY

Index(['PassengerId', 'Survived', 'Pclass', 'Name', 'Sex', 'Age',

'Parch', 'Ticket', 'Fare', 'Cabin', 'Embarked'],
dtype='object')
female 233
male 109
Name: Sex, dtype: int64
female 0.681287
male 0.318713
Name: Sex, dtype: float64

value_counts()

COPY

import pandas as pd

#load the csv file

df = pd.read_csv('train.csv')

# median age of each sex

median_age_men=df[df['Sex']=='male']['Age'].median()
median_age_women=df[df['Sex']=='female']['Age'].median()

print(f"The median age of men is {median_age_men}")

print(f"The median age of women is {median_age_women}")

COPY

The median age of men is 29.0

The median age of women is 27.0

XII CS Unit1 CSV Notes
No ratings yet
XII CS Unit1 CSV Notes
6 pages
Grade 10 Module 2 Computer
No ratings yet
Grade 10 Module 2 Computer
2 pages
Computer Science
No ratings yet
Computer Science
35 pages
40 R Programming Interview Questions & Answers For All Levels - DataCamp
No ratings yet
40 R Programming Interview Questions & Answers For All Levels - DataCamp
22 pages
Working With CSV Files in Python
No ratings yet
Working With CSV Files in Python
4 pages
Laravel 5 Simple Crud Application Using Reactjs Part 1
No ratings yet
Laravel 5 Simple Crud Application Using Reactjs Part 1
5 pages
40VCC617FQEE-IOM-06 2021 XCT7 Controls Touchscreen 240607 172015
No ratings yet
40VCC617FQEE-IOM-06 2021 XCT7 Controls Touchscreen 240607 172015
276 pages
CSV Files in Python
No ratings yet
CSV Files in Python
6 pages
Programming Fundamental Teaching Plan
No ratings yet
Programming Fundamental Teaching Plan
4 pages
Python CSV Files
No ratings yet
Python CSV Files
9 pages
Salesforce Administrator Practice Test Results
No ratings yet
Salesforce Administrator Practice Test Results
13 pages
ML
No ratings yet
ML
131 pages
12 Pandas
100% (1)
12 Pandas
21 pages
12 - CS - CSV File
No ratings yet
12 - CS - CSV File
4 pages
Amazon EKS Cheatsheet 1703176742
No ratings yet
Amazon EKS Cheatsheet 1703176742
8 pages
CSV File Reading and Writing: Module Contents
No ratings yet
CSV File Reading and Writing: Module Contents
9 pages
CSV BoardQuestions
No ratings yet
CSV BoardQuestions
3 pages
CSV FILES Online
No ratings yet
CSV FILES Online
84 pages
3D Occlusograms
100% (1)
3D Occlusograms
9 pages
Research Diary - How To Build CryptDB
No ratings yet
Research Diary - How To Build CryptDB
7 pages
PROG3112 Programming Java NCIII Part 2 WEEK 10 FIRST
100% (1)
PROG3112 Programming Java NCIII Part 2 WEEK 10 FIRST
5 pages
CSV File Handling
No ratings yet
CSV File Handling
16 pages
Kontakt Script Language Manual
No ratings yet
Kontakt Script Language Manual
35 pages
CSV File
No ratings yet
CSV File
30 pages
Data Sci
No ratings yet
Data Sci
29 pages
???? ???????????? ???? ??????
No ratings yet
???? ???????????? ???? ??????
63 pages
Csv-Files Final
No ratings yet
Csv-Files Final
21 pages
CSV Files
No ratings yet
CSV Files
28 pages
Csvfiles 2
No ratings yet
Csvfiles 2
28 pages
CSV Files
No ratings yet
CSV Files
22 pages
CSV File Handling
No ratings yet
CSV File Handling
20 pages
CSV Files
No ratings yet
CSV Files
24 pages
CVS File Handlinng
No ratings yet
CVS File Handlinng
5 pages
What Is It Riddles
No ratings yet
What Is It Riddles
11 pages
CSL 410 L16
No ratings yet
CSL 410 L16
22 pages
ITU07427 - Lab Worksheet
No ratings yet
ITU07427 - Lab Worksheet
7 pages
Notebook PYTHON DATA SCIENCE
No ratings yet
Notebook PYTHON DATA SCIENCE
16 pages
CSV File: Python With CSV Files
No ratings yet
CSV File: Python With CSV Files
19 pages
18 Useful Spanish Greetings Fo
No ratings yet
18 Useful Spanish Greetings Fo
4 pages
Iteration 1 Object-Oriented Analysis and Design
100% (1)
Iteration 1 Object-Oriented Analysis and Design
281 pages
Python Unit 5
No ratings yet
Python Unit 5
21 pages
Notes On CSV Filespdf
No ratings yet
Notes On CSV Filespdf
11 pages
CSV Files
No ratings yet
CSV Files
8 pages
Fds Unit - III
No ratings yet
Fds Unit - III
58 pages
CSV
No ratings yet
CSV
9 pages
Project IP 2023
No ratings yet
Project IP 2023
16 pages
Dataset Visualization Basic Ml-1
No ratings yet
Dataset Visualization Basic Ml-1
12 pages
45 of The Best Compressor Plugins in The World Gtps PDF Free
No ratings yet
45 of The Best Compressor Plugins in The World Gtps PDF Free
37 pages
CSV Comma Separated Values
No ratings yet
CSV Comma Separated Values
7 pages
CSV Note
No ratings yet
CSV Note
6 pages
CRISP DM1 - Chapter 2
No ratings yet
CRISP DM1 - Chapter 2
22 pages
EDA - Session-1 - Basic Dataframe Opertaions-1
No ratings yet
EDA - Session-1 - Basic Dataframe Opertaions-1
7 pages
Ip Project
No ratings yet
Ip Project
11 pages
Ip Project SM
No ratings yet
Ip Project SM
11 pages
CSV File
No ratings yet
CSV File
5 pages
File Handling
No ratings yet
File Handling
6 pages
CSV New
No ratings yet
CSV New
4 pages
7th Class of CSV and DataFrame
No ratings yet
7th Class of CSV and DataFrame
9 pages
CSV Programs
No ratings yet
CSV Programs
3 pages
CSV File Handling
No ratings yet
CSV File Handling
4 pages
CSV Files
No ratings yet
CSV Files
3 pages
Dsbda Assignment 1
No ratings yet
Dsbda Assignment 1
5 pages
Exercise: CSV File Handling in Python
No ratings yet
Exercise: CSV File Handling in Python
3 pages
Data Transfer Between Files, SQL Databases & Dataframes: Comma To Separate Each Specific Data Value. CSV Advantages
No ratings yet
Data Transfer Between Files, SQL Databases & Dataframes: Comma To Separate Each Specific Data Value. CSV Advantages
6 pages
Data Analytics Lab3 2100290110032
No ratings yet
Data Analytics Lab3 2100290110032
4 pages
CSV File Handling
No ratings yet
CSV File Handling
3 pages
Anshu.30.da Lab Exp 3
No ratings yet
Anshu.30.da Lab Exp 3
4 pages
CSV Files
No ratings yet
CSV Files
4 pages
CSV File Handling
No ratings yet
CSV File Handling
2 pages
Reading and Writing CSV Files
No ratings yet
Reading and Writing CSV Files
3 pages
CSV Operations With Screenshot
No ratings yet
CSV Operations With Screenshot
4 pages
Cheat Sheet
No ratings yet
Cheat Sheet
2 pages
Week1 Lecture1 2
No ratings yet
Week1 Lecture1 2
38 pages
Building An MSI File
No ratings yet
Building An MSI File
16 pages
Web Development in Modern Technologies 1
No ratings yet
Web Development in Modern Technologies 1
7 pages
# Alternative To CSV - Reader and Int Indexing of Rows
No ratings yet
# Alternative To CSV - Reader and Int Indexing of Rows
1 page
40 Questions To Test Your Skill On R For Data Science
No ratings yet
40 Questions To Test Your Skill On R For Data Science
32 pages
CSV 40
No ratings yet
CSV 40
2 pages
Python File Handling
No ratings yet
Python File Handling
4 pages
Csvfile
No ratings yet
Csvfile
2 pages
CSC Session Plan Unit I
No ratings yet
CSC Session Plan Unit I
16 pages
Ant Ds Pas69278p Street
No ratings yet
Ant Ds Pas69278p Street
2 pages
ABCSir - Assignment - Solution - Mar 18 2024 - 17-32
No ratings yet
ABCSir - Assignment - Solution - Mar 18 2024 - 17-32
48 pages
Legea Societatilor Comerciale 31 - 1990
No ratings yet
Legea Societatilor Comerciale 31 - 1990
4 pages
Final Thesis Presentation
100% (4)
Final Thesis Presentation
5 pages
Learning To Program With Haiku Lesson 18
No ratings yet
Learning To Program With Haiku Lesson 18
7 pages
Fitness App SRS
No ratings yet
Fitness App SRS
3 pages
Exam Questions Examples
No ratings yet
Exam Questions Examples
5 pages
Pointers and Reference Parameters: CSE 251 Dr. Charles B. Owen Programming in C 1
No ratings yet
Pointers and Reference Parameters: CSE 251 Dr. Charles B. Owen Programming in C 1
44 pages
Survey Sparrow
No ratings yet
Survey Sparrow
3 pages
Erreur 0 104 PDF
No ratings yet
Erreur 0 104 PDF
2 pages
FGH
No ratings yet
FGH
5 pages
Jaudat Ali-Resume Updated
No ratings yet
Jaudat Ali-Resume Updated
2 pages
Full Stack Software Developer
No ratings yet
Full Stack Software Developer
1 page

CSV Python Annotated

Uploaded by

CSV Python Annotated

Uploaded by

100 DAYS OF DATA

WORKING WITH CSV

Data analysis from a CSV file in Python

with open('my_family.csv') as input:

Header row - name, age, height(cm), weight(kg)

csv.reader next(reader object,

with open('my_family.csv') as input:

Lenin is 30 years old, 188 cm tall and 90 kg heavy

with open('my_family.csv') as input:

header = ['Name', 'Age', 'Height(cm)', 'Weight(kg)']

data = [ ['Phil', 42, 178, 76],

with open(filename, 'w') as output:

# Write a single list

# Writing a list of lists

header = ['Name', 'Age', 'Height(cm)', 'Weight(kg)']

data = [ ['Phil', 42, 178, 76],

# Write a single list

# Writing a list of lists

header = ['Name', 'Age', 'Height(cm)', 'Weight(kg)']

with open(filename, 'w') as output:

header = ['Name', 'Age', 'Height(cm)', 'Weight(kg)']

with open(filename, 'w') as output:

with open(filename, 'r') as output:

['Name', 'Age', 'Height(cm)', 'Weight(kg)', 'Address']

with open(filename, 'w') as output:

with open(filename, 'w') as output:

Traceback (most recent call last):

with open(filename, 'w') as output:

Name, Age, Height(cm), Weight(kg), Address

with open('my_family.csv', 'r') as f:

for line in csv_reader:

['Name', ' Age', ' Height(cm)', ' Weight(kg)', ' Address']

with open('my_family.csv', 'r') as f:

for line in csv_reader:

['Name', 'Age', 'Height(cm)', 'Weight(kg)', 'Address']

Name Age Height(cm) Weight(kg)

Age Height(cm) Weight(kg)

Age Height(cm) Weight(kg)

#load the csv file

# Count unique values in Sex column

# Percentage of male and female passengers

Index(['PassengerId', 'Survived', 'Pclass', 'Name', 'Sex', 'Age',

#load the csv file

# Count unique values in Sex column

Index(['PassengerId', 'Survived', 'Pclass', 'Name', 'Sex', 'Age',

#load the csv file

# median age of each sex

print(f"The median age of men is {median_age_men}")

The median age of men is 29.0

You might also like