0% found this document useful (0 votes)

5 views2 pages

To Collect Bowling Data

The document is a Python script that uses Selenium to scrape bowling statistics for cricket players from a website. It initializes a Chrome webdriver, navigates to the bowling sections for specified players and formats, extracts relevant data, and stores it in a Pandas DataFrame. Finally, it saves the collected data to a CSV file on the user's desktop if any data was successfully scraped.

Uploaded by

995aarvee

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

5 views2 pages

To Collect Bowling Data

Uploaded by

995aarvee

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 2

import os

import pandas as pd
import time
from selenium import webdriver
from selenium.webdriver.common.by import By
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC

# Initialize Chrome webdriver (make sure chromedriver is in your PATH)

driver = webdriver.Chrome()

# DataFrame to store final data

final_data = pd.DataFrame()

# List of players to iterate over (replace with actual player names)

players = ["RG Sharma", "Virat Kohli", "Jasprit Bumrah"]

# Formats to scrape
formats = ["Test", "ODI", "T20I", "TWENTY20"]

# Function to navigate to Bowling section and click it

def navigate_to_bowling_section(player, fmt):
url = f"http://www.cricmetric.com/playerstats.py?player={player.replace(' ',
'+')}&role=all&format=all&groupby=year#{fmt}-Bowling"
driver.get(url)
try:
# Wait for the Bowling tab to become clickable and then click it
bowling_tab = WebDriverWait(driver, 20).until(
EC.element_to_be_clickable((By.XPATH, f'//*[@id="{fmt}-Bowling-tab"]'))
)
bowling_tab.click()

# Wait for the Bowling section to become visible

WebDriverWait(driver, 20).until(
EC.visibility_of_element_located((By.XPATH, f'//*[@id="{fmt}-
Bowling"]/div/table'))
)
print(f"Successfully navigated to Bowling section for {player} in {fmt}")
return True
except Exception as e:
print(f"Error navigating to Bowling section for {player} in {fmt}: {e}")
return False

# Iterate over each player and format for bowling data

for player in players:
for fmt in formats:
try:
if navigate_to_bowling_section(player, fmt):
# Find the table element and extract text
table = driver.find_element(By.XPATH,
f'//*[@id="{fmt}-Bowling"]/div/table').text

# Split text into lines and extract headers and data

lines = table.split('\n')
headers = lines[0].split() # Adjust delimiter if necessary

# Filter for required columns

required_columns = ["Year", "Innings", "Overs", "Runs", "Wickets",
"Econ", "Avg", "SR", "5W", "BBI", "4s", "6s", "Dot%"]
filtered_headers = [header for header in headers if header in
required_columns]

data = []
for line in lines[1:]:
row_data = line.split()
filtered_data = [row_data[headers.index(header)] for header in
filtered_headers]
data.append(filtered_data)

# Create DataFrame from extracted data

df = pd.DataFrame(data, columns=filtered_headers)

# Add additional columns for Player and Format

df['Player'] = player
df['Format'] = fmt
df['Section'] = "Bowling"

# Concatenate current DataFrame with final_data

final_data = pd.concat([final_data, df], ignore_index=True)

print(f"Successfully collected bowling data for {player} in {fmt}")

except Exception as e:
print(f"Error processing {player} for {fmt} Bowling: {e}")
continue

# Quit webdriver
driver.quit()

# Determine the desktop path

desktop_path = os.path.join(os.path.join(os.environ['USERPROFILE']), 'Desktop')
csv_file_path = os.path.join(desktop_path, 'cricmetric_player_bowling_stats.csv')

# Debugging: Print final_data for inspection

print(final_data.head())

# Save final_data to CSV if data is collected

if not final_data.empty:
final_data.to_csv(csv_file_path, index=False)
print(f"Bowling data collection complete. Saved to '{csv_file_path}'.")
else:
print("No bowling data collected. Please check your scraping process.")

IP Project
100% (11)
IP Project
28 pages
IPL Data Analysis
100% (1)
IPL Data Analysis
26 pages
Pedal Court: Omair Sports Flooring
100% (1)
Pedal Court: Omair Sports Flooring
6 pages
Personal Trainer Session Tracking Form
33% (3)
Personal Trainer Session Tracking Form
1 page
HomeWorkoutPlanforGoddessToning PDF
67% (6)
HomeWorkoutPlanforGoddessToning PDF
4 pages
Practical File 2024
No ratings yet
Practical File 2024
25 pages
Invoice Jio Fi
No ratings yet
Invoice Jio Fi
1 page
Ipl Data Anlysis
No ratings yet
Ipl Data Anlysis
20 pages
Full Code
No ratings yet
Full Code
76 pages
24 Gourav
No ratings yet
24 Gourav
75 pages
67 Estate - Residential Compounds & Modern Villas in Jeddah, Saudi Arabia
100% (1)
67 Estate - Residential Compounds & Modern Villas in Jeddah, Saudi Arabia
17 pages
Cricket World Cup Management System
No ratings yet
Cricket World Cup Management System
53 pages
Modifiedip
No ratings yet
Modifiedip
27 pages
IPL Auction Analysis
No ratings yet
IPL Auction Analysis
39 pages
IP Project
No ratings yet
IP Project
28 pages
Test 14
No ratings yet
Test 14
25 pages
Informatics Practices Project File PDF
0% (1)
Informatics Practices Project File PDF
45 pages
Class 12 CS Project On Cricket Stat Analysis
No ratings yet
Class 12 CS Project On Cricket Stat Analysis
37 pages
AmanKhajuria IPproject
No ratings yet
AmanKhajuria IPproject
29 pages
Badri Project New 1
No ratings yet
Badri Project New 1
26 pages
t20 Batting Analysis System (Ip Class 12) (2024-25)
No ratings yet
t20 Batting Analysis System (Ip Class 12) (2024-25)
25 pages
Business Analytics
No ratings yet
Business Analytics
25 pages
Circular - Recovery of Centages DDF Scheme Works - 24007 - 29.06 PDF
100% (1)
Circular - Recovery of Centages DDF Scheme Works - 24007 - 29.06 PDF
2 pages
PUSHPA - 10610624 - CA1 - Webscraping - 18th Dec 2022.ipynb - Colaboratory
No ratings yet
PUSHPA - 10610624 - CA1 - Webscraping - 18th Dec 2022.ipynb - Colaboratory
20 pages
RAKESH
No ratings yet
RAKESH
24 pages
Vedant Aggarwal IP Project File
No ratings yet
Vedant Aggarwal IP Project File
27 pages
Turn Messy Data Into Insights With Pandas 1747162138
No ratings yet
Turn Messy Data Into Insights With Pandas 1747162138
44 pages
YEAR: 2024 - 2025: Ipl Data Analysis Using Mysql and Python Connectivy
No ratings yet
YEAR: 2024 - 2025: Ipl Data Analysis Using Mysql and Python Connectivy
22 pages
Phil Salt T20 Career Analysis
No ratings yet
Phil Salt T20 Career Analysis
38 pages
Indian Premier League Ip Project File
No ratings yet
Indian Premier League Ip Project File
42 pages
SREE
No ratings yet
SREE
24 pages
Share INFORMATICS PRACTICES KABIR
No ratings yet
Share INFORMATICS PRACTICES KABIR
37 pages
ML 1
No ratings yet
ML 1
16 pages
Ipl Data Analysis
No ratings yet
Ipl Data Analysis
19 pages
Ip Project
No ratings yet
Ip Project
16 pages
Ip Project
No ratings yet
Ip Project
20 pages
Ip Practical File
No ratings yet
Ip Practical File
23 pages
The 21 Day Body Recomp PDF
No ratings yet
The 21 Day Body Recomp PDF
25 pages
Report
No ratings yet
Report
25 pages
Coding Output CSV
No ratings yet
Coding Output CSV
30 pages
Exemplar - Perform Feature Engineering
No ratings yet
Exemplar - Perform Feature Engineering
14 pages
PandasAI + Cricket
No ratings yet
PandasAI + Cricket
10 pages
Dav Week8 240953580
No ratings yet
Dav Week8 240953580
15 pages
IP PROJECT On Ipl Sahil Uppal
No ratings yet
IP PROJECT On Ipl Sahil Uppal
27 pages
IP Project
No ratings yet
IP Project
28 pages
Program Dataframe
No ratings yet
Program Dataframe
8 pages
Ad 1
No ratings yet
Ad 1
14 pages
MFT Cycle 3
No ratings yet
MFT Cycle 3
37 pages
Final Report For 0th New
No ratings yet
Final Report For 0th New
10 pages
Ipl Data Analysis Porgram
No ratings yet
Ipl Data Analysis Porgram
6 pages
IPL - Prediction - Model - Training - Final - Ipynb - Colab
No ratings yet
IPL - Prediction - Model - Training - Final - Ipynb - Colab
8 pages
Dream Team 11
No ratings yet
Dream Team 11
6 pages
T 20 WC
No ratings yet
T 20 WC
4 pages
Advanced IPL Match Analysis Using Python (Advanced)
No ratings yet
Advanced IPL Match Analysis Using Python (Advanced)
4 pages
Dream Team
No ratings yet
Dream Team
4 pages
Code2pdf 6714bd5247d05
No ratings yet
Code2pdf 6714bd5247d05
3 pages
Company Profile
No ratings yet
Company Profile
25 pages
Advanced IPL Match Analysis Using Python (Basic)
No ratings yet
Advanced IPL Match Analysis Using Python (Basic)
3 pages
# Update The Template To Remove Pla
No ratings yet
# Update The Template To Remove Pla
2 pages
Corection
No ratings yet
Corection
2 pages
Soln
No ratings yet
Soln
3 pages
Mirko Workout PDF
100% (3)
Mirko Workout PDF
10 pages
Ip Project by Nitin Rajawat PDF
No ratings yet
Ip Project by Nitin Rajawat PDF
10 pages
Week 5 Essay
No ratings yet
Week 5 Essay
2 pages
Seismic Passive Control of Cable-Stayed Bridges: Hosam-Eddin M. Ali
No ratings yet
Seismic Passive Control of Cable-Stayed Bridges: Hosam-Eddin M. Ali
15 pages
Assignment 1
No ratings yet
Assignment 1
2 pages
Smart Player Rotation Strategy (22 Players 20 Teams)
No ratings yet
Smart Player Rotation Strategy (22 Players 20 Teams)
3 pages
Mom
No ratings yet
Mom
6 pages
20 Mistakes Self Defence Ebook (1) - Compressed
No ratings yet
20 Mistakes Self Defence Ebook (1) - Compressed
50 pages
Class 2 - Group 11 - Unit 8:: Soccer - The Beautiful Game
No ratings yet
Class 2 - Group 11 - Unit 8:: Soccer - The Beautiful Game
9 pages
Power Development, Part II - Lower Your Percentages - STACK PDF
No ratings yet
Power Development, Part II - Lower Your Percentages - STACK PDF
18 pages
1revised Petition For Damages - BoxRec Filing v11
100% (1)
1revised Petition For Damages - BoxRec Filing v11
102 pages
Feasibility Study: Dr. R Bista Ms Gyan Laxmi Shrestha Basic Administration Project 2017
No ratings yet
Feasibility Study: Dr. R Bista Ms Gyan Laxmi Shrestha Basic Administration Project 2017
22 pages
How Can This Golf Fitness Program Help Me
No ratings yet
How Can This Golf Fitness Program Help Me
3 pages
Learn To Row Booklet V2
No ratings yet
Learn To Row Booklet V2
51 pages
Pe4 Team Sports
No ratings yet
Pe4 Team Sports
18 pages
Sheiko Program
No ratings yet
Sheiko Program
4 pages
4092 PDF
100% (1)
4092 PDF
2 pages
Proposed Methodology For Prioritization of Investment Projects Along Selected Euro-Asian Routes
No ratings yet
Proposed Methodology For Prioritization of Investment Projects Along Selected Euro-Asian Routes
37 pages
7 12
No ratings yet
7 12
2 pages
Long List Twin Towers Registration
No ratings yet
Long List Twin Towers Registration
54 pages
40 Minute Blast - Abs, Cardio and Resistance Workout - Muscle & Strength
No ratings yet
40 Minute Blast - Abs, Cardio and Resistance Workout - Muscle & Strength
11 pages
Carrie Frederick - Resume
No ratings yet
Carrie Frederick - Resume
2 pages
Clab 2 Expt No 6
No ratings yet
Clab 2 Expt No 6
7 pages
DS3CD - W2D2 7th Jan
No ratings yet
DS3CD - W2D2 7th Jan
4 pages
FPA96 20230325 V2 Compressed
No ratings yet
FPA96 20230325 V2 Compressed
82 pages
Unit24 PassiveVoice GrammarPET
No ratings yet
Unit24 PassiveVoice GrammarPET
6 pages
7 12
No ratings yet
7 12
2 pages
Big Data Nalysis
No ratings yet
Big Data Nalysis
2 pages
WPA - BOLAND Open and Combined Events - STARTLIST 0809novembe
No ratings yet
WPA - BOLAND Open and Combined Events - STARTLIST 0809novembe
39 pages
200 Pleasurable Activities
No ratings yet
200 Pleasurable Activities
5 pages
Adapted Pe Lesson Plan
No ratings yet
Adapted Pe Lesson Plan
3 pages
Ride Details Bill Details: Thanks For Travelling With Us, Ketan Gawande
No ratings yet
Ride Details Bill Details: Thanks For Travelling With Us, Ketan Gawande
3 pages
PSC I Girder Comparison
No ratings yet
PSC I Girder Comparison
1 page
QTR (F (: India Ministry of
No ratings yet
QTR (F (: India Ministry of
2 pages
SR - No Chainages Description Observations As Per KML NH-161 JN To MH-TS Border
No ratings yet
SR - No Chainages Description Observations As Per KML NH-161 JN To MH-TS Border
1 page
Writing Academic English
No ratings yet
Writing Academic English
18 pages
TỔNG HỢP VIẾT CÂU B2. PART 1. ĐỀ
No ratings yet
TỔNG HỢP VIẾT CÂU B2. PART 1. ĐỀ
4 pages
Tawara MTB Racing: 120 Woodberry Road London Wc1B 4Bq
No ratings yet
Tawara MTB Racing: 120 Woodberry Road London Wc1B 4Bq
3 pages
Elements of A Training Session
No ratings yet
Elements of A Training Session
2 pages
Kingsolomon - Esports Tips
No ratings yet
Kingsolomon - Esports Tips
1 page
Three Minute Test
No ratings yet
Three Minute Test
1 page
C++ for Game Developers: Building Scalable and Robust Gaming Applications
From Everand
C++ for Game Developers: Building Scalable and Robust Gaming Applications
Jarrel E.
No ratings yet
How to a Developers Guide to 4k: Developer edition, #3
From Everand
How to a Developers Guide to 4k: Developer edition, #3
Xinc Cyberwizard
No ratings yet
No Ph.D. Game Design With Three.js
From Everand
No Ph.D. Game Design With Three.js
Nikiforos Kontopoulos
No ratings yet
The Essential R Reference
From Everand
The Essential R Reference
Mark Gardener
No ratings yet
150+ C Pattern Programs
From Everand
150+ C Pattern Programs
Hernando Abella
No ratings yet

To Collect Bowling Data

Uploaded by

To Collect Bowling Data

Uploaded by

import os

# Initialize Chrome webdriver (make sure chromedriver is in your PATH)

# DataFrame to store final data

# List of players to iterate over (replace with actual player names)

# Function to navigate to Bowling section and click it

# Wait for the Bowling section to become visible

# Iterate over each player and format for bowling data

# Split text into lines and extract headers and data

# Filter for required columns

# Create DataFrame from extracted data

# Add additional columns for Player and Format

# Concatenate current DataFrame with final_data

print(f"Successfully collected bowling data for {player} in {fmt}")

# Determine the desktop path

# Debugging: Print final_data for inspection

# Save final_data to CSV if data is collected

You might also like