0% found this document useful (0 votes)

50 views3 pages

Split and Create Py File

This Python script performs the following tasks: 1. It combines all CSV files in the current directory into a single file called "combine_param.csv". 2. It then removes any duplicate rows from the combined file. 3. It filters out any rows where a specified column contains a false value. 4. It splits the data into separate files based on unique index values and writes them to a new directory. 5. It optionally converts an IPython notebook into Python scripts and customizes each one for the different parameter files.

Uploaded by

kakashi hatake

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

50 views3 pages

Split and Create Py File

Uploaded by

kakashi hatake

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 3

import os, sys

import numpy as np
import pandas as pd
from glob import glob

### combine parameter

print("Combine Parameters")
all_parameters = glob('*.csv')

### Combine ###

Combine_data = pd.DataFrame()
for file in all_parameters:
print(file)
data = pd.read_csv(file)
Combine_data = pd.concat([Combine_data, data], ignore_index=True)

for file in all_parameters:

os.remove(file)

Combine_data.to_csv("combine_param.csv", index=False)
# --------------------------------------------------------------------------

### Remove Duplicates ###

if not Combine_data.empty:

print("Remove Duplicates")
initial_length = len(Combine_data)
print('Total Rows -', initial_length)

#Drop Dublicate
Combine_data.drop_duplicates(inplace=True)
final_length = len(Combine_data)
print('Dublicates Rows -', initial_length - final_length)
# ---------------------------------------------------------------------------

# remove false rows

if not Combine_data.empty:
print("\nRemove False Parameter")
print(Combine_data.columns.to_series().reset_index(drop=True))

col_index = int(input('Column True/False Index : '))

col_name = Combine_data.columns.to_list()[col_index]

initial_length = len(Combine_data)
print('Total Rows -', initial_length)

#Drop Dublicate
Combine_data = Combine_data[Combine_data[col_name] == True]
final_length = len(Combine_data)
print('Falsed Rows -', initial_length - final_length)
# ---------------------------------------------------------------------------

if not Combine_data.empty:

output_path = ''

if not os.path.isdir(output_path) and output_path != '':

os.mkdir(output_path)
bn_data = Combine_data[Combine_data['index'] == 'BANKNIFTY']
nf_data = Combine_data[Combine_data['index'] == 'NIFTY']
fn_data = Combine_data[Combine_data['index'] == 'FINNIFTY']

print('Total Rows -', len(Combine_data))

print('BANKNIFTY Rows -', len(bn_data))
print('NIFTY Rows-', len(nf_data))
print('FINNIFTY Rows-', len(fn_data))

# Split BANKNIFTY data

if not bn_data.empty:

no_of_param = int(input("BANKNIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(bn_data, no_of_param)):

data.to_csv(f"{output_path}bn_{idx}.csv", index=False)

# Split NIFTY data

if not nf_data.empty:

no_of_param = int(input("NIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(nf_data, no_of_param)):

data.to_csv(f"{output_path}nf_{idx}.csv", index=False)

# Split FINNIFTY data

if not fn_data.empty:

no_of_param = int(input("FINNIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(fn_data, no_of_param)):

data.to_csv(f"{output_path}fn_{idx}.csv", index=False)

if input("create py files y/n ? : ") == "y":

import os
import sys

### convert into py files

os.system('jupyter nbconvert --to script *.ipynb')

def prepend_line(file_name, line, name):

""" Insert given string as a new line at the beginning of a file """
# define name of temporary dummy file
dummy_file = file_name + '.bak'
# open original file in read mode and dummy file in write mode
with open(file_name, 'r') as read_obj, open(dummy_file, 'w') as write_obj:
# Write given line to the dummy file
write_obj.write(line + '\n')
# Read lines from original file one by one and append them to the dummy
file
for line in read_obj:
write_obj.write(line)

os.rename(dummy_file, name)

def code_script(name):
code_script = f"""import os
import sys
code_name = sys.argv[0].split('\\\\')[-1].replace('.py', '')
import ctypes
ctypes.windll.kernel32.SetConsoleTitleW(code_name)
print(code_name)
parameter_path = '{name}'
"""
return code_script

parameters = glob(f'{output_path}*.csv')
parameters = list(set(parameters) - set(["combine_param.csv"]))
code = glob("*.ipynb")[0].replace('ipynb','py')

import fileinput

tempFile = open(code, 'r+')

for line in fileinput.input(code):
tempFile.write(line.replace('parameter_path =', '# parameter_path ='))
tempFile.close()

for file in parameters:

prepend_line(code, code_script(file), file.replace('csv', 'py'))

os.remove(code)

Totally Tweens And Teens Diane P Tuccillo instant download
100% (1)
Totally Tweens And Teens Diane P Tuccillo instant download
36 pages
Thrive: Solar LED Home Lighting System
No ratings yet
Thrive: Solar LED Home Lighting System
2 pages
A Voice of My Own: Essays and Stories by Rolando Hinojosa
No ratings yet
A Voice of My Own: Essays and Stories by Rolando Hinojosa
159 pages
Bermocoll EHM 300 PDS
No ratings yet
Bermocoll EHM 300 PDS
3 pages
Data Analysis 6060
No ratings yet
Data Analysis 6060
6 pages
big data EX 1
No ratings yet
big data EX 1
3 pages
ex1,2_EDA
No ratings yet
ex1,2_EDA
6 pages
Advance Python
No ratings yet
Advance Python
5 pages
student data-Hanok,ataullah
No ratings yet
student data-Hanok,ataullah
5 pages
Oxy Metre
No ratings yet
Oxy Metre
17 pages
cs practical
No ratings yet
cs practical
8 pages
Theory of Cognitive Development (Jean Piaget)
No ratings yet
Theory of Cognitive Development (Jean Piaget)
6 pages
Week1 Numpy, Pandas (178) .Ipynb Colab
No ratings yet
Week1 Numpy, Pandas (178) .Ipynb Colab
6 pages
Computer: Supermarket Management System
No ratings yet
Computer: Supermarket Management System
11 pages
Data Analysis in Python_ML
No ratings yet
Data Analysis in Python_ML
21 pages
12th board practical
No ratings yet
12th board practical
8 pages
add a column to file
No ratings yet
add a column to file
2 pages
XX
No ratings yet
XX
4 pages
25 March CSV PYQs Qs
No ratings yet
25 March CSV PYQs Qs
6 pages
EDA (2)
No ratings yet
EDA (2)
7 pages
data analytics lab manual
No ratings yet
data analytics lab manual
26 pages
All Programs 2024 to back 2021 CSV Qs
No ratings yet
All Programs 2024 to back 2021 CSV Qs
8 pages
Menu Driven Programs
No ratings yet
Menu Driven Programs
7 pages
Ip 12
No ratings yet
Ip 12
5 pages
Weather Forecasting
No ratings yet
Weather Forecasting
5 pages
imp programs[1]
No ratings yet
imp programs[1]
8 pages
Data_preprocessing_example_programs1
No ratings yet
Data_preprocessing_example_programs1
9 pages
IP Project
No ratings yet
IP Project
8 pages
Assignment 7
No ratings yet
Assignment 7
1 page
Pandas NumPy Practice Questions
No ratings yet
Pandas NumPy Practice Questions
2 pages
Pre - DT Report ZBGR - 4331 - TDD
No ratings yet
Pre - DT Report ZBGR - 4331 - TDD
4 pages
Chapter2 - Data Wrangling
No ratings yet
Chapter2 - Data Wrangling
48 pages
csv files
No ratings yet
csv files
22 pages
EX-02-Data manipulation pandas matplot
No ratings yet
EX-02-Data manipulation pandas matplot
9 pages
MLC Practical
No ratings yet
MLC Practical
51 pages
TataChemicals
No ratings yet
TataChemicals
5 pages
EXP-3
No ratings yet
EXP-3
10 pages
Apr 2023
No ratings yet
Apr 2023
32 pages
Imagination
No ratings yet
Imagination
178 pages
DATASCIENCE_INTERNSHIP[1]
No ratings yet
DATASCIENCE_INTERNSHIP[1]
43 pages
Shiva Teja
No ratings yet
Shiva Teja
19 pages
1
No ratings yet
1
12 pages
CS Project CSV
No ratings yet
CS Project CSV
32 pages
SLM Report
No ratings yet
SLM Report
7 pages
Pre-Processing Example - 1
No ratings yet
Pre-Processing Example - 1
6 pages
ProductionMGmt XII IP ProjectReprotFinal
No ratings yet
ProductionMGmt XII IP ProjectReprotFinal
16 pages
Altair 240 - 4pp Brochure
No ratings yet
Altair 240 - 4pp Brochure
4 pages
EmployeeMgmt XII IP ProjectReprot 2022 23
No ratings yet
EmployeeMgmt XII IP ProjectReprot 2022 23
16 pages
CSV File Handling
No ratings yet
CSV File Handling
20 pages
Introduction to Pandas Programming 2
No ratings yet
Introduction to Pandas Programming 2
3 pages
Unit 5.Software Reliability
No ratings yet
Unit 5.Software Reliability
15 pages
Exp_1_Introduction to Data Analytics and Python fundamentals_sdk_ok
No ratings yet
Exp_1_Introduction to Data Analytics and Python fundamentals_sdk_ok
9 pages
DHP Journal
No ratings yet
DHP Journal
29 pages
External
No ratings yet
External
11 pages
Info
No ratings yet
Info
31 pages
Reading and Writing To File
No ratings yet
Reading and Writing To File
2 pages
Class Xii Computer Science Practical Programs - 2022-23 2
No ratings yet
Class Xii Computer Science Practical Programs - 2022-23 2
33 pages
Bruker: Technical Manual
No ratings yet
Bruker: Technical Manual
27 pages
Fds PDF
No ratings yet
Fds PDF
58 pages
Tom Tom Spark Cardio+Music
No ratings yet
Tom Tom Spark Cardio+Music
3 pages
Chapter 1-3 Research Paper Notes
No ratings yet
Chapter 1-3 Research Paper Notes
7 pages
Economy of Different Countries
No ratings yet
Economy of Different Countries
24 pages
LM 8E User Manual
No ratings yet
LM 8E User Manual
17 pages
Assignment 61
100% (2)
Assignment 61
4 pages
Syllabus of Applied Math in Cu
No ratings yet
Syllabus of Applied Math in Cu
98 pages
FDS RECORD-1-4
No ratings yet
FDS RECORD-1-4
18 pages
INFORMATIC Complete Project
No ratings yet
INFORMATIC Complete Project
27 pages
Applications of SM Processes
No ratings yet
Applications of SM Processes
110 pages
Ilovepdf Merged (2) Merged
No ratings yet
Ilovepdf Merged (2) Merged
65 pages
Semiotics and Methodology
No ratings yet
Semiotics and Methodology
3 pages
ML 1-11
No ratings yet
ML 1-11
27 pages
The Mathematics of Decisions, Elections, and Games
No ratings yet
The Mathematics of Decisions, Elections, and Games
242 pages
Department of Education: Sergia Soriano Esteban Integrated School Ii
No ratings yet
Department of Education: Sergia Soriano Esteban Integrated School Ii
8 pages
LibraryMgmt XII IP ProjectReportFinal
No ratings yet
LibraryMgmt XII IP ProjectReportFinal
19 pages
SalesMgmtSystem XII IP Projectreport 2022 23
No ratings yet
SalesMgmtSystem XII IP Projectreport 2022 23
18 pages
Ship of Theseus Was Rebuilt Over The Centuries F
No ratings yet
Ship of Theseus Was Rebuilt Over The Centuries F
5 pages
3rd Semester DDM AI DAA DEV Print Pages For Spiral Record 25-1-24 - Removed
No ratings yet
3rd Semester DDM AI DAA DEV Print Pages For Spiral Record 25-1-24 - Removed
28 pages
(Philips) Technical Handbook Book 4 Part IC02a Integrated Circuits MAB8031AH-2 To TDA1524A ... (PDFDrive)
No ratings yet
(Philips) Technical Handbook Book 4 Part IC02a Integrated Circuits MAB8031AH-2 To TDA1524A ... (PDFDrive)
1,136 pages
Assignment 3
No ratings yet
Assignment 3
4 pages
Fds Unit - III
No ratings yet
Fds Unit - III
58 pages
GTS-100N: Electronic Total Station Series GTS-102N GTS-105N
No ratings yet
GTS-100N: Electronic Total Station Series GTS-102N GTS-105N
20 pages
Techno-Commercial Proposal: Rooftop Solar Power Plant - 100 KW NTPC Limited
No ratings yet
Techno-Commercial Proposal: Rooftop Solar Power Plant - 100 KW NTPC Limited
11 pages
Chapter 3
No ratings yet
Chapter 3
15 pages
Kunj Project 2
No ratings yet
Kunj Project 2
31 pages
Hotel Management
No ratings yet
Hotel Management
25 pages
The Unofficial Essential Skills / Revision Guide For Mpm1D Grade 9 Academic Mathematics in Ontario by Mark Burke
No ratings yet
The Unofficial Essential Skills / Revision Guide For Mpm1D Grade 9 Academic Mathematics in Ontario by Mark Burke
44 pages
Pitched Roof
No ratings yet
Pitched Roof
2 pages
Product Brochure: Manufacturers and Stockists of High Pressure Pipeline and Drilling Equipment
No ratings yet
Product Brochure: Manufacturers and Stockists of High Pressure Pipeline and Drilling Equipment
30 pages
BA WA HD70 HD75 en H152
100% (1)
BA WA HD70 HD75 en H152
112 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet

Split and Create Py File

Uploaded by

Split and Create Py File

Uploaded by

import os, sys

### combine parameter

### Combine ###

for file in all_parameters:

### Remove Duplicates ###

# remove false rows

col_index = int(input('Column True/False Index : '))

if not os.path.isdir(output_path) and output_path != '':

print('Total Rows -', len(Combine_data))

# Split BANKNIFTY data

no_of_param = int(input("BANKNIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(bn_data, no_of_param)):

# Split NIFTY data

no_of_param = int(input("NIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(nf_data, no_of_param)):

# Split FINNIFTY data

no_of_param = int(input("FINNIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(fn_data, no_of_param)):

if input("create py files y/n ? : ") == "y":

### convert into py files

def prepend_line(file_name, line, name):

tempFile = open(code, 'r+')

for file in parameters:

You might also like