0% found this document useful (0 votes)

59 views3 pages

Split and Create Py File

This Python script performs the following tasks: 1. It combines all CSV files in the current directory into a single file called "combine_param.csv". 2. It then removes any duplicate rows from the combined file. 3. It filters out any rows where a specified column contains a false value. 4. It splits the data into separate files based on unique index values and writes them to a new directory. 5. It optionally converts an IPython notebook into Python scripts and customizes each one for the different parameter files.

Uploaded by

kakashi hatake

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

59 views3 pages

Split and Create Py File

Uploaded by

kakashi hatake

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 3

import os, sys

import numpy as np
import pandas as pd
from glob import glob

### combine parameter

print("Combine Parameters")
all_parameters = glob('*.csv')

### Combine ###

Combine_data = pd.DataFrame()
for file in all_parameters:
print(file)
data = pd.read_csv(file)
Combine_data = pd.concat([Combine_data, data], ignore_index=True)

for file in all_parameters:

os.remove(file)

Combine_data.to_csv("combine_param.csv", index=False)
# --------------------------------------------------------------------------

### Remove Duplicates ###

if not Combine_data.empty:

print("Remove Duplicates")
initial_length = len(Combine_data)
print('Total Rows -', initial_length)

#Drop Dublicate
Combine_data.drop_duplicates(inplace=True)
final_length = len(Combine_data)
print('Dublicates Rows -', initial_length - final_length)
# ---------------------------------------------------------------------------

# remove false rows

if not Combine_data.empty:
print("\nRemove False Parameter")
print(Combine_data.columns.to_series().reset_index(drop=True))

col_index = int(input('Column True/False Index : '))

col_name = Combine_data.columns.to_list()[col_index]

initial_length = len(Combine_data)
print('Total Rows -', initial_length)

#Drop Dublicate
Combine_data = Combine_data[Combine_data[col_name] == True]
final_length = len(Combine_data)
print('Falsed Rows -', initial_length - final_length)
# ---------------------------------------------------------------------------

if not Combine_data.empty:

output_path = ''

if not os.path.isdir(output_path) and output_path != '':

os.mkdir(output_path)
bn_data = Combine_data[Combine_data['index'] == 'BANKNIFTY']
nf_data = Combine_data[Combine_data['index'] == 'NIFTY']
fn_data = Combine_data[Combine_data['index'] == 'FINNIFTY']

print('Total Rows -', len(Combine_data))

print('BANKNIFTY Rows -', len(bn_data))
print('NIFTY Rows-', len(nf_data))
print('FINNIFTY Rows-', len(fn_data))

# Split BANKNIFTY data

if not bn_data.empty:

no_of_param = int(input("BANKNIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(bn_data, no_of_param)):

data.to_csv(f"{output_path}bn_{idx}.csv", index=False)

# Split NIFTY data

if not nf_data.empty:

no_of_param = int(input("NIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(nf_data, no_of_param)):

data.to_csv(f"{output_path}nf_{idx}.csv", index=False)

# Split FINNIFTY data

if not fn_data.empty:

no_of_param = int(input("FINNIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(fn_data, no_of_param)):

data.to_csv(f"{output_path}fn_{idx}.csv", index=False)

if input("create py files y/n ? : ") == "y":

import os
import sys

### convert into py files

os.system('jupyter nbconvert --to script *.ipynb')

def prepend_line(file_name, line, name):

""" Insert given string as a new line at the beginning of a file """
# define name of temporary dummy file
dummy_file = file_name + '.bak'
# open original file in read mode and dummy file in write mode
with open(file_name, 'r') as read_obj, open(dummy_file, 'w') as write_obj:
# Write given line to the dummy file
write_obj.write(line + '\n')
# Read lines from original file one by one and append them to the dummy
file
for line in read_obj:
write_obj.write(line)

os.rename(dummy_file, name)

def code_script(name):
code_script = f"""import os
import sys
code_name = sys.argv[0].split('\\\\')[-1].replace('.py', '')
import ctypes
ctypes.windll.kernel32.SetConsoleTitleW(code_name)
print(code_name)
parameter_path = '{name}'
"""
return code_script

parameters = glob(f'{output_path}*.csv')
parameters = list(set(parameters) - set(["combine_param.csv"]))
code = glob("*.ipynb")[0].replace('ipynb','py')

import fileinput

tempFile = open(code, 'r+')

for line in fileinput.input(code):
tempFile.write(line.replace('parameter_path =', '# parameter_path ='))
tempFile.close()

for file in parameters:

prepend_line(code, code_script(file), file.replace('csv', 'py'))

os.remove(code)

Assignment 61
100% (2)
Assignment 61
4 pages
General Mathematics: Functions
No ratings yet
General Mathematics: Functions
27 pages
ProductionMGmt XII IP ProjectReprotFinal
No ratings yet
ProductionMGmt XII IP ProjectReprotFinal
16 pages
25 March CSV PYQs Qs
No ratings yet
25 March CSV PYQs Qs
6 pages
Hotel Management
No ratings yet
Hotel Management
25 pages
csv file classwork
No ratings yet
csv file classwork
4 pages
Varnitjain 2300290120277 Cs3d Pythonassignment02
No ratings yet
Varnitjain 2300290120277 Cs3d Pythonassignment02
14 pages
LibraryMgmt XII IP ProjectReportFinal
No ratings yet
LibraryMgmt XII IP ProjectReportFinal
19 pages
All Programs 2024 To Back 2021 CSV Qs
No ratings yet
All Programs 2024 To Back 2021 CSV Qs
8 pages
Economy of Different Countries
No ratings yet
Economy of Different Countries
24 pages
Add A Column To File
No ratings yet
Add A Column To File
2 pages
Shiva Teja
No ratings yet
Shiva Teja
19 pages
Pythonfile
No ratings yet
Pythonfile
37 pages
Data Analytics Lab Manual
No ratings yet
Data Analytics Lab Manual
26 pages
3rd Semester DDM AI DAA DEV Print Pages For Spiral Record 25-1-24 - Removed
No ratings yet
3rd Semester DDM AI DAA DEV Print Pages For Spiral Record 25-1-24 - Removed
28 pages
IP Project
No ratings yet
IP Project
8 pages
EX-02-Data Manipulation Pandas Matplot
No ratings yet
EX-02-Data Manipulation Pandas Matplot
9 pages
CS Project CSV
No ratings yet
CS Project CSV
32 pages
Info
No ratings yet
Info
31 pages
Data Analysis 6060
No ratings yet
Data Analysis 6060
6 pages
SalesMgmtSystem XII IP Projectreport 2022 23
No ratings yet
SalesMgmtSystem XII IP Projectreport 2022 23
18 pages
ML 1-11
No ratings yet
ML 1-11
27 pages
60065a82-615a-4e51-b149-dc8601c42b3f
No ratings yet
60065a82-615a-4e51-b149-dc8601c42b3f
4 pages
Fds Unit - III
No ratings yet
Fds Unit - III
58 pages
External
No ratings yet
External
11 pages
CSV Files
No ratings yet
CSV Files
22 pages
DSC Lab Programs
No ratings yet
DSC Lab Programs
24 pages
CSV Operations - FH
No ratings yet
CSV Operations - FH
4 pages
Datascience Internship
No ratings yet
Datascience Internship
43 pages
Chapter2 - Data Wrangling
No ratings yet
Chapter2 - Data Wrangling
48 pages
Exp - 1 - Introduction To Data Analytics and Python Fundamentals - SDK - Ok
No ratings yet
Exp - 1 - Introduction To Data Analytics and Python Fundamentals - SDK - Ok
9 pages
FDS Record-1-4
No ratings yet
FDS Record-1-4
18 pages
CSV File Handling
No ratings yet
CSV File Handling
20 pages
Kunj Project 2
No ratings yet
Kunj Project 2
31 pages
12th Board Practical
No ratings yet
12th Board Practical
8 pages
Pre-Processing Example - 1
No ratings yet
Pre-Processing Example - 1
6 pages
XX
No ratings yet
XX
4 pages
INFORMATIC Complete Project
No ratings yet
INFORMATIC Complete Project
27 pages
Student Data-Hanok, Ataullah
No ratings yet
Student Data-Hanok, Ataullah
5 pages
NumPy and Pandas Step
No ratings yet
NumPy and Pandas Step
9 pages
Exp 3
No ratings yet
Exp 3
10 pages
Reading and Writing To File
No ratings yet
Reading and Writing To File
2 pages
Ilovepdf Merged (2) Merged
No ratings yet
Ilovepdf Merged (2) Merged
65 pages
Menu Driven Programs
No ratings yet
Menu Driven Programs
7 pages
Imp Programs
No ratings yet
Imp Programs
8 pages
PYTHON PROGRAMMING: Data Handling
No ratings yet
PYTHON PROGRAMMING: Data Handling
12 pages
Week1 Numpy, Pandas (178) .Ipynb Colab
No ratings yet
Week1 Numpy, Pandas (178) .Ipynb Colab
6 pages
Fds PDF
No ratings yet
Fds PDF
58 pages
Python Programs FDP
No ratings yet
Python Programs FDP
20 pages
Introduction To Pandas Programming 2
No ratings yet
Introduction To Pandas Programming 2
3 pages
Cs Practical
No ratings yet
Cs Practical
8 pages
10) Merging Dataframes: # Detecting Duplicates
No ratings yet
10) Merging Dataframes: # Detecting Duplicates
7 pages
Class Xii Computer Science Practical Programs - 2022-23 2
No ratings yet
Class Xii Computer Science Practical Programs - 2022-23 2
33 pages
Data Preprocessing Example Programs1
No ratings yet
Data Preprocessing Example Programs1
9 pages
Weather Forecasting
No ratings yet
Weather Forecasting
5 pages
Advance Python
No ratings yet
Advance Python
5 pages
Computer: Supermarket Management System
No ratings yet
Computer: Supermarket Management System
11 pages
Ip 12
No ratings yet
Ip 12
5 pages
IP Project Sample
No ratings yet
IP Project Sample
15 pages
MLC Practical
No ratings yet
MLC Practical
51 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
File No-1739517216MHE-032 Intelligent Transportion Systems
No ratings yet
File No-1739517216MHE-032 Intelligent Transportion Systems
2 pages
L1 Nutrition in Plants
No ratings yet
L1 Nutrition in Plants
4 pages
Fit India Letter
No ratings yet
Fit India Letter
2 pages
Student Notes-Greener Brominations
No ratings yet
Student Notes-Greener Brominations
9 pages
CMS Sample Paper - Class 9 Mathematics
No ratings yet
CMS Sample Paper - Class 9 Mathematics
9 pages
Model Code - XC-CPU101-C256K-8DI-6DO
No ratings yet
Model Code - XC-CPU101-C256K-8DI-6DO
6 pages
Control Panel Catalogue
No ratings yet
Control Panel Catalogue
20 pages
Operations Guide Baby-G Watch 5059
No ratings yet
Operations Guide Baby-G Watch 5059
4 pages
Tingari
No ratings yet
Tingari
62 pages
Alkohol Tata Nama
No ratings yet
Alkohol Tata Nama
4 pages
02 Decision Theory-Blockwood
No ratings yet
02 Decision Theory-Blockwood
5 pages
Maya
No ratings yet
Maya
3 pages
12th CHEM NAMING RXNS
No ratings yet
12th CHEM NAMING RXNS
43 pages
TX Topper Bi Filar
No ratings yet
TX Topper Bi Filar
1 page
ICSE Class 8 Maths Selina Solutions Chapter 7 Percent and Percentage
No ratings yet
ICSE Class 8 Maths Selina Solutions Chapter 7 Percent and Percentage
6 pages
Concepts of Probability
No ratings yet
Concepts of Probability
32 pages
Condensing Unit lbt2 q728 0y 2t
No ratings yet
Condensing Unit lbt2 q728 0y 2t
6 pages
A Word and Its Relatives: Derivation
No ratings yet
A Word and Its Relatives: Derivation
23 pages
Typhoon J-9918A 50738 - E - Manual
No ratings yet
Typhoon J-9918A 50738 - E - Manual
19 pages
Ess of Coal Mill-1 &2 - 1
No ratings yet
Ess of Coal Mill-1 &2 - 1
28 pages
Manual Instalare TRE4x4 TR135
No ratings yet
Manual Instalare TRE4x4 TR135
35 pages
Aditya Academy (Aass) Maths Class X
No ratings yet
Aditya Academy (Aass) Maths Class X
4 pages
Chapter 3 Part 2 - PVPrinciple
No ratings yet
Chapter 3 Part 2 - PVPrinciple
11 pages
Manufacturing Process of Chlorpyrifos TC
No ratings yet
Manufacturing Process of Chlorpyrifos TC
3 pages
Technical Specification
No ratings yet
Technical Specification
13 pages
Comparative Analysis of Field Oriented Control of BLDC Motor Using SPWM and SVPWM Techniques
No ratings yet
Comparative Analysis of Field Oriented Control of BLDC Motor Using SPWM and SVPWM Techniques
6 pages
Avalanche Rescue: Summary of Key Points
No ratings yet
Avalanche Rescue: Summary of Key Points
41 pages
Benjamin Franklin ° 1752 ° Michael Faraday ° 1831 °
No ratings yet
Benjamin Franklin ° 1752 ° Michael Faraday ° 1831 °
1 page
4 Practical Approaches To Minimize Voltage Drop Problems
No ratings yet
4 Practical Approaches To Minimize Voltage Drop Problems
6 pages

Split and Create Py File

Uploaded by

Split and Create Py File

Uploaded by

import os, sys

### combine parameter

### Combine ###

for file in all_parameters:

### Remove Duplicates ###

# remove false rows

col_index = int(input('Column True/False Index : '))

if not os.path.isdir(output_path) and output_path != '':

print('Total Rows -', len(Combine_data))

# Split BANKNIFTY data

no_of_param = int(input("BANKNIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(bn_data, no_of_param)):

# Split NIFTY data

no_of_param = int(input("NIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(nf_data, no_of_param)):

# Split FINNIFTY data

no_of_param = int(input("FINNIFTY Parameter No : "))

for idx, data in enumerate(np.array_split(fn_data, no_of_param)):

if input("create py files y/n ? : ") == "y":

### convert into py files

def prepend_line(file_name, line, name):

tempFile = open(code, 'r+')

for file in parameters:

You might also like