0% found this document useful (0 votes)

15 views15 pages

Co Digit Ooo

Uploaded by

Junior

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

15 views15 pages

Co Digit Ooo

Uploaded by

Junior

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 15

import polars as pl

import pathlib
from pathlib import Path, PurePath
import os
from datetime import datetime, time, timedelta
import pytz
from polars.exceptions import ComputeError
import torch
import torch.jit
import torch.nn as nn
import numpy as np
import pandas as pd
from typing import Optional
import plotly.graph_objects as go
import plotly.io as pio
from colorama import init, Fore, Back, Style

def setup_file_paths():
# Directory where the script is located
directory_script = Path(__file__).resolve().parent
# absolute script path
absolute_path = PurePath(directory_script, Path(__file__).name)
# change the current working directory
os.chdir(str(directory_script))
return absolute_path

class CSVProcessor:
"""
Summary:
Class to process CSV files with a defined schema.

Attributes:
default_schema (dict): default schema for the data.
schema (dict): Schema to be used to process the data.

"""

def init(self, csv_name: str, schema: dict = None) -> None:

# Define a name for csv data base
self.csv_name = csv_name
# Define the complete file name for csv data base
self.csv_file_name = f"{csv_name}.csv"
# Define the complete file name for csv main data base 1-minute
self.csv_main_file_name = f"{csv_name}_1m.csv"
# We define the default scheme (32 is cheaper than 64)
self.default_schema = {
"Date": pl.String,
"Open": pl.Float32,
"High": pl.Float32,
"Low": pl.Float32,
"Close": pl.Float32,
}
# Define the main data frame with all the history data
self.df_1m = None
# If no schema is provided, we use the default schema.
if schema is not None and isinstance(schema, dict):
self.schema = schema
else:
self.schema = self.default_schema
# Verify
self.check_and_create_csv()

def validate_input(self):
# Check if the input data is valid
pass

def csv_processor(
self,
show: bool = False,
return_tensor: bool = False,
start_date: str = None,
end_date: str = None,
generate_csv_file: bool = False,
) -> tuple[pl.DataFrame, Optional[torch.Tensor]]:
"""Process a CSV file and optionally return a Polars DataFrame and a
PyTorch tensor

Args:
show (bool, optional): Show the data frame. Defaults to False.
return_tensor (bool, optional): return a tensor. Defaults to False.
start_date (str, optional): the start date for the selection (format:
"YYYY.MM.DD"). Defaults to None.
end_date (str, optional): the end date for the selection (format:
"YYYY.MM.DD"). Defaults to None.

Returns:
tuple[pl.DataFrame, torch.Tensor]: return a polars data frame and a
tensor
Example:
>>> df, tensor = csv_processor(show=True, start_date="2019-01-7",
end_date="2019-01-8")

"""
try:

# Load CSV as a LazyFrame

df = pl.scan_csv(self.csv_file_name, has_header=False)

# Convert str to datetime

df = df.with_columns(
[
pl.col("column_1")
.str.strptime(pl.Date, "%Y.%m.%d")
.alias("column_1"),
pl.col("column_2").str.strptime(pl.Time, "%H:
%M").alias("column_2"),
]
)
df = df.with_columns(
pl.col("column_1").dt.combine(pl.col("column_2")).alias("column_1")
)

# First, the column is interpreted as being in the America/Lima time

zone (UTC-5).
df = df.with_columns(
pl.coalesce("column_1").dt.replace_time_zone("America/Lima")
)

# Second, convert the 'time' column to the New York time zone,
considering daylight saving time (UTC-4 in summer, UTC-5 in winter).
df = df.with_columns(
pl.col("column_1").dt.convert_time_zone("America/New_York")
)

# Finally, delete unnecessary column

df = df.drop(["column_2", "column_7"])

# rename columns
df = df.rename(
{
"column_1": "Date",
"column_3": "Open",
"column_4": "High",
"column_5": "Low",
"column_6": "Close",
}
)
# convert the strings dates to right format
if start_date is not None:
start_date = datetime.strptime(start_date, "%Y-%m-%d").astimezone(
pytz.timezone("America/New_York")
)
if end_date is not None:
end_date = datetime.strptime(end_date, "%Y-%m-%d").astimezone(
pytz.timezone("America/New_York")
)
# filter the table by start and end date
if start_date or end_date is not None:
df = df.filter(
(pl.col("Date") >= start_date) & (pl.col("Date") <= end_date)
)

# materialize (convert lazy data frame to data frame)

df = df.collect()
if return_tensor is True:
# Convert column 'dates' to a number (timestamp in nanoseconds)
df_int = df.with_columns(
pl.col("Date").cast(
pl.Int64
) # Switches to Int64 to get the timestamp
)
df_tensor = df_int.to_torch(return_type="tensor")
torch.set_printoptions(sci_mode=False)

else:
df_tensor = None
if show is True:
print(df.shape)
print(
"\nData frame:\n",
df,
"\nData frame converted to tensor:\n",
df_tensor,
)
if generate_csv_file is True:
# Define the path of CSV file
path = pathlib.Path(self.csv_main_file_name)
# Delete the time information
df = df.with_columns(
pl.col("Date").dt.to_string("%Y-%m-%d %H:%M:%S").alias("Date")
)
# Write the data frame to CSV file
df.write_csv(path)

return df, df_tensor

except pl.exceptions.ComputeError:
print("Error when making transformations")
return None
except (FileNotFoundError, OSError) as e:
print(f"Error loading CSV: {e}")
return None

def group_and_write_csv_by(self, time_frame: str | list):

"""_summary_

Args:
time_frame (str): time frame, like 5m, 10m, 15m, 1h, etc...

Returns:
pl.Dataframe: A new data frame
Example:
>>> df = roup_and_write_csv_by('1m') # 1-minute candlestick
>>> df = roup_and_write_csv_by('1h') # 1-hour candlestick
"""

# Grouping 1-minute candles to create x-minute candles and write it to a

csv file
def write_csv_time_frame():
# transform 1-minute Japanese candlesticks to specified timeframe
df_grouped = (
self.df_1m.group_by(
pl.col("Date").dt.truncate(
time_frame
) # rounds down the timestamp of each 1-minute candle to the
start of the nearest 5-minute interval.
) # Group by each 5-minute interval
.agg(
[
pl.first("Open").alias(
"Open"
), # Opening of the first sail of the group
pl.max("High").alias("High"), # Maximum of the group
pl.min("Low").alias("Low"), # Minimum of the group
pl.last("Close").alias(
"Close"
), # Closing of the last candle of the group
]
)
.sort(
pl.col("Date").dt.truncate(time_frame)
) # Sort by truncated interval
)

# In order to avoid wrong formats in 'Date' column, time is converted

to text.
df_grouped = df_grouped.with_columns(
pl.col("Date").dt.to_string("%Y-%m-%d %H:%M:%S").alias("Date")
)
# materialize or make physical the lazy frame
df_grouped = df_grouped.collect()
# create a csv file by writing the data frame
df_grouped.write_csv(pathlib.Path(f"{self.csv_name}_{time_frame}.csv"))

# if it is a str, then call once but if it a list call as needed

if isinstance(time_frame, str):
write_csv_time_frame()
elif isinstance(time_frame, list):
# iterate through the list of data frames to create csv files
for tm in time_frame:
# if exists, then pass
if os.path.exists(f"{self.csv_name}_{tm}.csv"):
print(f"{self.csv_name}_{tm}.csv already exists, pass...")
# if not exists, then create
else:
self.group_and_write_csv_by(tm)
print(f"{self.csv_name}_{tm}.csv successfully created...")

def check_and_create_csv(self) -> None:

"""Checks if the CSV file exists and creates it if not.
Check if the CSV file already exists
Args:
time_frame (str, optional): Time frame for grouping, like '1m' or '1h'.
"""
# If exists scan 1-minute candlestick csv file
if os.path.exists(self.csv_main_file_name):
pass
# If not exists scan 1-minute candlestick csv file, create it and create
common time frames
else:
# Step 1: Create 1-minute candlestick csv file
self.df_1m, _ = self.csv_processor(
show=False, return_tensor=False, generate_csv_file=True
)
# Step 2: Create common time frames (group by time frame and write
principal csv files)
self.group_and_write_csv_by(["5m", "10m", "15m", "30m", "1h", "4h",
"1d"])

def scan_csv(
self, time_frame, materialize: bool = False
) -> pl.LazyFrame | pl.DataFrame:
"""Scans a CSV file and returns a LazyFrame or a DataFrame.
Args:
csv_file (str): Path to the CSV file.
materialize (bool, optional): If True, returns a materialized
DataFrame. Defaults to False.
Returns:
pl.LazyFrame | pl.DataFrame: A LazyFrame if materialize is False,
or a DataFrame if materialize is True.
"""
# file name that will be scan when the function is called
csv_file_name = f"{self.csv_name}_{time_frame}.csv"
def scan():
# headers: Date,Open,High,Low,Close
# schema == data type per each column, establish it for greater
scanning efficiency
# scan with a schema
df = pl.scan_csv(
csv_file_name, has_header=True, schema_overrides=self.schema
)
# convert text to time (data time)
df = df.with_columns(
pl.col("Date")
.str.strptime(pl.Datetime, format="%Y-%m-%d %H:%M:%S")
.alias("Date")
)
return df

if os.path.exists(csv_file_name):
df = scan()
else:
self.group_and_write_csv_by(time_frame)
if materialize is True:
df = df.collect()
return df

# This class is in charge of the exploratory analysis of the data (EDA).

class DataExplorer:
pass

# This class deals with the analysis of fundamental news.

class FinancialNewsAnalyzer:
pass

# This class stores all trading strategies

class StrategyFactory:

def __init__(self):
self.check_format()

def check_format(self):
# check if the format of the output is correct
pass

def strategy_1(
self,
df: pl.DataFrame,
entry_time: str = "8:00",
order: str = "buy",
tp: int = 10,
sl: int = 2,
limit_time: str = "13:00:00",
lot_size: int = 0.05,
) -> pl.DataFrame:
"obtener el tiempo"
try:
hours, minutes = map(int, entry_time.split(":"))
except ValueError as exc:
raise ValueError(f"The format of entry_time must be 'HH:MM'.{exc}")
from exc
# get data frame filtered by time
df = df.filter(
(pl.col("Date").dt.hour() == hours)
& (pl.col("Date").dt.minute() == minutes)
)
# rename column
df = df.rename(
{
"Date": "entry_time",
}
)
# Get tp and sl
df = df.with_columns(
[
(pl.col("High") + int(tp)).alias("tp"),
(pl.col("Low") - int(sl)).alias("sl"),
]
)

#
=========================================================================== #
# This part is to get max and min values, do not delete this logic, just
optimize.
#
=========================================================================== #

# Materialize lazy frame because lf doesn't have 'transpose' method but df

does have it
df = df.collect()

# get max and min columns

df = df.with_columns(
df.select(["tp", "sl"])
.transpose()
.max()
.transpose()
.to_series()
.alias("max"),
df.select(["tp", "sl"])
.transpose()
.min()
.transpose()
.to_series()
.alias("min"),
)

# Delete unnecessary columns

df = df.drop(["High", "Low", "Close"])

#
=========================================================================== #
# This part indicates the time limit of the operation
# (this part is extremely important to avoid excessive ram consumption in
later filters).
#
=========================================================================== #
hour, minute, second = limit_time.split(":")
# create Date_max column
df = df.with_columns(
pl.datetime(
pl.col("entry_time").dt.year(),
pl.col("entry_time").dt.month(),
pl.col("entry_time").dt.day(),
int(hour), # new hour
int(minute), # new minute
int(second), # new second
).alias("Date_max")
)
return df

def strategy_2(
self,
df: pl.DataFrame,
lower_time_limit: str = "8:00",
upper_time_limit: str = "13:00",
min_candle_body: int = 2,
tp: int = 10,
sl: int = 3,
):
try:
lower_time_limit = datetime.strptime(lower_time_limit, "%H:%M").time()
upper_time_limit = datetime.strptime(upper_time_limit, "%H:%M").time()
except ValueError as exc:
raise ValueError(f"The format of time must be 'HH:MM'.{exc}") from exc
# Create a Time column to filter
df = df.with_columns(pl.col("Date").dt.time().alias("Time"))

# get data frame filtered by time

df = df.filter(
(pl.col("Time") >= lower_time_limit) & (pl.col("Time") <=
upper_time_limit)
)
# Create a candle_body column to filter
df = df.with_columns(
abs(pl.col("Open") - pl.col("Close")).round(0).alias("candle_body")
)
# ======== Get the first candle per each day with a min body =======
# Keep only with candles larger than 'min_candle_body'
dates = df.filter(pl.col("candle_body") >= min_candle_body)
# Create a new column called 'Date only' without time
dates = dates.with_columns(pl.col("Date").dt.date().alias("Date_only"))
# Keep only the first candle of each day grater than 'min_candle_body'
dates = (
dates.group_by("Date_only") # Group by 'Date_only'
.agg(pl.col("Date").first()) # get the first time of the day
.sort("Date") # Order by Date column
.select("Date") # Select only the Date column
)
# Add 5 minutes because the entry time is at the close of the candle with
the specified minimum number of pips.
dates = dates.with_columns((pl.col("Date") + pl.duration(minutes=5)))
# Filter the original dataframe by the dates
df = df.join(dates, on="Date", how="inner")
# Delete unnecessary column (time will no longer be used)
df = df.drop(["Time", "candle_body"])
# Get take profit
df = df.with_columns(
pl.when(pl.col("Open") < pl.col("Close"))
.then(pl.col("Open") + tp) # Buy order
.otherwise(pl.col("Open") - tp) # sell order
.alias("tp")
)
# Get stop loss
df = df.with_columns(
pl.when(pl.col("Open") > pl.col("Close"))
.then(pl.col("Open") + sl) # Buy order
.otherwise(pl.col("Open") - sl) # sell order
.alias("sl")
)

df = df.select(["Date", "Open", "tp", "sl"])

# Materialize lazy frame because lf doesn't have 'transpose' method but df

does have it
df = df.collect()

# get max and min columns

df = df.with_columns(
df.select(["tp", "sl"])
.transpose()
.max()
.transpose()
.to_series()
.alias("max"),
df.select(["tp", "sl"])
.transpose()
.min()
.transpose()
.to_series()
.alias("min"),
)

#
=========================================================================== #
# This part indicates the time limit of the operation
# (this part is extremely important to avoid excessive ram consumption in
later filters).
#
=========================================================================== #
# Get Date_max column
df = df.with_columns(
pl.col("Date")
.dt.date() # Extract only the date from the column 'Date'.
.cast(pl.Datetime) # Convert to datetime
.dt.offset_by(
f"{upper_time_limit.hour}h{upper_time_limit.minute}m"
) # Add the time stored in the variable
.alias("Date_max") # New column with the resulting datetime
)

# rename column
df = df.rename(
{
"Date": "entry_time",
}
)

return df

def strategy_3(self):
pass

# ...

# This class is in charge of performing historical back testing.

class BackTesting:
def __init__(self):
self.validate_format()

def validate_format(self):
"""_summary_
This method is used to validate the format of the data.
"""
# Check if the input data is in the correct format
pass

# Make Back testing using CPU

def back_tester_cpu(self, parameters, df_1m):
"""_summary_
This method is used to perform back testing using the CPU.

Args:
parameters (pl.DataFrame): parameters to make the review
df_1m (pl.DataFrame): the data base
"""
# declare variables
entry_time = parameters["entry_time"]
max_v = parameters["max"]
min_v = parameters["min"]
date_max = parameters["Date_max"]
max_db = df_1m["High"]
min_db = df_1m["Low"]
# list for storing the data frames of one row
data_frames = []
# loop to return the closing date of the trade
for entry_time_i, max_i, min_i, date_max_i, max_db_i, min_db_i in zip(
entry_time, max_v, min_v, date_max, max_db, min_db
):
a = entry_time_i, max_i, min_i, date_max_i, max_db_i, min_db_i
"In this section, is going to apply 3 filters"
# print(f"Date Range: {entry_time_i} TO {date_max_i}\nPrice Range:
{min_i} TO {max_i}")
# Select only the necessary columns
df_1m_limits = df_1m.select(["Date", "High", "Low"])
# First, filter by time. Filter the database
df_filtered_by_time = df_1m_limits.filter(
(pl.col("Date") >= entry_time_i) & (pl.col("Date") <= date_max_i)
)
# Second, filter by high and low. Filter the database
df = df_filtered_by_time.filter(
(pl.col("High") >= max_i) | (pl.col("Low") <= min_i)
)
# Third, get only the first value that fulfils the condition
df = df.head(1)
# if null, then close the order within the maximum time limit.
if df.is_empty():
df = df_filtered_by_time.select(pl.all().last())
else:
pass
# Fourth, stores the data frame in a list
data_frames.append(df)
# Join data frames
df_concat = pl.concat(data_frames)
# rename
df_concat = df_concat.rename(
{
"Date": "exit_time",
}
)
# Concatenate both data frames and delete unnecessary column
df_concat = pl.concat([parameters, df_concat], how="horizontal").drop(
"Date_max"
)

# getting close price

df_concat = df_concat.with_columns(
pl.when(pl.col("High") >= pl.col("max"))
.then(pl.col("max")) # max is tp if it's buy but sl if it's sell
.otherwise(pl.col("min")) # min is sl if it's buy but tp if it's sell
.alias("close_price")
)
# getting type order price
df_concat = df_concat.with_columns(
pl.when(pl.col("tp") > pl.col("sl"))
.then(pl.lit("buy"))
.otherwise(pl.lit("sell"))
.alias("max")
)
df_concat = df_concat.rename(
{
"max": "type", # rename the column
}
)
# drop unnecessary columns
df_concat = df_concat.drop(["High", "Low", "min"])

# getting utility price

df_concat = df_concat.with_columns(
pl.when(
(
(pl.col("type") == pl.lit("buy"))
& (pl.col("close_price") > pl.col("Open"))
)
| (
(pl.col("type") == pl.lit("sell"))
& (pl.col("close_price") < pl.col("Open"))
)
)
.then(abs(pl.col("Open") - pl.col("tp")))
.otherwise(-abs(pl.col("Open") - pl.col("sl")))
.alias("utility")
)
# profit accumulation
df_concat = df_concat.with_columns(
pl.col("utility")
.cum_sum()
.alias("Cumulative_utility") # calculate cumulative sum
)
return df_concat

# Make Back testing using GPU (Faster than CPU)

def back_tester_GPU(self, parameters, df_1m):
"""_summary_
Parameters

Args:
parameters (pl.DataFrame): _description_
df_1m (pl.DataFrame): _description_
"""
# <==============================================================>#
# <==================== GPU BACKTESTER ===========================>#
# <==============================================================>#
pass

# This class is in charge of data visualization.

class DataVisualizer:
def __init__(self):
self.logo_ASCII()
init() # colorama

# this is just for decorative purpose

def logo_ASCII(self):
"""_summary_
Display the logo of the application
"""
# Gold / Dollar
print(Fore.YELLOW)
print("<================================================>")
print("██╗ ██╗ █████╗ ██╗ ██╗██╗ ██╗███████╗██████╗")
print("╚██╗██╔╝██╔══██╗██║ ██║██║ ██║██╔════╝██╔══██╗")
print(" ╚███╔╝ ███████║██║ ██║██║ ██║███████╗██║ ██║")
print(" ██╔██╗ ██╔══██║██║ ██║██║ ██║╚════██║██║ ██║")
print("██╔╝ ██╗██║ ██║╚██████╔╝╚██████╔╝███████║██████╔╝")
print("╚═╝ ╚═╝╚═╝ ╚═╝ ╚═════╝ ╚═════╝ ╚══════╝╚═════╝")
print("<============= by Joel Pasapera ================>")
print(Style.RESET_ALL)

def new_function(self):
print("Here will be a new function")

def write_csv(
self, df: pl.DataFrame, file_name: str = "back_test", show: bool = False
) -> None:
"""_summary_

Args:
df (pl.DataFrame): Dataframe to be written into CSV file
file_name (str, optional): Name of the output CSV file. Defaults to
"back_test".
show (bool, optional): Show results if you want. Defaults to False.
"""
# Write a DataFrame to a CSV file
# < ============================================================>#
# <==================== SAVE IN CVS FILE =======================>#
# < ============================================================>#
# In order to avoid wrong formats in 'Date' column, time is converted to
text.
df = df.with_columns(
pl.col(["entry_time", "exit_time"]).dt.to_string("%Y-%m-%d %H:%M:%S")
)
# generate the path
csv_path = f"{file_name}.csv"
# create a csv file by writing the data frame
df.write_csv(pathlib.Path(csv_path))
if show is True:
print(f"Data saved in {csv_path}")
print(df)

def save_graph_as_png(
self,
df: pl.DataFrame,
file_name: str = "chart",
title: str = "Graph",
x_title: str = "exit_time",
y_title: str = "Cumulative_utility",
) -> None:
"""_summary_

Args:
df (pl.DataFrame): Dataframe to be graph and save as png file
file_name (str, optional): Name of the output png file. Defaults to
"chart".
title (str, optional): Title of the graph. Defaults to "Graph".
x_title (str, optional): Dataframe's name column that will be x axis.
Defaults to "exit_time".
y_title (str, optional): Dataframe's name column that will be y axis.
Defaults to "Cumulative_utility".
"""
# < ============================================================>#
# < =============== SAVE UTILITY IN PNG FILE ===================>#
# < ============================================================>#
# create a new figure
# create figure
fig = go.Figure(
go.Scatter(
x=df[x_title],
y=df[y_title],
mode="lines",
name=title,
)
)

# Update the designed of the graph (optional)

fig.update_layout(
title=title,
xaxis_title=x_title,
yaxis_title=y_title,
plot_bgcolor="white",
)
# profitability_chart.png
# save the graph with png extension
image_path = f"{file_name}.png"
pio.write_image(fig, image_path)

# evaluates technical aspects of a trading strategy,

class StrategyEvaluator:
# such as performing Monte Carlo tests and obtaining metrics such as profit
factor and win rate
def __init__(self, df):
self.df = df

# make back testing with million of different parameters until found the right
strategy
class IntensiveBackTesting:
def __init__(self, df, strategy, risk_management, data_visualizer,
strategy_eval):
self.df = df
self.strategy = strategy
self.risk_management = risk_management
self.data_visualizer = data_visualizer
self.strategy_eval = strategy_eval

# This is the main function

def main():
# the intention of this is to run all scripts in the same location as this
script.
setup_file_paths()
# create an instance of the data visualizer
view = DataVisualizer()
# Create an objet 'xauusd' which represents gold data
xauusd = CSVProcessor(csv_name="XAUUSD")
# Create data frames (pl.Dataframe) for xauusd
df_1m = xauusd.scan_csv(time_frame="1m") # 1-minute (1m) candlestick
df_5m = xauusd.scan_csv(time_frame="5m") # 5-minute (5m) candlestick
# Get parameters of each strategy
get_parameters = StrategyFactory()
# Strategy 1
parameters_1 = get_parameters.strategy_1(df_1m)
# Strategy 2
parameters_2 = None
# Materialize before make back testing (THIS IS MANDATORY)
df_1m = df_1m.collect()
# make the back testing
review = BackTesting()
review.back_tester_cpu(parameters=parameters_1, df_1m=df_1m)
# show results
view.new_function()

# This is the main function

def main_test():
# the intention of this is to run all scripts in the same location as this
script.
setup_file_paths()
# create an instance of the data visualizer
view = DataVisualizer()
# Create an objet 'xauusd' which represents gold data
xauusd = CSVProcessor(csv_name="XAUUSD")
# Create data frames (pl.Dataframe) for xauusd
df_1m = xauusd.scan_csv(time_frame="1m") # 1-minute (1m) candlestick
df_5m = xauusd.scan_csv(time_frame="5m") # 5-minute (5m) candlestick
# Get parameters of each strategy
get_parameters = StrategyFactory()
# Strategy 1
parameters_2 = get_parameters.strategy_2(df_5m)
# Materialize before make back testing (THIS IS MANDATORY)
df_1m = df_1m.collect()
# make the back testing
review = BackTesting()
review.back_tester_cpu(parameters=parameters_2, df_1m=df_1m)
# show results
view.new_function()

if __name__ == "__main__":
main_test()

Ankit Frontenddevloper 1
No ratings yet
Ankit Frontenddevloper 1
1 page
Yash Week 3 Uber Case Study
No ratings yet
Yash Week 3 Uber Case Study
38 pages
Data Aggregation
No ratings yet
Data Aggregation
68 pages
019) Pandas - Batch 2 - Day 019 (FINAL DAY)
No ratings yet
019) Pandas - Batch 2 - Day 019 (FINAL DAY)
43 pages
Exercise 7 - Pandas
No ratings yet
Exercise 7 - Pandas
2 pages
Lunc Prediction
No ratings yet
Lunc Prediction
6 pages
Code
No ratings yet
Code
2 pages
Dev Record Final
No ratings yet
Dev Record Final
34 pages
CH-6 Data Loading, Storage, and File Formats
No ratings yet
CH-6 Data Loading, Storage, and File Formats
163 pages
Cheat Sheet
No ratings yet
Cheat Sheet
10 pages
Cheat Sheet: The Pandas Dataframe Object: Preliminaries Get Your Data Into A Dataframe
100% (1)
Cheat Sheet: The Pandas Dataframe Object: Preliminaries Get Your Data Into A Dataframe
12 pages
Lesson - 3 - 1 Data Wrangling
No ratings yet
Lesson - 3 - 1 Data Wrangling
29 pages
Lab 1 ML Lab
No ratings yet
Lab 1 ML Lab
15 pages
MLStack Cafe 2
No ratings yet
MLStack Cafe 2
11 pages
Pandas DataFrameObject
No ratings yet
Pandas DataFrameObject
4 pages
Cheat Sheet: The Pandas Dataframe Object: Preliminaries Get Your Data Into A Dataframe
100% (1)
Cheat Sheet: The Pandas Dataframe Object: Preliminaries Get Your Data Into A Dataframe
10 pages
Cheat Sheet: The Pandas Dataframe Object I: Preliminaries Get Your Data Into A Dataframe
No ratings yet
Cheat Sheet: The Pandas Dataframe Object I: Preliminaries Get Your Data Into A Dataframe
12 pages
Unit Iv
No ratings yet
Unit Iv
63 pages
Dejene Chala Stat606 Screening Quiz Programming Part
No ratings yet
Dejene Chala Stat606 Screening Quiz Programming Part
12 pages
Automl Code
No ratings yet
Automl Code
3 pages
10 - Jayesh - Prakash - Rane
No ratings yet
10 - Jayesh - Prakash - Rane
26 pages
Project Intern - Jupyter Notebook
No ratings yet
Project Intern - Jupyter Notebook
16 pages
Pandas DataFrame Notes
No ratings yet
Pandas DataFrame Notes
13 pages
Pandas DataFrame Notes
No ratings yet
Pandas DataFrame Notes
10 pages
Pandas DataFrame Notes
100% (1)
Pandas DataFrame Notes
10 pages
Pandas DataFrame Notes
67% (3)
Pandas DataFrame Notes
13 pages
Practical No. 6
No ratings yet
Practical No. 6
15 pages
FDS Record-1-4
No ratings yet
FDS Record-1-4
18 pages
Group-3 Report
No ratings yet
Group-3 Report
38 pages
Pandas & Numpy
No ratings yet
Pandas & Numpy
32 pages
Recurrent Neural Network-Programs
No ratings yet
Recurrent Neural Network-Programs
9 pages
Chapter2 - Data Wrangling
No ratings yet
Chapter2 - Data Wrangling
48 pages
Data Analysis Tools
No ratings yet
Data Analysis Tools
26 pages
Data Wrangling With Python and Pandas
No ratings yet
Data Wrangling With Python and Pandas
7 pages
Pandas Documentation PDF
No ratings yet
Pandas Documentation PDF
86 pages
Cheat Sheet - Pandas
No ratings yet
Cheat Sheet - Pandas
12 pages
Commands SQL, Python (BASICS)
No ratings yet
Commands SQL, Python (BASICS)
7 pages
WorkingWithData - Ipynb - Colaboratory
No ratings yet
WorkingWithData - Ipynb - Colaboratory
13 pages
Pandas Dataframe and Series
No ratings yet
Pandas Dataframe and Series
10 pages
7 Days Analytics Course 3feiz7 4
No ratings yet
7 Days Analytics Course 3feiz7 4
8 pages
PMT2 24
No ratings yet
PMT2 24
56 pages
NumPy and Pandas Tutorial
No ratings yet
NumPy and Pandas Tutorial
8 pages
Unit 5 I
No ratings yet
Unit 5 I
34 pages
Machine Learning Lab
No ratings yet
Machine Learning Lab
43 pages
Data Analysis 6060
No ratings yet
Data Analysis 6060
6 pages
3rd Semester DDM AI DAA DEV Print Pages For Spiral Record 25-1-24 - Removed
No ratings yet
3rd Semester DDM AI DAA DEV Print Pages For Spiral Record 25-1-24 - Removed
28 pages
DAP 3 Module
No ratings yet
DAP 3 Module
62 pages
Data Aggregation and Group Operations
No ratings yet
Data Aggregation and Group Operations
34 pages
Tutorial - Time Series Analysis With Pandas - Dataquest
No ratings yet
Tutorial - Time Series Analysis With Pandas - Dataquest
32 pages
DS Unit-Vi
No ratings yet
DS Unit-Vi
22 pages
Pandas
No ratings yet
Pandas
5 pages
Justenoughpython Pandas 220915 175329
No ratings yet
Justenoughpython Pandas 220915 175329
64 pages
10 Minutes To Pandas - Pandas 2.1.1 Documentation
No ratings yet
10 Minutes To Pandas - Pandas 2.1.1 Documentation
24 pages
Time Series Forecasting Jupyter Code - Ipynb
No ratings yet
Time Series Forecasting Jupyter Code - Ipynb
2,484 pages
Adobe Scan 14-May-2024
No ratings yet
Adobe Scan 14-May-2024
7 pages
Dataframe in Pandas - Cheatsheet
No ratings yet
Dataframe in Pandas - Cheatsheet
8 pages
Pandas
No ratings yet
Pandas
27 pages
基于Engle Granger的低频、高频统计套利研究
No ratings yet
基于Engle Granger的低频、高频统计套利研究
22 pages
Data Frame
No ratings yet
Data Frame
95 pages
M2-R4 Web Design 2020
No ratings yet
M2-R4 Web Design 2020
12 pages
Introduction To CMG's Modelling Workflows
No ratings yet
Introduction To CMG's Modelling Workflows
96 pages
DCIT21: Module 2: Number Systems
No ratings yet
DCIT21: Module 2: Number Systems
10 pages
Cum Bapi Bapi - Alm - Order - Maintain
No ratings yet
Cum Bapi Bapi - Alm - Order - Maintain
2 pages
CGFINAL
No ratings yet
CGFINAL
5 pages
Aleph Whitepaper
No ratings yet
Aleph Whitepaper
20 pages
Superstore Sales Management System
100% (1)
Superstore Sales Management System
9 pages
Sequences and Synonyms
No ratings yet
Sequences and Synonyms
16 pages
CV1800B CV1801B Preliminary Datasheet Full en
No ratings yet
CV1800B CV1801B Preliminary Datasheet Full en
692 pages
Nning Shipping Reliable Containers in Production 2nd Edition WWW EBooksWorld Ir
0% (1)
Nning Shipping Reliable Containers in Production 2nd Edition WWW EBooksWorld Ir
352 pages
Single Node Deploy
100% (1)
Single Node Deploy
61 pages
2024 07 29 - Log
No ratings yet
2024 07 29 - Log
3 pages
What Is AUTOSAR Communication Stack (ComStack) - AUTOSAR Development
No ratings yet
What Is AUTOSAR Communication Stack (ComStack) - AUTOSAR Development
4 pages
Media Literacy
No ratings yet
Media Literacy
28 pages
EMBEDDEDE SYSTEM Eee
No ratings yet
EMBEDDEDE SYSTEM Eee
22 pages
2.2.7 Win Activation Facts
No ratings yet
2.2.7 Win Activation Facts
2 pages
Reporte Abap Envia - Email
No ratings yet
Reporte Abap Envia - Email
9 pages
ZBrush 2024 Whats New
No ratings yet
ZBrush 2024 Whats New
13 pages
Ketan Be Cse 2024 Javafsd
No ratings yet
Ketan Be Cse 2024 Javafsd
1 page
BCA SEM-2 (2022) April-2023 CS - 10 SAD, SOFTWARE QUALITY ASSURANCE& TESTING
No ratings yet
BCA SEM-2 (2022) April-2023 CS - 10 SAD, SOFTWARE QUALITY ASSURANCE& TESTING
3 pages
01-Configuration Preparation
No ratings yet
01-Configuration Preparation
5 pages
Control Flow Statements: Printf
100% (2)
Control Flow Statements: Printf
9 pages
Manual Soft B
No ratings yet
Manual Soft B
104 pages
EJB3 Introduction
No ratings yet
EJB3 Introduction
62 pages
Medium Incorporaao Nao e Possessao Alexandre Cumino 2 PDF Free
No ratings yet
Medium Incorporaao Nao e Possessao Alexandre Cumino 2 PDF Free
190 pages
PWC Token Audit V1
No ratings yet
PWC Token Audit V1
12 pages
07 Hacker Mindset
No ratings yet
07 Hacker Mindset
8 pages
DSA Question Solve
No ratings yet
DSA Question Solve
42 pages
Httpbin (1) - HTTP Client Testing Service
No ratings yet
Httpbin (1) - HTTP Client Testing Service
2 pages

Co Digit Ooo

Uploaded by

Co Digit Ooo

Uploaded by

import polars as pl

def __init__(self, csv_name: str, schema: dict = None) -> None:

# Load CSV as a LazyFrame

# Convert str to datetime

# First, the column is interpreted as being in the America/Lima time

# Finally, delete unnecessary column

# materialize (convert lazy data frame to data frame)

return df, df_tensor

def group_and_write_csv_by(self, time_frame: str | list):

# Grouping 1-minute candles to create x-minute candles and write it to a

# In order to avoid wrong formats in 'Date' column, time is converted

# if it is a str, then call once but if it a list call as needed

def check_and_create_csv(self) -> None:

# This class is in charge of the exploratory analysis of the data (EDA).

# This class deals with the analysis of fundamental news.

# This class stores all trading strategies

# Materialize lazy frame because lf doesn't have 'transpose' method but df

# get max and min columns

# Delete unnecessary columns

# get data frame filtered by time

df = df.select(["Date", "Open", "tp", "sl"])

# Materialize lazy frame because lf doesn't have 'transpose' method but df

# get max and min columns

# This class is in charge of performing historical back testing.

# Make Back testing using CPU

# getting close price

# getting utility price

# Make Back testing using GPU (Faster than CPU)

# This class is in charge of data visualization.

# this is just for decorative purpose

# Update the designed of the graph (optional)

# evaluates technical aspects of a trading strategy,

# This is the main function

# This is the main function

You might also like

def init(self, csv_name: str, schema: dict = None) -> None: