The date is an index so not important
This commit is contained in:
@@ -22,7 +22,7 @@ def pull():
|
|||||||
# Remove the ticker column
|
# Remove the ticker column
|
||||||
df.columns = df.columns.get_level_values(0)
|
df.columns = df.columns.get_level_values(0)
|
||||||
|
|
||||||
# Make sure Date is actually a Date Object
|
# Make sure Date is a number object
|
||||||
df = df.reset_index()
|
df = df.reset_index()
|
||||||
df['Date'] = pd.to_numeric(pd.to_datetime(df['Date']))
|
df['Date'] = pd.to_numeric(pd.to_datetime(df['Date']))
|
||||||
|
|
||||||
@@ -47,8 +47,7 @@ def pull():
|
|||||||
print("Processing data")
|
print("Processing data")
|
||||||
final_df = pd.concat(all_data)
|
final_df = pd.concat(all_data)
|
||||||
|
|
||||||
# Nomralize the Date
|
# Make date the index so it doesnt influence the training
|
||||||
final_df['Date'] = (final_df['Date'] - final_df['Date'].min()) / (final_df['Date'].max() - final_df['Date'].min())
|
|
||||||
final_df.set_index('Date', inplace=True)
|
final_df.set_index('Date', inplace=True)
|
||||||
|
|
||||||
# Drop rows with null values
|
# Drop rows with null values
|
||||||
|
|||||||
Reference in New Issue
Block a user