The date is an index so not important
This commit is contained in:
@@ -22,7 +22,7 @@ def pull():
|
||||
# Remove the ticker column
|
||||
df.columns = df.columns.get_level_values(0)
|
||||
|
||||
# Make sure Date is actually a Date Object
|
||||
# Make sure Date is a number object
|
||||
df = df.reset_index()
|
||||
df['Date'] = pd.to_numeric(pd.to_datetime(df['Date']))
|
||||
|
||||
@@ -47,8 +47,7 @@ def pull():
|
||||
print("Processing data")
|
||||
final_df = pd.concat(all_data)
|
||||
|
||||
# Nomralize the Date
|
||||
final_df['Date'] = (final_df['Date'] - final_df['Date'].min()) / (final_df['Date'].max() - final_df['Date'].min())
|
||||
# Make date the index so it doesnt influence the training
|
||||
final_df.set_index('Date', inplace=True)
|
||||
|
||||
# Drop rows with null values
|
||||
|
||||
Reference in New Issue
Block a user