forked from a-phung/BeaverHacks_Spring2021_Project
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathml.py
106 lines (76 loc) · 3.24 KB
/
ml.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
import pandas_datareader as web
import datetime as dt
from sklearn.preprocessing import MinMaxScaler
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, Dropout, LSTM
def delphi(ticker, future_date):
#load data
company = ticker
start = dt.datetime(2018,1,1)
end = dt.datetime(2020,1,1)
future_days = int(future_date)
data = web.DataReader(company, 'yahoo', start, end)
#prepare data
scaler = MinMaxScaler(feature_range = (0,1))
scaled_data = scaler.fit_transform(data['Adj Close'].values.reshape(-1,1))
#uses the adjusted close price
prediction_days = 100
x_train = []
y_train = []
for x in range(prediction_days, len(scaled_data)):
x_train.append(scaled_data[x-prediction_days:x,0])
y_train.append(scaled_data[x,0])
x_train = np.array(x_train)
y_train = np.array(y_train)
x_train = np.reshape(x_train, (x_train.shape[0], x_train.shape[1],1))
#print(len(x_train))
#build model (simple tree)
model = Sequential()
#https://www.tensorflow.org/api_docs/python/tf/keras/Sequential
model.add(LSTM(units = 50, return_sequences = True, input_shape = (x_train.shape[1],1)))
model.add(Dropout(0.2))
model.add(LSTM(units = 50, return_sequences = True))
model.add(Dropout(0.2))
model.add(LSTM(units = 50))
model.add(Dropout(0.2))
model.add(Dense(units = 1)) #prediction of next closing day
model.compile(optimizer = 'rmsprop', loss = 'mean_squared_error')
#fitting
model.fit(x_train, y_train, epochs = 50, batch_size = None)
print(model.summary())
#print(model.evaluate())
#model accuracy
test_start = dt.datetime(2020,1,1)
test_end = dt.datetime.now()
test_data = web.DataReader(company, 'yahoo', test_start, test_end)
actual_prices = test_data['Adj Close'].values
total_dataset = pd.concat((data['Adj Close'], test_data['Adj Close']), axis = 0)
model_inputs = total_dataset[len(total_dataset) - len(test_data) - prediction_days:].values
model_inputs = model_inputs.reshape(-1,1)
model_inputs = scaler.transform(model_inputs)
x_test = []
for x in range(prediction_days, len(model_inputs)):
x_test.append(model_inputs[x-prediction_days:x,0])
x_test = np.array(x_test)
x_test = np.reshape(x_test, (x_test.shape[0], x_test.shape[1], 1))
predicted_prices = model.predict(x_test, batch_size=None)
predicted_prices = scaler.inverse_transform(predicted_prices)
# make predictions on test data
real_data = [model_inputs[len(model_inputs) + future_days - prediction_days:len(model_inputs + future_days), 0]]
real_data = np.array(real_data)
real_data = np.reshape(real_data, (real_data.shape[0], real_data.shape[1], 1))
prediction = model.predict(real_data, batch_size=None)
prediction = scaler.inverse_transform(prediction)
print('prediction')
print(prediction)
#plotting
plt.plot(actual_prices, color = 'blue', label = 'Actual Price')
plt.plot(predicted_prices, color = 'red', label = 'Predicted Price')
plt.title('Share Price')
plt.xlabel('Time (days)')
plt.ylabel('Share Price (USD)')
plt.legend()
plt.show()