StockSaint/basic.py at main · 1Bit-Developers/StockSaint · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
import subprocess
import sys

# try:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import mplcyberpunk


#     # import seaborn as sns
#     # from sklearn.metrics import r2_score, median_absolute_error, mean_absolute_error
#     # from sklearn.metrics import median_absolute_error, mean_squared_error, mean_squared_log_error
#     # from scipy.optimize import minimize
#     # import statsmodels.tsa.api as smt
#     # import statsmodels.api as sm
#     # from tqdm import tqdm_notebook
#     # from itertools import product
#
# except ImportError:
#     subprocess.check_call([sys.executable, "-m", "pip", "install", 'pandas'])
#     subprocess.check_call([sys.executable, "-m", "pip", "install", 'numpy'])
#     subprocess.check_call([sys.executable, "-m", "pip", "install", 'matplotlib'])
#     subprocess.check_call([sys.executable, "-m", "pip", "install", 'mplcyberpunk'])
#     # subprocess.check_call([sys.executable, "-m", "pip", "install", 'seaborn'])
#     # subprocess.check_call([sys.executable, "-m", "pip", "install", 'sklearn'])
#     # subprocess.check_call([sys.executable, "-m", "pip", "install", 'scipy'])
#     # subprocess.check_call([sys.executable, "-m", "pip", "install", 'statsmodels'])
#     # subprocess.check_call([sys.executable, "-m", "pip", "install", 'tqdm'])
#     # subprocess.check_call([sys.executable, "-m", "pip", "install", 'itertools'])
#
# finally:
#     import pandas as pd
#     import numpy as np
#     import matplotlib.pyplot as plt
#     import mplcyberpunk
#     # import seaborn as sns
#     # from sklearn.metrics import r2_score, median_absolute_error, mean_absolute_error
#     # from sklearn.metrics import median_absolute_error, mean_squared_error, mean_squared_log_error
#     # from scipy.optimize import minimize
#     # import statsmodels.tsa.api as smt
#     # import statsmodels.api as sm
#     # from tqdm import tqdm_notebook
#     # from itertools import product


# Getting the Data in string format from NodeJS
# NodeJS passed 2 args ['./test.py', data] where sys.argv[1] represents DATA
data = sys.argv[1]

# Creating a Pandas DataFrame for the supplied data
my_data_new = pd.DataFrame([x.split(',') for x in data.split('\n')])

# Rearranging and Cleaning the Data
my_data_new.columns = my_data_new.iloc[0]
my_data_new = my_data_new.drop(columns = ['dividend_amount', 'split_coefficient\r'])
my_data_new.drop(0, axis = 0, inplace = True)
my_data_new.drop(101, axis = 0, inplace = True)
my_data_new = my_data_new.iloc[::-1]        # reverse all rows
my_data_new.reset_index(drop = True, inplace = True)

# Converting the Data type of each data item like close, high, low etc from "Object" to "numeric"
for i in range(0, len(my_data_new.columns)):
    my_data_new.iloc[:,i] = pd.to_numeric(my_data_new.iloc[:,i], errors='ignore')

# Important Functions
# 1) this returns the mean absolute error b/w the predicted and the true value
def mean_absolute_percentage_error(y_true, y_pred):
    return np.mean(np.abs((y_true - y_pred) / y_true)) * 100

# 2) this function plots the moving average and the Required Plot
# accepts a pandas data frame named series => Required Plot
# accepts window size for rolling mean
# accepts name for the png figure to be save
def plot_moving_average(series, window, my_name):

    # creating a DataFrame for storing the rolling mean's
    rolling_mean_prediction = series.rolling(window=window).mean()

    # return the rolling mean DataFrame for the Current Dynamic(close, high, low etc)
    # so as to complete the prediction process
    return rolling_mean_prediction

def gen_my_plot(prediction, original, my_name, my_technique_label):
    plt.figure(figsize=(20, 10))

    # Plotting the Prediction and Original on the same Plot
    # Plot the prediction
    plt.plot(my_data_new.timestamp, prediction, marker = 'o', label = my_technique_label, color = 'green')

    # # plot the original data on the same plot
    plt.plot(original, label='Actual values', marker = 'D', color = 'red')

    plt.xticks(np.arange(0, 100, step=10))  # Set label locations.
    plt.tick_params(labelsize=12)
    plt.legend(loc='best')
    plt.grid(True)
    plt.xlabel('TIMESTAMP', fontsize = 15)
    if(my_name == 'volume'):
        plt.ylabel('VOLUME (in Units)')
    else:
        lab = 'PRICES'
        if(sys.argv[2] == 'BSE'):
            lab = lab + " (in Rs.)"
        else:
            lab = lab + " (in $)"
        plt.ylabel(lab, fontsize = 15)
    plt.legend()
    mplcyberpunk.add_glow_effects()

    file_name = "/tmp/fig_basic_prediction_" + my_name + '.png'
    plt.savefig(file_name)

# 3) Prediction function for the Market Dynamic
# We pass last(x2,y2) and 2nd-last mean(x1, y1) and predict x2 + 1
# though we can use this for and point but it will increase error chance for values
def my_prediction(x1, y1, x2, y2, X):
    slope = (y2 - y1) / (x2 - x1)
    y = y1 + slope * (X - x1)
    return (y, slope)

# 4) Market Mood Predicting Function
# uses Slope Value of the last 2 rolling mean values to predict the Up / Down Nature of the Prediction Plot
def mood(slope):
    if(slope >= 0):
        return "Up"
    else:
        return "Down"

# defining number of Rows and Columns into the DataFrame
r,c = my_data_new.shape

# result_prediction variable to store final result
result_prediction = ""

# ===============================   Generating Prediction FOR BASIC USER ===========================
window = 3
plot_technique = "moving_average"
plt.style.use("cyberpunk")
pleasePlot = ["close", "open"]
for dynamic in pleasePlot:
    if(dynamic == 'open'):
        # Plot the Original Data
        plt.figure(figsize=(20, 10))
        plt.plot(my_data_new.timestamp, my_data_new.open, marker = 'd', color = 'red')
        plt.xticks(np.arange(0, 100, step=10))  # Set label locations.
        plt.tick_params(labelsize=12)
        plt.legend(loc='best')
        plt.grid(True)
        plt.xlabel('TIMESTAMP', fontsize = 15)

        lab = 'PRICES'
        if(sys.argv[2] == 'BSE'):
            lab = lab + " (in Rs.)"
        else:
            lab = lab + " (in $)"
        plt.ylabel(lab, fontsize = 15)

        plt.legend()
        mplcyberpunk.add_glow_effects()
        # file_name = "public/fig_basic_opening.png"
        file_name = "/tmp/fig_basic_opening.png"
        plt.savefig(file_name)
        # plt.show()

        # image = cv2.imread("logo.png")

        # # Checking if the image is empty or not
        # if image is None:
        #     result = "Image is empty!!"
        # else:
        #     result = "Image is not empty!!"

        # # Calling and printing
        # # the function
        # print(result)

        # Calculating the Prediction Value using MOVING AVERAGE and Exponential Smoothing
        my_technique_label = ""
        if(plot_technique == 'moving_average'):
            prediction = plot_moving_average(my_data_new.open, window, "opening")
            y2 = prediction.iloc[-1]
            x2 = r-1
            y1 = prediction.iloc[-2]
            x1 = r-2
            my_technique_label = "Moving Average"

        else:
            alpha = 2 / (window + 1)
            prediction = plot_exponential_smoothing(my_data_new.open, alpha, "opening")
            y2 = prediction[-1]
            x2 = r-1
            y1 = prediction[-2]
            x1 = r-2
            my_technique_label = "Exponential Smoothing"

        gen_my_plot(prediction, my_data_new.open, "opening", my_technique_label)
        prediction, slope = my_prediction(x1, y1, x2, y2, x2+1)

        # Adding the Results Obtained i.e. Predicted Value and Mood to "result_prediction"
        # using "%" as a separator
        result_prediction += str(prediction) + "%" + mood(slope) + "%"

    elif(dynamic == 'close'):

        # Plot the Original Data
        plt.figure(figsize=(20, 10))
        plt.plot(my_data_new.timestamp, my_data_new.close, marker = 'd', color = 'red')
        plt.xticks(np.arange(0, 100, step=10))  # Set label locations.
        plt.tick_params(labelsize=12)
        plt.legend(loc='best')
        plt.grid(True)
        plt.xlabel('TIMESTAMP', fontsize = 15)

        lab = 'PRICES'
        if(sys.argv[2] == 'BSE'):
            lab = lab + " (in Rs.)"
        else:
            lab = lab + " (in $)"
        plt.ylabel(lab, fontsize = 15)

        plt.legend()
        mplcyberpunk.add_glow_effects()
        file_name = "/tmp/fig_basic_closing.png"
        plt.savefig(file_name)

        # Calculating the Prediction Value using MOVING AVERAGE and Exponential Smoothing
        my_technique_label = ""
        if(plot_technique == 'moving_average'):
            prediction = plot_moving_average(my_data_new.close, window, "closing")
            y2 = prediction.iloc[-1]
            x2 = r-1
            y1 = prediction.iloc[-2]
            x1 = r-2
            my_technique_label = "Moving Average"

        else:
            alpha = 2 / (window + 1)
            prediction = plot_exponential_smoothing(my_data_new.close, alpha, "closing")
            y2 = prediction[-1]
            x2 = r-1
            y1 = prediction[-2]
            x1 = r-2
            my_technique_label = "Exponential Smoothing"

        gen_my_plot(prediction, my_data_new.close, "closing", my_technique_label)
        prediction, slope = my_prediction(x1, y1, x2, y2, x2+1)

        # Adding the Results Obtained i.e. Predicted Value and Mood to "result_prediction"
        # using "%" as a separator
        result_prediction += str(prediction) + "%" + mood(slope) + "%"

    else:
        print("No Market Dynamic Found to Plot")

# returning the results
print(result_prediction)

sys.stdout.flush