You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132
  1. import numpy as np
  2. import tensorflow as tf
  3. import pandas as pd
  4. import matplotlib.pyplot as plt
  5. import wilshire
  6. import tensorflow_addons as tfa
  7. from statsmodels.tsa.arima.model import ARIMA
  8. def snake(x):
  9. return(x+(tf.math.sin(50*x)**2)/50)
  10. def sinus(x):
  11. return(tf.math.sin(x))
  12. def sinus_cosinus(x):
  13. return(tf.math.sin(x)+tf.math.cos(x))
  14. def swish(x):
  15. return(x*tf.math.sigmoid(x))
  16. #activations = [tf.keras.activations.relu,swish,sinus_cosinus,sinus,snake]
  17. activations = [snake]
  18. def prepare_data(filename="WILL5000INDFC2.csv"):
  19. df_train,df_test,index = wilshire.preprocess(filename)
  20. x_train = np.arange(df_train.shape[0])
  21. maximum = np.max(x_train)
  22. x_train = x_train / maximum
  23. y_train=df_train["WILL5000INDFC"]
  24. y_train.to_numpy()
  25. x_test = np.arange(df_train.shape[0]+1,df_train.shape[0]+df_test.shape[0]+1)
  26. y_test = df_test["WILL5000INDFC"]
  27. y_test.to_numpy()
  28. x_test=x_test / maximum
  29. return x_train,x_test,y_train,y_test,maximum,index
  30. def arima_pred(y_train,y_test,orders=[[2,1,1],[2,2,1],[3,1,1],[2,1,2]],n=5):
  31. mse=[]
  32. for order in orders :
  33. mean_err=np.array()
  34. for k in range(n):
  35. train = y_train
  36. preds = []
  37. for test in range(len(y_test)):
  38. model = ARIMA(train, order=(order[0],order[1],order[2]))
  39. model = model.fit()
  40. output = model.forecast()
  41. preds.append(output[0])
  42. #train.append(y_test[te
  43. mean_err.append((np.square(np.array(preds) - np.array(y_test))).mean())
  44. mse.append(mean_err.mean())
  45. return(mse)
  46. def create_model(activation):
  47. model = tf.keras.Sequential()
  48. model.add(tf.keras.layers.Dense(1,input_shape=[1,],activation=activation))
  49. model.add(tf.keras.layers.Dense(64,activation=activation))
  50. model.add(tf.keras.layers.Dense(64,activation=activation))
  51. model.add(tf.keras.layers.Dense(1))
  52. opt = tf.keras.optimizers.SGD(learning_rate=0.01,momentum=0.9)
  53. model.compile(optimizer=opt, loss='mse')
  54. model.build()
  55. model.summary()
  56. return model
  57. def training_testing(n=5,activations = [tf.keras.activations.relu,swish,sinus_cosinus,sinus,snake]):
  58. x_train,x_test,y_train,y_test,maximum,index = prepare_data(filename="WILL5000INDFC2.csv")
  59. models = []
  60. errors_train,errors_test = [],[]
  61. mean_y_train,mean_y_test,std_y_test=[],[],[]
  62. for activation in activations :
  63. y_train_5=[]
  64. y_test_5=[]
  65. errors_train_5=[]
  66. errors_test_5=[]
  67. for k in range(n):
  68. model = create_model(activations)
  69. model.fit(x_train,y_train, batch_size=1, epochs=1)
  70. y_pred_test = model.predict(x_test)
  71. y_pred_train = model.predict(x_train)
  72. y_train_5.append(y_pred_train)
  73. y_test_5.append(y_pred_test)
  74. errors_test_5.append(model.evaluate(x_test,y_test))
  75. errors_train_5.append(model.evaluate(x_train,y_train))
  76. models.append(model)
  77. mean_y_train.append(np.mean(y_train_5,axis=0))
  78. mean_y_test.append(np.mean(y_test_5,axis=0))
  79. std_y_test.append(np.std(y_test_5,axis=0))
  80. errors_train.append([np.mean(errors_train_5),np.std(errors_train_5)])
  81. errors_test.append([np.mean(errors_test_5),np.std(errors_test_5)])
  82. # y_preds_train.append(y_pred_train)
  83. # y_preds_test.append(y_pred_test)
  84. return models,errors_train,errors_test
  85. def final_plot(models,errors_test,arima_err):
  86. x_train,x_test,y_train,y_test,maximum,index = prepare_data(filename="WILL5000INDFC2.csv")
  87. x = np.arange(9000)
  88. x_n = x / maximum
  89. future_preds = models[-1].predict(x_n) ## Calculated with a website the number of working days between 01-06-2020 and 01-01-2024
  90. #x=np.arange(df_train.shape[0]+df_test.shape[0]+908)
  91. y_true = np.concatenate((y_train,y_test))
  92. x_cut = np.arange(x_train.shape[0]+x_test.shape[0])
  93. print("----- ARIMA Test MSE -----")
  94. orders_ARIMA = ["[2,1,1]","[2,2,1]","[3,1,1]","[2,1,2]"]
  95. for k in range(len(orders_ARIMA)):
  96. print("ARIMA"+orders_ARIMA[k]+" : "+str(arima_err[k]))
  97. print("----- DNN Test MSE -----")
  98. activations = ["ReLU","Swish","Sinus Cosinus","Sinus","Snake"]
  99. for k in range(len(activations)):
  100. print("DNN "+activations[k]+" : "+str(errors_test[k]))
  101. plt.figure()
  102. plt.plot(x_cut,y_true,label="True data")
  103. plt.plot(x,future_preds,label="Predictions")
  104. plt.xticks(range(0, 9000, 250), range(1995, 2031, 1))
  105. plt.xlabel("Années")
  106. plt.ylabel("Index Willshire5000 normalisé")
  107. plt.vlines([index,index+85],ymin=0,ymax=1,colors="r",label="Test Samples")
  108. plt.legend()
  109. plt.show()