Predicción 1 paso adelante usando el último retardo (grilla)

Code

import tensorflow as tf
from tensorflow.keras.callbacks import CSVLogger, EarlyStopping
import matplotlib as mpl
import matplotlib.pyplot as plt
import numpy as np
import os
import pandas as pd
import seaborn as sns
import time
import gc
import sys
from statsmodels.graphics.tsaplots import plot_acf
from statsmodels.graphics.tsaplots import plot_pacf

Code

print(f"Tensorflow Version: {tf.__version__}")
print(f"Pandas Version: {pd.__version__}")
print(f"Numpy Version: {np.__version__}")
print(f"System Version: {sys.version}")

mpl.rcParams['figure.figsize'] = (17, 5)
mpl.rcParams['axes.grid'] = False
sns.set_style("whitegrid")

notebookstart= time.time()

Code

import IPython
import IPython.display

0.1 Preparación de los datos

Code

# Lectura de la serie
Bitcoin = pd.read_csv("C:/Users/dofca/Desktop/series/datos/BTC-Daily.csv",
                   header = 0, usecols = [1,6])
Bitcoin.rename(columns={"date": "Fecha", "close": "Valor"}, inplace=True)
Bitcoin['Fecha'] = pd.to_datetime(Bitcoin['Fecha'])
Bitcoin.sort_values(by=['Fecha'], inplace=True)
ventana = (Bitcoin['Fecha'] >= '2017-01-01') & (Bitcoin['Fecha'] <= '2021-12-31')
Bitcoin = Bitcoin.loc[ventana]
Bitcoin = Bitcoin.reset_index(drop = True)

Bitcoin

	Fecha	Valor
0	2017-01-01	998.80
1	2017-01-02	1014.10
2	2017-01-03	1036.99
3	2017-01-04	1122.56
4	2017-01-05	994.02
...	...	...
1821	2021-12-27	50718.11
1822	2021-12-28	47543.30
1823	2021-12-29	46483.36
1824	2021-12-30	47150.71
1825	2021-12-31	46214.37

1826 rows × 2 columns

Code

features_considered = ['Valor'] # la variable a usar en la predicción es ella misma

Code

features = Bitcoin[features_considered] # solo se usará la variable Total en la predicción
features.index = Bitcoin['Fecha'] # variable que indica el tiempo (la serie es mensual)
features

Code

features.plot(subplots = True) # gráfico de la serie de tiempo

array([<Axes: xlabel='Fecha'>], dtype=object)

Code

# partición del conjuntos de datos en entrenamiento, validación y prueba
column_indices = {name: i for i, name in enumerate(features.columns)} # índice = 0

n = len(features) 
train_df = features[0:int(n*0.7)] 
val_df = features[int(n*0.7):int(n*0.9)] 
test_df = features[int(n*0.9):] 

num_features = features.shape[1]

Code

print("longitud dataframe entrenamiento:", train_df.shape)
print("longitud dataframe validación:", val_df.shape)
print("longitud dataframe prueba:", test_df.shape)

longitud dataframe entrenamiento: (1278, 1)
longitud dataframe validación: (365, 1)
longitud dataframe prueba: (183, 1)

Code

# Normalización de las observaciones
train_mean = train_df.mean()
train_std = train_df.std()

train_df = (train_df - train_mean) / train_std
val_df = (val_df - train_mean) / train_std
test_df = (test_df - train_mean) / train_std

Code

# todo el dataframe normalizado por train_mean y train_std
df_std = (features - train_mean) / train_std
df_std = df_std.melt(var_name='Column', value_name='Normalized')
df_std

Code

plt.figure(figsize=(9, 5))
ax = sns.violinplot(x = 'Column', y = 'Normalized', data = df_std)
_ = ax.set_xticklabels(features.keys(), rotation=90)

0.2 Definición de clases y funciones para el problema de aprendizaje automático

Code

class WindowGenerator():
  def __init__(self, input_width, label_width, shift,
               train_df=train_df, val_df=val_df, test_df=test_df,
               label_columns=None):
    # Store the raw data.
    self.train_df = train_df
    self.val_df = val_df
    self.test_df = test_df

    # Work out the label column indices.
    self.label_columns = label_columns
    if label_columns is not None:
      self.label_columns_indices = {name: i for i, name in
                                    enumerate(label_columns)}
    self.column_indices = {name: i for i, name in
                           enumerate(train_df.columns)}

    # Work out the window parameters.
    self.input_width = input_width
    self.label_width = label_width
    self.shift = shift

    self.total_window_size = input_width + shift

    self.input_slice = slice(0, input_width)
    self.input_indices = np.arange(self.total_window_size)[self.input_slice]

    self.label_start = self.total_window_size - self.label_width
    self.labels_slice = slice(self.label_start, None)
    self.label_indices = np.arange(self.total_window_size)[self.labels_slice]

  def __repr__(self):
    return '\n'.join([
        f'Total window size: {self.total_window_size}',
        f'Input indices: {self.input_indices}',
        f'Label indices: {self.label_indices}',
        f'Label column name(s): {self.label_columns}'])

0.3 Split

Dada una lista de entradas consecutivas, el método split_window las convertirá en una ventana de entradas y una ventana de etiquetas.

Code

def split_window(self, features):
  inputs = features[:, self.input_slice, :]
  labels = features[:, self.labels_slice, :]
  if self.label_columns is not None:
    labels = tf.stack(
        [labels[:, :, self.column_indices[name]] for name in self.label_columns],
        axis=-1)

  # Slicing doesn't preserve static shape information, so set the shapes
  # manually. This way the `tf.data.Datasets` are easier to inspect.
  inputs.set_shape([None, self.input_width, None])
  labels.set_shape([None, self.label_width, None])

  return inputs, labels

WindowGenerator.split_window = split_window

0.4 Transforma nuestros objetos a tipo tensorflow

Tamaño del lote batch size = 32

Code

def make_dataset(self, data):
  data = np.array(data, dtype=np.float32)
  ds = tf.keras.utils.timeseries_dataset_from_array(
      data=data,
      targets=None,
      sequence_length=self.total_window_size,
      sequence_stride=1,
      shuffle=False,
      batch_size=32,) 

  ds = ds.map(self.split_window)

  return ds

WindowGenerator.make_dataset = make_dataset

Code

@property
def train(self):
  return self.make_dataset(self.train_df)

@property
def val(self):
  return self.make_dataset(self.val_df)

@property
def test(self):
  return self.make_dataset(self.test_df)

@property
def example(self):
  """Get and cache an example batch of `inputs, labels` for plotting."""
  result = getattr(self, '_example', None)
  if result is None:
    # No example batch was found, so get one from the `.train` dataset
    result = next(iter(self.train))
    # And cache it for next time
    self._example = result
  return result

WindowGenerator.train = train
WindowGenerator.val = val
WindowGenerator.test = test
WindowGenerator.example = example

1 Definir las gráficas para visualizar lo que se desea predecir en términos de las entradas

Code

def plot(self, model=None, plot_col='Valor', max_subplots=3):
  inputs, labels = self.example
  plt.figure(figsize=(12, 8))
  plot_col_index = self.column_indices[plot_col]
  max_n = min(max_subplots, len(inputs))
  for n in range(max_n):
    plt.subplot(max_n, 1, n+1)
    plt.ylabel(f'{plot_col} [normed]')
    plt.plot(self.input_indices, inputs[n, :, plot_col_index],
             label='Inputs', marker='.', zorder=-10)

    if self.label_columns:
      label_col_index = self.label_columns_indices.get(plot_col, None)
    else:
      label_col_index = plot_col_index

    if label_col_index is None:
      continue

    plt.scatter(self.label_indices, labels[n, :, label_col_index],
                edgecolors='k', label='Labels', c='#2ca02c', s=64)
    if model is not None:
      predictions = model(inputs)
      plt.scatter(self.label_indices, predictions[n, :, label_col_index],
                  marker='X', edgecolors='k', label='Predictions',
                  c='#ff7f0e', s=64)

    if n == 0:
      plt.legend()

  plt.xlabel('Time [h]')

WindowGenerator.plot = plot

2 Configuración para el ajuste de los modelos

Code

# Definimos número de épocas necesarias y funciones de pérdida
MAX_EPOCHS = 20

def compile_and_fit(model, window, patience=2): #patiences como el número de épocas que espera antes de parar
  # Para evitar sobreajuste
  early_stopping = tf.keras.callbacks.EarlyStopping(monitor='val_loss',
                                                    patience=patience,
                                                    mode='min')

  model.compile(loss=tf.losses.MeanSquaredError(),
                optimizer=tf.optimizers.Adam(),
                metrics=[tf.metrics.MeanAbsoluteError()])

  history = model.fit(window.train, epochs=MAX_EPOCHS,
                      validation_data=window.val,
                      callbacks=[early_stopping])
  return history

2.1 Configuración del modelo

w1 = WindowGenerator(input_width=1, label_width=1, shift=1,
                     label_columns=['Valor'])
w1

Code

for batch in w1.train.take(1):
    inputs_train,targets_train = batch
    
print("Input shape:", inputs_train.numpy().shape)
print("Target shape:", targets_train.numpy().shape)

Input shape: (32, 1, 1)
Target shape: (32, 1, 1)

Code

for batch in w1.val.take(1):
    inputs_val,targets_val = batch

print("Input shape:", inputs_val.numpy().shape)
print("Target shape:", targets_val.numpy().shape)

Code

for batch in w1.test.take(1):
    inputs_test,targets_test = batch

print("Input shape:", inputs_val.numpy().shape)
print("Target shape:", targets_val.numpy().shape)

Code

w1.train.element_spec

Code

w1.plot()

Code

## Ejemplo de los lotes en los datos de entrenamiento
i=1
for batch in w1.train.take(1):
    inputs, targets = batch
    print("Covariable o input",i,inputs)
    print("Respuesta o etiqueta",i,targets)
    i=i+1

Code

## Ejemplo de los lotes en los datos de validación
i=1
for batch in w1.val.take(1):
    inputs, targets = batch
    print("Covariable o input",i,inputs)
    print("Respuesta o etiqueta",i,targets)
    i=i+1

Code

## Ejemplo de los lotes en los datos de prueba
i=1
for batch in w1.test.take(10):
    inputs, targets = batch
    print("Covariable o input",i,inputs)
    print("Respuesta o etiqueta",i,targets)
    i=i+1

Code

input_dataset_train = w1.train.map(lambda x,y: x)
target_dataset_train = w1.train.map(lambda x,y: y)

Code

input_dataset_val = w1.val.map(lambda x,y: x)
target_dataset_val = w1.val.map(lambda x,y: y)

Code

input_dataset_test = w1.test.map(lambda x,y: x)
target_dataset_test = w1.test.map(lambda x,y: y)

2.2 búsqueda de los hiperparámetros e implementación del modelo

Code

from tensorflow import keras
import keras_tuner as kt
from keras.models import Sequential
from keras.layers import Dense, LSTM, Dropout
from tensorflow.keras import layers

Code

def build_model(hp):
    model = keras.Sequential()
    model.add(layers.LSTM(units=hp.Int('input_unit',min_value=32,max_value=512,step=32),activation=hp.Choice("activation", ["relu", "tanh"]),return_sequences=True))
    for i in range(hp.Int('n_layers', 1, 4)):
        model.add(layers.LSTM(hp.Int(f'lstm_{i}_units',min_value=32,max_value=512,step=32),activation=hp.Choice("activation", ["relu", "tanh"]),return_sequences=True))
    model.add(layers.LSTM(hp.Int('layer_2_neurons',min_value=32,max_value=512,step=32),activation=hp.Choice("activation", ["relu", "tanh"])))
    model.add(layers.Dropout(hp.Float('Dropout_rate',min_value=0,max_value=0.5,step=0.1)))
    model.add(layers.Dense(1, activation="linear"))
    model.compile(loss='mean_squared_error', optimizer='adam',metrics = ['mse'])
    return model

Code

tuner_LSTM = kt.GridSearch(
    hypermodel=build_model,
    objective="val_loss",
    max_trials=50,
    seed=1234,
    overwrite=True,
    directory="dirsalida",
    project_name="helloworld"
)

Code

stop_early = tf.keras.callbacks.EarlyStopping(monitor="val_loss",patience=0)

Code

# tuner_LSTM.search_space_summary()

Code

tuner_LSTM.search((w1.train), epochs=20, validation_data=(w1.val),callbacks=[stop_early])

Code

# Get the top 2 models.
models_LSTM = tuner_LSTM.get_best_models(num_models=2)
best_model_LSTM = models_LSTM[0]
# Build the model.
# Needed for `Sequential` without specified `input_shape`.
best_model_LSTM.build(input_shape=(32, 1, 1))
best_model_LSTM.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 lstm (LSTM)                 (32, 1, 32)               4352      
                                                                 
 lstm_1 (LSTM)               (32, 1, 32)               8320      
                                                                 
 lstm_2 (LSTM)               (32, 32)                  8320      
                                                                 
 dropout (Dropout)           (32, 32)                  0         
                                                                 
 dense (Dense)               (32, 1)                   33        
                                                                 
=================================================================
Total params: 21025 (82.13 KB)
Trainable params: 21025 (82.13 KB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________

Code

tuner_LSTM.results_summary()

Code

train_plus_val=w1.train.concatenate(w1.val)###verificar que en efecto

Code

# Get the top 2 hyperparameters.
best_hps_LSTM = tuner_LSTM.get_best_hyperparameters(5)
# Build the model with the best hp.
callback=tf.keras.callbacks.EarlyStopping(monitor="loss",patience=0)
model_LSTM = build_model(best_hps_LSTM[0])
# Fit with the entire dataset.
model_LSTM.fit(train_plus_val, epochs=20,callbacks=[callback])

Una vez re-entrenado el modelo con el conjunto de hiperparámetros hallado anteriormente, se obtiene el siguiente MSE en en conjunto de entrenamiento + validación:

Code

model_LSTM.evaluate(train_plus_val, verbose=0)

[1.1643624305725098, 1.1643624305725098]

y el MSE sobre el conjunto de prueba:

Code

model_LSTM.evaluate(w1.test, verbose=0)

[6.678896903991699, 6.678896903991699]

2.3 Predicción sobre el conjunto de prueba

Code

prediction_test=(model_LSTM.predict(w1.test, verbose=1)*train_std['Valor']+train_mean['Valor'])
print(prediction_test.shape)

Code

i=1
for batch in target_dataset_test.take(10):
    if i==1:
        targets_test = batch.numpy()
    elif i>1:
        targets_test_aux = batch.numpy()
        targets_test=np.append(targets_test,targets_test_aux)
    i=i+1
    
print(targets_test.shape)

Code

true_series=targets_test*train_std['Valor']+train_mean['Valor']
true_series=true_series.reshape((182,1,1))
print(true_series.shape)

Una vez que se hacen las predicciones sobre el conjunto de prueba, se hace la comparación con los valores reales y se obtiene el siguiente RECM (en la escala original):

Code

errors_squared=tf.keras.metrics.mean_squared_error(true_series, prediction_test).numpy()
print("RECM:",errors_squared.mean()**0.5)

RECM: 16257.529455609176

Code

test_index=test_df.index[:182]
true_series_final=true_series.reshape(182)
prediction_test_final=prediction_test.reshape(182)

Code

plt.plot(true_series_final)
plt.plot(prediction_test_final)
plt.legend(['Respesta real','Predicción de la Respuesta'],loc='lower right', fontsize=15)
plt.ylabel('Y y $\hat{Y}$ en conjunto de prueba', fontsize=15)
plt.title('Red neuronal recurrente: Predicciones sobre el conjunto de prueba', fontsize=20)

Text(0.5, 1.0, 'Red neuronal recurrente: Predicciones sobre el conjunto de prueba')

Code

predicciones_prueba = model_LSTM.predict(w1.test)*train_std['Valor']+train_mean['Valor']
train_val_predict = model_LSTM.predict(train_plus_val)*train_std['Valor']+train_mean['Valor']

Code

plt.figure(figsize=(20,10))
plt.title('Red neuronal recurrente para la serie de tiempo del Bitcoin', fontsize=20)
plt.xlabel('Fecha', fontsize=18)
plt.ylabel('Precio de cierre del Bitcoin', fontsize=18)
plt.plot(Bitcoin['Fecha'], Bitcoin['Valor'])
plt.plot(Bitcoin['Fecha'][1:1642], train_val_predict)
plt.plot(Bitcoin['Fecha'][1644:1826], predicciones_prueba)
plt.legend(['Serie original', 'Predicciones en entrenamiento + validación', 'Predicciones en prueba'], loc='lower right',
          fontsize=15)
plt.show()

2.4 Errores de Predicción del Modelo

2.4.1 Sobre el conjunto de entrenamiento

Code

labels_train = np.concatenate([y for x, y in w1.train], axis=0)
labels_train.shape

Code

lista=list(w1.train.unbatch().map(lambda x, y: (x, y)))

Code

prediccion_intra_muestra=model_LSTM.predict(w1.train, verbose=1)
prediccion_intra_muestra=prediccion_intra_muestra.reshape(1277,1,1)

Code

eror_prediction_train=labels_train-prediccion_intra_muestra

Code

x_vals = train_df.index[1:]

Code

print(eror_prediction_train.shape)
print(x_vals.shape)

Code

eror_prediction_train=eror_prediction_train.reshape(eror_prediction_train.shape[0])
eror_prediction_train.shape

Code

fig = plt.figure(figsize=(15,8))
plt.plot(eror_prediction_train)
plt.ylabel('$Y-\hat{Y}$', fontsize=14)
plt.title('Error de predicción sobre los datos de entrenamiento', fontsize=16);

Code

graficapacf=plot_pacf(eror_prediction_train,lags=50,method='ldbiased') ###Se puede usar también em method='ywmle'
graficaacf=plot_acf(eror_prediction_train,lags=50,adjusted='ldbiased')

2.4.2 Sobre el conjunto de prueba

Code

labels_test = np.concatenate([y for x, y in w1.test], axis=0)
prediccion_conjunto_test=model_LSTM.predict(w1.test, verbose=1)
prediccion_conjunto_test=prediccion_conjunto_test.reshape(182,1,1)
eror_prediction_test=labels_test-prediccion_conjunto_test
eror_prediction_test=eror_prediction_test.reshape(eror_prediction_test.shape[0])

Code

fig1 = plt.figure(figsize=(15,8))
plt.plot(eror_prediction_test)
plt.ylabel('$Y-\hat{Y}$', fontsize=14)
plt.title('Error de predicción sobre los datos de prueba', fontsize=16)

Text(0.5, 1.0, 'Error de predicción sobre los datos de prueba')

Code

graficapacf=plot_pacf(eror_prediction_test,lags=50,method='ldbiased') ###Se puede usar también em method='ywmle'
graficaacf=plot_acf(eror_prediction_test,lags=50,adjusted='ldbiased')

Volver arriba

--- title: "Predicción 1 paso adelante usando el último retardo (grilla)" jupyter: python3 warning: false code-fold: true output: false --- ```{python} import tensorflow as tf from tensorflow.keras.callbacks import CSVLogger, EarlyStopping import matplotlib as mpl import matplotlib.pyplot as plt import numpy as np import os import pandas as pd import seaborn as sns import time import gc import sys from statsmodels.graphics.tsaplots import plot_acf from statsmodels.graphics.tsaplots import plot_pacf ``` ```{python} print(f"Tensorflow Version: {tf.__version__}") print(f"Pandas Version: {pd.__version__}") print(f"Numpy Version: {np.__version__}") print(f"System Version: {sys.version}") mpl.rcParams['figure.figsize'] = (17, 5) mpl.rcParams['axes.grid'] = False sns.set_style("whitegrid") notebookstart= time.time() ``` ```{python} import IPython import IPython.display ``` ## Preparación de los datos ```{python} #| output: true # Lectura de la serie Bitcoin = pd.read_csv("C:/Users/dofca/Desktop/series/datos/BTC-Daily.csv", header = 0, usecols = [1,6]) Bitcoin.rename(columns={"date": "Fecha", "close": "Valor"}, inplace=True) Bitcoin['Fecha'] = pd.to_datetime(Bitcoin['Fecha']) Bitcoin.sort_values(by=['Fecha'], inplace=True) ventana = (Bitcoin['Fecha'] >= '2017-01-01') & (Bitcoin['Fecha'] <= '2021-12-31') Bitcoin = Bitcoin.loc[ventana] Bitcoin = Bitcoin.reset_index(drop = True) Bitcoin ``` ```{python} features_considered = ['Valor'] # la variable a usar en la predicción es ella misma ``` ```{python} features = Bitcoin[features_considered] # solo se usará la variable Total en la predicción features.index = Bitcoin['Fecha'] # variable que indica el tiempo (la serie es mensual) features ``` ```{python} #| output: true #| fig-align: center features.plot(subplots = True) # gráfico de la serie de tiempo ``` ```{python} # partición del conjuntos de datos en entrenamiento, validación y prueba column_indices = {name: i for i, name in enumerate(features.columns)} # índice = 0 n = len(features) train_df = features[0:int(n*0.7)] val_df = features[int(n*0.7):int(n*0.9)] test_df = features[int(n*0.9):] num_features = features.shape[1] ``` ```{python} #| output: true print("longitud dataframe entrenamiento:", train_df.shape) print("longitud dataframe validación:", val_df.shape) print("longitud dataframe prueba:", test_df.shape) ``` ```{python} # Normalización de las observaciones train_mean = train_df.mean() train_std = train_df.std() train_df = (train_df - train_mean) / train_std val_df = (val_df - train_mean) / train_std test_df = (test_df - train_mean) / train_std ``` ```{python} # todo el dataframe normalizado por train_mean y train_std df_std = (features - train_mean) / train_std df_std = df_std.melt(var_name='Column', value_name='Normalized') df_std ``` ```{python} #| output: true #| fig-align: center plt.figure(figsize=(9, 5)) ax = sns.violinplot(x = 'Column', y = 'Normalized', data = df_std) _ = ax.set_xticklabels(features.keys(), rotation=90) ``` ## Definición de clases y funciones para el problema de aprendizaje automático ```{python} class WindowGenerator(): def __init__(self, input_width, label_width, shift, train_df=train_df, val_df=val_df, test_df=test_df, label_columns=None): # Store the raw data. self.train_df = train_df self.val_df = val_df self.test_df = test_df # Work out the label column indices. self.label_columns = label_columns if label_columns is not None: self.label_columns_indices = {name: i for i, name in enumerate(label_columns)} self.column_indices = {name: i for i, name in enumerate(train_df.columns)} # Work out the window parameters. self.input_width = input_width self.label_width = label_width self.shift = shift self.total_window_size = input_width + shift self.input_slice = slice(0, input_width) self.input_indices = np.arange(self.total_window_size)[self.input_slice] self.label_start = self.total_window_size - self.label_width self.labels_slice = slice(self.label_start, None) self.label_indices = np.arange(self.total_window_size)[self.labels_slice] def __repr__(self): return '\n'.join([ f'Total window size: {self.total_window_size}', f'Input indices: {self.input_indices}', f'Label indices: {self.label_indices}', f'Label column name(s): {self.label_columns}']) ``` ## Split Dada una lista de entradas consecutivas, el método split_window las convertirá en una ventana de entradas y una ventana de etiquetas. ```{python} def split_window(self, features): inputs = features[:, self.input_slice, :] labels = features[:, self.labels_slice, :] if self.label_columns is not None: labels = tf.stack( [labels[:, :, self.column_indices[name]] for name in self.label_columns], axis=-1) # Slicing doesn't preserve static shape information, so set the shapes # manually. This way the `tf.data.Datasets` are easier to inspect. inputs.set_shape([None, self.input_width, None]) labels.set_shape([None, self.label_width, None]) return inputs, labels WindowGenerator.split_window = split_window ``` ## Transforma nuestros objetos a tipo tensorflow Tamaño del lote batch size = 32 ```{python} def make_dataset(self, data): data = np.array(data, dtype=np.float32) ds = tf.keras.utils.timeseries_dataset_from_array( data=data, targets=None, sequence_length=self.total_window_size, sequence_stride=1, shuffle=False, batch_size=32,) ds = ds.map(self.split_window) return ds WindowGenerator.make_dataset = make_dataset ``` ```{python} @property def train(self): return self.make_dataset(self.train_df) @property def val(self): return self.make_dataset(self.val_df) @property def test(self): return self.make_dataset(self.test_df) @property def example(self): """Get and cache an example batch of `inputs, labels` for plotting.""" result = getattr(self, '_example', None) if result is None: # No example batch was found, so get one from the `.train` dataset result = next(iter(self.train)) # And cache it for next time self._example = result return result WindowGenerator.train = train WindowGenerator.val = val WindowGenerator.test = test WindowGenerator.example = example ``` # Definir las gráficas para visualizar lo que se desea predecir en términos de las entradas ```{python} def plot(self, model=None, plot_col='Valor', max_subplots=3): inputs, labels = self.example plt.figure(figsize=(12, 8)) plot_col_index = self.column_indices[plot_col] max_n = min(max_subplots, len(inputs)) for n in range(max_n): plt.subplot(max_n, 1, n+1) plt.ylabel(f'{plot_col} [normed]') plt.plot(self.input_indices, inputs[n, :, plot_col_index], label='Inputs', marker='.', zorder=-10) if self.label_columns: label_col_index = self.label_columns_indices.get(plot_col, None) else: label_col_index = plot_col_index if label_col_index is None: continue plt.scatter(self.label_indices, labels[n, :, label_col_index], edgecolors='k', label='Labels', c='#2ca02c', s=64) if model is not None: predictions = model(inputs) plt.scatter(self.label_indices, predictions[n, :, label_col_index], marker='X', edgecolors='k', label='Predictions', c='#ff7f0e', s=64) if n == 0: plt.legend() plt.xlabel('Time [h]') WindowGenerator.plot = plot ``` # Configuración para el ajuste de los modelos ```{python} # Definimos número de épocas necesarias y funciones de pérdida MAX_EPOCHS = 20 def compile_and_fit(model, window, patience=2): #patiences como el número de épocas que espera antes de parar # Para evitar sobreajuste early_stopping = tf.keras.callbacks.EarlyStopping(monitor='val_loss', patience=patience, mode='min') model.compile(loss=tf.losses.MeanSquaredError(), optimizer=tf.optimizers.Adam(), metrics=[tf.metrics.MeanAbsoluteError()]) history = model.fit(window.train, epochs=MAX_EPOCHS, validation_data=window.val, callbacks=[early_stopping]) return history ``` ## Configuración del modelo ```{python} #| code-fold: false w1 = WindowGenerator(input_width=1, label_width=1, shift=1, label_columns=['Valor']) w1 ``` ```{python} #| output: true for batch in w1.train.take(1): inputs_train,targets_train = batch print("Input shape:", inputs_train.numpy().shape) print("Target shape:", targets_train.numpy().shape) ``` ```{python} for batch in w1.val.take(1): inputs_val,targets_val = batch print("Input shape:", inputs_val.numpy().shape) print("Target shape:", targets_val.numpy().shape) ``` ```{python} for batch in w1.test.take(1): inputs_test,targets_test = batch print("Input shape:", inputs_val.numpy().shape) print("Target shape:", targets_val.numpy().shape) ``` ```{python} w1.train.element_spec ``` ```{python} #| output: true #| fig-align: center w1.plot() ``` ```{python} ## Ejemplo de los lotes en los datos de entrenamiento i=1 for batch in w1.train.take(1): inputs, targets = batch print("Covariable o input",i,inputs) print("Respuesta o etiqueta",i,targets) i=i+1 ``` ```{python} ## Ejemplo de los lotes en los datos de validación i=1 for batch in w1.val.take(1): inputs, targets = batch print("Covariable o input",i,inputs) print("Respuesta o etiqueta",i,targets) i=i+1 ``` ```{python} ## Ejemplo de los lotes en los datos de prueba i=1 for batch in w1.test.take(10): inputs, targets = batch print("Covariable o input",i,inputs) print("Respuesta o etiqueta",i,targets) i=i+1 ``` ```{python} input_dataset_train = w1.train.map(lambda x,y: x) target_dataset_train = w1.train.map(lambda x,y: y) ``` ```{python} input_dataset_val = w1.val.map(lambda x,y: x) target_dataset_val = w1.val.map(lambda x,y: y) ``` ```{python} input_dataset_test = w1.test.map(lambda x,y: x) target_dataset_test = w1.test.map(lambda x,y: y) ``` ## búsqueda de los hiperparámetros e implementación del modelo ```{python} from tensorflow import keras import keras_tuner as kt from keras.models import Sequential from keras.layers import Dense, LSTM, Dropout from tensorflow.keras import layers ``` ```{python} def build_model(hp): model = keras.Sequential() model.add(layers.LSTM(units=hp.Int('input_unit',min_value=32,max_value=512,step=32),activation=hp.Choice("activation", ["relu", "tanh"]),return_sequences=True)) for i in range(hp.Int('n_layers', 1, 4)): model.add(layers.LSTM(hp.Int(f'lstm_{i}_units',min_value=32,max_value=512,step=32),activation=hp.Choice("activation", ["relu", "tanh"]),return_sequences=True)) model.add(layers.LSTM(hp.Int('layer_2_neurons',min_value=32,max_value=512,step=32),activation=hp.Choice("activation", ["relu", "tanh"]))) model.add(layers.Dropout(hp.Float('Dropout_rate',min_value=0,max_value=0.5,step=0.1))) model.add(layers.Dense(1, activation="linear")) model.compile(loss='mean_squared_error', optimizer='adam',metrics = ['mse']) return model ``` ```{python} tuner_LSTM = kt.GridSearch( hypermodel=build_model, objective="val_loss", max_trials=50, seed=1234, overwrite=True, directory="dirsalida", project_name="helloworld" ) ``` ```{python} stop_early = tf.keras.callbacks.EarlyStopping(monitor="val_loss",patience=0) ``` ```{python} # tuner_LSTM.search_space_summary() ``` ```{python} tuner_LSTM.search((w1.train), epochs=20, validation_data=(w1.val),callbacks=[stop_early]) ``` ```{python} #| output: true # Get the top 2 models. models_LSTM = tuner_LSTM.get_best_models(num_models=2) best_model_LSTM = models_LSTM[0] # Build the model. # Needed for `Sequential` without specified `input_shape`. best_model_LSTM.build(input_shape=(32, 1, 1)) best_model_LSTM.summary() ``` ```{python} tuner_LSTM.results_summary() ``` ```{python} train_plus_val=w1.train.concatenate(w1.val)###verificar que en efecto ``` ```{python} # Get the top 2 hyperparameters. best_hps_LSTM = tuner_LSTM.get_best_hyperparameters(5) # Build the model with the best hp. callback=tf.keras.callbacks.EarlyStopping(monitor="loss",patience=0) model_LSTM = build_model(best_hps_LSTM[0]) # Fit with the entire dataset. model_LSTM.fit(train_plus_val, epochs=20,callbacks=[callback]) ``` Una vez re-entrenado el modelo con el conjunto de hiperparámetros hallado anteriormente, se obtiene el siguiente **MSE** en en conjunto de entrenamiento + validación: ```{python} #| output: true model_LSTM.evaluate(train_plus_val, verbose=0) ``` y el **MSE** sobre el conjunto de prueba: ```{python} #| output: true model_LSTM.evaluate(w1.test, verbose=0) ``` ## Predicción sobre el conjunto de prueba ```{python} prediction_test=(model_LSTM.predict(w1.test, verbose=1)*train_std['Valor']+train_mean['Valor']) print(prediction_test.shape) ``` ```{python} i=1 for batch in target_dataset_test.take(10): if i==1: targets_test = batch.numpy() elif i>1: targets_test_aux = batch.numpy() targets_test=np.append(targets_test,targets_test_aux) i=i+1 print(targets_test.shape) ``` ```{python} true_series=targets_test*train_std['Valor']+train_mean['Valor'] true_series=true_series.reshape((182,1,1)) print(true_series.shape) ``` Una vez que se hacen las predicciones sobre el conjunto de prueba, se hace la comparación con los valores reales y se obtiene el siguiente **RECM** (en la escala original): ```{python} #| output: true errors_squared=tf.keras.metrics.mean_squared_error(true_series, prediction_test).numpy() print("RECM:",errors_squared.mean()**0.5) ``` ```{python} test_index=test_df.index[:182] true_series_final=true_series.reshape(182) prediction_test_final=prediction_test.reshape(182) ``` ```{python} #| output: true #| fig-align: center plt.plot(true_series_final) plt.plot(prediction_test_final) plt.legend(['Respesta real','Predicción de la Respuesta'],loc='lower right', fontsize=15) plt.ylabel('Y y $\hat{Y}$ en conjunto de prueba', fontsize=15) plt.title('Red neuronal recurrente: Predicciones sobre el conjunto de prueba', fontsize=20) ``` ```{python} predicciones_prueba = model_LSTM.predict(w1.test)*train_std['Valor']+train_mean['Valor'] train_val_predict = model_LSTM.predict(train_plus_val)*train_std['Valor']+train_mean['Valor'] ``` ```{python} #| output: true #| fig-align: center plt.figure(figsize=(20,10)) plt.title('Red neuronal recurrente para la serie de tiempo del Bitcoin', fontsize=20) plt.xlabel('Fecha', fontsize=18) plt.ylabel('Precio de cierre del Bitcoin', fontsize=18) plt.plot(Bitcoin['Fecha'], Bitcoin['Valor']) plt.plot(Bitcoin['Fecha'][1:1642], train_val_predict) plt.plot(Bitcoin['Fecha'][1644:1826], predicciones_prueba) plt.legend(['Serie original', 'Predicciones en entrenamiento + validación', 'Predicciones en prueba'], loc='lower right', fontsize=15) plt.show() ``` ## Errores de Predicción del Modelo ### Sobre el conjunto de entrenamiento ```{python} labels_train = np.concatenate([y for x, y in w1.train], axis=0) labels_train.shape ``` ```{python} lista=list(w1.train.unbatch().map(lambda x, y: (x, y))) ``` ```{python} prediccion_intra_muestra=model_LSTM.predict(w1.train, verbose=1) prediccion_intra_muestra=prediccion_intra_muestra.reshape(1277,1,1) ``` ```{python} eror_prediction_train=labels_train-prediccion_intra_muestra ``` ```{python} x_vals = train_df.index[1:] ``` ```{python} print(eror_prediction_train.shape) print(x_vals.shape) ``` ```{python} eror_prediction_train=eror_prediction_train.reshape(eror_prediction_train.shape[0]) eror_prediction_train.shape ``` ```{python} #| output: true #| fig-align: center fig = plt.figure(figsize=(15,8)) plt.plot(eror_prediction_train) plt.ylabel('$Y-\hat{Y}$', fontsize=14) plt.title('Error de predicción sobre los datos de entrenamiento', fontsize=16); ``` ```{python} #| output: true #| fig-align: center graficapacf=plot_pacf(eror_prediction_train,lags=50,method='ldbiased') ###Se puede usar también em method='ywmle' graficaacf=plot_acf(eror_prediction_train,lags=50,adjusted='ldbiased') ``` ### Sobre el conjunto de prueba ```{python} labels_test = np.concatenate([y for x, y in w1.test], axis=0) prediccion_conjunto_test=model_LSTM.predict(w1.test, verbose=1) prediccion_conjunto_test=prediccion_conjunto_test.reshape(182,1,1) eror_prediction_test=labels_test-prediccion_conjunto_test eror_prediction_test=eror_prediction_test.reshape(eror_prediction_test.shape[0]) ``` ```{python} #| output: true #| fig-align: center fig1 = plt.figure(figsize=(15,8)) plt.plot(eror_prediction_test) plt.ylabel('$Y-\hat{Y}$', fontsize=14) plt.title('Error de predicción sobre los datos de prueba', fontsize=16) ``` ```{python} #| output: true #| fig-align: center graficapacf=plot_pacf(eror_prediction_test,lags=50,method='ldbiased') ###Se puede usar también em method='ywmle' graficaacf=plot_acf(eror_prediction_test,lags=50,adjusted='ldbiased') ```