Thiết kế website giá rẻ

Question

I want to reconstruct the ECG signal from PPG using a vanilla Transformer model. However, as shown in the attached image, the reconstruction is not very successful. Although it is true that I have only run it for 1 epoch, the model fails to follow the shape at all, and I am wondering if there might be an issue with the model. I set the start token to -3.

enter image description here

<code>#%% Transformer model

import tensorflow as tf

from tensorflow import keras

from tensorflow.keras import layers

import numpy as np

def transformer_encoder(inputs, head_size, num_heads, ff_dim, dropout=0):

x = layers.MultiHeadAttention(key_dim=head_size, num_heads=num_heads, dropout=dropout)(inputs, inputs)

x = layers.Dropout(dropout)(x)

x = layers.LayerNormalization(epsilon=1e-6)(x)

x = layers.Add()([inputs, x])

res = layers.Dense(ff_dim, activation='relu')(x)

res = layers.Dense(inputs.shape[-1])(res)

res = layers.LayerNormalization(epsilon=1e-6)(res)

res = layers.Add()([x, res])

return res

def transformer_decoder(inputs, encoder_outputs, head_size, num_heads, ff_dim, dropout=0):

seq_len = tf.shape(inputs)[1]

look_ahead_mask = tf.linalg.band_part(tf.ones((seq_len, seq_len)), -1, 0)

look_ahead_mask = look_ahead_mask[tf.newaxis, tf.newaxis, :, :]

attention_output = layers.MultiHeadAttention(key_dim=head_size, num_heads=num_heads, dropout=dropout)(

inputs, inputs, attention_mask=look_ahead_mask

)

attention_output = layers.Dropout(dropout)(attention_output)

attention_output = layers.LayerNormalization(epsilon=1e-6)(attention_output)

out1 = layers.Add()([inputs, attention_output])

attention_output = layers.MultiHeadAttention(key_dim=head_size, num_heads=num_heads, dropout=dropout)(

out1, encoder_outputs

)

attention_output = layers.Dropout(dropout)(attention_output)

attention_output = layers.LayerNormalization(epsilon=1e-6)(attention_output)

out2 = layers.Add()([out1, attention_output])

res = layers.Dense(ff_dim, activation='relu')(out2)

res = layers.Dense(inputs.shape[-1])(res)

res = layers.LayerNormalization(epsilon=1e-6)(res)

out3 = layers.Add()([out2, res])

return out3

def get_positional_encoding(seq_length, d_model):

position = np.arange(seq_length)[:, np.newaxis]

div_term = np.exp(np.arange(0, d_model, 2) * -(np.log(10000.0) / d_model))

positional_encoding = np.zeros((seq_length, d_model))

positional_encoding[:, 0::2] = np.sin(position * div_term)

positional_encoding[:, 1::2] = np.cos(position * div_term)

return tf.cast(positional_encoding, dtype=tf.float32)

def build_encoder_decoder_model(

ppg_input_shape,

ecg_input_shape,

head_size,

num_heads,

ff_dim,

num_transformer_blocks,

dropout=0,

mlp_units=[128],

mlp_dropout=0.4,

):

ppg_seq_length, ppg_d_model = ppg_input_shape

ecg_seq_length, ecg_d_model = ecg_input_shape

encoder_inputs = keras.Input(shape=(ppg_seq_length, ppg_d_model), name="encoder_inputs")

decoder_inputs = keras.Input(shape=(ecg_seq_length, ecg_d_model), name="decoder_inputs")

# Encoder

positional_encoding = get_positional_encoding(ppg_seq_length, ppg_d_model)

x = encoder_inputs + positional_encoding

for _ in range(num_transformer_blocks):

x = transformer_encoder(x, head_size, num_heads, ff_dim, dropout)

encoder_outputs = x

# Decoder

positional_encoding = get_positional_encoding(ecg_seq_length, ecg_d_model)

x = decoder_inputs + positional_encoding

for _ in range(num_transformer_blocks):

x = transformer_decoder(x, encoder_outputs, head_size, num_heads, ff_dim, dropout)

x = layers.Dense(ff_dim, activation='relu')(x)

x = layers.Dense(ecg_d_model)(x)

# Output shape should match ecg_seq_length

x = x[:, 1:, :]

model = keras.Model(inputs=[encoder_inputs, decoder_inputs], outputs=x)

return model

# Example usage:

ppg_input_shape = (200, 1)

ecg_input_shape = (201, 1)

head_size = 64

num_heads = 8

ff_dim = 128

num_transformer_blocks = 4

dropout = 0.1

mlp_units = [128]

mlp_dropout = 0.4

model = build_encoder_decoder_model(

ppg_input_shape,

ecg_input_shape,

head_size,

num_heads,

ff_dim,

num_transformer_blocks,

dropout,

mlp_units,

mlp_dropout

)

model.compile(

optimizer=keras.optimizers.Adam(learning_rate=0.0001),

loss='mse',

metrics=['mae']

)

model.summary()

hist = model.fit([X_train_ppg, y_train_ecg], y_train_ecg[:,1:,:], epochs=1, validation_data=([X_val_ppg, y_val_ecg], y_val_ecg[:,1:,:]), batch_size=4)

import matplotlib.pyplot as plt

def mean_squared_error(y_true, y_pred):

y_true = np.array(y_true)

y_pred = np.array(y_pred)

mse = np.mean((y_true - y_pred) ** 2)

return mse

ppg_test = X_test_ppg[1].reshape(1,200,1)

decoder_input = add_elements_to_samples(np.zeros(ppg_test.shape),-3)

predictions = model.predict([ppg_test, decoder_input])

print(mean_squared_error(y_test_ecg[1,1:,],predictions))

plt.plot(ppg_test.reshape(-1))

plt.plot(predictions.reshape(-1))

plt.plot(y_test_ecg[1,1:,].reshape(-1))

</code>

<code>#%% Transformer model import tensorflow as tf from tensorflow import keras from tensorflow.keras import layers import numpy as np def transformer_encoder(inputs, head_size, num_heads, ff_dim, dropout=0): x = layers.MultiHeadAttention(key_dim=head_size, num_heads=num_heads, dropout=dropout)(inputs, inputs) x = layers.Dropout(dropout)(x) x = layers.LayerNormalization(epsilon=1e-6)(x) x = layers.Add()([inputs, x]) res = layers.Dense(ff_dim, activation='relu')(x) res = layers.Dense(inputs.shape[-1])(res) res = layers.LayerNormalization(epsilon=1e-6)(res) res = layers.Add()([x, res]) return res def transformer_decoder(inputs, encoder_outputs, head_size, num_heads, ff_dim, dropout=0): seq_len = tf.shape(inputs)[1] look_ahead_mask = tf.linalg.band_part(tf.ones((seq_len, seq_len)), -1, 0) look_ahead_mask = look_ahead_mask[tf.newaxis, tf.newaxis, :, :] attention_output = layers.MultiHeadAttention(key_dim=head_size, num_heads=num_heads, dropout=dropout)( inputs, inputs, attention_mask=look_ahead_mask ) attention_output = layers.Dropout(dropout)(attention_output) attention_output = layers.LayerNormalization(epsilon=1e-6)(attention_output) out1 = layers.Add()([inputs, attention_output]) attention_output = layers.MultiHeadAttention(key_dim=head_size, num_heads=num_heads, dropout=dropout)( out1, encoder_outputs ) attention_output = layers.Dropout(dropout)(attention_output) attention_output = layers.LayerNormalization(epsilon=1e-6)(attention_output) out2 = layers.Add()([out1, attention_output]) res = layers.Dense(ff_dim, activation='relu')(out2) res = layers.Dense(inputs.shape[-1])(res) res = layers.LayerNormalization(epsilon=1e-6)(res) out3 = layers.Add()([out2, res]) return out3 def get_positional_encoding(seq_length, d_model): position = np.arange(seq_length)[:, np.newaxis] div_term = np.exp(np.arange(0, d_model, 2) * -(np.log(10000.0) / d_model)) positional_encoding = np.zeros((seq_length, d_model)) positional_encoding[:, 0::2] = np.sin(position * div_term) positional_encoding[:, 1::2] = np.cos(position * div_term) return tf.cast(positional_encoding, dtype=tf.float32) def build_encoder_decoder_model( ppg_input_shape, ecg_input_shape, head_size, num_heads, ff_dim, num_transformer_blocks, dropout=0, mlp_units=[128], mlp_dropout=0.4, ): ppg_seq_length, ppg_d_model = ppg_input_shape ecg_seq_length, ecg_d_model = ecg_input_shape encoder_inputs = keras.Input(shape=(ppg_seq_length, ppg_d_model), name="encoder_inputs") decoder_inputs = keras.Input(shape=(ecg_seq_length, ecg_d_model), name="decoder_inputs") # Encoder positional_encoding = get_positional_encoding(ppg_seq_length, ppg_d_model) x = encoder_inputs + positional_encoding for _ in range(num_transformer_blocks): x = transformer_encoder(x, head_size, num_heads, ff_dim, dropout) encoder_outputs = x # Decoder positional_encoding = get_positional_encoding(ecg_seq_length, ecg_d_model) x = decoder_inputs + positional_encoding for _ in range(num_transformer_blocks): x = transformer_decoder(x, encoder_outputs, head_size, num_heads, ff_dim, dropout) x = layers.Dense(ff_dim, activation='relu')(x) x = layers.Dense(ecg_d_model)(x) # Output shape should match ecg_seq_length x = x[:, 1:, :] model = keras.Model(inputs=[encoder_inputs, decoder_inputs], outputs=x) return model # Example usage: ppg_input_shape = (200, 1) ecg_input_shape = (201, 1) head_size = 64 num_heads = 8 ff_dim = 128 num_transformer_blocks = 4 dropout = 0.1 mlp_units = [128] mlp_dropout = 0.4 model = build_encoder_decoder_model( ppg_input_shape, ecg_input_shape, head_size, num_heads, ff_dim, num_transformer_blocks, dropout, mlp_units, mlp_dropout ) model.compile( optimizer=keras.optimizers.Adam(learning_rate=0.0001), loss='mse', metrics=['mae'] ) model.summary() hist = model.fit([X_train_ppg, y_train_ecg], y_train_ecg[:,1:,:], epochs=1, validation_data=([X_val_ppg, y_val_ecg], y_val_ecg[:,1:,:]), batch_size=4) import matplotlib.pyplot as plt def mean_squared_error(y_true, y_pred): y_true = np.array(y_true) y_pred = np.array(y_pred) mse = np.mean((y_true - y_pred) ** 2) return mse ppg_test = X_test_ppg[1].reshape(1,200,1) decoder_input = add_elements_to_samples(np.zeros(ppg_test.shape),-3) predictions = model.predict([ppg_test, decoder_input]) print(mean_squared_error(y_test_ecg[1,1:,],predictions)) plt.plot(ppg_test.reshape(-1)) plt.plot(predictions.reshape(-1)) plt.plot(y_test_ecg[1,1:,].reshape(-1)) </code>

#%% Transformer model
import tensorflow as tf
from tensorflow import keras
from tensorflow.keras import layers
import numpy as np

def transformer_encoder(inputs, head_size, num_heads, ff_dim, dropout=0):
    x = layers.MultiHeadAttention(key_dim=head_size, num_heads=num_heads, dropout=dropout)(inputs, inputs)
    x = layers.Dropout(dropout)(x)
    x = layers.LayerNormalization(epsilon=1e-6)(x)
    x = layers.Add()([inputs, x])
    
    res = layers.Dense(ff_dim, activation='relu')(x)
    res = layers.Dense(inputs.shape[-1])(res)
    res = layers.LayerNormalization(epsilon=1e-6)(res)
    res = layers.Add()([x, res])
    
    return res

def transformer_decoder(inputs, encoder_outputs, head_size, num_heads, ff_dim, dropout=0):
    
    seq_len = tf.shape(inputs)[1]
    look_ahead_mask = tf.linalg.band_part(tf.ones((seq_len, seq_len)), -1, 0)
    look_ahead_mask = look_ahead_mask[tf.newaxis, tf.newaxis, :, :]
    
    attention_output = layers.MultiHeadAttention(key_dim=head_size, num_heads=num_heads, dropout=dropout)(
        inputs, inputs, attention_mask=look_ahead_mask
    )
    attention_output = layers.Dropout(dropout)(attention_output)
    attention_output = layers.LayerNormalization(epsilon=1e-6)(attention_output)
    out1 = layers.Add()([inputs, attention_output])
    
    attention_output = layers.MultiHeadAttention(key_dim=head_size, num_heads=num_heads, dropout=dropout)(
        out1, encoder_outputs
    )
    attention_output = layers.Dropout(dropout)(attention_output)
    attention_output = layers.LayerNormalization(epsilon=1e-6)(attention_output)
    out2 = layers.Add()([out1, attention_output])
    
    res = layers.Dense(ff_dim, activation='relu')(out2)
    res = layers.Dense(inputs.shape[-1])(res)
    res = layers.LayerNormalization(epsilon=1e-6)(res)
    out3 = layers.Add()([out2, res])
    
    return out3

def get_positional_encoding(seq_length, d_model):
    position = np.arange(seq_length)[:, np.newaxis]
    div_term = np.exp(np.arange(0, d_model, 2) * -(np.log(10000.0) / d_model))
    positional_encoding = np.zeros((seq_length, d_model))
    positional_encoding[:, 0::2] = np.sin(position * div_term)
    positional_encoding[:, 1::2] = np.cos(position * div_term)
    return tf.cast(positional_encoding, dtype=tf.float32)

def build_encoder_decoder_model(
    ppg_input_shape,
    ecg_input_shape,
    head_size,
    num_heads,
    ff_dim,
    num_transformer_blocks,
    dropout=0,
    mlp_units=[128],
    mlp_dropout=0.4,
):
    ppg_seq_length, ppg_d_model = ppg_input_shape
    ecg_seq_length, ecg_d_model = ecg_input_shape
    
    encoder_inputs = keras.Input(shape=(ppg_seq_length, ppg_d_model), name="encoder_inputs")
    decoder_inputs = keras.Input(shape=(ecg_seq_length, ecg_d_model), name="decoder_inputs")

    # Encoder
    positional_encoding = get_positional_encoding(ppg_seq_length, ppg_d_model)
    x = encoder_inputs + positional_encoding

    for _ in range(num_transformer_blocks):
        x = transformer_encoder(x, head_size, num_heads, ff_dim, dropout)
    
    encoder_outputs = x
    
    # Decoder
    positional_encoding = get_positional_encoding(ecg_seq_length, ecg_d_model)
    x = decoder_inputs + positional_encoding

    for _ in range(num_transformer_blocks):
        x = transformer_decoder(x, encoder_outputs, head_size, num_heads, ff_dim, dropout)
    
    x = layers.Dense(ff_dim, activation='relu')(x)
    x = layers.Dense(ecg_d_model)(x)
    
    # Output shape should match ecg_seq_length
    x = x[:, 1:, :]
    
    model = keras.Model(inputs=[encoder_inputs, decoder_inputs], outputs=x)
    return model

# Example usage:
ppg_input_shape = (200, 1)  
ecg_input_shape = (201, 1)  
head_size = 64
num_heads = 8
ff_dim = 128
num_transformer_blocks = 4
dropout = 0.1
mlp_units = [128]
mlp_dropout = 0.4

model = build_encoder_decoder_model(
    ppg_input_shape,
    ecg_input_shape,
    head_size,
    num_heads,
    ff_dim,
    num_transformer_blocks,
    dropout,
    mlp_units,
    mlp_dropout
)

model.compile(
    optimizer=keras.optimizers.Adam(learning_rate=0.0001),
    loss='mse',
    metrics=['mae']
)
model.summary()

hist = model.fit([X_train_ppg, y_train_ecg], y_train_ecg[:,1:,:], epochs=1, validation_data=([X_val_ppg, y_val_ecg], y_val_ecg[:,1:,:]), batch_size=4)

import matplotlib.pyplot as plt

def mean_squared_error(y_true, y_pred):
    y_true = np.array(y_true)
    y_pred = np.array(y_pred)
    mse = np.mean((y_true - y_pred) ** 2)
    return mse

ppg_test = X_test_ppg[1].reshape(1,200,1)
decoder_input = add_elements_to_samples(np.zeros(ppg_test.shape),-3)
predictions = model.predict([ppg_test, decoder_input])


print(mean_squared_error(y_test_ecg[1,1:,],predictions))


plt.plot(ppg_test.reshape(-1))
plt.plot(predictions.reshape(-1))
plt.plot(y_test_ecg[1,1:,].reshape(-1))

The dataset consists of approximately 1.8 million samples, so I believe the amount of data should be sufficient, but the model seems unable to follow the shape of the ECG at all, making me wonder if there is a problem with the model.

Thiết kế website giá rẻ

Danh mục

Transformer model to reconstruction ECG from PPG signal