Keras中可变序列长度的序列到序列分类

如果它对某人有帮助，以下是我最终实施解决方案的方式：import tensorflow as tfimport numpy as np# Load data from filex_list, y_list = loadSequences("train.csv")# x_list is now a list of arrays (m,n) of float64, where m is the timesteps# and n is the number of features.# y_list is a list of arrays (m,1) of Boolean.assert len(x_list) == len(y_list)num_sequences = len(x_list)num_features = len(x_list[0][0])batch_size = 10batches_per_epoch = 5assert batch_size * batches_per_epoch == num_sequencesdef train_generator():    # Sort by length so the number of timesteps in each batch is minimized    x_list.sort(key=len)    y_list.sort(key=len)    # Generate batches    while True:        for b in range(batches_per_epoch):            longest_index = (b + 1) * batch_size - 1            timesteps = len(x_list[longest_index])            x_train = np.zeros((batch_size, timesteps, num_features))            y_train = np.zeros((batch_size, timesteps, 1))            for i in range(batch_size):                li = b * batch_size + i                x_train[i, 0:len(x_list[li]), :] = x_list[li]                y_train[i, 0:len(y_list[li]), 0] = y_list[li]            yield x_train, y_trainmodel = tf.keras.models.Sequential([            tf.keras.layers.Masking(mask_value=0., input_shape=(None,num_features)),            tf.keras.layers.LSTM(32, return_sequences=True),            tf.keras.layers.Dense(2, activation=tf.nn.softmax)        ])model.compile(optimizer='adam',            loss='sparse_categorical_crossentropy',            metrics=['accuracy'])model.fit_generator(train_generator(), steps_per_epoch=batches_per_epoch, epochs=100)

Keras中可变序列长度的序列到序列分类

2回答