Training a single model jointly over multiple datasets in tensorflow

Question

I want to train a single variational autoencoder model or even a standard autoencoder over many datasets jointly (e.g. mnist, cifar, svhn, etc. where all the images in the datasets are resized to be the same input shape). Here is the VAE tutorial in tensorflow which I am using as a starting point: https://www…

Accepted Answer

If I understand your question correctly, you want to control the number of batches that you pull from your train and test sets, instead of iterating over them completely before doing an update.  You can turn your dataset into an iterator by wrapping it in iter() and use the next() method to grab the next batch.Example:import numpy as npimport tensorflow as tf# fake mnist datatrain_imgs = tf.random.normal([100, 28, 28, 1])test_imgs = tf.random.normal([100, 28, 28, 1])train_labels = tf.one_hot(    tf.random.uniform([100,], minval=0, maxval=10, dtype=tf.int64), 10)test_labels = tf.one_hot(    tf.random.uniform([100,], minval=0, maxval=10, dtype=tf.int64), 10)# create train/test datasettrain_ds = tf.data.Dataset.from_tensor_slices((train_imgs, train_labels))train_ds = train_ds.repeat().shuffle(1 << 6).batch(8)test_ds = tf.data.Dataset.from_tensor_slices((test_imgs, train_labels))test_ds = test_ds.repeat().shuffle(1 << 6).batch(8)# simple mnist networkx_in = tf.keras.Input((28, 28, 1))x = tf.keras.layers.Flatten()(x_in)x = tf.keras.layers.Dense(100)(x)x_out = tf.keras.layers.Dense(10)(x)# simple mnist modelmodel = tf.keras.Model(x_in, x_out)# make datasets iteratorstrain_iter = iter(train_ds)test_iter = iter(test_ds)# lossdef xent_loss(y_true, y_pred):    ce = tf.keras.losses.CategoricalCrossentropy()    return ce(y_true, y_pred)    # simple training loop where you control the batches per epoch# for your train and test datasetsNUM_EPOCHS = 10NUM_TRAIN_BATCHES_PER_EPOCH = 20NUM_TEST_BATCHES_PER_EPOCH = 5for epoch in range(NUM_EPOCHS):    train_losses = []    # train    for _ in range(NUM_TRAIN_BATCHES_PER_EPOCH):        X_train, y_train = next(train_iter)        y_hat = model(X_train)        loss = xent_loss(y_train, y_hat)        train_losses.append(loss)        # do gradient update ...            # report train loss    print(f"epoch: {epoch}ttrain_loss: {np.mean(train_losses):.4f}")    train_losses = []        # validate    test_losses = []    for _ in range(NUM_TEST_BATCHES_PER_EPOCH):        X_test, y_test = next(test_iter)        y_hat = model(X_test)        loss = xent_loss(y_test, y_hat)        test_losses.append(loss)            # report validation loss    print(f"epoch: {epoch}ttest_loss: {np.mean(test_losses):.4f}")    test_losses = []    print('-' * 40)# epoch: 0  train_loss: 7.3092# epoch: 0  test_loss: 7.3427# ----------------------------------------# epoch: 1  train_loss: 6.8050# epoch: 1  test_loss: 8.4867# ----------------------------------------

Advertisement

Answer