markub3327 · May 14, 2022 18:26 · markub3327 · May 14, 2022
diff --git a/get_dataset_partitions_tf.py b/get_dataset_partitions_tf.py
 def get_dataset_partitions_tf(ds, ds_size, train_split=0.7, val_split=0.15, test_split=0.15, shuffle=True, shuffle_size=10000, batch_size=32):
    assert (train_split + test_split + val_split) == 1
    
    if shuffle:
        # Specify seed to always have the same split distribution between runs
        ds = ds.shuffle(shuffle_size, seed=12, reshuffle_each_iteration=False)
    
    train_size = int(train_split * ds_size)
    val_size = int(val_split * ds_size)
    
    train_ds = ds.take(train_size).shuffle(buffer_size=batch_size * 8).batch(batch_size)
    val_ds = ds.skip(train_size).take(val_size).shuffle(buffer_size=batch_size * 8).batch(batch_size)
    test_ds = ds.skip(train_size).skip(val_size).shuffle(buffer_size=batch_size * 8).batch(batch_size)
    
    return train_ds, val_ds, test_ds
	def get_dataset_partitions_tf(ds, ds_size, train_split=0.7, val_split=0.15, test_split=0.15, shuffle=True, shuffle_size=10000, batch_size=32):
	assert (train_split + test_split + val_split) == 1

	if shuffle:
	# Specify seed to always have the same split distribution between runs
	ds = ds.shuffle(shuffle_size, seed=12, reshuffle_each_iteration=False)

	train_size = int(train_split * ds_size)
	val_size = int(val_split * ds_size)

	train_ds = ds.take(train_size).shuffle(buffer_size=batch_size * 8).batch(batch_size)
	val_ds = ds.skip(train_size).take(val_size).shuffle(buffer_size=batch_size * 8).batch(batch_size)
	test_ds = ds.skip(train_size).skip(val_size).shuffle(buffer_size=batch_size * 8).batch(batch_size)

	return train_ds, val_ds, test_ds
No results found