ruggeri · December 18, 2017 01:30
diff --git a/functional.py b/functional.py
 # Resource: https://keras.io/getting-started/functional-api-guide/

 import keras.backend as K
 from keras.datasets import mnist
 from keras.layers import Dense, Input, Lambda
 from keras.models import Model
 from keras.optimizers import Adam
 from keras.utils import to_categorical
 import numpy as np

 # Create an input layer, which allocates a tf.placeholder tensor.
 input_tensor = Input(shape = (28, 28))

 # I could use a Keras Flatten layer like this.
 # from keras.layers import Flatten
 # flattened_input = Flatten()(input_tensor)
 #
 # But I will use the Keras interface to low-level TF. To do this, I
 # create a "Lambda" layer. Lambda layers are custom layers in which
 # I can do TF stuff.
 flatten_layer = Lambda(
    lambda ipt: K.reshape(ipt, (-1, 28 * 28))
 )
 flattened_input = flatten_layer(input_tensor)

 # Create a dense layer, and feed it in the input_tensor.
 # Note: it is more normal to write Dense(10, activation = 'relu')(flattened_input)
 hidden_layer = Dense(10, activation = 'relu')
 hidden_output = hidden_layer(flattened_input)
 output_layer = Dense(10, activation = 'softmax')
 classification_output = output_layer(hidden_output)

 # We specify what tensors we will be fed in, and which tensors are the
 # final outputs of the model.
 model = Model([input_tensor], [classification_output])

 # Build the optimizer
 LEARNING_RATE = 0.001
 optimizer = Adam(lr = LEARNING_RATE)

 # "Custom" loss function
 def categorical_cross_entropy(y_true, y_pred):
    # Let's see what comes into this function! They should be TF
    # Tensor objects!
    print(y_true)
    print(y_pred)

    # keras.backend is conventionally imported as K.
    # It is the Keras abstraction of TensorFlow; you're basically using
    # a nicer interface for TF here. This is lower level than the Keras
    # layers API. K functions typically manipulate TF tensors directly.
    #
    # Note I must use K.epsilon() because taking the log of a zero
    # probability gives NaN. This adds a small nudge so nothing is zero.
    # This problem wouldn't happen if I worked in logits, but I used
    # softmax at the final layer.
    return K.mean(
        K.sum(y_true * -K.log(y_pred + K.epsilon()), axis = 1)
    )

 model.compile(
    # This says to use our CE function. We could have just said 'categorical_cross_entropy'
    # because Keras is nice and will figure that out for us. This is
    # more manual in case we want to have a fancy loss function.
    loss = [categorical_cross_entropy],
    # You can have multiple outputs, in which case you can specify
    # multiple loss functions. Of course, we have only one output here.
    loss_weights = [1.0],
    optimizer = optimizer,
    metrics = ['accuracy'],
 )

 # This just downloads the datasets.
 (x_train, y_train), (x_test, y_test) = mnist.load_data()

 x_mean = np.mean(x_train)
 x_stddev = np.std(x_train)

 # Normalize x values.
 x_train = (x_train - x_mean) / x_stddev
 x_test = (x_test - x_mean) / x_stddev

 # One hot encode.
 y_train = to_categorical(y_train, 10)
 y_test = to_categorical(y_test, 10)

 model.fit(
    x_train,
    y_train,
    validation_data = (x_test, y_test),
    epochs = 3
 )
	# Resource: https://keras.io/getting-started/functional-api-guide/

	import keras.backend as K
	from keras.datasets import mnist
	from keras.layers import Dense, Input, Lambda
	from keras.models import Model
	from keras.optimizers import Adam
	from keras.utils import to_categorical
	import numpy as np

	# Create an input layer, which allocates a tf.placeholder tensor.
	input_tensor = Input(shape = (28, 28))

	# I could use a Keras Flatten layer like this.
	# from keras.layers import Flatten
	# flattened_input = Flatten()(input_tensor)
	#
	# But I will use the Keras interface to low-level TF. To do this, I
	# create a "Lambda" layer. Lambda layers are custom layers in which
	# I can do TF stuff.
	flatten_layer = Lambda(
	lambda ipt: K.reshape(ipt, (-1, 28 * 28))
	)
	flattened_input = flatten_layer(input_tensor)

	# Create a dense layer, and feed it in the input_tensor.
	# Note: it is more normal to write Dense(10, activation = 'relu')(flattened_input)
	hidden_layer = Dense(10, activation = 'relu')
	hidden_output = hidden_layer(flattened_input)
	output_layer = Dense(10, activation = 'softmax')
	classification_output = output_layer(hidden_output)

	# We specify what tensors we will be fed in, and which tensors are the
	# final outputs of the model.
	model = Model([input_tensor], [classification_output])

	# Build the optimizer
	LEARNING_RATE = 0.001
	optimizer = Adam(lr = LEARNING_RATE)

	# "Custom" loss function
	def categorical_cross_entropy(y_true, y_pred):
	# Let's see what comes into this function! They should be TF
	# Tensor objects!
	print(y_true)
	print(y_pred)

	# keras.backend is conventionally imported as K.
	# It is the Keras abstraction of TensorFlow; you're basically using
	# a nicer interface for TF here. This is lower level than the Keras
	# layers API. K functions typically manipulate TF tensors directly.
	#
	# Note I must use K.epsilon() because taking the log of a zero
	# probability gives NaN. This adds a small nudge so nothing is zero.
	# This problem wouldn't happen if I worked in logits, but I used
	# softmax at the final layer.
	return K.mean(
	K.sum(y_true * -K.log(y_pred + K.epsilon()), axis = 1)
	)

	model.compile(
	# This says to use our CE function. We could have just said 'categorical_cross_entropy'
	# because Keras is nice and will figure that out for us. This is
	# more manual in case we want to have a fancy loss function.
	loss = [categorical_cross_entropy],
	# You can have multiple outputs, in which case you can specify
	# multiple loss functions. Of course, we have only one output here.
	loss_weights = [1.0],
	optimizer = optimizer,
	metrics = ['accuracy'],
	)

	# This just downloads the datasets.
	(x_train, y_train), (x_test, y_test) = mnist.load_data()

	x_mean = np.mean(x_train)
	x_stddev = np.std(x_train)

	# Normalize x values.
	x_train = (x_train - x_mean) / x_stddev
	x_test = (x_test - x_mean) / x_stddev

	# One hot encode.
	y_train = to_categorical(y_train, 10)
	y_test = to_categorical(y_test, 10)

	model.fit(
	x_train,
	y_train,
	validation_data = (x_test, y_test),
	epochs = 3
	)