🐗

Justin Evans eustin

🐗

Learning

eustin / letor-part-1-model-sentences.py

Created May 25, 2020 22:35

eustin / letor-part-1-model-tokeniser.py

Created May 25, 2020 22:35

	tokeniser = tf.keras.preprocessing.text.Tokenizer()
	tokeniser.fit_on_texts(sentences)

	print(tokeniser.word_index)

eustin / letor-part-1-model-sequences.py

Created May 25, 2020 22:36

	sequences = tokeniser.texts_to_sequences(sentences)
	for x in sequences:
	print(x)

eustin / letor-part-1-model-vocab-size.py

Created May 25, 2020 22:37

	VOCAB_SIZE = max(tokeniser.index_word) + 1
	print(f"VOCAB_SIZE: {VOCAB_SIZE}")

eustin / letor-part-1-model-skipgrams.py

Created May 25, 2020 22:38

	def make_skipgrams():
	train_x, all_labels = [], []
	for sequence in sequences:
	pairs, labels = tf.keras.preprocessing.sequence.skipgrams(
	sequence, VOCAB_SIZE, negative_samples=1.0, window_size=1, shuffle=True
	)
	train_x.extend(pairs)
	all_labels.extend(labels)

	train_x = np.array(train_x)

eustin / letor-part-1-model-model-arch.py

Created May 25, 2020 22:40

	# inputs
	content_input = tf.keras.layers.Input(shape=(1, ), dtype=tf.int32, name='content_word')
	context_input = tf.keras.layers.Input(shape=(1, ), dtype=tf.int32, name='context_word')

	# layers
	embeddings = tf.keras.layers.Embedding(input_dim=VOCAB_SIZE, output_dim=2, name='embeddings')
	dot_prod = tf.keras.layers.Dot(axes=2, normalize=True, name='dot_product')
	# graph
	content_embedding = embeddings(content_input)
	context_embedding = embeddings(context_input)

eustin / letor-part-1-model-training-loop.py

Last active May 27, 2020 20:41

	loss_hist = []

	for i in range(20):

	if i > 0:

	content_words, context_words, labels = make_skipgrams()

	hist = model.fit([content_words, context_words], labels, epochs=1, verbose=0)
	print(f"loss: {hist.history['loss'][-1]:.4f}")

eustin / letor-part-2-packages.py

Created June 8, 2020 03:24

	import random
	random.seed(1)

	import numpy as np
	np.random.seed(1)

	import itertools
	import matplotlib.pyplot as plt
	plt.style.use('ggplot')

eustin / letor-part-2-objects-to-rank.py

Created June 8, 2020 03:29

objects_to_rank = {'dress', 'shirt', 'pants'}

eustin / letor-part-2-all-permutations.py

Created June 8, 2020 03:30

	all_permutations = list(itertools.permutations(objects_to_rank))

	for x in sorted(all_permutations):
	print(x)