kevinrobinson · December 7, 2015 18:48
diff --git a/dictionary.py b/dictionary.py
 # example input:
 sentence = 'The quick brown fox jumped over the lazy dog.'

 # tokenize and normalize words, building the set of all vocabulary ever seen
 words_set = {}
 def tokenize(sentence):
  return map(str.lower, sentence[0:-1].split(' '))
 for word in tokenize(sentence):
  words_set[word] = True

 # build an index for the vocabulary
 word2index = {}
 index2word = {}
 for index, word in enumerate(words_set.keys()):
  word2index[word] = index
  index2word[index] = word

 # output:
 # >>> word2index
 # {'quick': 4, 'lazy': 6, 'jumped': 7, 'brown': 2, 'the': 3, 'over': 0, 'dog': 5, 'fox': 1}
 # >>> index2word
 # {0: 'over', 1: 'fox', 2: 'brown', 3: 'the', 4: 'quick', 5: 'dog', 6: 'lazy', 7: 'jumped'}
	# example input:
	sentence = 'The quick brown fox jumped over the lazy dog.'

	# tokenize and normalize words, building the set of all vocabulary ever seen
	words_set = {}
	def tokenize(sentence):
	return map(str.lower, sentence[0:-1].split(' '))
	for word in tokenize(sentence):
	words_set[word] = True

	# build an index for the vocabulary
	word2index = {}
	index2word = {}
	for index, word in enumerate(words_set.keys()):
	word2index[word] = index
	index2word[index] = word

	# output:
	# >>> word2index
	# {'quick': 4, 'lazy': 6, 'jumped': 7, 'brown': 2, 'the': 3, 'over': 0, 'dog': 5, 'fox': 1}
	# >>> index2word
	# {0: 'over', 1: 'fox', 2: 'brown', 3: 'the', 4: 'quick', 5: 'dog', 6: 'lazy', 7: 'jumped'}
No results found