avanishgiri · November 12, 2013 08:03 · avanishgiri · Nov 12, 2013
diff --git a/frequencies.rb b/frequencies.rb
 def word_frequencies(string, k)
  words = string.split(/\s/)  # O(n)  ## delimit by whitespace
  max = 0
  min = Float::INFINITY

  # create hash table for word --> frequency #

  frequencies = words.inject(Hash.new(0)) do |hash,word|  # O(n)
    occurrences = hash[word] += 1                     
    max = occurrences if occurrences > max            
    min = occurrences if occurrences < min            
    hash;                                             
  end

  # perform counting sort #
  
  sorted = Array.new(max + words.length - min)  
 
  frequencies.each do |word, frequency|   # O(n)
    index = frequency - min  #offset index by minimum index
    if sorted[index]
      sorted[index] = sorted[index].push(word)  
    else
      sorted[index] = [word]                    
    end
  end
  

  return sorted.reverse if k > sorted.length
  return sorted.compact.flatten[-k..-1].reverse    #O(n)
 end


 text = "hi hello hi my name is what what hi hello hi this is a test test test test hi hi hi what hello these are some words these these"

 p word_frequencies(text, 4)
	def word_frequencies(string, k)
	words = string.split(/\s/) # O(n) ## delimit by whitespace
	max = 0
	min = Float::INFINITY

	# create hash table for word --> frequency #

	frequencies = words.inject(Hash.new(0)) do \|hash,word\| # O(n)
	occurrences = hash[word] += 1
	max = occurrences if occurrences > max
	min = occurrences if occurrences < min
	hash;
	end

	# perform counting sort #

	sorted = Array.new(max + words.length - min)

	frequencies.each do \|word, frequency\| # O(n)
	index = frequency - min #offset index by minimum index
	if sorted[index]
	sorted[index] = sorted[index].push(word)
	else
	sorted[index] = [word]
	end
	end


	return sorted.reverse if k > sorted.length
	return sorted.compact.flatten[-k..-1].reverse #O(n)
	end


	text = "hi hello hi my name is what what hi hello hi this is a test test test test hi hi hi what hello these are some words these these"

	p word_frequencies(text, 4)