dreamr · December 28, 2015 01:19 · dreamr · Nov 11, 2013
diff --git a/split_dict b/split_dict
 #!/usr/bin/env ruby
 # encoding: utf-8

 # So this is basically a data flow problem
 # I could have gotten lambda on it, made it lazy
 # and that would speed this up a lot. However it
 # not be readable by anyone who isn't into
 # functional coding and lambda madness (tm)

 def get_sequences(string)
  alpha_only = string.gsub(/\d|\W/, '')
  0.upto(alpha_only.chars.size).map {|i| 
    alpha_only[i..i+3].upcase
  }.select {|word| word if word.chars.size == 4 }
 end

 def dict_to_hash(dict_lines)
  dict_lines.reduce({}) do |hash, word|
    hash.merge(word => get_sequences(word))
  end
 end

 def log_results(hash)
  File.delete("words.txt", "sequences.txt")
  hash.each do |word, sequences|
    next if sequences.none?
    File.open("words.txt", "a") {|f| f.puts word }
    File.open("sequences.txt", "a") do |f|
      sequences.uniq.each {|seq| f.puts seq }
    end
  end
 end

 def split_that_shit!
  dict_lines = File.readlines("dictionary.txt")
  log_results(dict_to_hash(dict_lines))
 end

 split_that_shit!

 require 'minitest/autorun'

 describe "#log_results" do
  let(:hash) {{
    'Aarhus' => %w(AARH ARHU RHUS),
    '10th' => [],
    'AAAS' => %w(AAAS)
  }}

  it "must log the sequences" do
    log_results(hash)
    File.read("words.txt").must_equal(
      "Aarhus\nAAAS\n"
    )
  end
 end

 describe "#dict_to_hash" do
  let(:dictionary) { "Aarhus\n10th\nAAAS\n" }
  it "must return a hash" do
    dict_to_hash(dictionary).must_equal({
      'Aarhus' => %w(AARH ARHU RHUS),
      '10th' => [],
      'AAAS' => %w(AAAS)
    })
  end
 end

 describe "#get_sequences" do
  it "will correctly get da sequences for 'Aarhus'" do
    get_sequences("Aarhus").must_equal [
      "AARH",
      "ARHU",
      "RHUS"
    ]
  end

  it "will correctly get da sequences for '10th'" do
    get_sequences("10th").must_equal []
  end

  it "will correctly get da sequences for 'AAAS'" do
    get_sequences("AAAS").must_equal [
      "AAAS"
    ]
  end
 end
	#!/usr/bin/env ruby
	# encoding: utf-8

	# So this is basically a data flow problem
	# I could have gotten lambda on it, made it lazy
	# and that would speed this up a lot. However it
	# not be readable by anyone who isn't into
	# functional coding and lambda madness (tm)

	def get_sequences(string)
	alpha_only = string.gsub(/\d\|\W/, '')
	0.upto(alpha_only.chars.size).map {\|i\|
	alpha_only[i..i+3].upcase
	}.select {\|word\| word if word.chars.size == 4 }
	end

	def dict_to_hash(dict_lines)
	dict_lines.reduce({}) do \|hash, word\|
	hash.merge(word => get_sequences(word))
	end
	end

	def log_results(hash)
	File.delete("words.txt", "sequences.txt")
	hash.each do \|word, sequences\|
	next if sequences.none?
	File.open("words.txt", "a") {\|f\| f.puts word }
	File.open("sequences.txt", "a") do \|f\|
	sequences.uniq.each {\|seq\| f.puts seq }
	end
	end
	end

	def split_that_shit!
	dict_lines = File.readlines("dictionary.txt")
	log_results(dict_to_hash(dict_lines))
	end

	split_that_shit!

	require 'minitest/autorun'

	describe "#log_results" do
	let(:hash) {{
	'Aarhus' => %w(AARH ARHU RHUS),
	'10th' => [],
	'AAAS' => %w(AAAS)
	}}

	it "must log the sequences" do
	log_results(hash)
	File.read("words.txt").must_equal(
	"Aarhus\nAAAS\n"
	)
	end
	end

	describe "#dict_to_hash" do
	let(:dictionary) { "Aarhus\n10th\nAAAS\n" }
	it "must return a hash" do
	dict_to_hash(dictionary).must_equal({
	'Aarhus' => %w(AARH ARHU RHUS),
	'10th' => [],
	'AAAS' => %w(AAAS)
	})
	end
	end

	describe "#get_sequences" do
	it "will correctly get da sequences for 'Aarhus'" do
	get_sequences("Aarhus").must_equal [
	"AARH",
	"ARHU",
	"RHUS"
	]
	end

	it "will correctly get da sequences for '10th'" do
	get_sequences("10th").must_equal []
	end

	it "will correctly get da sequences for 'AAAS'" do
	get_sequences("AAAS").must_equal [
	"AAAS"
	]
	end
	end