Skip to content

Instantly share code, notes, and snippets.

@axiak
Created June 8, 2012 00:12
Show Gist options
  • Save axiak/2892539 to your computer and use it in GitHub Desktop.
Save axiak/2892539 to your computer and use it in GitHub Desktop.
name denormalizer
class NameDenormalizer(object):
def __init__(self, filename=None):
filename = filename or 'names1.1.csv'
lookup = collections.defaultdict(list)
with open(filename) as f:
reader = csv.reader(f)
for line in reader:
matches = set(line)
for match in matches:
lookup[match].append(matches)
self.lookup = lookup
def __getitem__(self, name):
name = name.lower()
if name not in self.lookup:
raise KeyError(name)
names = reduce(operator.or_, self.lookup[name])
if name in names:
names.remove(name)
return names
def get(self, name, default=None):
try:
return self[name]
except KeyError:
return default
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment