serrasqueiro · November 2, 2024 19:02
diff --git a/pangram-de.md b/pangram-de.md
diff --git a/pangram-pt.md b/pangram-pt.md
diff --git a/pangrama.md b/pangrama.md
diff --git a/show.py b/show.py
 #!/usr/bin/env python
 # show.py -- (c)2024 Henrique Moreira

 """ Show west-european Pangrams
 """

 import unicodedata

 # More basic, but works for German lang. better!
 from unidecode import unidecode

 LANG = [
    "pt",
    "de",
 ]

 WHOT = {
    "pt": "portuguese",	# Portugue^s
    "de": "german",	# Deutsch
 }

 def main():
    """ Show and illustrate pangrams """
    for language in LANG:
        desc = WHOT[language]
        print(f"Showing pangram for {language}: {desc}")
        fname = f"pangram-{language}.md"
        show_pangram(language, fname)

 def strip_acc(astr:str) -> str:
    """ Removes accents.
    Referenced at:
 	https://stackoverflow.com/questions/517923/what-is-the-best-way-to-remove-accents-normalize-in-a-python-unicode-string
    """
    astr = ''.join(achr for achr in unicodedata.normalize('NFD', astr)
           if unicodedata.category(achr) != 'Mn')
    return astr

 def show_pangram(lang:str, fname:str):
    with open(fname, "r", encoding="utf-8") as fdin:
        astr = pangram(fdin.read(), lang)
    print("-", astr, end="\n\n")
    return True

 def pangram(text, lang=""):
    last = [line for line in text.splitlines() if line.strip() and line[0] != ' '][-1]
    astr = strip_acc(last)
    # To convert best-effort:
    #	astr.encode("ASCII", errors='ignore').decode("ASCII")
    # Just ensure we got pure ASCII:
    rec = astr.encode("ASCII", errors='ignore').decode("ASCII")
    if astr != rec:
        print("# Warning NFD for language (ISO 3166-1 name):", lang)
        print("# last:", unidecode(last))
        return "?"
    return astr

 if __name__ == "__main__":
    main()
	#!/usr/bin/env python
	# show.py -- (c)2024 Henrique Moreira

	""" Show west-european Pangrams
	"""

	import unicodedata

	# More basic, but works for German lang. better!
	from unidecode import unidecode

	LANG = [
	"pt",
	"de",
	]

	WHOT = {
	"pt": "portuguese", # Portugue^s
	"de": "german", # Deutsch
	}

	def main():
	""" Show and illustrate pangrams """
	for language in LANG:
	desc = WHOT[language]
	print(f"Showing pangram for {language}: {desc}")
	fname = f"pangram-{language}.md"
	show_pangram(language, fname)

	def strip_acc(astr:str) -> str:
	""" Removes accents.
	Referenced at:
	https://stackoverflow.com/questions/517923/what-is-the-best-way-to-remove-accents-normalize-in-a-python-unicode-string
	"""
	astr = ''.join(achr for achr in unicodedata.normalize('NFD', astr)
	if unicodedata.category(achr) != 'Mn')
	return astr

	def show_pangram(lang:str, fname:str):
	with open(fname, "r", encoding="utf-8") as fdin:
	astr = pangram(fdin.read(), lang)
	print("-", astr, end="\n\n")
	return True

	def pangram(text, lang=""):
	last = [line for line in text.splitlines() if line.strip() and line[0] != ' '][-1]
	astr = strip_acc(last)
	# To convert best-effort:
	# astr.encode("ASCII", errors='ignore').decode("ASCII")
	# Just ensure we got pure ASCII:
	rec = astr.encode("ASCII", errors='ignore').decode("ASCII")
	if astr != rec:
	print("# Warning NFD for language (ISO 3166-1 name):", lang)
	print("# last:", unidecode(last))
	return "?"
	return astr

	if __name__ == "__main__":
	main()