February 10, 2016 04:27
diff --git a/convert-html-entities.py b/convert-html-entities.py
 import html
 import re

 pua = {
    '63233': '&#3636;',
    '63234': '&#3637;',
    '63235': '&#3638;',
    '63236': '&#3639;',
    '63237': '&#3656;',
    '63238': '&#3657;',
    '63242': '&#3656;',
    '63243': '&#3657;',
    '63246': '&#3660;',
    '63248': '&#3633;',
    '63250': '&#3655;',
    '63251': '&#3656;',
    '63252': '&#3657;'
 }

 def thaiPUA(matchobj):
    return pua[matchobj.group(1)]

 p = re.compile(r'\&\#(\d{5,})\;')

 outputf = open('new.html', 'w')
 inputf = open('constitution-draft-20160129.html', 'r')
 for line in inputf:
    text = p.sub(thaiPUA, line)
    outputf.writelines(html.unescape(text))
 inputf.close()
 outputf.close()
	import html
	import re

	pua = {
	'63233': 'ิ',
	'63234': 'ี',
	'63235': 'ึ',
	'63236': 'ื',
	'63237': '่',
	'63238': '้',
	'63242': '่',
	'63243': '้',
	'63246': '์',
	'63248': 'ั',
	'63250': '็',
	'63251': '่',
	'63252': '้'
	}

	def thaiPUA(matchobj):
	return pua[matchobj.group(1)]

	p = re.compile(r'\&\#(\d{5,})\;')

	outputf = open('new.html', 'w')
	inputf = open('constitution-draft-20160129.html', 'r')
	for line in inputf:
	text = p.sub(thaiPUA, line)
	outputf.writelines(html.unescape(text))
	inputf.close()
	outputf.close()
No results found