Created
June 4, 2026 08:26
-
-
Save lordlinus/db5ce3bb84a98328bc37d99475d09f01 to your computer and use it in GitHub Desktop.
SCB Thai TTS PLS lexicon for Azure Voice Live
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| <?xml version="1.0" encoding="UTF-8"?> | |
| <lexicon version="1.0" | |
| xmlns="http://www.w3.org/2005/01/pronunciation-lexicon" | |
| xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" | |
| xsi:schemaLocation="http://www.w3.org/2005/01/pronunciation-lexicon | |
| http://www.w3.org/TR/2007/CR-pronunciation-lexicon-20071212/pls.xsd" | |
| alphabet="ipa" xml:lang="th-TH"> | |
| <!-- | |
| SCOPE: Only override words the th-TH voice mispronounces or symbols it does | |
| not expand. Numbers, dates, and currency AMOUNTS are read correctly by the | |
| native voice and are intentionally NOT listed (overriding them risks | |
| regressions and only matches exact/isolated tokens). All phonemes use IPA in | |
| decomposed Unicode (NFD), as required by Azure custom lexicon. | |
| --> | |
| <!-- THAI CURRENCY --> | |
| <lexeme> | |
| <grapheme>฿</grapheme> | |
| <alias>บาท</alias> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>THB</grapheme> | |
| <alias>บาทไทย</alias> | |
| </lexeme> | |
| <!-- COMMON THAI WORDS & PHRASES --> | |
| <lexeme> | |
| <grapheme>สวัสดี</grapheme> | |
| <phoneme>sà.wàt.diː</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>ค่ะ</grapheme> | |
| <phoneme>kʰâ</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>ครับ</grapheme> | |
| <phoneme>kʰráp</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>ใช่</grapheme> | |
| <phoneme>tɕʰâj</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>ไม่</grapheme> | |
| <phoneme>mâj</phoneme> | |
| </lexeme> | |
| <!-- TIME EXPRESSIONS --> | |
| <lexeme> | |
| <grapheme>เช้า</grapheme> | |
| <phoneme>tɕʰáw</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>บ่าย</grapheme> | |
| <phoneme>bàːj</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>เย็น</grapheme> | |
| <phoneme>jen</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>คืน</grapheme> | |
| <phoneme>kʰɯːn</phoneme> | |
| </lexeme> | |
| <!-- MONTHS --> | |
| <lexeme> | |
| <grapheme>มกราคม</grapheme> | |
| <phoneme>mók.kà.raː.kʰom</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>กุมภาพันธ์</grapheme> | |
| <phoneme>kum.pʰaː.pʰan</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>มีนาคม</grapheme> | |
| <phoneme>miː.naː.kʰom</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>เมษายน</grapheme> | |
| <phoneme>meː.sǎː.yon</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>พฤษภาคม</grapheme> | |
| <phoneme>pʰrɯ́t.sà.pʰaː.kʰom</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>มิถุนายน</grapheme> | |
| <phoneme>mí.tʰù.naː.yon</phoneme> | |
| </lexeme> | |
| <!-- MONTHS continued (Jul-Dec) --> | |
| <lexeme> | |
| <grapheme>กรกฎาคม</grapheme> | |
| <phoneme>kà.rá.kà.daː.kʰom</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>สิงหาคม</grapheme> | |
| <phoneme>sǐŋ.hǎː.kʰom</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>กันยายน</grapheme> | |
| <phoneme>kan.yaː.yon</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>ตุลาคม</grapheme> | |
| <phoneme>tù.laː.kʰom</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>พฤศจิกายน</grapheme> | |
| <phoneme>pʰrɯ́t.sà.tɕì.kaː.yon</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>ธันวาคม</grapheme> | |
| <phoneme>tʰan.waː.kʰom</phoneme> | |
| </lexeme> | |
| <!-- COMMON FINANCIAL TERMS --> | |
| <lexeme> | |
| <grapheme>สินเชื่อ</grapheme> | |
| <phoneme>sǐn.tɕʰɯ̂a</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>บัตรเครดิต</grapheme> | |
| <phoneme>bàt.kʰreː.dìt</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>ดอกเบี้ย</grapheme> | |
| <phoneme>dɔ̀ːk.bîːa</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>บัญชี</grapheme> | |
| <phoneme>ban.tɕʰiː</phoneme> | |
| </lexeme> | |
| <!-- FORMAL PARTICLES --> | |
| <lexeme> | |
| <grapheme>ที่</grapheme> | |
| <phoneme>tʰîː</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>เป็น</grapheme> | |
| <phoneme>pen</phoneme> | |
| </lexeme> | |
| <lexeme> | |
| <grapheme>มี</grapheme> | |
| <phoneme>miː</phoneme> | |
| </lexeme> | |
| </lexicon> |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment