-
Notifications
You must be signed in to change notification settings - Fork 0
/
searchindex.js
1 lines (1 loc) · 96.1 KB
/
searchindex.js
1
Search.setIndex({"alltitles": {"Additional Functions": [[1, "additional-functions"]], "BPEmbAug Class": [[1, "bpembaug-class"]], "Bigram": [[8, "bigram"]], "Citations": [[26, "citations"]], "Command Line": [[28, null]], "ConceptNet": [[6, "conceptnet"]], "Coreference Resolution Function": [[5, "coreference-resolution-function"]], "DEFAULT_SPELL_CHECKER": [[14, "default-spell-checker"]], "Definition": [[6, "definition"]], "Dependencies": [[24, "dependencies"]], "EntityLinker": [[7, "entitylinker"]], "Example": [[7, "example"], [8, "example"], [9, "example"], [11, "example"]], "FAQ": [[27, null], [30, "faq"]], "FastTextAug and Thai2transformersAug Classes": [[1, "fasttextaug-and-thai2transformersaug-classes"]], "Functions": [[2, "functions"]], "Getting Started": [[29, null]], "Indices and tables": [[26, "indices-and-tables"]], "Installation": [[30, null]], "Introduction": [[1, "introduction"], [2, "introduction"], [5, "introduction"]], "KeyBERT": [[15, "keybert"]], "Keyword Extraction Engines": [[15, "keyword-extraction-engines"]], "KhaveeVerifier": [[9, "khaveeverifier"]], "License": [[31, null]], "Modules": [[0, "modules"], [6, "modules"], [8, "modules"], [9, "modules"], [11, "modules"], [12, "modules"], [13, "modules"], [14, "modules"], [15, "modules"], [16, "modules"], [17, "modules"], [18, "modules"], [19, "modules"], [20, "modules"], [21, "modules"], [22, "modules"], [23, "modules"], [24, "modules"], [25, "modules"]], "NorvigSpellChecker": [[14, "norvigspellchecker"]], "Notes": [[26, null]], "OSCAR": [[6, "oscar"]], "Package reference:": [[26, null]], "PyThaiNLP documentation": [[26, null]], "Quality Evaluation": [[2, "quality-evaluation"]], "References": [[13, "references"], [14, "references"], [16, "references"], [20, "references"], [22, "references"], [23, "references"], [24, "references"]], "Runtime Configurations": [[30, "runtime-configurations"]], "Sentence level": [[17, "sentence-level"]], "Subword level": [[17, "subword-level"]], "Synset": [[6, "synset"]], "Tagger Engines": [[16, "tagger-engines"]], "TextAugment Class": [[1, "textaugment-class"]], "Tokenization": [[2, "tokenization"]], "Tokenization Engines": [[17, "tokenization-engines"]], "Transliteration Engines": [[20, "transliteration-engines"]], "Trigram": [[8, "trigram"]], "Tutorial Notebooks": [[29, "tutorial-notebooks"]], "Unigram": [[8, "unigram"]], "Usage": [[2, "usage"], [5, "usage"], [8, "usage"], [11, "usage"]], "Util": [[6, "util"]], "Word level": [[17, "word-level"]], "Word2VecAug, Thai2fitAug, LTW2VAug Classes": [[1, "word2vecaug-thai2fitaug-ltw2vaug-classes"]], "WordNet": [[6, "wordnet"]], "WordNetAug Class": [[1, "wordnetaug-class"]], "correct": [[14, "correct"]], "correct_sent": [[14, "correct-sent"]], "countries": [[6, "countries"]], "dependency_parsing": [[11, "dependency-parsing"]], "download": [[6, "download"]], "find_synonym": [[6, "find-synonym"]], "get_corpus": [[6, "get-corpus"]], "get_corpus_as_is": [[6, "get-corpus-as-is"]], "get_corpus_db": [[6, "get-corpus-db"]], "get_corpus_db_detail": [[6, "get-corpus-db-detail"]], "get_corpus_default_db": [[6, "get-corpus-default-db"]], "get_corpus_path": [[6, "get-corpus-path"]], "lk82": [[13, "lk82"]], "metasound": [[13, "metasound"]], "perceptron": [[16, "perceptron"]], "prayut_and_somchaip": [[13, "prayut-and-somchaip"]], "provinces": [[6, "provinces"]], "pythainlp.ancient": [[0, null]], "pythainlp.augment": [[1, null]], "pythainlp.benchmarks": [[2, null]], "pythainlp.chat": [[3, null]], "pythainlp.classify": [[4, null]], "pythainlp.coref": [[5, null]], "pythainlp.corpus": [[6, null]], "pythainlp.corpus.conceptnet.edges": [[6, "pythainlp-corpus-conceptnet-edges"]], "pythainlp.corpus.oscar.unigram_word_freqs": [[6, "pythainlp-corpus-oscar-unigram-word-freqs"]], "pythainlp.corpus.oscar.word_freqs": [[6, "pythainlp-corpus-oscar-word-freqs"]], "pythainlp.corpus.th_en_translit.get_transliteration_dict": [[6, "pythainlp-corpus-th-en-translit-get-transliteration-dict"]], "pythainlp.corpus.tnc.bigram_word_freqs": [[6, "pythainlp-corpus-tnc-bigram-word-freqs"]], "pythainlp.corpus.tnc.trigram_word_freqs": [[6, "pythainlp-corpus-tnc-trigram-word-freqs"]], "pythainlp.corpus.tnc.unigram_word_freqs": [[6, "pythainlp-corpus-tnc-unigram-word-freqs"]], "pythainlp.corpus.tnc.word_freqs": [[6, "pythainlp-corpus-tnc-word-freqs"]], "pythainlp.corpus.ttc.unigram_word_freqs": [[6, "pythainlp-corpus-ttc-unigram-word-freqs"]], "pythainlp.corpus.ttc.word_freqs": [[6, "pythainlp-corpus-ttc-word-freqs"]], "pythainlp.corpus.util.find_badwords": [[6, "pythainlp-corpus-util-find-badwords"]], "pythainlp.corpus.util.revise_newmm_default_wordset": [[6, "pythainlp-corpus-util-revise-newmm-default-wordset"]], "pythainlp.corpus.util.revise_wordset": [[6, "pythainlp-corpus-util-revise-wordset"]], "pythainlp.corpus.wordnet.all_lemma_names": [[6, "pythainlp-corpus-wordnet-all-lemma-names"]], "pythainlp.corpus.wordnet.all_synsets": [[6, "pythainlp-corpus-wordnet-all-synsets"]], "pythainlp.corpus.wordnet.custom_lemmas": [[6, "pythainlp-corpus-wordnet-custom-lemmas"]], "pythainlp.corpus.wordnet.langs": [[6, "pythainlp-corpus-wordnet-langs"]], "pythainlp.corpus.wordnet.lch_similarity": [[6, "pythainlp-corpus-wordnet-lch-similarity"]], "pythainlp.corpus.wordnet.lemma": [[6, "pythainlp-corpus-wordnet-lemma"]], "pythainlp.corpus.wordnet.lemma_from_key": [[6, "pythainlp-corpus-wordnet-lemma-from-key"]], "pythainlp.corpus.wordnet.lemmas": [[6, "pythainlp-corpus-wordnet-lemmas"]], "pythainlp.corpus.wordnet.morphy": [[6, "pythainlp-corpus-wordnet-morphy"]], "pythainlp.corpus.wordnet.path_similarity": [[6, "pythainlp-corpus-wordnet-path-similarity"]], "pythainlp.corpus.wordnet.synset": [[6, "pythainlp-corpus-wordnet-synset"]], "pythainlp.corpus.wordnet.synsets": [[6, "pythainlp-corpus-wordnet-synsets"]], "pythainlp.corpus.wordnet.wup_similarity": [[6, "pythainlp-corpus-wordnet-wup-similarity"]], "pythainlp.el": [[7, null]], "pythainlp.generate": [[8, null]], "pythainlp.generate.thai2fit.gen_sentence": [[8, "pythainlp-generate-thai2fit-gen-sentence"]], "pythainlp.generate.wangchanglm.WangChanGLM": [[8, "pythainlp-generate-wangchanglm-wangchanglm"]], "pythainlp.khavee": [[9, null]], "pythainlp.morpheme": [[10, null]], "pythainlp.parse": [[11, null]], "pythainlp.phayathaibert": [[12, null]], "pythainlp.soundex": [[13, null]], "pythainlp.soundex.sound.audio_vector": [[13, "pythainlp-soundex-sound-audio-vector"]], "pythainlp.soundex.sound.word2audio": [[13, "pythainlp-soundex-sound-word2audio"]], "pythainlp.soundex.sound.word_approximation": [[13, "pythainlp-soundex-sound-word-approximation"]], "pythainlp.spell": [[14, null]], "pythainlp.summarize": [[15, null]], "pythainlp.tag": [[16, null]], "pythainlp.tokenize": [[17, null]], "pythainlp.tools": [[18, null]], "pythainlp.translate": [[19, null]], "pythainlp.transliterate": [[20, null]], "pythainlp.ulmfit": [[21, null]], "pythainlp.util": [[22, null]], "pythainlp.wangchanberta": [[23, null]], "pythainlp.word_vector": [[24, null]], "pythainlp.wsd": [[25, null]], "remove": [[6, "remove"]], "soundex": [[13, "soundex"]], "spell": [[14, "spell"]], "spell_sent": [[14, "spell-sent"]], "thai_dict": [[6, "thai-dict"]], "thai_family_names": [[6, "thai-family-names"]], "thai_female_names": [[6, "thai-female-names"]], "thai_male_names": [[6, "thai-male-names"]], "thai_negations": [[6, "thai-negations"]], "thai_orst_words": [[6, "thai-orst-words"]], "thai_stopwords": [[6, "thai-stopwords"]], "thai_syllables": [[6, "thai-syllables"]], "thai_synonyms": [[6, "thai-synonyms"]], "thai_words": [[6, "thai-words"]], "thai_wsd_dict": [[6, "thai-wsd-dict"]], "udom83": [[13, "udom83"]], "unigram": [[16, "unigram"]]}, "docnames": ["api/ancient", "api/augment", "api/benchmarks", "api/chat", "api/classify", "api/coref", "api/corpus", "api/el", "api/generate", "api/khavee", "api/morpheme", "api/parse", "api/phayathaibert", "api/soundex", "api/spell", "api/summarize", "api/tag", "api/tokenize", "api/tools", "api/translate", "api/transliterate", "api/ulmfit", "api/util", "api/wangchanberta", "api/word_vector", "api/wsd", "index", "notes/FAQ", "notes/command_line", "notes/getting_started", "notes/installation", "notes/license"], "envversion": {"sphinx": 64, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinx.ext.todo": 2, "sphinx.ext.viewcode": 1}, "filenames": ["api/ancient.rst", "api/augment.rst", "api/benchmarks.rst", "api/chat.rst", "api/classify.rst", "api/coref.rst", "api/corpus.rst", "api/el.rst", "api/generate.rst", "api/khavee.rst", "api/morpheme.rst", "api/parse.rst", "api/phayathaibert.rst", "api/soundex.rst", "api/spell.rst", "api/summarize.rst", "api/tag.rst", "api/tokenize.rst", "api/tools.rst", "api/translate.rst", "api/transliterate.rst", "api/ulmfit.rst", "api/util.rst", "api/wangchanberta.rst", "api/word_vector.rst", "api/wsd.rst", "index.rst", "notes/FAQ.rst", "notes/command_line.rst", "notes/getting_started.rst", "notes/installation.rst", "notes/license.rst"], "indexentries": {"__dict__ (pythainlp.khavee.khaveeverifier attribute)": [[9, "pythainlp.khavee.KhaveeVerifier.__dict__", false]], "__dict__ (pythainlp.spell.norvigspellchecker attribute)": [[14, "pythainlp.spell.NorvigSpellChecker.__dict__", false]], "__init__() (pythainlp.el.entitylinker method)": [[7, "pythainlp.el.EntityLinker.__init__", false]], "__init__() (pythainlp.generate.bigram method)": [[8, "pythainlp.generate.Bigram.__init__", false]], "__init__() (pythainlp.generate.trigram method)": [[8, "pythainlp.generate.Trigram.__init__", false]], "__init__() (pythainlp.generate.unigram method)": [[8, "pythainlp.generate.Unigram.__init__", false]], "__init__() (pythainlp.khavee.khaveeverifier method)": [[9, "pythainlp.khavee.KhaveeVerifier.__init__", false]], "__init__() (pythainlp.spell.norvigspellchecker method)": [[14, "pythainlp.spell.NorvigSpellChecker.__init__", false]], "__init__() (pythainlp.tag.ner method)": [[16, "pythainlp.tag.NER.__init__", false]], "__init__() (pythainlp.tag.nner method)": [[16, "pythainlp.tag.NNER.__init__", false]], "__init__() (pythainlp.tag.thainer.thainametagger method)": [[16, "pythainlp.tag.thainer.ThaiNameTagger.__init__", false]], "__init__() (pythainlp.tokenize.longest.longestmatchtokenizer method)": [[17, "pythainlp.tokenize.longest.LongestMatchTokenizer.__init__", false]], "__init__() (pythainlp.tokenize.multi_cut.latticestring method)": [[17, "pythainlp.tokenize.multi_cut.LatticeString.__init__", false]], "__init__() (pythainlp.tokenize.tokenizer method)": [[17, "pythainlp.tokenize.Tokenizer.__init__", false]], "__init__() (pythainlp.util.trie method)": [[22, "pythainlp.util.Trie.__init__", false]], "__init__() (pythainlp.util.trie.node method)": [[22, "pythainlp.util.Trie.Node.__init__", false]], "__module__ (pythainlp.khavee.khaveeverifier attribute)": [[9, "pythainlp.khavee.KhaveeVerifier.__module__", false]], "__module__ (pythainlp.spell.norvigspellchecker attribute)": [[14, "pythainlp.spell.NorvigSpellChecker.__module__", false]], "add() (pythainlp.util.trie method)": [[22, "pythainlp.util.Trie.add", false]], "aksonhan_to_current() (in module pythainlp.ancient)": [[0, "pythainlp.ancient.aksonhan_to_current", false]], "bigram (class in pythainlp.generate)": [[8, "pythainlp.generate.Bigram", false]], "check_aek_too() (pythainlp.khavee.khaveeverifier method)": [[9, "pythainlp.khavee.KhaveeVerifier.check_aek_too", false]], "check_karu_lahu() (pythainlp.khavee.khaveeverifier method)": [[9, "pythainlp.khavee.KhaveeVerifier.check_karu_lahu", false]], "check_klon() (pythainlp.khavee.khaveeverifier method)": [[9, "pythainlp.khavee.KhaveeVerifier.check_klon", false]], "check_marttra() (pythainlp.khavee.khaveeverifier method)": [[9, "pythainlp.khavee.KhaveeVerifier.check_marttra", false]], "check_sara() (pythainlp.khavee.khaveeverifier method)": [[9, "pythainlp.khavee.KhaveeVerifier.check_sara", false]], "children (pythainlp.util.trie.node attribute)": [[22, "pythainlp.util.Trie.Node.children", false]], "chunk_parse() (in module pythainlp.tag)": [[16, "pythainlp.tag.chunk_parse", false]], "coreference_resolution() (in module pythainlp.coref)": [[5, "pythainlp.coref.coreference_resolution", false]], "correct() (in module pythainlp.spell)": [[14, "pythainlp.spell.correct", false]], "correct() (pythainlp.spell.norvigspellchecker method)": [[14, "pythainlp.spell.NorvigSpellChecker.correct", false]], "correct_sent() (in module pythainlp.spell)": [[14, "pythainlp.spell.correct_sent", false]], "default_spell_checker (in module pythainlp.spell)": [[14, "pythainlp.spell.DEFAULT_SPELL_CHECKER", false]], "dependency_parsing() (in module pythainlp.parse)": [[11, "pythainlp.parse.dependency_parsing", false]], "dictionary() (pythainlp.spell.norvigspellchecker method)": [[14, "pythainlp.spell.NorvigSpellChecker.dictionary", false]], "end (pythainlp.util.trie.node attribute)": [[22, "pythainlp.util.Trie.Node.end", false]], "entitylinker (class in pythainlp.el)": [[7, "pythainlp.el.EntityLinker", false]], "environment variable": [[18, "index-0", false], [30, "envvar-PYTHAINLP_DATA_DIR", false], [30, "envvar-PYTHAINLP_READ_MODE", false]], "extract_keywords() (in module pythainlp.summarize)": [[15, "pythainlp.summarize.extract_keywords", false]], "find_all_segment() (in module pythainlp.tokenize.multi_cut)": [[17, "pythainlp.tokenize.multi_cut.find_all_segment", false]], "freq() (pythainlp.spell.norvigspellchecker method)": [[14, "pythainlp.spell.NorvigSpellChecker.freq", false]], "gen_sentence() (pythainlp.generate.bigram method)": [[8, "pythainlp.generate.Bigram.gen_sentence", false]], "gen_sentence() (pythainlp.generate.trigram method)": [[8, "pythainlp.generate.Trigram.gen_sentence", false]], "gen_sentence() (pythainlp.generate.unigram method)": [[8, "pythainlp.generate.Unigram.gen_sentence", false]], "get_el() (pythainlp.el.entitylinker method)": [[7, "pythainlp.el.EntityLinker.get_el", false]], "get_ner() (pythainlp.tag.thainer.thainametagger method)": [[16, "pythainlp.tag.thainer.ThaiNameTagger.get_ner", false]], "get_sense() (in module pythainlp.wsd)": [[25, "pythainlp.wsd.get_sense", false]], "handle_karun_sound_silence() (pythainlp.khavee.khaveeverifier method)": [[9, "pythainlp.khavee.KhaveeVerifier.handle_karun_sound_silence", false]], "is_sumpus() (pythainlp.khavee.khaveeverifier method)": [[9, "pythainlp.khavee.KhaveeVerifier.is_sumpus", false]], "khaveeverifier (class in pythainlp.khavee)": [[9, "pythainlp.khavee.KhaveeVerifier", false]], "known() (pythainlp.spell.norvigspellchecker method)": [[14, "pythainlp.spell.NorvigSpellChecker.known", false]], "latticestring (class in pythainlp.tokenize.multi_cut)": [[17, "pythainlp.tokenize.multi_cut.LatticeString", false]], "list_to_string() (in module pythainlp.tokenize.thaisumcut)": [[17, "pythainlp.tokenize.thaisumcut.list_to_string", false]], "lk82() (in module pythainlp.soundex)": [[13, "pythainlp.soundex.lk82", false]], "load_engine() (pythainlp.tag.ner method)": [[16, "pythainlp.tag.NER.load_engine", false]], "load_engine() (pythainlp.tag.nner method)": [[16, "pythainlp.tag.NNER.load_engine", false]], "longestmatchtokenizer (class in pythainlp.tokenize.longest)": [[17, "pythainlp.tokenize.longest.LongestMatchTokenizer", false]], "metasound() (in module pythainlp.soundex)": [[13, "pythainlp.soundex.metasound", false]], "middle_cut() (in module pythainlp.tokenize.thaisumcut)": [[17, "pythainlp.tokenize.thaisumcut.middle_cut", false]], "mmcut() (in module pythainlp.tokenize.multi_cut)": [[17, "pythainlp.tokenize.multi_cut.mmcut", false]], "module": [[17, "module-pythainlp.tokenize.etcc", false], [17, "module-pythainlp.tokenize.longest", false], [17, "module-pythainlp.tokenize.multi_cut", false], [17, "module-pythainlp.tokenize.newmm", false], [17, "module-pythainlp.tokenize.tcc", false], [17, "module-pythainlp.tokenize.tcc_p", false], [17, "module-pythainlp.tokenize.thaisumcut", false], [20, "module-pythainlp.transliterate.royin.romanize", false]], "ner (class in pythainlp.tag)": [[16, "pythainlp.tag.NER", false]], "nighit() (in module pythainlp.morpheme)": [[10, "pythainlp.morpheme.nighit", false]], "nner (class in pythainlp.tag)": [[16, "pythainlp.tag.NNER", false]], "norvigspellchecker (class in pythainlp.spell)": [[14, "pythainlp.spell.NorvigSpellChecker", false]], "pos_tag() (in module pythainlp.tag)": [[16, "pythainlp.tag.pos_tag", false]], "pos_tag_sents() (in module pythainlp.tag)": [[16, "pythainlp.tag.pos_tag_sents", false]], "prayut_and_somchaip() (in module pythainlp.soundex)": [[13, "pythainlp.soundex.prayut_and_somchaip", false]], "prefixes() (pythainlp.util.trie method)": [[22, "pythainlp.util.Trie.prefixes", false]], "prob() (pythainlp.generate.bigram method)": [[8, "pythainlp.generate.Bigram.prob", false]], "prob() (pythainlp.generate.trigram method)": [[8, "pythainlp.generate.Trigram.prob", false]], "prob() (pythainlp.spell.norvigspellchecker method)": [[14, "pythainlp.spell.NorvigSpellChecker.prob", false]], "pythainlp.tokenize.etcc": [[17, "module-pythainlp.tokenize.etcc", false]], "pythainlp.tokenize.longest": [[17, "module-pythainlp.tokenize.longest", false]], "pythainlp.tokenize.multi_cut": [[17, "module-pythainlp.tokenize.multi_cut", false]], "pythainlp.tokenize.newmm": [[17, "module-pythainlp.tokenize.newmm", false]], "pythainlp.tokenize.tcc": [[17, "module-pythainlp.tokenize.tcc", false]], "pythainlp.tokenize.tcc_p": [[17, "module-pythainlp.tokenize.tcc_p", false]], "pythainlp.tokenize.thaisumcut": [[17, "module-pythainlp.tokenize.thaisumcut", false]], "pythainlp.transliterate.royin.romanize": [[20, "module-pythainlp.transliterate.royin.romanize", false]], "pythainlp_data_dir": [[18, "index-0", false], [30, "envvar-PYTHAINLP_DATA_DIR", false]], "pythainlp_read_mode": [[30, "envvar-PYTHAINLP_READ_MODE", false]], "remove() (pythainlp.util.trie method)": [[22, "pythainlp.util.Trie.remove", false]], "segment() (in module pythainlp.tokenize.etcc)": [[17, "pythainlp.tokenize.etcc.segment", false]], "segment() (in module pythainlp.tokenize.longest)": [[17, "pythainlp.tokenize.longest.segment", false]], "segment() (in module pythainlp.tokenize.multi_cut)": [[17, "pythainlp.tokenize.multi_cut.segment", false]], "segment() (in module pythainlp.tokenize.newmm)": [[17, "pythainlp.tokenize.newmm.segment", false]], "segment() (in module pythainlp.tokenize.tcc)": [[17, "pythainlp.tokenize.tcc.segment", false]], "segment() (in module pythainlp.tokenize.tcc_p)": [[17, "pythainlp.tokenize.tcc_p.segment", false]], "set_tokenize_engine() (pythainlp.tokenize.tokenizer method)": [[17, "pythainlp.tokenize.Tokenizer.set_tokenize_engine", false]], "soundex() (in module pythainlp.soundex)": [[13, "pythainlp.soundex.soundex", false]], "spell() (in module pythainlp.spell)": [[14, "pythainlp.spell.spell", false]], "spell() (pythainlp.spell.norvigspellchecker method)": [[14, "pythainlp.spell.NorvigSpellChecker.spell", false]], "spell_sent() (in module pythainlp.spell)": [[14, "pythainlp.spell.spell_sent", false]], "split_into_sentences() (pythainlp.tokenize.thaisumcut.thaisentencesegmentor method)": [[17, "pythainlp.tokenize.thaisumcut.ThaiSentenceSegmentor.split_into_sentences", false]], "summarize() (in module pythainlp.summarize)": [[15, "pythainlp.summarize.summarize", false]], "tag() (pythainlp.tag.ner method)": [[16, "pythainlp.tag.NER.tag", false]], "tag() (pythainlp.tag.nner method)": [[16, "pythainlp.tag.NNER.tag", false]], "tag_provinces() (in module pythainlp.tag)": [[16, "pythainlp.tag.tag_provinces", false]], "tcc() (in module pythainlp.tokenize.tcc)": [[17, "pythainlp.tokenize.tcc.tcc", false]], "tcc() (in module pythainlp.tokenize.tcc_p)": [[17, "pythainlp.tokenize.tcc_p.tcc", false]], "tcc_pos() (in module pythainlp.tokenize.tcc)": [[17, "pythainlp.tokenize.tcc.tcc_pos", false]], "tcc_pos() (in module pythainlp.tokenize.tcc_p)": [[17, "pythainlp.tokenize.tcc_p.tcc_pos", false]], "thainametagger (class in pythainlp.tag.thainer)": [[16, "pythainlp.tag.thainer.ThaiNameTagger", false]], "thaisentencesegmentor (class in pythainlp.tokenize.thaisumcut)": [[17, "pythainlp.tokenize.thaisumcut.ThaiSentenceSegmentor", false]], "tokenize() (pythainlp.tokenize.longest.longestmatchtokenizer method)": [[17, "pythainlp.tokenize.longest.LongestMatchTokenizer.tokenize", false]], "tokenizer (class in pythainlp.tokenize)": [[17, "pythainlp.tokenize.Tokenizer", false]], "trie (class in pythainlp.util)": [[22, "pythainlp.util.Trie", false]], "trie.node (class in pythainlp.util)": [[22, "pythainlp.util.Trie.Node", false]], "trigram (class in pythainlp.generate)": [[8, "pythainlp.generate.Trigram", false]], "udom83() (in module pythainlp.soundex)": [[13, "pythainlp.soundex.udom83", false]], "unigram (class in pythainlp.generate)": [[8, "pythainlp.generate.Unigram", false]], "word_tokenize() (pythainlp.tokenize.tokenizer method)": [[17, "pythainlp.tokenize.Tokenizer.word_tokenize", false]]}, "objects": {"": [[30, 6, 1, "-", "PYTHAINLP_DATA_DIR"], [30, 6, 1, "-", "PYTHAINLP_READ_MODE"]], "pythainlp.ancient": [[0, 0, 1, "", "aksonhan_to_current"]], "pythainlp.coref": [[5, 0, 1, "", "coreference_resolution"]], "pythainlp.el": [[7, 1, 1, "", "EntityLinker"]], "pythainlp.el.EntityLinker": [[7, 2, 1, "", "__init__"], [7, 2, 1, "", "get_el"]], "pythainlp.generate": [[8, 1, 1, "", "Bigram"], [8, 1, 1, "", "Trigram"], [8, 1, 1, "", "Unigram"]], "pythainlp.generate.Bigram": [[8, 2, 1, "", "__init__"], [8, 2, 1, "", "gen_sentence"], [8, 2, 1, "", "prob"]], "pythainlp.generate.Trigram": [[8, 2, 1, "", "__init__"], [8, 2, 1, "", "gen_sentence"], [8, 2, 1, "", "prob"]], "pythainlp.generate.Unigram": [[8, 2, 1, "", "__init__"], [8, 2, 1, "", "gen_sentence"]], "pythainlp.khavee": [[9, 1, 1, "", "KhaveeVerifier"]], "pythainlp.khavee.KhaveeVerifier": [[9, 3, 1, "", "__dict__"], [9, 2, 1, "", "__init__"], [9, 3, 1, "", "__module__"], [9, 2, 1, "", "check_aek_too"], [9, 2, 1, "", "check_karu_lahu"], [9, 2, 1, "", "check_klon"], [9, 2, 1, "", "check_marttra"], [9, 2, 1, "", "check_sara"], [9, 2, 1, "", "handle_karun_sound_silence"], [9, 2, 1, "", "is_sumpus"]], "pythainlp.morpheme": [[10, 0, 1, "", "nighit"]], "pythainlp.parse": [[11, 0, 1, "", "dependency_parsing"]], "pythainlp.soundex": [[13, 0, 1, "", "lk82"], [13, 0, 1, "", "metasound"], [13, 0, 1, "", "prayut_and_somchaip"], [13, 0, 1, "", "soundex"], [13, 0, 1, "", "udom83"]], "pythainlp.spell": [[14, 4, 1, "", "DEFAULT_SPELL_CHECKER"], [14, 1, 1, "", "NorvigSpellChecker"], [14, 0, 1, "", "correct"], [14, 0, 1, "", "correct_sent"], [14, 0, 1, "", "spell"], [14, 0, 1, "", "spell_sent"]], "pythainlp.spell.NorvigSpellChecker": [[14, 3, 1, "", "__dict__"], [14, 2, 1, "", "__init__"], [14, 3, 1, "", "__module__"], [14, 2, 1, "", "correct"], [14, 2, 1, "", "dictionary"], [14, 2, 1, "", "freq"], [14, 2, 1, "", "known"], [14, 2, 1, "", "prob"], [14, 2, 1, "", "spell"]], "pythainlp.summarize": [[15, 0, 1, "", "extract_keywords"], [15, 0, 1, "", "summarize"]], "pythainlp.tag": [[16, 1, 1, "", "NER"], [16, 1, 1, "", "NNER"], [16, 0, 1, "", "chunk_parse"], [16, 0, 1, "", "pos_tag"], [16, 0, 1, "", "pos_tag_sents"], [16, 0, 1, "", "tag_provinces"]], "pythainlp.tag.NER": [[16, 2, 1, "", "__init__"], [16, 2, 1, "", "load_engine"], [16, 2, 1, "", "tag"]], "pythainlp.tag.NNER": [[16, 2, 1, "", "__init__"], [16, 2, 1, "", "load_engine"], [16, 2, 1, "", "tag"]], "pythainlp.tag.thainer": [[16, 1, 1, "", "ThaiNameTagger"]], "pythainlp.tag.thainer.ThaiNameTagger": [[16, 2, 1, "", "__init__"], [16, 2, 1, "", "get_ner"]], "pythainlp.tokenize": [[17, 1, 1, "", "Tokenizer"], [17, 5, 0, "-", "etcc"], [17, 5, 0, "-", "longest"], [17, 5, 0, "-", "multi_cut"], [17, 5, 0, "-", "newmm"], [17, 5, 0, "-", "tcc"], [17, 5, 0, "-", "tcc_p"], [17, 5, 0, "-", "thaisumcut"]], "pythainlp.tokenize.Tokenizer": [[17, 2, 1, "", "__init__"], [17, 2, 1, "", "set_tokenize_engine"], [17, 2, 1, "", "word_tokenize"]], "pythainlp.tokenize.etcc": [[17, 0, 1, "", "segment"]], "pythainlp.tokenize.longest": [[17, 1, 1, "", "LongestMatchTokenizer"], [17, 0, 1, "", "segment"]], "pythainlp.tokenize.longest.LongestMatchTokenizer": [[17, 2, 1, "", "__init__"], [17, 2, 1, "", "tokenize"]], "pythainlp.tokenize.multi_cut": [[17, 1, 1, "", "LatticeString"], [17, 0, 1, "", "find_all_segment"], [17, 0, 1, "", "mmcut"], [17, 0, 1, "", "segment"]], "pythainlp.tokenize.multi_cut.LatticeString": [[17, 2, 1, "", "__init__"]], "pythainlp.tokenize.newmm": [[17, 0, 1, "", "segment"]], "pythainlp.tokenize.tcc": [[17, 0, 1, "", "segment"], [17, 0, 1, "", "tcc"], [17, 0, 1, "", "tcc_pos"]], "pythainlp.tokenize.tcc_p": [[17, 0, 1, "", "segment"], [17, 0, 1, "", "tcc"], [17, 0, 1, "", "tcc_pos"]], "pythainlp.tokenize.thaisumcut": [[17, 1, 1, "", "ThaiSentenceSegmentor"], [17, 0, 1, "", "list_to_string"], [17, 0, 1, "", "middle_cut"]], "pythainlp.tokenize.thaisumcut.ThaiSentenceSegmentor": [[17, 2, 1, "", "split_into_sentences"]], "pythainlp.transliterate.royin": [[20, 5, 0, "-", "romanize"]], "pythainlp.util": [[22, 1, 1, "", "Trie"]], "pythainlp.util.Trie": [[22, 1, 1, "", "Node"], [22, 2, 1, "", "__init__"], [22, 2, 1, "", "add"], [22, 2, 1, "", "prefixes"], [22, 2, 1, "", "remove"]], "pythainlp.util.Trie.Node": [[22, 2, 1, "", "__init__"], [22, 3, 1, "", "children"], [22, 3, 1, "", "end"]], "pythainlp.wsd": [[25, 0, 1, "", "get_sense"]]}, "objnames": {"0": ["py", "function", "Python function"], "1": ["py", "class", "Python class"], "2": ["py", "method", "Python method"], "3": ["py", "attribute", "Python attribute"], "4": ["py", "data", "Python data"], "5": ["py", "module", "Python module"], "6": ["std", "envvar", "environment variable"]}, "objtypes": {"0": "py:function", "1": "py:class", "2": "py:method", "3": "py:attribute", "4": "py:data", "5": "py:module", "6": "std:envvar"}, "terms": {"": [5, 6, 7, 8, 9, 11, 14, 16, 17, 18, 20, 22, 23, 28], "0": [5, 6, 7, 8, 11, 14, 15, 16, 17, 20, 22, 25, 26, 28, 30, 31], "00": [6, 22], "000": [14, 16], "0000": 28, "0006959172792052158": 14, "001": 8, "01": 22, "01234567890": 22, "02": 23, "03": 22, "05": [14, 22], "05055": 16, "05gb": 6, "06": 22, "09": 22, "09319090843200684": 25, "09635": 23, "0974416732788086": 25, "0d": 22, "0e46": 22, "1": [6, 8, 11, 13, 14, 15, 16, 17, 20, 22, 25, 28, 30, 31], "10": [5, 6, 15, 16, 22, 30], "100": 22, "1000": 28, "10021889": 22, "1005704402923584": 25, "103": 16, "10400": 16, "10th": 22, "11": [7, 13, 16, 17, 22], "11130": 16, "114k": 6, "1153": 28, "1180": 10, "11940": 20, "12": 22, "1200": 16, "122": 22, "123": 22, "12473666667938232": 25, "127": 17, "12l": 17, "13": [22, 30], "14": 16, "1478": 28, "14ibg": 17, "15": [16, 22], "15637": 28, "16": 16, "1618": 24, "17": 22, "17654": 28, "18": [13, 22], "18807": 28, "189": 16, "19": [5, 17], "19132": 28, "1941": 22, "1946": 22, "198": 16, "1982": 13, "1983": 13, "1998": 13, "1999": 16, "1l": 17, "1st": 22, "1utqgxxmrxor9jp1b1jcq1frbnvorhtbq": 17, "1v1z657_5eswpo8rlfvrwa0a5e4vkg7si": 17, "2": [6, 8, 9, 11, 13, 14, 15, 16, 17, 22, 26, 30, 31], "20": 16, "200": 22, "2000": [16, 17], "2001": 17, "2004": 16, "2006": 20, "2007": 14, "2008": 16, "2009": 13, "2014": 24, "2016": 31, "2019": 22, "2020": [16, 17], "2021": 23, "2022": [13, 22], "2023": [22, 26, 31], "21": [16, 17, 22], "2101": 23, "23": [7, 22, 23], "2300612": 22, "234": 17, "234\u0e1a\u0e32\u0e1719": 17, "24": 22, "2410": 22, "243": 13, "2438": 22, "2499": 16, "24h": 22, "25": [6, 22, 26], "2519": 22, "2526": 13, "255": 13, "2551": 6, "2555": 22, "2556": 22, "2562": 22, "2565": 22, "2566": 22, "26": 6, "2670": 16, "27": [22, 23], "3": [6, 8, 11, 13, 15, 16, 22, 28, 30], "30": [14, 16, 22], "30301809310913086": 7, "31": 22, "312": 23, "32": [6, 30], "3223": 14, "32\u0e19": 17, "36": [26, 28], "3639": 14, "37": 17, "3734": 22, "3rd": 26, "4": [6, 8, 9, 11, 13, 16, 20, 22, 31], "40": [14, 17, 22], "400": 22, "41": 6, "42caj4e6bk1f5b1j": 22, "434330506948445": 6, "434k": 6, "4641016151377544": 6, "482306849763902e": 14, "49": 16, "4th": 22, "5": [13, 14, 15, 16, 17, 22, 28, 30], "50": [5, 22], "50755": 28, "52": [5, 13], "543": 22, "56": 22, "59": 22, "5mb": 6, "5x": 17, "6": [6, 7, 13, 18, 22, 30], "61": 16, "62": [22, 30], "620": 22, "6399497389793396": 7, "64": [23, 30], "65": 23, "66": 22, "690kb": 6, "6h": 22, "7": [7, 16, 22, 23], "7142490744590759": 7, "7th": 22, "8": [9, 13, 17, 22, 23], "8173": 28, "8314": 28, "8657019734382629": 7, "8888": 16, "89": 23, "9": [14, 15, 16, 22, 23], "9227": 28, "9387": 28, "95": [16, 22], "980": 22, "993": 28, "A": [5, 6, 10, 13, 14, 15, 17, 20, 22, 29, 30], "AND": 22, "AS": 31, "And": 14, "As": 29, "BE": 22, "By": [6, 14, 15, 18, 22, 25, 30], "For": [1, 6, 15, 16, 17, 22, 23, 29, 30, 31], "If": [6, 11, 14, 15, 16, 17, 18, 20, 22, 23, 26, 30], "In": [13, 17, 22, 26, 29], "It": [1, 6, 8, 9, 10, 11, 13, 14, 16, 17, 19, 20, 22, 24, 29, 30], "No": [6, 11, 16, 20, 29], "OF": 31, "OR": 31, "Of": [16, 28], "One": 20, "The": [1, 2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 29], "Then": [14, 15], "These": [1, 2, 6, 22, 24], "To": [1, 2, 5, 8, 11, 16], "With": [6, 29, 30], "_": [11, 22], "__annotations__": [9, 14], "__dict__": [9, 14], "__doc__": [9, 14], "__init__": [7, 8, 9, 14, 16, 17, 22], "__module__": [9, 14], "__weakref__": [9, 14], "_d": 22, "_is_thai_and_not_num": 14, "_token": 17, "aa": 22, "ab": 23, "abbr_en": 6, "abbr_th": 6, "abbrevi": [6, 16, 22, 30], "abbreviation_to_full_text": [22, 30], "about": [5, 6, 7, 11, 16, 22, 27, 30, 31], "abov": 22, "above_vowel": 22, "ac": [13, 14, 16], "academ": 16, "access": [6, 18, 20], "accident": 22, "accommod": 30, "accord": [6, 9, 13, 14, 17, 22], "account": [16, 22], "accur": [20, 22, 30], "accuraci": [2, 14, 17, 25], "achiev": 25, "acl": 11, "aclweb": 24, "acoust": 16, "activ": [6, 16], "actual": 22, "ad": [17, 22], "adapt": 17, "add": [17, 22], "add_year": 22, "addit": [2, 17, 20], "addition": 20, "address": 17, "adher": [9, 22], "adj": 16, "adject": 16, "adp": 16, "adposit": 16, "adv": 16, "advanc": [13, 14, 17, 30], "adverb": 16, "adverbi": 16, "advi": 16, "advis": 31, "advn": 16, "advp": 16, "ae": 22, "aek": 9, "affirm": 16, "after": [6, 16, 17, 22], "against": 28, "agre": 31, "ah": 22, "ai": 23, "aid": [10, 22], "aj": 16, "aksonhan": 0, "aksonhan_to_curr": 0, "al": [17, 23], "algorithm": [10, 13, 14, 15, 16, 17], "alik": 13, "all": [9, 14, 15, 17, 22, 30, 31], "allow": [1, 8, 13, 16, 17, 20, 22], "almost": 22, "along": 17, "alphabet": [13, 20, 22, 30], "alreadi": 6, "also": [6, 7, 15, 17, 30], "altern": [1, 20], "alwai": 22, "am": 22, "ambigu": [17, 25], "amd64": 30, "among": 17, "amount": 22, "an": [0, 6, 7, 10, 14, 17, 20, 22, 25, 29, 31], "analysi": [2, 9, 10, 17, 22], "analyz": [5, 9, 11, 13], "ancient": 26, "ani": [6, 14, 16, 17, 31], "anno": 22, "annot": 16, "answer": [7, 11], "anthologi": 24, "anyon": 2, "apach": [26, 31], "aphasia": 17, "api": 6, "appear": 15, "appl": 22, "appli": [5, 11, 17, 22], "applic": [1, 2, 7, 8, 13, 24, 25, 31], "approach": [1, 13, 17, 20, 30], "appropri": 8, "approxim": [13, 22], "ar": [1, 2, 6, 8, 13, 14, 15, 16, 17, 18, 20, 22, 23, 24, 25, 30, 31], "arab": 22, "arabic_digit_to_thai_digit": 22, "architectur": 30, "archiv": 22, "arguabl": 29, "around": 14, "art": 14, "arthit": 26, "articl": 16, "artifici": 6, "arxiv": [16, 23], "ascend": 22, "asia": 22, "asian": 29, "ask": 27, "assert": 10, "assess": 2, "asset": 1, "assign": 14, "assist": [2, 6, 20, 22, 25], "associ": [7, 16], "astrologi": 13, "att": 23, "attacut": [17, 28, 30], "attribut": [9, 14, 16, 17, 31], "audienc": 20, "audio": 13, "augment": [26, 30], "author": 17, "automat": 30, "aux": 16, "auxiliari": 16, "av": 16, "avail": [1, 6, 13, 16, 23, 28], "averag": 16, "avocado": 10, "avoid": 17, "awar": 25, "ax": 16, "a\u02d0": 20, "b": [16, 22], "backward": 17, "bact": 6, "badli": 6, "baht": 22, "bahttext": 22, "balanc": 17, "bangkok": 22, "bangkokhealth": 16, "bank": 22, "base": [1, 6, 7, 8, 10, 11, 12, 13, 14, 15, 17, 20, 22, 23, 25], "base_word": 6, "basi": [29, 31], "basic": [9, 11, 13, 14, 23], "becaus": [22, 29], "been": 6, "befor": [9, 16, 22, 24, 30], "begin": [8, 16, 22], "behavior": 22, "beij": 17, "being": 22, "bela": 7, "belong": [16, 22], "below": 22, "below_vowel": 22, "benchmark": [10, 23, 26, 28, 30], "benefici": [14, 22], "bert": [11, 17], "best": 29, "better": 30, "between": [6, 9, 11, 13, 16, 17, 19], "biggest": 29, "bigram": [6, 15], "bill": 5, "bit": 30, "blackboard": [16, 17], "blackboard_ud": 16, "bmsacr": 6, "boil": 29, "bool": [6, 8, 9, 10, 14, 16, 17, 20, 22], "boolean": [9, 14], "boonkwan": 16, "boriboon": 16, "both": [9, 13, 17, 22, 29], "boundari": 17, "bpemb_wv": 1, "break": 17, "breakiter": 6, "broken": 17, "br\u00fcckner": 13, "bsd": 22, "buddhist": 22, "build": [16, 25, 30], "built": [12, 23, 30], "bundl": 6, "c": [6, 22, 23, 30], "calcul": 22, "calendar": 22, "call": [8, 13, 15, 22, 30], "callabl": [6, 14], "can": [2, 5, 6, 7, 9, 11, 13, 14, 15, 17, 18, 22, 24, 25, 26, 27, 28, 29, 30], "candid": 14, "canin": 17, "cannot": [10, 22], "capabl": [1, 8, 11, 13, 19, 23], "captur": 29, "cardin": 16, "care": [15, 22], "case": [14, 17, 20], "cat": 22, "catalog": [6, 28], "categor": 10, "caus": 22, "cc": [6, 16, 31], "cc0": 31, "cconj": 16, "central": 1, "centuri": 22, "certainli": 22, "cfqc": 16, "ch": 22, "chakri": 22, "challeng": [5, 29], "chanc": 17, "chang": [17, 22], "chaovavanich": [6, 17, 26], "chapter": 22, "char": [11, 22], "char_level": 28, "charact": [6, 9, 14, 17, 20, 22], "characterist": 22, "charin": 26, "charun": 16, "chat": 26, "chatbot": 8, "check": [9, 10, 14, 22], "check_aek_too": 9, "check_karu_lahu": 9, "check_klon": 9, "check_marttra": 9, "check_sara": 9, "checker": [9, 14], "children": 22, "chines": 29, "choic": [14, 17], "choos": [14, 15, 16, 17, 20, 22], "chormai": 26, "chosen": 8, "chula": [13, 14], "chulalongkorn": 13, "chumpolsathien": 17, "chumpolsathien_2020": 17, "chunk": 16, "chunk_pars": 16, "cite": [13, 17, 23, 26], "cl": 16, "clariti": 22, "class": [7, 8, 9, 14, 16, 17, 22], "classic": 9, "classif": [21, 22, 29, 30], "classifi": [16, 26], "claus": 17, "clause_token": 17, "clean": 22, "clir": 13, "clock": 22, "close": 22, "closest": 14, "cltv": 16, "cluster": [5, 17], "clusters_str": 5, "cmtr": 16, "cnit": 16, "co": [20, 22], "code": [13, 17, 18, 22, 31], "coher": 8, "colab": [17, 23], "collat": 22, "collect": [2, 6, 10, 16, 18, 22], "colloc": 17, "com": [6, 7, 10, 16, 17, 22, 23], "combin": [13, 17], "come": 6, "comma": 29, "command": [26, 30], "comment": 6, "common": [6, 16, 17, 22, 31], "commun": [6, 17, 22], "compar": 16, "comparison": 13, "compat": [1, 22], "compil": [20, 30], "complet": 15, "complianc": 31, "compon": [1, 5, 7, 9, 11, 14, 17, 20, 22, 30], "comprehens": [17, 20, 23], "compress": 13, "comput": [6, 15, 22], "concepnet": 6, "concept": [5, 17], "conceptu": 22, "condit": 31, "config": 30, "configur": 14, "conjunct": 16, "conll": 11, "conllu": 11, "connect": 6, "connector": 29, "consecut": [8, 15], "consid": [6, 9, 16], "consider": 6, "consist": [6, 8, 22], "conson": [0, 22], "constrain": 17, "construct": 7, "contain": [1, 6, 16, 17, 18, 22, 24, 25], "content": [8, 22], "context": [5, 8, 16, 22, 25, 29], "contigu": 17, "continu": 17, "contributor": [6, 18], "conveni": 8, "convent": 22, "convers": [20, 22], "convert": [0, 13, 16, 20, 22], "convert_year": 22, "coordin": 16, "cop": 11, "copi": [6, 20, 31], "copyright": 31, "core": [7, 9, 11, 25], "coref": 26, "corefer": 30, "coreference_resolut": [5, 30], "corpora": [6, 16, 21, 24, 31], "corpu": [8, 14, 15, 16, 17, 22, 26, 28, 30, 31], "correct": [9, 22, 25], "correctli": [14, 22], "correctly_tokenised_word": 28, "corrector": [14, 22], "correspond": [7, 9, 16, 22], "cos_sim": 25, "could": [6, 17, 22, 30], "count": 22, "count_thai_char": 22, "counter": 22, "countries_th": 6, "countthai": 22, "covid": 5, "cp": 13, "cp36": 30, "cp36m": 30, "cpe": 15, "cplusplu": 22, "cpu": [5, 23, 25, 30], "creat": [8, 10, 11, 15, 16, 17, 18, 22, 29, 30, 31], "creation": [8, 9], "creativ": 31, "credit": [6, 17], "crf": [16, 17], "crfcut": [17, 28], "crfsuit": 30, "criteria": 22, "critic": 7, "cross": [13, 17], "crucial": [2, 5, 22, 25], "ctime": 22, "cuda": [5, 7], "cue": 22, "cultur": 22, "currenc": 22, "current": [0, 2, 14, 22, 30], "custom": [14, 17, 20, 22], "custom_dict": [14, 17, 25], "custom_dict_japanese_nam": 17, "custom_dictionari": 17, "custom_token": 25, "custom_words_list": 17, "customiz": 14, "cut": [17, 21], "cvbl": 16, "d": [6, 22], "dai": 22, "dangl": 22, "data": [1, 6, 8, 14, 18, 22, 24, 28, 30], "databas": [1, 6, 30], "dataset": [6, 17, 18, 28, 31], "datatim": 22, "date": [16, 22], "datetim": 22, "datetime_obj": 22, "db": 6, "dcnm": 16, "ddac": 16, "ddan": 16, "ddaq": 16, "ddbq": 16, "de": 29, "dead": [9, 22], "dead_syllable_as_aek": 9, "deal": [5, 25], "deberta": 11, "decid": 29, "decim": [17, 22], "decreas": 14, "dedic": [5, 9, 19, 20, 31], "deep": [20, 21], "deepcut": [17, 28], "default": [5, 6, 8, 11, 13, 14, 15, 16, 17, 18, 20, 22, 30], "default_db": 6, "default_word_dict_tri": 17, "defaultdict": 6, "defin": [15, 17], "definit": [16, 25], "degre": 29, "delimit": 22, "demonstr": 16, "deni": 30, "depend": [11, 16, 30], "dependency_pars": 30, "deprec": 22, "deriv": 11, "descend": [14, 22], "design": [1, 2, 5, 6, 8, 9, 13, 14, 17, 18, 20, 22, 25], "det": 16, "detail": [1, 6, 10, 16, 23, 24, 28, 30], "detect": [10, 11, 17, 22], "detector": 22, "determin": [16, 22, 25], "detoken": 17, "dev": 6, "develop": [1, 2, 13, 18, 22, 30], "devic": [5, 6, 7, 25], "dhanon": 16, "diac": 16, "diacrit": 22, "diaq": 16, "dibq": 16, "dict": [5, 6, 7, 14, 16, 17, 20, 22, 25], "dict_filt": 14, "dict_item": 14, "dict_sourc": [17, 22], "dict_tri": [6, 17, 22], "dictionari": [6, 14, 15, 17, 20, 22, 25], "die": 22, "differ": [5, 15, 16, 17, 19, 29], "digit": 22, "digit_to_text": 22, "direct": 22, "directli": [18, 28, 30], "directori": [6, 18, 30], "disambigu": [6, 25], "discard": 6, "discours": 16, "discuss": 24, "displai": 22, "display_thai_char": 22, "dist": [6, 18], "distanc": [14, 25], "distil": 17, "distribut": [22, 30, 31], "divers": 1, "diversif": 1, "diversifi": 1, "divid": 17, "dl": 6, "do": [6, 22, 29], "doc": [17, 22], "document": [1, 2, 6, 15, 17, 22, 24, 31], "doe": [16, 18, 22, 29, 30], "doesn": [6, 16], "domain": [17, 22, 31], "domini": 22, "donm": 16, "doubl": 22, "down": [0, 22, 29], "download": [18, 28, 30], "downstream": 2, "drive": 17, "dt_obj": 22, "due": 22, "duplic": [6, 8, 22], "dynasti": 22, "e": [6, 15, 16, 17, 22], "each": [1, 6, 14, 15, 16, 17, 22, 30], "eaff": 16, "eas": 22, "easi": 29, "easier": 22, "ed": 22, "edg": 21, "edit": [6, 14], "edu": 30, "effect": [5, 6, 15, 20], "effici": [17, 18, 22], "effort": 30, "either": 31, "eitt": 16, "el": [26, 30], "el_scor": 7, "electron": 22, "elimin": 22, "email": 16, "embed": [1, 17], "emoji": 22, "emoji_to_thai": 22, "empir": 26, "empti": [6, 22, 25], "en": [6, 22], "enabl": [1, 8, 13, 18], "encapsul": 17, "encod": [13, 17, 22], "encompass": 18, "end": [6, 16, 17, 22, 29], "eng": 13, "eng_to_thai": 22, "engin": [11, 13, 14, 29, 30], "english": [1, 6, 9, 10, 13, 20, 22], "enhanc": [1, 14, 17, 22, 24, 25], "enrich": 1, "ensembl": 17, "ensur": [9, 18, 20, 22, 24, 25], "entir": [10, 14], "entiti": [5, 7, 16, 17, 23, 30], "entity_typ": 16, "entropi": 17, "environ": [18, 24, 30], "eo": 29, "epitran": 20, "equal": [16, 20], "equip": 9, "equival": 22, "era": 22, "errno": [6, 30], "error": 14, "esolut": 30, "especi": 22, "essenti": [6, 7, 17, 18, 22, 24], "esupar": [11, 30], "et": [17, 23], "etc": [29, 30], "etcc": 17, "even": 29, "everi": [14, 22], "everyth": 30, "exact": [6, 16], "exactli": 14, "exampl": [0, 1, 2, 5, 6, 10, 13, 14, 15, 16, 17, 18, 20, 22, 25, 28, 29, 30], "excel": 22, "except": 31, "exclud": [16, 22], "exclude_stopword": 22, "executor": 30, "exist": [6, 14, 18, 30], "expand": [14, 22], "expand_maiyamok": 22, "expens": 15, "explicit": 24, "explicitli": 17, "explor": [1, 23], "exponenti": 17, "expos": 18, "express": [5, 16, 29, 31], "extend": [8, 14], "extens": [14, 22], "extern": 18, "extra": 30, "extra1": 30, "extra2": 30, "extra_id_0": 15, "extract": [17, 22], "extract_keyword": 15, "extrem": 29, "f": [9, 17, 22], "face": 29, "facebook": [6, 17], "facilit": [1, 8, 22], "fail": [14, 30], "fall": 22, "fallback_engin": 20, "fals": [6, 8, 9, 10, 16, 17, 20, 22, 30], "famili": 6, "familiar": 20, "family_names_th": 6, "faq": 26, "fast": [22, 30], "faster": 17, "featur": [17, 20, 22], "feb": 23, "femal": 6, "field": [22, 29], "file": [6, 17, 22, 28, 30, 31], "fileid": 17, "filenam": 6, "filenotfounderror": 6, "filter": [14, 15, 17], "final": 15, "financi": 22, "find": [6, 9, 13, 14, 21, 22, 30], "find_all_seg": 17, "find_keyword": 22, "fine": [17, 21, 23], "first": [14, 15, 22], "fit": 22, "five": 22, "fix": [22, 30], "fixn": 16, "fixv": 16, "flexibl": 20, "float": [8, 14, 17, 22, 25], "fmt": 22, "fn": 28, "focus": [20, 22], "follow": [1, 2, 5, 8, 11, 16, 17, 22, 23, 26, 29], "follow_vowel": 22, "forc": 6, "form": [9, 16, 20, 22], "format": [6, 10, 16, 17, 20, 22], "forward": 17, "found": [6, 14, 22], "foundat": 24, "four": 22, "fp": 28, "free": 22, "freebsd": 22, "french": 29, "freq": 14, "frequenc": [6, 8, 14, 15, 16, 22], "frequent": 27, "friendli": 22, "from": [0, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 20, 22, 25, 28, 29, 30], "front": 22, "frozenset": 6, "full": [18, 22, 30], "func": [14, 15], "function": [6, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 20, 22, 23, 24, 25, 28, 30], "fundament": [2, 11, 14, 17, 20, 22], "further": [1, 6, 17, 23], "futur": 2, "fx": 16, "g": [6, 15, 17], "g2p": [20, 28], "gate": 5, "gen": 8, "gener": [1, 14, 17, 20, 22, 26, 30], "gensim": 24, "get": [6, 7, 17, 25, 26, 28, 30], "get_el": 7, "get_full_data_path": 18, "get_ner": 16, "get_pythainlp_data_path": 18, "get_pythainlp_path": 18, "get_sens": 25, "gist": 17, "github": [7, 11, 17, 22, 23, 26, 27], "give": 22, "given": [6, 11, 13, 14, 15, 16, 18, 22, 25], "global": [20, 22], "gnu": 22, "goeswith": 11, "gohlk": 30, "goldberg": 24, "good": 30, "googl": [17, 23], "got": 22, "govern": 31, "gpu": 23, "gram": 8, "grammar": 17, "grammarli": 14, "grammat": 11, "graph": [6, 7, 17], "graphem": 20, "great": 17, "greater": 15, "greet": 6, "group": 6, "guid": 22, "guidelin": [1, 2, 16], "h": [20, 22], "ha": [6, 10, 16, 22, 29], "habit": 29, "han": [5, 17], "han_solo": 17, "handbook": 22, "handl": [9, 22], "handle_karun_sound_sil": 9, "hard": 29, "have": [6, 22, 29, 30], "head": 11, "hejira": 22, "hello": 6, "help": [5, 6, 11, 17, 22, 28], "here": [5, 7, 8, 9, 11], "heurist": [10, 17], "hidden": 22, "high": 22, "highest": [14, 15], "highli": 15, "highlight": 20, "histor": [22, 29], "historian": 22, "hitoshi": 16, "home": [6, 30], "homonym": 13, "hood": 15, "hope": 6, "hour": 22, "how": [5, 7, 8, 9, 11, 14, 20, 30], "html": [16, 22], "http": [6, 7, 10, 13, 14, 16, 17, 20, 22, 23, 24, 30, 31], "huggingfac": [11, 20], "human": 22, "hunspel": 14, "h\u0101phyntr": 20, "i": [0, 1, 2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 29, 30, 31], "icu": [6, 17, 20, 29, 30], "icu_vers": 30, "icubrk_th": 6, "id": 6, "idea": 25, "identif": [10, 22], "identifi": [5, 10, 11, 14, 17, 22], "idn": 22, "idna": 22, "ignor": [15, 22], "ignore_char": 22, "ij": 16, "illustr": 6, "impact": 2, "imper": 16, "implement": [13, 14, 17, 22], "impli": 31, "import": [0, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 20, 22, 25, 29], "improv": [1, 2, 6, 14, 17, 22], "in_dict": 17, "includ": [1, 2, 6, 7, 8, 11, 15, 16, 17, 20, 22, 23, 29, 31], "incorpor": 2, "incorrect": 22, "incorrectli": 22, "incur": 14, "indefinit": 16, "independ": 22, "index": 26, "indic": [14, 16, 20, 22, 29], "individu": [17, 22], "info": [16, 28], "inform": [5, 6, 7, 11, 13, 17, 22, 30, 31], "initi": [8, 9, 14, 17], "inner": 18, "input": [5, 6, 8, 9, 11, 14, 15, 17, 20, 22, 28], "inrut": 17, "insepar": 17, "insid": 16, "insight": 18, "instal": [24, 26], "instanc": [5, 9, 14, 15, 16, 22], "instanti": 17, "instantiatetd": 22, "instead": [6, 22], "institut": [17, 20], "int": [6, 8, 9, 13, 14, 15, 16, 17, 22], "integ": 22, "integr": 1, "intellig": 6, "intend": [18, 22, 23], "intention": 22, "interest": 2, "interim": 22, "interject": 16, "intermedi": 16, "intern": [17, 18, 20, 22, 30, 31], "internation": 22, "internet": [6, 23], "interpret": 25, "interrog": 16, "intersect": 14, "intj": 16, "invalu": [2, 20, 22], "invis": 22, "involv": [11, 25], "io": 26, "iob": 16, "ip": 17, "ipa": [20, 22, 30], "ipa_to_rtg": 22, "is_khave": 9, "is_native_thai": 10, "is_poetri": 9, "is_sumpu": 9, "isa": 6, "isahara": 16, "iscit": 17, "ismiddlecut": 17, "iso": 20, "iso_11940": 20, "issu": [20, 29], "isthai": 22, "isthaichar": 22, "item": 22, "itemsview": 14, "iter": [6, 14, 15, 16, 17, 22], "its": [9, 18, 22, 23, 25], "itself": 14, "ix": 22, "j": [20, 22], "ja": 6, "jakkrit": 17, "jan": 23, "jantrakulchai": 23, "japan": [6, 16], "japanes": 29, "javascript": 22, "jcmp": 16, "jcrg": 16, "jeeragon": 17, "jitkrittum": 17, "join": [17, 18], "join_broken_num": 17, "joiner": 22, "journal": [16, 20], "jsbr": 16, "json": 6, "just": [14, 22], "k": [15, 22], "k_type": 9, "kai": 22, "kanchanawan": 20, "kanyanat": 16, "karun": 9, "kedmane": 22, "keep": [6, 14, 17, 18], "keep_whitespac": 17, "kei": [7, 14, 22], "keyboard": 22, "keyphras": 15, "keyphrase_ngram_rang": 15, "keyword": [17, 22], "khamyo": 22, "khave": 26, "kind": [6, 17, 31], "king": [13, 22], "kl": 22, "kluai": 22, "kluaj": 22, "kmutt": 15, "knowledg": [6, 7, 17], "known": [7, 14, 20, 29], "ko": 22, "koichiyasuoka": 11, "korakot": [6, 17, 26], "kosawat": 16, "kriengket": 16, "krit": 16, "kucut": 6, "kv": 9, "l": [22, 23], "label": [6, 16, 28], "lack": 29, "lalita": 26, "lambda": 6, "lang": 22, "languag": [1, 2, 5, 6, 7, 8, 9, 10, 11, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 29, 31], "larg": [15, 17, 21, 24], "latin": 20, "latticestr": 17, "law": [16, 31], "layout": 22, "la\u02d0": 22, "lc_time": 22, "lead": 1, "lead_vowel": 22, "learn": [10, 17, 20, 21], "learnt": 30, "leenoi": 16, "len": 16, "length": [7, 13, 14, 22], "less": [15, 29], "letter": [20, 29], "level": [11, 22], "levi": 24, "lexic": [1, 6], "lfd": 30, "lib": [6, 18], "libc": 22, "librari": [7, 17, 18, 19, 22, 24, 26, 29, 30], "licens": [6, 26], "light": 18, "like": [13, 14, 16, 29, 30], "limit": [17, 31], "limkonchotiwat": 26, "limmaneepraserth": 17, "line": [6, 22, 26, 30], "ling": 14, "lingual": 17, "linguist": [16, 22, 24], "link": [5, 7, 17, 22], "linked_ent": 7, "linux": 22, "list": [5, 6, 7, 8, 9, 11, 14, 15, 16, 17, 22, 25, 29], "list_text": 7, "list_to_str": 17, "list_word": 14, "live": 22, "lk82": 28, "ll": 21, "lm": 1, "load": 24, "load_engin": 16, "local": [6, 18, 22, 28], "locat": [16, 18, 22, 30], "logic": 22, "long": [17, 22], "longest": [6, 17, 28], "longestmatchtoken": 17, "look": [14, 20, 30], "lookup": [20, 22], "lorchirachoonkul": 13, "lot": 29, "low": 22, "lowphansirikul": [23, 26], "lowphansirikul_2021": 23, "lst20": 16, "luantangsrisuk": 16, "m": [20, 22, 23], "m6h": 22, "maat2": 20, "machin": [19, 30], "maco": 22, "mai": [15, 16, 17, 18, 22, 30, 31], "main": 17, "mainli": 18, "maintain": 26, "maiyamok": 22, "maj": 22, "make": [1, 2, 6, 13, 14, 16, 17, 19, 20, 22, 24, 29], "male": 6, "man": 22, "man3": 22, "manag": [13, 17, 18, 22, 28], "mani": [17, 22], "manner": 22, "manpages_iphoneo": 22, "manual": 22, "map": [1, 16], "mappingproxi": [9, 14], "mark": [16, 17, 22, 29], "master": 13, "mastersthesi": 17, "match": [13, 16, 17, 22], "max_keyword": 15, "max_len": 14, "maxim": 17, "maximum": [14, 15, 17], "ma\u02d0t3": 20, "md_score": 7, "mean": [6, 11, 15, 22, 25, 30], "meaning": 17, "meant": 22, "measur": [16, 25], "mechan": [17, 18], "media": 17, "member": 6, "mention": 7, "metacpan": 22, "metaphon": 13, "metasound": 28, "method": [1, 2, 8, 9, 10, 14, 17, 20, 26], "metric": [2, 14], "microsecond": 22, "microsoft": [22, 30], "mid": 22, "middle_cut": 17, "min_df": 15, "min_freq": 14, "min_len": [14, 22], "mini": 17, "minimum": [14, 15, 22], "minut": 22, "miscellan": 18, "mistak": 22, "ml": 30, "mm": 17, "mmcut": 17, "mode": 30, "model": [1, 5, 6, 7, 8, 11, 12, 15, 16, 17, 20, 21, 23, 25, 30, 31], "model_nam": [5, 7], "modif": [6, 22], "modifi": 22, "modul": [1, 2, 5, 7, 10, 26], "monei": [16, 22], "monetari": 22, "month": 22, "monthika": 16, "mood": 16, "more": [6, 8, 10, 14, 17, 20, 22, 24, 30, 31], "more_word": 6, "morphem": 26, "mors": 22, "morse_decod": 22, "morse_encod": 22, "morse_text": 22, "most": [14, 15, 17, 25, 29], "mpnet": 25, "mt5": [15, 30], "multi": [17, 29], "multi_cut": 17, "multiel": 7, "multilingu": [6, 25], "multipl": [1, 17, 20, 22], "myz7nzar7dmw": 17, "n": [6, 8, 15, 20, 22, 23], "nakhun": 17, "nakhunchumpolsathien": 17, "name": [6, 7, 8, 9, 11, 13, 15, 16, 17, 18, 22, 23, 30], "name_en": 6, "name_th": 6, "named_ent": 16, "naoto": 16, "naphasia": 17, "nation": [6, 8, 14, 16], "nativ": [10, 16, 22, 29], "natur": [2, 5, 6, 7, 11, 17, 19, 22, 23, 24, 25, 26, 29], "navig": 6, "nbi": 6, "ncmn": [11, 16], "ncnm": 16, "ncsec98": 13, "ne": 16, "necessari": [8, 9], "nectec": 22, "nectec_to_ipa": 22, "need": [6, 17, 20, 24, 25, 30], "neg": 16, "negat": [6, 16], "negations_th": 6, "nel": 7, "ner": 16, "nercut": 17, "nest": 16, "net": 22, "network": 6, "neural": 17, "new": [1, 10, 17, 22, 29, 30], "newlin": [17, 22], "newmm": [6, 15, 17, 28, 29], "next": [8, 14], "ngzxj15rkwjnwozlot32fqborbx": 17, "niggahita": 10, "nighit": 10, "nikhahit": 22, "nitaya": 20, "nitsuwat": 17, "nlbl": 16, "nlp": [1, 2, 5, 17, 24, 25, 26, 29], "nlpo3": [17, 30], "nltk": 6, "nn": 16, "nner": 16, "node": [6, 22, 30], "nomin": 16, "non": [10, 14, 20, 22], "non_thai": 22, "none": [6, 9, 11, 14, 15, 16, 17, 22], "nonm": 16, "nonthaburi": 6, "normal": [15, 16, 22], "norvig": 14, "note": [2, 15, 16, 17, 22, 30], "notebook": [17, 23, 26, 31], "noth": 22, "noun": [11, 16], "novel": 13, "now": [16, 22], "now_reign_year": 22, "np": 16, "nprp": 16, "nrpsc": 16, "nsubj": 11, "nttl": 16, "nu": 16, "num": 16, "num_to_thaiword": 22, "number": [8, 14, 15, 16, 22], "numer": [16, 17, 22], "numpi": 24, "nutanong": 23, "nw": 28, "n\u0e1b\u0e01\u0e15": 17, "n\u0e1c": 17, "n\u0e41\u0e25\u0e30\u0e44\u0e14": 17, "o": [16, 20], "obj": 11, "object": [9, 14, 15, 17, 22, 25], "obtain": [13, 18, 31], "obvious": 30, "occurr": [14, 22], "offer": [1, 2, 8, 9, 11, 13, 17, 18, 20], "offici": [1, 2, 20], "offset": 7, "often": 29, "omc": 6, "omer": 24, "omit": 17, "one": [14, 15, 17, 22, 30], "onli": [13, 15, 16, 17, 22, 30], "onnx": 20, "ontologi": 13, "open": [1, 6, 17, 22, 26], "openbsd": 22, "oper": [18, 22], "optim": 30, "option": [5, 6, 11, 13, 15, 16, 17, 20, 22, 30], "orchid": 16, "orchid_ud": 16, "orchidpp": 16, "order": [6, 14, 16, 22], "ordin": 16, "org": [6, 16, 22, 23, 24, 31], "organ": [16, 24], "orig_word": 6, "origin": [1, 17, 22], "oscar": 8, "oskut": [17, 30], "oss": 26, "other": [5, 6, 15, 16, 20, 22, 29, 31], "otherwis": [6, 16, 17, 22], "out": [6, 15, 17, 20, 22, 29], "output": [0, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 20, 22, 25], "output_str": 8, "outsid": 16, "overcom": 29, "overview": 24, "p": [16, 20, 22], "pa": 16, "packag": [1, 6, 18, 29, 30], "pad": 22, "page": [22, 26], "pair": 22, "pali": 10, "palingoon": 22, "paludkong": 17, "paper": [13, 23], "para": 17, "paragraph": [9, 17], "paragraph_threshold": 17, "paragraph_token": 17, "parallel": 16, "param": [6, 16, 20], "paramet": [0, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 20, 22, 25], "paraphras": 25, "pars": [16, 22, 26, 30], "parser": 11, "parsing_result": 11, "part": [1, 6, 8, 16, 17, 22, 23, 28], "particl": 16, "particularli": [1, 13, 20, 25], "pass": [5, 22], "path": [6, 17, 18, 22, 28, 30], "path_to_custom_dictionari": 17, "patiroop": 17, "patorn": 17, "pattarawat": 26, "pattern": 17, "pdf": 13, "pdmn": 16, "peerat": 26, "peopl": 6, "percentag": 22, "perform": [1, 6, 11, 23, 25, 29, 30], "period": 29, "permiss": [30, 31], "permissionerror": 30, "person": 16, "person_names_female_th": 6, "person_names_male_th": 6, "peter": 14, "phaholphinyo": 16, "phapn": 20, "phapphayon": 20, "phatthiyaphaibun": [17, 26], "phayathaibert": 26, "phone": 16, "phonem": [20, 22], "phonet": [13, 17, 20, 22, 30], "php": 22, "phrase": [16, 17, 20, 22], "phrombut": 16, "phunspel": [14, 30], "pick": 15, "pip": 30, "pivot": 18, "place": 22, "plai": [2, 7, 18], "platform": 22, "pleas": [1, 2, 6, 15, 23, 26, 31], "pn": 14, "pntr": 16, "po": [1, 11, 16, 28], "pod": 22, "poem": 9, "poem_text": 9, "poetic": 9, "poetri": 9, "point": [17, 22, 24], "pois": 29, "polpanuma": [23, 26], "pomm": 29, "ponrawe": 17, "pornpimon": 22, "port": 14, "pos_tag": 16, "pos_tag_s": 16, "posit": [6, 17, 22], "posix": 22, "possibl": [1, 14, 17, 22], "possibli": 14, "post": [6, 16, 17], "postype2wordnet": 1, "potato": 29, "power": [1, 8, 9, 14, 21, 22], "pp": [16, 17], "ppr": [11, 16], "pr": 16, "prachya": 16, "practic": 20, "practition": [1, 24], "prasitjutrakul": 13, "prayut": 13, "pre": [11, 14, 16, 17, 24, 30], "preced": [8, 16], "precis": [17, 22, 25, 28], "predict": 8, "predominantli": 10, "prefer": 13, "prefix": [16, 22], "prel": 16, "preposit": 16, "preprocess": 22, "present": [17, 22], "pretrain": [11, 23], "preval": 22, "previou": 8, "primari": [5, 9, 25], "primarili": [6, 18], "principl": 9, "print": [0, 5, 6, 7, 8, 9, 11, 16, 17, 22, 25], "prob": [8, 14], "probabilist": 8, "probabl": [8, 14], "problem": [22, 29, 30], "proceed": 26, "process": [1, 2, 5, 6, 7, 11, 13, 14, 17, 18, 19, 20, 22, 23, 24, 25, 26, 29, 30], "produc": 15, "project": [26, 31], "pron": [11, 16], "prong": 29, "pronoun": [5, 16], "pronounc": 20, "pronunci": [13, 20, 22], "proofread": 14, "proper": 16, "properli": 22, "properti": 13, "propn": 16, "proport": 22, "propos": [13, 17], "prosper": 6, "provid": [1, 2, 5, 6, 8, 9, 11, 13, 14, 17, 19, 20, 22, 24, 25], "provinc": 16, "pth": 6, "pu": 16, "puan": 20, "public": [6, 20, 24, 26, 31], "publish": 20, "pud": 16, "punc": 16, "punct": 16, "punctuat": [16, 22], "purpos": [18, 22], "put": 22, "py": 30, "pyicu": [17, 20, 30], "pythainlp": [27, 28, 29, 30, 31], "pythainlp_data_dir": [18, 30], "pythainlp_read_mod": 30, "python": [14, 17, 22, 26, 29, 30], "python3": [6, 18], "pythonlib": 30, "pytorch": 20, "p\u02b0": 20, "p\u02b0a\u02d0pjanot": 20, "q": 30, "q312": 7, "q484876": 7, "qualit": 2, "qualiti": 1, "quantifi": 22, "quantit": 16, "question": [6, 7, 11, 27], "quick": [22, 29], "qwerti": 22, "r": [6, 15, 17, 22], "rama": 22, "rang": [9, 20], "rank": 22, "rattanakosin": 22, "raw": 22, "re": 22, "reach": 6, "read": [6, 7, 10, 11, 27, 30], "readabl": [14, 22], "recal": 28, "recent": 29, "recogn": [16, 22], "recognit": [16, 23, 30], "recommend": [15, 30], "reconstruct": 17, "reduc": 17, "refer": [1, 5, 6, 15], "refin": 17, "regex": 17, "regular": 24, "reign": 22, "reign_year": 22, "reign_year_to_ad": 22, "rejoin": 17, "rel": [6, 16, 22], "relat": [2, 6], "relatedto": 6, "relationship": [5, 6, 11], "releas": 31, "relev": 15, "reli": [17, 22], "reliabl": [10, 14], "remain": 6, "remov": [14, 22], "remove_dangl": 22, "remove_dup_spac": 22, "remove_repeat_vowel": 22, "remove_tone_ipa": 22, "remove_tonemark": 22, "remove_zw": 22, "render": [20, 22], "reorder": 22, "reorder_vowel": 22, "repeat": 22, "repetit": [15, 22], "replac": 22, "repositori": [17, 23], "repres": [6, 11, 22], "represent": [1, 13, 17, 20, 22, 24], "requir": [6, 14, 15, 20, 24, 30, 31], "research": [1, 2, 17, 22, 24, 29], "resolv": 25, "resourc": [1, 6, 18, 19, 22, 24], "respect": 16, "respons": [7, 14], "result": [9, 11, 14, 16, 22, 28], "retain": 22, "retriev": [7, 13, 18], "return": [0, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 20, 22, 25], "revers": [17, 22], "revis": 6, "revised_word": 6, "rhyme": [9, 22], "rise": 22, "rm": 28, "roberta": 11, "robust": 22, "role": [2, 7, 18], "roman": [20, 30], "root": [6, 10, 11, 18, 29], "royal": [6, 20, 22], "royin": 20, "rpre": 16, "rtg": [20, 22], "rtype": [6, 20], "rule": [9, 17, 22, 29], "run": [5, 7, 17, 25], "runtim": 20, "rust": 17, "sa": [6, 22], "saa4": 20, "safe": 17, "safe_mod": 17, "samant": 20, "samat": 20, "same": [5, 17], "sampl": 28, "samsonj": 22, "sara": 22, "sarayut": 17, "satang": 22, "save": [6, 28], "sa\u02d05": 20, "sa\u02d0ma\u02d0rot": 20, "school": 17, "sconj": 16, "score": 22, "script": 22, "scrollto": 17, "search": [13, 14, 22, 26], "second": [6, 22], "section": [9, 17, 20], "secur": 22, "see": [6, 17, 20, 22, 25, 30, 31], "seed": 8, "seem": 29, "seen": 6, "sefr": 17, "sefr_cut": 17, "segment": [6, 17, 29], "select": [8, 14, 15, 17, 22], "semant": [6, 25], "sens": [6, 25, 29], "sense_label": 6, "sent": [6, 16, 17, 22, 28], "sent_token": [15, 17], "sentenc": [8, 11, 14, 15, 16, 22, 25, 29], "sentence_1": 17, "sentence_2": 17, "sentencepiec": 17, "sententi": 16, "sep": 13, "separ": [17, 28], "sequenc": [8, 22], "serv": [20, 22], "server": 6, "set": [2, 6, 14, 16, 17, 20, 22, 29, 30], "set_tokenize_engin": 17, "set_tokenizer_engin": 17, "setlocal": 22, "setup": 30, "sever": 8, "share": 6, "shed": 18, "short": 22, "should": [9, 20, 22, 29], "show": [6, 16], "show_pronunci": 20, "side": 30, "sign": 22, "signific": [20, 22], "significantli": 2, "silenc": 9, "silent": 9, "similar": [13, 14, 22, 24, 25, 29], "simpl": [7, 8, 10, 20, 22], "simpli": 22, "sinc": 22, "singapor": 26, "singl": [8, 14, 17], "sitthaa": 16, "size": 17, "skill": 30, "small": 15, "smaller": 17, "smallest": 17, "smooth": 18, "snae": 13, "so": [15, 30], "social": 17, "societi": [6, 16], "softwar": [26, 31], "solo": 17, "solut": 22, "somchai": 13, "some": [17, 22, 28, 30], "sornlertlamvanich": 16, "sort": [14, 22], "sound": [9, 22], "sound_syl": 22, "soundex": [26, 28], "sourc": [0, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 20, 22, 25, 26, 28, 30, 31], "space": [16, 22, 29], "spaceaft": 11, "spacy_thai": [11, 30], "span": 16, "spars": 24, "speaker": 20, "special": [20, 22], "specif": [13, 17, 20, 21, 22, 23, 31], "specifi": [15, 16, 18, 30], "speech": [1, 6, 16, 22, 23, 28], "speed": 23, "spell": [0, 9, 17, 20, 22, 26, 30], "spell_syl": 22, "spell_word": 22, "spj": 13, "split": 17, "split_into_sent": 17, "spm": [11, 23], "spooner": 20, "spyll": 14, "src": 22, "ssg": [17, 30], "stabl": 30, "stack": 17, "standard": [13, 14, 20, 22], "start": [6, 22, 26], "start_seq": 8, "statist": 13, "stativ": 16, "status": 22, "step": [5, 8, 11], "still": [0, 14, 22], "stop": 15, "stop_word": 15, "stopword": [6, 22], "stopwords_th": 6, "store": 30, "str": [0, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 20, 22, 25], "straightforward": 22, "strategi": 17, "strftime": 22, "string": [6, 8, 13, 17, 20, 22], "strip": [6, 9], "strptime": 22, "strrftime": 22, "structur": [9, 11, 16, 22], "style": 17, "subordin": 16, "subword": [1, 11, 23, 28, 29], "subword_token": 17, "successfulli": 6, "suffix": 22, "suit": 20, "suitabl": [9, 13, 22, 25, 30], "sum": 15, "summar": [17, 26, 30], "summari": 15, "sumonma": 22, "suntorntip": 26, "supnithi": 16, "supot": 17, "suppli": 17, "support": [6, 16, 17, 22, 30], "sure": 22, "surfacetext": 6, "suriyawongkul": 26, "suwanvisat": 13, "syllabl": [6, 9, 11, 17, 22, 28, 30], "syllable_length": 22, "syllable_open_close_detector": 22, "syllable_token": 17, "syllables_th": 6, "symbol": 22, "symposium": 17, "symspel": 14, "symspellpi": [14, 30], "synonym": [1, 6], "system": [5, 13, 20, 22, 29, 30], "t": [6, 9, 15, 16, 20, 22], "t1": [6, 8], "t10": 6, "t2": 8, "t3": 8, "tab": 6, "tabl": 16, "tackl": 5, "tag": [1, 7, 11, 23, 26, 28], "tag_provinc": 16, "tagg": 28, "tagger": 11, "tailor": 22, "takahashi": 16, "take": [6, 8, 16, 22, 30], "target": 22, "task": [1, 2, 5, 6, 7, 10, 11, 13, 14, 17, 19, 20, 21, 22, 23, 24, 25, 29], "tcc": 17, "tcc_p": 17, "tcc_po": 17, "tdtb": 16, "team": 26, "technic": 30, "techniqu": [1, 2, 13, 17, 21, 29], "technologi": 17, "techo": 17, "ted": 17, "tensor": 22, "term": [6, 9, 29], "terr": 29, "test": [6, 28], "text": [1, 2, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 19, 20, 21, 22, 25, 28, 29, 30], "text_1": 17, "text_2": 17, "text_to_arabic_digit": 22, "text_to_num": 22, "text_to_thai_digit": 22, "textaug": 30, "textbook": [6, 8], "textual": [1, 22], "th": [6, 11, 13, 14, 16, 22], "th_blackboard": 11, "th_th": 22, "thai": [0, 1, 2, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 20, 22, 23, 24, 25, 26, 28, 29, 30], "thai2fit": 30, "thai2fit_wv": 28, "thai2rom": [20, 30], "thai2rom_onnx": 20, "thai2transform": 23, "thai2vec": 8, "thai_dict": 25, "thai_digit": 22, "thai_digit_to_arabic_digit": 22, "thai_nner": 16, "thai_stopword": 15, "thai_strftim": 22, "thai_strptim": 22, "thai_to_eng": 22, "thai_word": 17, "thai_word_tone_detector": 22, "thaidigit": 22, "thaig2p": 20, "thaig2p_v2": 20, "thailand": [6, 13, 16, 20, 22], "thailand_provinces_th": 6, "thainametagg": 16, "thainer": [16, 28], "thainer14": 16, "thainlp": [6, 28, 30], "thaisentencesegmentor": 17, "thaisum": 17, "thaisumcut": 17, "thaitext": 13, "thaiword_to_d": 22, "thaiword_to_num": 22, "thaiword_to_tim": 22, "than": [15, 17], "thanathip": 26, "thatphithakkul": 22, "theeramunkong": 17, "thei": [5, 14, 16, 17, 18, 20, 22], "them": [15, 17, 21, 22, 29, 30], "themselv": 22, "theoret": 24, "thepchai": 16, "thesi": [6, 13], "thi": [1, 5, 6, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 20, 22, 23, 24, 25, 29, 30, 31], "thing": 30, "those": 22, "three": [8, 16], "through": 18, "thu": 16, "thwiki_lm": 6, "thwiki_model_lstm": 6, "ti": 22, "time": [16, 17, 22, 30], "time_data": 22, "time_to_thaiword": 22, "timeout": 6, "tini": 17, "tis620_to_utf8": 22, "titl": [16, 17], "tltk": [14, 16, 17, 20], "tltk_g2p": 20, "tltk_ipa": 20, "tn": 28, "tnc": [8, 14, 16], "tnc_freq": 6, "to_idna": 22, "todai": 0, "tok8kicsj": 22, "token": [6, 8, 11, 14, 15, 16, 23, 25, 26, 28, 29, 30], "tokenizer_engin": 15, "tokens_po": 16, "tomorrow": 22, "tonal": [9, 22], "tone": 22, "tone_detector": 22, "tonemark": 22, "too": 9, "tool": [2, 5, 8, 9, 10, 14, 17, 19, 20, 21, 22, 25, 26, 30], "toolkit": [9, 16, 20], "toolset": 1, "top": 22, "top_k": 22, "total": 28, "total_words_in_ref_sampl": 28, "total_words_in_sampl": 28, "tp": 28, "train": [6, 8, 11, 17, 21, 24, 29], "training_data": 6, "transcript": [20, 22], "transform": [22, 23, 25], "transformers_ud": [11, 30], "transformersud": 11, "translat": [9, 22, 25, 26, 29, 30], "transliter": [6, 13, 22, 26, 30], "travel": 22, "treasur": 22, "tree": 11, "treebank": [16, 17], "trie": [6, 17, 22], "trigram": 6, "trove": 22, "true": [6, 8, 9, 10, 16, 17, 20, 22, 30], "trueplookpanya": 10, "try": [22, 30], "ttc": 8, "ttc_freq": [6, 18], "tud": 16, "tune": [17, 21, 23], "tupl": [6, 14, 15, 16, 22, 25], "tutori": 26, "two": [0, 8, 9, 10, 15, 16, 22, 29, 30], "txt": [6, 17, 18, 28], "txtt": 17, "type": [0, 5, 6, 7, 8, 9, 10, 11, 13, 14, 16, 17, 18, 20, 22, 25, 30], "typo": 22, "tzinfo": 22, "u": 22, "uci": 30, "ud": [11, 16], "ud_goeswith": 11, "udom83": 28, "udomcharoenchaikit": 26, "udompanich": 13, "ulmfit": [26, 30], "umlfit": 30, "uncas": 23, "under": [15, 30, 31], "underlin": 24, "underscor": 22, "understand": [1, 5, 6, 18, 22, 25, 29], "unexpect": 22, "unicod": [17, 20, 22, 30], "unicodedata": 22, "unigram": [6, 15], "union": [6, 7, 9, 11, 16, 17, 22], "uniqu": [1, 20, 22], "unit": [15, 16, 17, 22], "univers": [11, 13, 16, 21, 31], "universaldepend": 16, "unix": 22, "unless": 31, "unsupervis": 25, "unwant": 22, "up": [1, 20], "upgrad": 30, "upo": 11, "upon": [12, 23], "url": [6, 16], "us": [0, 1, 2, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 20, 22, 24, 25, 26, 28, 29, 31], "usag": 1, "user": [6, 8, 9, 13, 17, 18, 22, 28], "user1": 28, "usr": [6, 18], "utenpattanun": 17, "utf": [17, 22], "util": [2, 8, 9, 10, 14, 17, 18, 20, 23, 26, 30], "uua": 22, "v": 22, "v1": [5, 20], "v2": [11, 16, 20, 25], "v6": 14, "vact": 16, "valid": [9, 14], "valu": [6, 8, 14, 16, 17, 22], "valuabl": [1, 14, 17, 18, 19, 22, 24], "vari": 15, "variabl": [18, 30], "variat": [1, 17], "varieti": 1, "variou": [1, 2, 6, 7, 8, 13, 17, 20, 22, 23, 24], "vatt": 16, "vector": [13, 24, 29, 30], "verb": [11, 16], "verbal": 16, "verif": 9, "verifi": 9, "versatil": [17, 20, 22], "version": [1, 6, 16, 30, 31], "vichit": 13, "view": 22, "virach": 16, "visibl": 22, "vistec": 23, "visual": [22, 30], "vital": [18, 22], "vocaburai": 17, "vol": 16, "vorapon": 16, "vote": 6, "vowel": [0, 9, 22], "vp": [13, 16], "vsta": [11, 16], "vv": 16, "w": [15, 17, 22, 28], "w1": 10, "w14": 24, "w2": 10, "w2p": 20, "wa": [13, 17, 22], "wai": 8, "wait": 17, "wanchanberta": 14, "wanchanberta_thai_grammarli": 14, "wangchanberta": [16, 17, 26, 30], "wangchanglm": 30, "wannaphong": [17, 20, 26], "wanne": 13, "want": [5, 6, 8, 11, 22], "warn": 22, "warranti": 31, "we": [6, 16, 22, 25, 30], "websit": 26, "weekdai": 22, "weight": 6, "welcom": 21, "well": 6, "western": 22, "wheel": 30, "when": [1, 5, 15, 22, 25, 29], "where": [18, 21, 22, 25, 29, 30], "whether": [10, 14, 20], "which": [1, 6, 9, 11, 13, 14, 15, 17, 18, 20, 22, 24], "while": 18, "whitespac": [6, 17, 22], "whl": 30, "who": 22, "whose": 14, "wide": 20, "width": 22, "wiki": 22, "wiki_lm_lstm": 6, "wikidata": 7, "wikiparsec": 6, "wikipedia": [11, 22], "wiktionari": [6, 25], "win32": 30, "window": 30, "wisesight": 28, "within": [1, 5, 7, 14, 16, 18, 25, 30], "without": [14, 16, 22, 31], "wittawat": 17, "word": [0, 2, 6, 8, 9, 10, 11, 13, 14, 15, 16, 20, 22, 24, 25, 28, 29, 30], "word1": 9, "word2": 9, "word2vec": 1, "word_detoken": 17, "word_level": 28, "word_list": 22, "word_token": [15, 17, 29], "word_vector": 26, "wordlist": 6, "wordnet": [1, 30], "words_th": 6, "words_to_num": 22, "work": [1, 6, 9, 13, 14, 17, 18, 22, 24], "workshop": 26, "would": [16, 17, 29], "wrapper": [14, 16, 17], "write": [0, 14, 17, 22, 29, 31], "wrong": 22, "wrongli": 17, "wsd": [26, 30], "wtp": 17, "wtpsplitax": 17, "www": [6, 10, 13, 14, 16, 22, 24, 30, 31], "x": [16, 22], "x0b": 22, "x0c0123456789": 22, "xitgmlwmp": 22, "xl": 15, "xn": 22, "xvae": 16, "xvam": 16, "xvbb": 16, "xvbm": 16, "xvmm": 16, "xx": 16, "xxl": 15, "xxx": 30, "y": 22, "yamok": 22, "year": [17, 22], "yet": [6, 18, 22], "yoav": 24, "you": [1, 2, 5, 6, 7, 8, 11, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31], "your": [1, 6, 17, 20, 24, 25, 26, 30], "yuanghirun": 17, "zero": [22, 31], "zip": 16, "zoneinfo": 22, "zwjp": 22, "zwsp": 22, "\u00e3\u00e3\u00e1": 22, "\u00e3\u00e7": 22, "\u00e3\u00f0": 22, "\u00ed\u00f8\u00b5\u00ea\u00f2\u00eb": 22, "\u0101m\u0101rt": 20, "\u0e01": [0, 6, 13, 14, 15, 16, 17, 20, 22, 25, 28, 29], "\u0e01\u0e01": [6, 25], "\u0e01\u0e01\u0e02\u0e19\u0e32\u0e01": 6, "\u0e01\u0e02\u0e23\u0e30\u0e20\u0e32\u0e29\u0e32\u0e44\u0e17\u0e22\u0e17": 13, "\u0e01\u0e04\u0e33\u0e1e": 13, "\u0e01\u0e08\u0e33\u0e04": 28, "\u0e01\u0e14\u0e14": 6, "\u0e01\u0e15": [5, 6], "\u0e01\u0e19": [15, 16], "\u0e01\u0e1b": 28, "\u0e01\u0e20\u0e32\u0e29\u0e32\u0e16": 29, "\u0e01\u0e20\u0e32\u0e29\u0e32\u0e1a": 17, "\u0e01\u0e21": 16, "\u0e01\u0e23": [5, 6, 7, 15, 16, 28], "\u0e01\u0e23\u0e21\u0e1e\u0e23\u0e30\u0e19\u0e40\u0e23\u0e28\u0e23\u0e27\u0e23\u0e24\u0e17\u0e18": 15, "\u0e01\u0e23\u0e21\u0e1e\u0e23\u0e30\u0e19\u0e40\u0e23\u0e28\u0e27\u0e23\u0e24\u0e17": 15, "\u0e01\u0e23\u0e21\u0e27": 16, "\u0e01\u0e23\u0e2d\u0e1a": [6, 9, 25], "\u0e01\u0e23\u0e30\u0e17": 28, "\u0e01\u0e23\u0e30\u0e17\u0e23\u0e27\u0e07\u0e2d": 22, "\u0e01\u0e23\u0e30\u0e1a": [6, 14], "\u0e01\u0e23\u0e30\u0e1b": 14, "\u0e01\u0e25": [16, 22], "\u0e01\u0e25\u0e21": 29, "\u0e01\u0e27": [9, 16], "\u0e01\u0e29": 13, "\u0e01\u0e29\u0e13": 22, "\u0e01\u0e29\u0e23": 22, "\u0e01\u0e29\u0e23\u0e25\u0e30\u0e15": 20, "\u0e01\u0e29\u0e23\u0e2b": 0, "\u0e01\u0e29\u0e23\u0e41\u0e25\u0e30": 22, "\u0e01\u0e29\u0e32\u0e04": 17, "\u0e01\u0e2a\u0e1a\u0e32\u0e22\u0e21\u0e32\u0e01": 5, "\u0e01\u0e2b\u0e23\u0e2d": 15, "\u0e01\u0e30": 28, "\u0e01\u0e30\u0e1b": 14, "\u0e01\u0e32": [6, 17, 22, 28], "\u0e01\u0e32\u0e0d\u0e08\u0e19\u0e1a": 6, "\u0e01\u0e32\u0e22\u0e19": 22, "\u0e01\u0e32\u0e23": [6, 16, 17, 22, 28], "\u0e01\u0e32\u0e23\u0e13": [14, 22], "\u0e01\u0e32\u0e23\u0e17\u0e33\u0e07\u0e32\u0e19": 28, "\u0e01\u0e32\u0e23\u0e40\u0e0a": 9, "\u0e01\u0e32\u0e23\u0e40\u0e25": 6, "\u0e01\u0e32\u0e23\u0e41\u0e1e\u0e17\u0e22": 16, "\u0e01\u0e32\u0e23\u0e41\u0e2a\u0e14\u0e07": 17, "\u0e01\u0e32\u0e23\u0e43\u0e0a": 13, "\u0e01\u0e32\u0e25": 22, "\u0e01\u0e32\u0e25\u0e40\u0e27\u0e25\u0e32": 22, "\u0e01\u0e32\u0e2a": 22, "\u0e01\u0e32\u0e2a\u0e32\u0e21\u0e19\u0e32\u0e17": 22, "\u0e01\u0e33\u0e21": 16, "\u0e01\u0e33\u0e25": 16, "\u0e01\u0e33\u0e41\u0e1e\u0e07\u0e40\u0e1e\u0e0a\u0e23": 16, "\u0e01\u0e40\u0e09": 28, "\u0e01\u0e40\u0e14": 15, "\u0e01\u0e43\u0e19\u0e02": 28, "\u0e02": [6, 16, 17, 22], "\u0e02\u0e13\u0e30": 6, "\u0e02\u0e19\u0e21\u0e0a": 17, "\u0e02\u0e2d\u0e07": [16, 17], "\u0e02\u0e2d\u0e07\u0e01\u0e32\u0e23\u0e1e": 17, "\u0e02\u0e2d\u0e07\u0e40\u0e02\u0e32": 5, "\u0e02\u0e2d\u0e07\u0e40\u0e08": 15, "\u0e02\u0e2d\u0e07\u0e40\u0e23\u0e32\u0e19": 22, "\u0e02\u0e2d\u0e07\u0e41\u0e02": 15, "\u0e02\u0e2d\u0e2d\u0e20": 17, "\u0e02\u0e32": 16, "\u0e04": [8, 10, 13, 14, 16, 17, 22, 25, 28], "\u0e04\u0e04\u0e33\u0e40\u0e2d\u0e01\u0e42\u0e17": 9, "\u0e04\u0e0a\u0e40\u0e2a\u0e19": 15, "\u0e04\u0e0b": 5, "\u0e04\u0e19": [11, 16, 22], "\u0e04\u0e19\u0e08": 9, "\u0e04\u0e19\u0e14": [11, 22], "\u0e04\u0e19\u0e25\u0e30\u0e04\u0e23": 22, "\u0e04\u0e19\u0e46\u0e19\u0e01": 22, "\u0e04\u0e23": [8, 14, 16, 22], "\u0e04\u0e25": [14, 16], "\u0e04\u0e27\u0e1a\u0e04": 15, "\u0e04\u0e27\u0e23": [16, 28], "\u0e04\u0e27\u0e32\u0e21": [16, 17], "\u0e04\u0e27\u0e32\u0e21\u0e23": 5, "\u0e04\u0e27\u0e32\u0e21\u0e41\u0e1b\u0e25\u0e01\u0e41\u0e22\u0e01\u0e41\u0e25\u0e30": 17, "\u0e04\u0e27\u0e32\u0e21\u0e41\u0e1b\u0e25\u0e01\u0e41\u0e22\u0e01\u0e41\u0e25\u0e30\u0e1e": 17, "\u0e04\u0e2b": 10, "\u0e04\u0e2d": 22, "\u0e04\u0e30": 22, "\u0e04\u0e33": 28, "\u0e04\u0e33\u0e44\u0e17\u0e22\u0e41\u0e17": 10, "\u0e04\u0e40\u0e23": 17, "\u0e07": [6, 9, 13, 14, 15, 16, 17, 22, 28], "\u0e07\u0e02\u0e19\u0e21\u0e2b\u0e27\u0e32\u0e19\u0e43\u0e19\u0e15\u0e33\u0e19\u0e32\u0e19\u0e17": 15, "\u0e07\u0e04": [0, 10], "\u0e07\u0e04\u0e30\u0e19\u0e2d\u0e07": 9, "\u0e07\u0e04\u0e32\u0e23": 22, "\u0e07\u0e07\u0e32\u0e19\u0e41\u0e25\u0e30\u0e04\u0e27\u0e32\u0e21\u0e23": 15, "\u0e07\u0e08\u0e33\u0e1e\u0e27\u0e01\u0e02\u0e19\u0e21\u0e40\u0e04": 25, "\u0e07\u0e16\u0e19\u0e19\u0e1e\u0e23\u0e30\u0e2d\u0e32\u0e17": 15, "\u0e07\u0e17\u0e33\u0e15": 8, "\u0e07\u0e19": [15, 22], "\u0e07\u0e1a\u0e32\u0e17\u0e16": 22, "\u0e07\u0e1b\u0e23\u0e30\u0e40\u0e17\u0e28\u0e44\u0e17\u0e22": 22, "\u0e07\u0e1b\u0e27\u0e07\u0e21\u0e32": 17, "\u0e07\u0e1e": 22, "\u0e07\u0e1f": 22, "\u0e07\u0e23": 22, "\u0e07\u0e23\u0e16\u0e40\u0e21\u0e25": 22, "\u0e07\u0e23\u0e2d\u0e22\u0e2a": 22, "\u0e07\u0e2a": [16, 28], "\u0e07\u0e2b\u0e21": 28, "\u0e07\u0e2b\u0e21\u0e14": [16, 22], "\u0e07\u0e2b\u0e23": 15, "\u0e07\u0e2d\u0e1a\u0e02\u0e19\u0e21\u0e04": 25, "\u0e07\u0e2d\u0e22": 15, "\u0e07\u0e32": 28, "\u0e07\u0e32\u0e19": [22, 25, 28], "\u0e07\u0e40\u0e01\u0e15": 14, "\u0e07\u0e40\u0e04\u0e23\u0e32\u0e30\u0e2b": 17, "\u0e07\u0e40\u0e17\u0e1e": 5, "\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23": [6, 15], "\u0e07\u0e40\u0e17\u0e1e\u0e40\u0e1b": 7, "\u0e07\u0e40\u0e25": 11, "\u0e07\u0e40\u0e2a": 9, "\u0e07\u0e40\u0e2d": 9, "\u0e07\u0e42\u0e22\u0e04": 10, "\u0e07\u0e43\u0e04\u0e23": 17, "\u0e07\u0e43\u0e2a": 15, "\u0e07\u0e43\u0e2a\u0e40\u0e1b": 15, "\u0e07\u0e44\u0e25": 9, "\u0e08": [0, 5, 7, 13, 16, 17, 22, 28], "\u0e08\u0e01\u0e01": 0, "\u0e08\u0e07": 16, "\u0e08\u0e08": [13, 22], "\u0e08\u0e1e\u0e23\u0e30\u0e08": 15, "\u0e08\u0e1e\u0e23\u0e30\u0e08\u0e2d\u0e21\u0e40\u0e01\u0e25": 15, "\u0e08\u0e23": [10, 16], "\u0e08\u0e2d\u0e07": 9, "\u0e08\u0e30": 17, "\u0e08\u0e30\u0e17\u0e33\u0e43\u0e2b": 15, "\u0e08\u0e30\u0e21\u0e32\u0e19": 22, "\u0e08\u0e32\u0e01": 16, "\u0e08\u0e33\u0e19\u0e27\u0e19": [16, 22], "\u0e08\u0e33\u0e25\u0e2d\u0e07": 6, "\u0e09": [9, 16, 17, 28], "\u0e0a": [13, 14, 15, 16, 17, 22, 25], "\u0e0a\u0e01\u0e32\u0e23\u0e1b": 22, "\u0e0a\u0e01\u0e32\u0e25\u0e1b": 22, "\u0e0a\u0e22": 13, "\u0e0a\u0e2a\u0e21": 15, "\u0e0a\u0e32\u0e27\u0e0a": 28, "\u0e0b": [15, 16, 22], "\u0e0d": [13, 16], "\u0e0d\u0e08\u0e23": 10, "\u0e0d\u0e0a": 16, "\u0e0d\u0e0a\u0e32": 14, "\u0e0d\u0e0d\u0e32": 14, "\u0e0d\u0e28": 6, "\u0e0d\u0e2b\u0e32": 14, "\u0e0d\u0e2b\u0e32\u0e22": 28, "\u0e0d\u0e40\u0e15": 15, "\u0e0d\u0e43\u0e19\u0e01\u0e32\u0e23\u0e2a\u0e23": 6, "\u0e10\u0e18\u0e23\u0e23\u0e21\u0e19": 16, "\u0e10\u0e32\u0e19": 10, "\u0e12": 17, "\u0e12\u0e19": 6, "\u0e12\u0e19\u0e18\u0e23\u0e23\u0e21": 15, "\u0e12\u0e19\u0e32\u0e01\u0e32\u0e23": 17, "\u0e13": [16, 17], "\u0e13\u0e10\u0e32\u0e19": 10, "\u0e13\u0e2b": 13, "\u0e13\u0e32": 16, "\u0e14": [11, 14, 15, 16, 17, 22, 28], "\u0e14\u0e16": 15, "\u0e14\u0e17": 16, "\u0e14\u0e19\u0e32\u0e17": 22, "\u0e14\u0e1a\u0e32\u0e17\u0e16": 22, "\u0e14\u0e1b\u0e01\u0e15": 17, "\u0e14\u0e1b\u0e23\u0e30\u0e0a\u0e32\u0e0a\u0e19\u0e14": 22, "\u0e14\u0e1e\u0e25": 15, "\u0e14\u0e21\u0e1e\u0e32\u0e13": 13, "\u0e14\u0e25": [6, 22], "\u0e14\u0e25\u0e32\u0e19\u0e2a": 22, "\u0e14\u0e2b\u0e19": 25, "\u0e14\u0e2d": [13, 22], "\u0e14\u0e2d\u0e01\u0e44\u0e21": 9, "\u0e14\u0e32\u0e27\u0e40\u0e23": 6, "\u0e14\u0e40\u0e01": 22, "\u0e14\u0e41\u0e25": 15, "\u0e14\u0e42\u0e17\u0e29": 15, "\u0e14\u0e42\u0e17\u0e29\u0e15": 15, "\u0e14\u0e46": 15, "\u0e15": [6, 10, 13, 14, 15, 16, 17, 22, 25, 28], "\u0e15\u0e22": [15, 22], "\u0e15\u0e23": 22, "\u0e15\u0e23\u0e20\u0e32\u0e1a": 14, "\u0e15\u0e23\u0e20\u0e32\u0e1e": 14, "\u0e15\u0e23\u0e30\u0e01": 6, "\u0e15\u0e23\u0e40\u0e08": 15, "\u0e15\u0e27\u0e32": 22, "\u0e15\u0e2a\u0e32\u0e2b\u0e01\u0e23\u0e23\u0e21": 22, "\u0e15\u0e2a\u0e33\u0e2b\u0e23": 25, "\u0e15\u0e2d\u0e19": 16, "\u0e15\u0e2d\u0e25\u0e2e": 16, "\u0e15\u0e30\u0e27": 10, "\u0e15\u0e32": 29, "\u0e15\u0e32\u0e01": 29, "\u0e15\u0e33\u0e2b\u0e19": 15, "\u0e16": [15, 16, 22, 29], "\u0e16\u0e27": 6, "\u0e16\u0e2d\u0e14\u0e40\u0e2a": 20, "\u0e17": [15, 16, 17, 22, 28], "\u0e17\u0e14\u0e2a\u0e2d\u0e1a": 16, "\u0e17\u0e14\u0e2a\u0e2d\u0e1a\u0e19\u0e32\u0e22\u0e27\u0e23\u0e23\u0e13\u0e1e\u0e07\u0e29": 16, "\u0e17\u0e14\u0e2a\u0e2d\u0e1a\u0e20\u0e32\u0e29\u0e32\u0e44\u0e17\u0e22": 22, "\u0e17\u0e14\u0e2a\u0e2d\u0e1a\u0e23\u0e30\u0e1a\u0e1a\u0e40\u0e27\u0e25\u0e32": 16, "\u0e17\u0e17": 16, "\u0e17\u0e22\u0e32\u0e19": 13, "\u0e17\u0e22\u0e32\u0e25": [6, 13], "\u0e17\u0e22\u0e32\u0e28\u0e32\u0e2a\u0e15\u0e23": 16, "\u0e17\u0e2d\u0e07": 9, "\u0e17\u0e2d\u0e07\u0e08": 16, "\u0e17\u0e2d\u0e07\u0e2d": 6, "\u0e17\u0e2d\u0e40\u0e23": 15, "\u0e17\u0e32\u0e07": 16, "\u0e17\u0e33": 28, "\u0e17\u0e33\u0e01\u0e32\u0e23\u0e28": 17, "\u0e17\u0e33\u0e07\u0e32\u0e19": 16, "\u0e17\u0e33\u0e07\u0e32\u0e19\u0e44\u0e14": 15, "\u0e17\u0e33\u0e40\u0e19": 15, "\u0e17\u0e33\u0e40\u0e1b": 25, "\u0e17\u0e33\u0e43\u0e2b": 15, "\u0e17\u0e41\u0e2d\u0e1b\u0e40\u0e1b": 7, "\u0e18": [15, 22], "\u0e18\u0e07_\u0e44\u0e17\u0e22": 22, "\u0e18\u0e19\u0e32\u0e04\u0e32\u0e23\u0e41\u0e2b": 22, "\u0e18\u0e23\u0e23\u0e21\u0e14\u0e32": 16, "\u0e19": [0, 5, 6, 8, 9, 10, 11, 13, 14, 15, 16, 17, 20, 22, 28, 29], "\u0e191": 17, "\u0e19\u0e01": [16, 22], "\u0e19\u0e04\u0e19\u0e14": 11, "\u0e19\u0e04\u0e27": 17, "\u0e19\u0e04\u0e33\u0e44\u0e17\u0e22\u0e15\u0e32\u0e21\u0e40\u0e2a": 13, "\u0e19\u0e08": 22, "\u0e19\u0e08\u0e33\u0e19\u0e27\u0e19": 22, "\u0e19\u0e0a": [9, 25], "\u0e19\u0e0a\u0e2d\u0e1a\u0e01": 9, "\u0e19\u0e0b": 7, "\u0e19\u0e14": 22, "\u0e19\u0e15\u0e23\u0e07": 14, "\u0e19\u0e15\u0e23\u0e1a": 14, "\u0e19\u0e17": [15, 16, 17, 22], "\u0e19\u0e17\u0e23": [6, 13, 16, 22], "\u0e19\u0e18": [6, 13, 22], "\u0e19\u0e19": 10, "\u0e19\u0e19\u0e17\u0e1a": 6, "\u0e19\u0e1a": [6, 15, 16], "\u0e19\u0e1b": [15, 22], "\u0e19\u0e1b\u0e23\u0e30\u0e18\u0e32\u0e19\u0e18": 16, "\u0e19\u0e21": 28, "\u0e19\u0e21\u0e23\u0e14\u0e01\u0e15\u0e01\u0e17\u0e2d\u0e14\u0e21\u0e32\u0e16": 15, "\u0e19\u0e21\u0e32\u0e08\u0e32\u0e01\u0e1c\u0e25\u0e07\u0e32\u0e19\u0e27": 17, "\u0e19\u0e22": [22, 28], "\u0e19\u0e22\u0e32\u0e22\u0e19": 17, "\u0e19\u0e23\u0e30\u0e22\u0e30": 17, "\u0e19\u0e23\u0e32": 20, "\u0e19\u0e27\u0e32\u0e04\u0e21": 22, "\u0e19\u0e2a\u0e01": 15, "\u0e19\u0e2a\u0e19\u0e32\u0e19": 16, "\u0e19\u0e2a\u0e32\u0e21\u0e1e": 22, "\u0e19\u0e2b\u0e01\u0e23": 22, "\u0e19\u0e2b\u0e01\u0e23\u0e2d\u0e22\u0e2a": 22, "\u0e19\u0e2b\u0e19": 22, "\u0e19\u0e2b\u0e23": 15, "\u0e19\u0e2b\u0e32\u0e0a": 13, "\u0e19\u0e2d": [20, 22], "\u0e19\u0e2d\u0e19": 17, "\u0e19\u0e2d\u0e23": 14, "\u0e19\u0e2d\u0e30\u0e44\u0e23\u0e17": 15, "\u0e19\u0e2d\u0e32\u0e01\u0e32\u0e23": 17, "\u0e19\u0e2d\u0e32\u0e01\u0e32\u0e23\u0e1c": 17, "\u0e19\u0e2d\u0e32\u0e17": 22, "\u0e19\u0e2d\u0e32\u0e2b\u0e32\u0e23\u0e0d": 22, "\u0e19\u0e30": 16, "\u0e19\u0e30\u0e04\u0e23": 22, "\u0e19\u0e32": 17, "\u0e19\u0e32\u0e01\u0e32\u0e23": 17, "\u0e19\u0e32\u0e04\u0e21": [17, 22], "\u0e19\u0e32\u0e07\u0e1b\u0e23\u0e30\u0e19\u0e2d\u0e21": 16, "\u0e19\u0e32\u0e17": 22, "\u0e19\u0e32\u0e19\u0e32": 22, "\u0e19\u0e32\u0e19\u0e32\u0e32\u0e32": 22, "\u0e19\u0e32\u0e22": [5, 16], "\u0e19\u0e32\u0e22\u0e01": 16, "\u0e19\u0e32\u0e22\u0e19": 22, "\u0e19\u0e32\u0e22\u0e27\u0e23\u0e23\u0e13\u0e1e\u0e07\u0e29": 16, "\u0e19\u0e32\u0e23": 20, "\u0e19\u0e32\u0e2c": 22, "\u0e19\u0e40\u0e0b": 8, "\u0e19\u0e40\u0e17\u0e2d\u0e23": [14, 25], "\u0e19\u0e40\u0e1f": 28, "\u0e19\u0e40\u0e21": 7, "\u0e19\u0e40\u0e25": 25, "\u0e19\u0e40\u0e27": 17, "\u0e19\u0e40\u0e2a\u0e32\u0e23": 22, "\u0e19\u0e41\u0e1b\u0e14\u0e23": 22, "\u0e19\u0e41\u0e2d\u0e25\u0e1e": 22, "\u0e19\u0e42\u0e0b": 17, "\u0e19\u0e42\u0e14\u0e27\u0e2a": 16, "\u0e19\u0e43\u0e08\u0e17": 15, "\u0e19\u0e43\u0e08\u0e2a": 15, "\u0e19\u0e43\u0e19\u0e04\u0e33": 28, "\u0e19\u0e43\u0e19\u0e1e\u0e23\u0e30\u0e1a\u0e32\u0e17\u0e2a\u0e21\u0e40\u0e14": 15, "\u0e19\u0e44\u0e01": 9, "\u0e19\u0e44\u0e1b\u0e1b\u0e23\u0e30\u0e0a": 17, "\u0e1a": [0, 8, 13, 14, 15, 16, 17, 22, 28, 29], "\u0e1a551": 13, "\u0e1a5515": 13, "\u0e1a55150": 13, "\u0e1a931900": 13, "\u0e1ae419": 13, "\u0e1a\u0e01\u0e32\u0e23\u0e2b\u0e21": 17, "\u0e1a\u0e02": 25, "\u0e1a\u0e02\u0e2d\u0e07\u0e1e\u0e23\u0e30\u0e40\u0e08": 15, "\u0e1a\u0e04": 13, "\u0e1a\u0e07\u0e07\u0e04\u0e1a\u0e1a": 0, "\u0e1a\u0e08": 22, "\u0e1a\u0e08\u0e2d\u0e07": 9, "\u0e1a\u0e0a": 6, "\u0e1a\u0e14": 15, "\u0e1a\u0e17\u0e04\u0e27\u0e32\u0e21\u0e19": 17, "\u0e1a\u0e19": [16, 25], "\u0e1a\u0e19\u0e16\u0e19\u0e19\u0e1e\u0e23\u0e30\u0e2d\u0e32\u0e17": 15, "\u0e1a\u0e20": 17, "\u0e1a\u0e21\u0e2d\u0e1a\u0e2b\u0e21\u0e32\u0e22\u0e43\u0e2b": 17, "\u0e1a\u0e23": 14, "\u0e1a\u0e25": 22, "\u0e1a\u0e25\u0e23\u0e32\u0e0a\u0e18\u0e32\u0e19": 6, "\u0e1a\u0e27": 5, "\u0e1a\u0e2a\u0e2d\u0e07": 22, "\u0e1a\u0e2a\u0e2d\u0e07\u0e19\u0e32\u0e2c": 22, "\u0e1a\u0e32\u0e07": 16, "\u0e1a\u0e32\u0e07\u0e01": 5, "\u0e1a\u0e32\u0e07\u0e04\u0e19\u0e16": 28, "\u0e1a\u0e32\u0e17": [16, 17, 22], "\u0e1a\u0e32\u0e23": 16, "\u0e1a\u0e40\u0e01": [22, 25], "\u0e1a\u0e40\u0e08": 22, "\u0e1a\u0e40\u0e0a": 8, "\u0e1a\u0e40\u0e2d": 22, "\u0e1a\u0e42\u0e15": 15, "\u0e1b": [13, 14, 16, 22], "\u0e1b223": 13, "\u0e1b3e54": 13, "\u0e1b775300": 13, "\u0e1b\u0e01\u0e15": 17, "\u0e1b\u0e04\u0e27\u0e32\u0e21\u0e20\u0e32\u0e29\u0e32\u0e44\u0e17\u0e22\u0e42\u0e14\u0e22\u0e43\u0e0a": 6, "\u0e1b\u0e14": 16, "\u0e1b\u0e17\u0e32": 10, "\u0e1b\u0e23": 14, "\u0e1b\u0e23\u0e30\u0e01\u0e32\u0e23\u0e2b\u0e19": 6, "\u0e1b\u0e23\u0e30\u0e08\u0e33\u0e43\u0e19\u0e23\u0e30\u0e14": 17, "\u0e1b\u0e23\u0e30\u0e17": 15, "\u0e1b\u0e23\u0e30\u0e18\u0e32\u0e19\u0e32\u0e18": 16, "\u0e1b\u0e23\u0e30\u0e21\u0e32\u0e13": 16, "\u0e1b\u0e23\u0e32\u0e08": 16, "\u0e1c": [16, 17, 28], "\u0e1c\u0e21": [5, 11, 16, 28], "\u0e1c\u0e21\u0e23": 5, "\u0e1c\u0e21\u0e40\u0e1b": 11, "\u0e1c\u0e25": 28, "\u0e1d": 16, "\u0e1d\u0e32": 17, "\u0e1e": [6, 11, 13, 15, 16, 17, 22, 28], "\u0e1e\u0e07\u0e29": 16, "\u0e1e\u0e0d\u0e32\u0e40\u0e08": 15, "\u0e1e\u0e19\u0e18": 13, "\u0e1e\u0e23": 22, "\u0e1e\u0e23\u0e30\u0e2d\u0e07\u0e04": 15, "\u0e1e\u0e23\u0e30\u0e40\u0e08": 15, "\u0e1e\u0e24": 22, "\u0e1e\u0e24\u0e28\u0e08": 22, "\u0e1e\u0e25\u0e40\u0e2d\u0e01": 16, "\u0e1e\u0e27\u0e01": 16, "\u0e1e\u0e27\u0e01\u0e40\u0e23\u0e32": 17, "\u0e1e\u0e27\u0e01\u0e40\u0e23\u0e32\u0e23": 17, "\u0e1e\u0e2d\u0e14": 16, "\u0e1e\u0e30": 20, "\u0e1e\u0e32\u0e01": 28, "\u0e1e\u0e32\u0e1a": 20, "\u0e1f": [22, 28], "\u0e1f\u0e23\u0e2a\u0e1f": 22, "\u0e1f\u0e40\u0e27\u0e2d\u0e23": 8, "\u0e20": [6, 16], "\u0e20\u0e32": 28, "\u0e20\u0e32\u0e04": 17, "\u0e20\u0e32\u0e1e\u0e22\u0e19\u0e15\u0e23": 20, "\u0e20\u0e32\u0e1e\u0e27\u0e32\u0e14": 17, "\u0e20\u0e32\u0e29\u0e32": [17, 29], "\u0e20\u0e32\u0e29\u0e32\u0e16": 29, "\u0e21": [5, 6, 9, 13, 14, 15, 16, 17, 22, 28], "\u0e21\u0e01\u0e23\u0e32\u0e04\u0e21": 22, "\u0e21\u0e01\u0e32\u0e23\u0e40\u0e1b\u0e25": 15, "\u0e21\u0e0a\u0e19\u0e42\u0e04\u0e01\u0e22\u0e32\u0e27\u0e2b\u0e25\u0e32\u0e22\u0e04\u0e19\u0e44\u0e14": 28, "\u0e21\u0e1b\u0e17\u0e32": 10, "\u0e21\u0e20\u0e32\u0e1e": 22, "\u0e21\u0e22": 22, "\u0e21\u0e2b\u0e32\u0e27": [6, 13], "\u0e21\u0e2d": 22, "\u0e21\u0e30\u0e19\u0e32\u0e27": 14, "\u0e21\u0e30\u0e21": 10, "\u0e21\u0e32": [16, 22], "\u0e21\u0e32\u0e01": [16, 22], "\u0e21\u0e32\u0e08\u0e32\u0e01": 5, "\u0e21\u0e32\u0e14": 20, "\u0e21\u0e40\u0e02": 15, "\u0e21\u0e40\u0e1b": 15, "\u0e21\u0e40\u0e21": 17, "\u0e21\u0e41\u0e23\u0e01": 17, "\u0e21\u0e41\u0e23\u0e01\u0e02\u0e2d\u0e07": 17, "\u0e21\u0e41\u0e23\u0e01\u0e41\u0e25": 5, "\u0e22": [6, 8, 13, 14, 15, 16, 17, 22, 28], "\u0e22\u0e01\u0e2d\u0e32\u0e04\u0e32\u0e23\u0e2b\u0e25": 15, "\u0e22\u0e01\u0e44": 14, "\u0e22\u0e07": [6, 13, 16, 22], "\u0e22\u0e07\u0e20\u0e32\u0e29\u0e32\u0e44\u0e17\u0e22\u0e40\u0e1b": 20, "\u0e22\u0e07\u0e2a\u0e15\u0e32\u0e07\u0e04": 11, "\u0e22\u0e07\u0e2b\u0e21\u0e32": 9, "\u0e22\u0e07\u0e2d": 13, "\u0e22\u0e07\u0e40\u0e2b\u0e21": 13, "\u0e22\u0e0a": 28, "\u0e22\u0e13\u0e23\u0e07\u0e04": 15, "\u0e22\u0e17": 17, "\u0e22\u0e18\u0e23\u0e23\u0e21\u0e28\u0e32\u0e2a\u0e15\u0e23": 6, "\u0e22\u0e19": [6, 17, 20], "\u0e22\u0e19\u0e02\u0e2d\u0e07\u0e40\u0e23\u0e32\u0e19": 22, "\u0e22\u0e19\u0e2a": 17, "\u0e22\u0e19\u0e40\u0e1b": 17, "\u0e22\u0e19\u0e41\u0e1b\u0e25\u0e07": 15, "\u0e22\u0e19\u0e41\u0e1b\u0e25\u0e07\u0e15": 15, "\u0e22\u0e1a\u0e17": 15, "\u0e22\u0e1e\u0e23\u0e30\u0e1a\u0e32\u0e17\u0e2a\u0e21\u0e40\u0e14": 15, "\u0e22\u0e23": 9, "\u0e22\u0e27": 16, "\u0e22\u0e27\u0e30\u0e15": 15, "\u0e22\u0e30": 15, "\u0e22\u0e32\u0e20\u0e23\u0e13": 10, "\u0e22\u0e43\u0e19\u0e04\u0e27\u0e32\u0e21\u0e1a\u0e01\u0e1e\u0e23": 17, "\u0e22\u0e44\u0e1e\u0e1a": 16, "\u0e23": [5, 6, 8, 13, 14, 15, 16, 17, 28, 29], "\u0e23100": 13, "\u0e231000": 13, "\u0e23100000": 13, "\u0e23\u0e13\u0e01\u0e32\u0e23": 13, "\u0e23\u0e23": [0, 22], "\u0e23\u0e2d\u0e14": 16, "\u0e23\u0e30\u0e0a": 13, "\u0e23\u0e30\u0e1a": 5, "\u0e23\u0e30\u0e1a\u0e1a": 16, "\u0e23\u0e32": [17, 20], "\u0e23\u0e32\u0e0a\u0e27\u0e07\u0e28": 17, "\u0e25": [6, 7, 13, 16, 17], "\u0e25100": 13, "\u0e25\u0e02\u0e2d\u0e07\u0e1c": 25, "\u0e25\u0e04\u0e04\u0e19\u0e40\u0e01": 9, "\u0e25\u0e04\u0e0a\u0e40\u0e2a\u0e19": 15, "\u0e25\u0e08\u0e2d\u0e21\u0e40\u0e01\u0e25": 15, "\u0e25\u0e1b\u0e27": 15, "\u0e25\u0e21": 29, "\u0e25\u0e22": 16, "\u0e25\u0e30": 16, "\u0e25\u0e32\u0e22\u0e25": 22, "\u0e25\u0e32\u0e27": 6, "\u0e27": [5, 9, 13, 14, 15, 16, 17, 22, 28], "\u0e27330000": 28, "\u0e274000": 28, "\u0e27\u0e01": 9, "\u0e27\u0e02": 22, "\u0e27\u0e07": 10, "\u0e27\u0e17": 13, "\u0e27\u0e19": [15, 16, 17, 22], "\u0e27\u0e19\u0e17": 15, "\u0e27\u0e1a\u0e17": 6, "\u0e27\u0e22\u0e17\u0e33\u0e43\u0e2b": 15, "\u0e27\u0e23": 14, "\u0e27\u0e23\u0e23\u0e13": [13, 16, 28], "\u0e27\u0e23\u0e23\u0e13\u0e01\u0e23\u0e23\u0e21": 17, "\u0e27\u0e25\u0e30\u0e01": 15, "\u0e27\u0e2d": 22, "\u0e27\u0e2d\u0e1a\u0e43\u0e2b": 25, "\u0e27\u0e32": 17, "\u0e27\u0e40\u0e15\u0e2d\u0e23": 25, "\u0e27\u0e40\u0e1b": 8, "\u0e27\u0e40\u0e2d\u0e07": 16, "\u0e27\u0e42\u0e1b\u0e23\u0e14\u0e40\u0e01\u0e25": 15, "\u0e27\u0e42\u0e21\u0e07": 16, "\u0e27\u0e46": 16, "\u0e28": [6, 15, 16, 17, 22], "\u0e28\u0e23": 15, "\u0e29": [6, 7, 15], "\u0e29\u0e10\u0e32\u0e19": 10, "\u0e29\u0e20": 6, "\u0e29\u0e41\u0e25\u0e30": 15, "\u0e29\u0e41\u0e25\u0e30\u0e44\u0e21": 15, "\u0e2a": [5, 10, 14, 15, 16, 17, 22, 28], "\u0e2a\u0e14": [6, 8], "\u0e2a\u0e15\u0e32\u0e07\u0e04": 22, "\u0e2a\u0e19": 16, "\u0e2a\u0e19\u0e32\u0e21": 16, "\u0e2a\u0e20\u0e32\u0e1e": 28, "\u0e2a\u0e20\u0e32\u0e1e\u0e01\u0e32\u0e23\u0e08": 28, "\u0e2a\u0e21": 16, "\u0e2a\u0e22": 16, "\u0e2a\u0e23": [10, 15], "\u0e2a\u0e23\u0e23": 9, "\u0e2a\u0e23\u0e23\u0e40\u0e1e\u0e0a\u0e0d": 0, "\u0e2a\u0e23\u0e30": 0, "\u0e2a\u0e27": [6, 8], "\u0e2a\u0e27\u0e22": 16, "\u0e2a\u0e27\u0e22\u0e07\u0e32\u0e21": 9, "\u0e2a\u0e2d\u0e07": [16, 22], "\u0e2a\u0e2d\u0e07\u0e1e": 22, "\u0e2a\u0e2d\u0e07\u0e23": 22, "\u0e2a\u0e2d\u0e07\u0e25": 22, "\u0e2a\u0e2d\u0e07\u0e42\u0e21\u0e07\u0e40\u0e0a": 22, "\u0e2a\u0e32": 20, "\u0e2a\u0e32\u0e21": 16, "\u0e2a\u0e32\u0e21\u0e32\u0e23\u0e16": [10, 20], "\u0e2a\u0e32\u0e27": 9, "\u0e2a\u0e33\u0e2b\u0e23": 16, "\u0e2b": [15, 16, 17, 22], "\u0e2b\u0e01\u0e42\u0e21\u0e07\u0e04\u0e23": 22, "\u0e2b\u0e19": [16, 22], "\u0e2b\u0e19\u0e2d\u0e07\u0e04\u0e32\u0e22": 16, "\u0e2b\u0e21": [17, 22, 28], "\u0e2b\u0e21\u0e32": 9, "\u0e2b\u0e21\u0e32\u0e0a": 9, "\u0e2b\u0e21\u0e32\u0e22\u0e16": 15, "\u0e2b\u0e23": [15, 16], "\u0e2b\u0e25": 13, "\u0e2b\u0e25\u0e1a\u0e20": 16, "\u0e2b\u0e25\u0e32\u0e22": 16, "\u0e2b\u0e25\u0e32\u0e22\u0e1b": 28, "\u0e2b\u0e27\u0e32\u0e19": 14, "\u0e2b\u0e32\u0e01": 16, "\u0e2b\u0e32\u0e23": 15, "\u0e2c\u0e32": 16, "\u0e2c\u0e32\u0e25\u0e07\u0e01\u0e23\u0e13": 13, "\u0e2d": [0, 5, 6, 7, 8, 9, 10, 13, 14, 15, 16, 17, 22, 28], "\u0e2d\u0e01\u0e1b\u0e23\u0e30\u0e42\u0e22\u0e04\u0e2a\u0e33\u0e04": 6, "\u0e2d\u0e02\u0e19\u0e21\u0e0a\u0e19": 25, "\u0e2d\u0e02\u0e2d\u0e07\u0e40\u0e2b\u0e25\u0e27": 15, "\u0e2d\u0e04": 13, "\u0e2d\u0e07": [6, 16, 17, 28], "\u0e2d\u0e07\u0e01\u0e32\u0e23\u0e04": 25, "\u0e2d\u0e07\u0e08\u0e32\u0e01": 16, "\u0e2d\u0e07\u0e0a\u0e32\u0e27\u0e1a": 11, "\u0e2d\u0e07\u0e17": [17, 28], "\u0e2d\u0e07\u0e2b\u0e25\u0e27\u0e07\u0e02\u0e2d\u0e07\u0e1b\u0e23\u0e30\u0e40\u0e17\u0e28\u0e44\u0e17\u0e22": 7, "\u0e2d\u0e07\u0e40\u0e18": 9, "\u0e2d\u0e07\u0e40\u0e1e\u0e25\u0e07": 16, "\u0e2d\u0e07\u0e40\u0e2a": 13, "\u0e2d\u0e07\u0e44\u0e21": 15, "\u0e2d\u0e08": 13, "\u0e2d\u0e08\u0e33\u0e19\u0e27\u0e19\u0e17": 22, "\u0e2d\u0e14": 15, "\u0e2d\u0e16": [17, 22], "\u0e2d\u0e18\u0e07\u0e1b\u0e23\u0e30\u0e40\u0e17\u0e28\u0e44\u0e17\u0e22": 22, "\u0e2d\u0e19": [9, 16], "\u0e2d\u0e19\u0e01": [9, 13, 16], "\u0e2d\u0e19\u0e1c\u0e21\u0e01": 22, "\u0e2d\u0e19\u0e41\u0e01": 15, "\u0e2d\u0e1a": [16, 28], "\u0e2d\u0e1a\u0e40\u0e04\u0e22\u0e40\u0e1b": 7, "\u0e2d\u0e1b\u0e1b": 20, "\u0e2d\u0e1e": 28, "\u0e2d\u0e21": [8, 25], "\u0e2d\u0e21\u0e32\u0e40\u0e23": 15, "\u0e2d\u0e21\u0e32\u0e43\u0e19\u0e23": 15, "\u0e2d\u0e21\u0e41\u0e0b\u0e21\u0e2a": 15, "\u0e2d\u0e22": [15, 16, 17, 22], "\u0e2d\u0e22\u0e1a\u0e32\u0e17\u0e16": 22, "\u0e2d\u0e22\u0e2a": 22, "\u0e2d\u0e22\u0e41\u0e1b\u0e14\u0e2a": 22, "\u0e2d\u0e23": 15, "\u0e2d\u0e27": [15, 17], "\u0e2d\u0e2a\u0e32\u0e22\u0e21\u0e2d\u0e0d": 15, "\u0e2d\u0e2b\u0e21": 9, "\u0e2d\u0e2d\u0e01\u0e40\u0e2a": 13, "\u0e2d\u0e30": [0, 17], "\u0e2d\u0e30\u0e40\u0e1f\u0e40\u0e0b": 17, "\u0e2d\u0e30\u0e44\u0e23": 16, "\u0e2d\u0e32": [17, 22], "\u0e2d\u0e32\u0e01\u0e32\u0e23": 17, "\u0e2d\u0e32\u0e04\u0e32\u0e23": 16, "\u0e2d\u0e32\u0e2b\u0e32\u0e23": [15, 16], "\u0e2d\u0e32\u0e2b\u0e32\u0e23\u0e08\u0e30\u0e15": 15, "\u0e2d\u0e32\u0e40\u0e1a\u0e30": 17, "\u0e2d\u0e41\u0e21": 28, "\u0e2f\u0e25\u0e2f": 15, "\u0e30": 16, "\u0e32": [6, 15, 16, 22, 28], "\u0e32\u0e01": 16, "\u0e32\u0e01\u0e24\u0e14\u0e32\u0e20": 15, "\u0e32\u0e07": [15, 16, 28], "\u0e32\u0e07\u0e01": 28, "\u0e32\u0e07\u0e01\u0e27": 17, "\u0e32\u0e07\u0e01\u0e32\u0e22": 15, "\u0e32\u0e07\u0e01\u0e32\u0e22\u0e40\u0e08\u0e23": 15, "\u0e32\u0e07\u0e01\u0e32\u0e22\u0e41\u0e25": 15, "\u0e32\u0e07\u0e02\u0e27\u0e32\u0e07\u0e41\u0e15": 17, "\u0e32\u0e07\u0e15\u0e33\u0e2b\u0e19": 15, "\u0e32\u0e07\u0e1b\u0e01\u0e15": 15, "\u0e32\u0e07\u0e41\u0e25\u0e30\u0e2a\u0e20\u0e32\u0e1e\u0e01\u0e32\u0e23\u0e17\u0e33\u0e07\u0e32\u0e19": 28, "\u0e32\u0e07\u0e43\u0e14": 17, "\u0e32\u0e07\u0e44\u0e23": 16, "\u0e32\u0e07\u0e46": [15, 16], "\u0e32\u0e08\u0e2d\u0e21\u0e21\u0e32\u0e23\u0e14\u0e32": 15, "\u0e32\u0e08\u0e2d\u0e21\u0e21\u0e32\u0e23\u0e14\u0e32\u0e01\u0e25": 15, "\u0e32\u0e0a": 15, "\u0e32\u0e17\u0e2d\u0e07": 9, "\u0e32\u0e19": [13, 16], "\u0e32\u0e19\u0e01\u0e33\u0e25": 11, "\u0e32\u0e19\u0e02\u0e2d\u0e07\u0e40\u0e08": 15, "\u0e32\u0e19\u0e1a\u0e32\u0e17": 16, "\u0e32\u0e19\u0e21\u0e32": 28, "\u0e32\u0e19\u0e2a": 22, "\u0e32\u0e19\u0e2a\u0e2d\u0e07\u0e2b\u0e21": 22, "\u0e32\u0e19\u0e2a\u0e32\u0e21\u0e41\u0e2a\u0e19\u0e2b\u0e01\u0e23": 22, "\u0e32\u0e19\u0e40\u0e01": 17, "\u0e32\u0e1a\u0e23\u0e21\u0e27\u0e07\u0e28": 15, "\u0e32\u0e1a\u0e32\u0e17": 22, "\u0e32\u0e1a\u0e32\u0e17\u0e19": 22, "\u0e32\u0e1e": 15, "\u0e32\u0e1e\u0e23\u0e30\u0e22\u0e32\u0e21\u0e2b\u0e32\u0e42\u0e22\u0e18\u0e32": 15, "\u0e32\u0e1e\u0e23\u0e30\u0e22\u0e32\u0e21\u0e2b\u0e32\u0e42\u0e22\u0e18\u0e32\u0e19\u0e23\u0e32\u0e18": 15, "\u0e32\u0e21": 16, "\u0e32\u0e22": [16, 22], "\u0e32\u0e22\u0e2d\u0e2d\u0e01": 28, "\u0e32\u0e22\u0e42\u0e21\u0e07\u0e04\u0e23": 22, "\u0e32\u0e23": [14, 22], "\u0e32\u0e23\u0e32\u0e0a\u0e01\u0e32\u0e23\u0e44\u0e14": 17, "\u0e32\u0e27\u0e2d\u0e22\u0e32\u0e01\u0e01": 22, "\u0e32\u0e2a": [15, 22], "\u0e32\u0e2b": 22, "\u0e32\u0e2b\u0e23": 28, "\u0e32\u0e2d": 16, "\u0e32\u0e2d\u0e22": [15, 16, 22], "\u0e32\u0e2f": 15, "\u0e32\u0e40\u0e08": 15, "\u0e32\u0e40\u0e1b": 15, "\u0e32\u0e41\u0e02": 15, "\u0e32\u0e42\u0e21\u0e07\u0e40\u0e0a": 16, "\u0e32\u0e43\u0e2b\u0e21": 17, "\u0e32\u0e46": 16, "\u0e33\u0e40\u0e2a\u0e21\u0e2d": 16, "\u0e33\u0e41\u0e02": 15, "\u0e40\u0e01": [15, 16, 17, 22], "\u0e40\u0e01\u0e2d\u0e27": 9, "\u0e40\u0e02": [5, 16, 17], "\u0e40\u0e02\u0e15\u0e1e\u0e23\u0e30\u0e19\u0e04\u0e23": 15, "\u0e40\u0e02\u0e32": 16, "\u0e40\u0e02\u0e32\u0e01\u0e33\u0e25": 25, "\u0e40\u0e02\u0e32\u0e0a": 9, "\u0e40\u0e04": 29, "\u0e40\u0e04\u0e22": 16, "\u0e40\u0e04\u0e22\u0e17\u0e33\u0e21\u0e32\u0e43\u0e19\u0e2d\u0e14": 17, "\u0e40\u0e04\u0e2d\u0e23": 28, "\u0e40\u0e07": 17, "\u0e40\u0e08": 15, "\u0e40\u0e08\u0e23": [13, 15], "\u0e40\u0e0a": [15, 16], "\u0e40\u0e0a\u0e2d\u0e23": 16, "\u0e40\u0e14": [14, 15], "\u0e40\u0e15": 6, "\u0e40\u0e16\u0e2d\u0e30": 16, "\u0e40\u0e17": 16, "\u0e40\u0e18\u0e2d": [15, 16], "\u0e40\u0e19": [14, 16, 25], "\u0e40\u0e1a\u0e30": 17, "\u0e40\u0e1b": [11, 15, 16, 17, 22], "\u0e40\u0e1c": 28, "\u0e40\u0e1c\u0e0a": 16, "\u0e40\u0e1e": [6, 13, 16], "\u0e40\u0e1e\u0e22\u0e19": 14, "\u0e40\u0e1e\u0e23\u0e32\u0e30\u0e27": [15, 16], "\u0e40\u0e1e\u0e25": 14, "\u0e40\u0e1e\u0e25\u0e07": 14, "\u0e40\u0e1f\u0e40\u0e0b": 17, "\u0e40\u0e21": [16, 22], "\u0e40\u0e23": [6, 9, 16, 17], "\u0e40\u0e23\u0e32": [16, 17, 29], "\u0e40\u0e23\u0e32\u0e23": 29, "\u0e40\u0e23\u0e32\u0e40\u0e25": 17, "\u0e40\u0e25": [16, 17], "\u0e40\u0e25\u0e02": 22, "\u0e40\u0e25\u0e22": 16, "\u0e40\u0e27": 25, "\u0e40\u0e27\u0e25\u0e32": [16, 22], "\u0e40\u0e28\u0e29": 16, "\u0e40\u0e2a": [14, 16, 22, 28], "\u0e40\u0e2a\u0e17\u0e2d\u0e46": 16, "\u0e40\u0e2a\u0e32": 15, "\u0e40\u0e2a\u0e32\u0e44\u0e1f\u0e1f": 15, "\u0e40\u0e2b": 16, "\u0e40\u0e2b\u0e15": [14, 22, 28], "\u0e40\u0e2b\u0e15\u0e01\u0e32\u0e23\u0e13": 14, "\u0e40\u0e2b\u0e21": [9, 16, 22], "\u0e40\u0e2b\u0e23\u0e2d": 16, "\u0e40\u0e2d": [9, 16], "\u0e40\u0e2d\u0e01": 22, "\u0e40\u0e2d\u0e07": 9, "\u0e40\u0e2d\u0e2d": [9, 16], "\u0e40\u0e40\u0e1b\u0e25\u0e01": 22, "\u0e41\u0e01": 16, "\u0e41\u0e04\u0e19\u0e32\u0e14\u0e32": 6, "\u0e41\u0e04\u0e1b": 16, "\u0e41\u0e15": [6, 16, 25], "\u0e41\u0e19": 15, "\u0e41\u0e1a\u0e19": 25, "\u0e41\u0e1a\u0e1a": 16, "\u0e41\u0e1a\u0e1a\u0e08\u0e33\u0e25\u0e2d\u0e07\u0e41\u0e1a\u0e1a\u0e25\u0e33\u0e14": 6, "\u0e41\u0e1b": 17, "\u0e41\u0e1b\u0e14": 22, "\u0e41\u0e1b\u0e14\u0e19\u0e32\u0e2c": 22, "\u0e41\u0e1b\u0e14\u0e42\u0e21\u0e07\u0e2a": 22, "\u0e41\u0e1b\u0e25\u0e01": [17, 22], "\u0e41\u0e21": 16, "\u0e41\u0e21\u0e27": [8, 9, 16, 22], "\u0e41\u0e21\u0e27\u0e17\u0e33\u0e2d\u0e30\u0e44\u0e23\u0e15\u0e2d\u0e19\u0e2b": 16, "\u0e41\u0e21\u0e27\u0e40\u0e27\u0e25\u0e32\u0e19\u0e30\u0e19": 8, "\u0e41\u0e21\u0e27\u0e44\u0e21": 8, "\u0e41\u0e22": 17, "\u0e41\u0e22\u0e01": 17, "\u0e41\u0e23": 17, "\u0e41\u0e23\u0e07": 14, "\u0e41\u0e23\u0e07\u0e07\u0e32\u0e19": 28, "\u0e41\u0e23\u0e07\u0e07\u0e32\u0e19\u0e01\u0e30\u0e14": 28, "\u0e41\u0e25": [9, 25], "\u0e41\u0e25\u0e30": [13, 16, 17, 22, 28], "\u0e41\u0e25\u0e30\u0e01\u0e32\u0e23\u0e41\u0e2a\u0e14\u0e07\u0e07": 17, "\u0e41\u0e25\u0e30\u0e40\u0e02\u0e32": 5, "\u0e41\u0e25\u0e30\u0e40\u0e02\u0e32\u0e44\u0e14": 17, "\u0e41\u0e25\u0e30\u0e40\u0e08": 15, "\u0e41\u0e25\u0e30\u0e40\u0e1b": 15, "\u0e41\u0e25\u0e30\u0e44\u0e14": 17, "\u0e41\u0e2a\u0e19\u0e2a\u0e14\u0e43\u0e2a": 9, "\u0e41\u0e2a\u0e19\u0e41\u0e1b\u0e14\u0e2b\u0e21": 22, "\u0e41\u0e2d": 22, "\u0e41\u0e2d\u0e1a": 14, "\u0e41\u0e2d\u0e25\u0e08": 6, "\u0e42\u0e04": 16, "\u0e42\u0e04\u0e42\u0e23\u0e19": 16, "\u0e42\u0e0b": 17, "\u0e42\u0e14\u0e22\u0e19": 6, "\u0e42\u0e14\u0e22\u0e1b\u0e01\u0e15": 16, "\u0e42\u0e14\u0e22\u0e40\u0e23": 16, "\u0e42\u0e17": 22, "\u0e42\u0e19": 16, "\u0e42\u0e1b\u0e23\u0e41\u0e01\u0e23\u0e21": 17, "\u0e42\u0e1b\u0e23\u0e41\u0e01\u0e23\u0e21\u0e01\u0e32\u0e23\u0e2a": 13, "\u0e42\u0e1b\u0e23\u0e41\u0e01\u0e23\u0e21\u0e04\u0e2d\u0e21\u0e1e": 25, "\u0e42\u0e21": 6, "\u0e42\u0e21\u0e07": 16, "\u0e42\u0e21\u0e19": 6, "\u0e42\u0e21\u0e1a": 6, "\u0e42\u0e22\u0e04": 10, "\u0e42\u0e23\u0e04\u0e23\u0e30\u0e1a\u0e32\u0e14": 16, "\u0e42\u0e23\u0e07\u0e40\u0e23": 22, "\u0e42\u0e23\u0e07\u0e41\u0e23\u0e21\u0e02\u0e2d\u0e07\u0e40\u0e23\u0e32\u0e19": 22, "\u0e42\u0e23\u0e21\u0e32\u0e40\u0e19": 6, "\u0e42\u0e25\u0e01\u0e23": 16, "\u0e42\u0e25\u0e40\u0e21\u0e15\u0e23": 16, "\u0e42\u0e2d": [16, 29], "\u0e42\u0e2d\u0e1a\u0e23": 7, "\u0e42\u0e2d\u0e1a\u0e32\u0e21\u0e32": 16, "\u0e42\u0e2d\u0e1a\u0e32\u0e21\u0e32\u0e40\u0e1b": 16, "\u0e42\u0e2d\u0e1e": 16, "\u0e42\u0e2d\u0e40\u0e04": [17, 29], "\u0e42\u0e2d\u0e40\u0e04\u0e1a": [17, 29], "\u0e43\u0e01\u0e25": 22, "\u0e43\u0e04\u0e23": 16, "\u0e43\u0e0a": [9, 16, 22, 25], "\u0e43\u0e15": 16, "\u0e43\u0e19": [16, 22, 28], "\u0e43\u0e19\u0e01\u0e32\u0e23\u0e17\u0e33\u0e07\u0e32\u0e19": 25, "\u0e43\u0e19\u0e17\u0e32\u0e07\u0e2d": 25, "\u0e43\u0e19\u0e23": [15, 22], "\u0e43\u0e19\u0e2a\u0e27\u0e19": 11, "\u0e43\u0e2b": [15, 16], "\u0e43\u0e2b\u0e21": 16, "\u0e44\u0e01": 22, "\u0e44\u0e07": 6, "\u0e44\u0e14": [5, 8, 9, 16, 17, 22], "\u0e44\u0e17\u0e22": 16, "\u0e44\u0e17\u0e22\u0e40\u0e2d": 22, "\u0e44\u0e1b": [6, 16], "\u0e44\u0e1e\u0e1a": 16, "\u0e44\u0e1f\u0e1f": 15, "\u0e44\u0e1f\u0e25": 14, "\u0e44\u0e21": [6, 16, 17, 22, 28], "\u0e44\u0e21\u0e40\u0e04": 16, "\u0e44\u0e2b\u0e19": 16, "\u0e44\u0e2b\u0e21": 16, "\u0e46": [15, 22, 25], "\u0e50": 22, "\u0e51": [6, 22], "\u0e51\u0e50": 22, "\u0e51\u0e52\u0e53": 22, "\u0e52": 22, "\u0e52\u0e55": 22, "\u0e53": 22, "\u0e54": 22, "\u0e54\u0e50\u0e50": 22, "\u0e55": 22, "\u0e55\u0e59": 22, "\u0e58": 22, "\u0e59": 22}, "titles": ["pythainlp.ancient", "pythainlp.augment", "pythainlp.benchmarks", "pythainlp.chat", "pythainlp.classify", "pythainlp.coref", "pythainlp.corpus", "pythainlp.el", "pythainlp.generate", "pythainlp.khavee", "pythainlp.morpheme", "pythainlp.parse", "pythainlp.phayathaibert", "pythainlp.soundex", "pythainlp.spell", "pythainlp.summarize", "pythainlp.tag", "pythainlp.tokenize", "pythainlp.tools", "pythainlp.translate", "pythainlp.transliterate", "pythainlp.ulmfit", "pythainlp.util", "pythainlp.wangchanberta", "pythainlp.word_vector", "pythainlp.wsd", "PyThaiNLP documentation", "FAQ", "Command Line", "Getting Started", "Installation", "License"], "titleterms": {"addit": 1, "all_lemma_nam": 6, "all_synset": 6, "ancient": 0, "audio_vector": 13, "augment": 1, "benchmark": 2, "bigram": 8, "bigram_word_freq": 6, "bpembaug": 1, "chat": 3, "citat": 26, "class": 1, "classifi": 4, "command": 28, "conceptnet": 6, "configur": 30, "coref": 5, "corefer": 5, "corpu": 6, "correct": 14, "correct_s": 14, "countri": 6, "custom_lemma": 6, "default_spell_check": 14, "definit": 6, "depend": 24, "dependency_pars": 11, "document": 26, "download": 6, "edg": 6, "el": 7, "engin": [15, 16, 17, 20], "entitylink": 7, "evalu": 2, "exampl": [7, 8, 9, 11], "extract": 15, "faq": [27, 30], "fasttextaug": 1, "find_badword": 6, "find_synonym": 6, "function": [1, 2, 5], "gen_sent": 8, "gener": 8, "get": 29, "get_corpu": 6, "get_corpus_as_i": 6, "get_corpus_db": 6, "get_corpus_db_detail": 6, "get_corpus_default_db": 6, "get_corpus_path": 6, "get_transliteration_dict": 6, "indic": 26, "instal": 30, "introduct": [1, 2, 5], "keybert": 15, "keyword": 15, "khave": 9, "khaveeverifi": 9, "lang": 6, "lch_similar": 6, "lemma": 6, "lemma_from_kei": 6, "level": 17, "licens": 31, "line": 28, "lk82": 13, "ltw2vaug": 1, "metasound": 13, "modul": [0, 6, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25], "morphem": 10, "morphi": 6, "norvigspellcheck": 14, "note": 26, "notebook": 29, "oscar": 6, "packag": 26, "pars": 11, "path_similar": 6, "perceptron": 16, "phayathaibert": 12, "prayut_and_somchaip": 13, "provinc": 6, "pythainlp": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26], "qualiti": 2, "refer": [13, 14, 16, 20, 22, 23, 24, 26], "remov": 6, "resolut": 5, "revise_newmm_default_wordset": 6, "revise_wordset": 6, "runtim": 30, "sentenc": 17, "sound": 13, "soundex": 13, "spell": 14, "spell_sent": 14, "start": 29, "subword": 17, "summar": 15, "synset": 6, "tabl": 26, "tag": 16, "tagger": 16, "textaug": 1, "th_en_translit": 6, "thai2fit": 8, "thai2fitaug": 1, "thai2transformersaug": 1, "thai_dict": 6, "thai_family_nam": 6, "thai_female_nam": 6, "thai_male_nam": 6, "thai_neg": 6, "thai_orst_word": 6, "thai_stopword": 6, "thai_syl": 6, "thai_synonym": 6, "thai_word": 6, "thai_wsd_dict": 6, "tnc": 6, "token": [2, 17], "tool": 18, "translat": 19, "transliter": 20, "trigram": 8, "trigram_word_freq": 6, "ttc": 6, "tutori": 29, "udom83": 13, "ulmfit": 21, "unigram": [8, 16], "unigram_word_freq": 6, "usag": [2, 5, 8, 11], "util": [6, 22], "wangchanberta": 23, "wangchanglm": 8, "word": 17, "word2audio": 13, "word2vecaug": 1, "word_approxim": 13, "word_freq": 6, "word_vector": 24, "wordnet": 6, "wordnetaug": 1, "wsd": 25, "wup_similar": 6}})