[ https://issues.apache.org/jira/browse/TIKA-3340?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17320414#comment-17320414 ]
Hudson commented on TIKA-3340: ------------------------------ UNSTABLE: Integrated in Jenkins build Tika ยป tika-main-jdk8 #194 (See [https://ci-builds.apache.org/job/Tika/job/tika-main-jdk8/194/]) Tika's OpenNLPDetector now covers 148 languages and language-script pairs (TIKA-3340). (tallison: [https://github.com/apache/tika/commit/5610d1e956b73b45e9f55604bee6bf4784edba55]) * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/xho * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/lao * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/ben-rom * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/gug * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/lin * (delete) tika-eval/tika-eval-core/src/main/resources/common_tokens/sun * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/zho-trad * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/yor * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/amh * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/nso * (delete) tika-eval/tika-eval-core/src/main/resources/common_tokens/azj * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/tel-rom * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/kur * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/yid * (edit) tika-langdetect/tika-langdetect-opennlp/src/main/java/org/apache/tika/langdetect/opennlp/OpenNLPDetector.java * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/gom * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/asm * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/gla * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/mhr * (edit) tika-langdetect/tika-langdetect-commons/pom.xml * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/srd * (edit) tika-eval/tika-eval-core/src/main/java/org/apache/tika/eval/core/tokens/CommonTokenCountManager.java * (edit) tika-eval/tika-eval-app/src/main/java/org/apache/tika/eval/app/tools/LeipzigHelper.java * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/kin * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/hau * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/ckb * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/tsn * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/tam-rom * (delete) tika-langdetect/tika-langdetect-opennlp/src/main/resources/opennlp_langdetect_model_20190626.bin * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/ful * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/khm * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/new * (edit) tika-eval/tika-eval-core/src/test/java/org/apache/tika/eval/core/langid/LangIdTest.java * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/zho-simp * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/lug * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/ori * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/ibo * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/hat * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/urd-rom * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/orm * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/div * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/roh * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/bih * (delete) tika-eval/tika-eval-core/src/main/resources/common_tokens/plt * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/tuk * (edit) CHANGES.txt * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/knn * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/ssw * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/uig * (edit) tika-eval/tika-eval-app/src/test/java/org/apache/tika/eval/app/SimpleComparerTest.java * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/mya-zaw * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/wol * (edit) tika-langdetect/tika-langdetect-opennlp/src/test/java/org/apache/tika/langdetect/opennlp/OpenNLPDetectorTest.java * (edit) tika-eval/tika-eval-core/src/main/resources/common_tokens/snd * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/mya * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/hin-rom * (add) tika-eval/tika-eval-core/src/main/resources/common_tokens/quz > LanguageProfile for Myanmar > --------------------------- > > Key: TIKA-3340 > URL: https://issues.apache.org/jira/browse/TIKA-3340 > Project: Tika > Issue Type: Improvement > Components: languageidentifier > Reporter: Arky > Priority: Major > Fix For: 2.0.0 > > Attachments: 20210401-model.report.txt, 20210413.report.txt, > lang_comparisons.xlsx, table-summarized-truncated.txt.gz > > > A language profile for detecting Myanmar/Burmese (my). -- This message was sent by Atlassian Jira (v8.3.4#803005)