{"created":"2020-09-01T14:41:26.286938+00:00","id":4400,"links":{},"metadata":{"_buckets":{"deposit":"4d422375-0949-4d34-8553-ee97eefeabab"},"_deposit":{"id":"4400","owners":[],"pid":{"revision_id":0,"type":"recid","value":"4400"},"status":"published"},"_oai":{"id":"oai:meral.edu.mm:recid/4400","sets":["1582963302567:1597824273898"]},"communities":["ucsy"],"item_1583103067471":{"attribute_name":"Title","attribute_value_mlt":[{"subitem_1551255647225":"A Study of Myanmar Word Segmentation Schemes for Statistical Machine Translation","subitem_1551255648112":"en_US"}]},"item_1583103085720":{"attribute_name":"Description","attribute_value_mlt":[{"interim":"Myanmar sentences are written as contiguoussequences of syllables with no characters delimiting thewords. In statistical machine translation (SMT), wordsegmentation is a necessary step for languages that donot naturally delimit words. Myanmar is a low-resourcelanguage and therefore it is difficult to develop a goodword segmentation tool based on machine learningtechniques. In this paper, we examine various wordsegmentation schemes and their effect on the translationfrom Myanmar to seven other languages. We performedexperiments based on character segmentation, syllablesegmentation, human lexical/phrasal segmentation, andunsupervised/supervised word segmentation. The resultsshow that the highest quality machine translation wasattained with syllable segmentation, and we found thiseffect to be greatest for translation into subject-objectverb (SOV) structured languages such as Japanese andKorean. Approaches based on machine learning wereunable to match this performance for most languagepairs, and we believe this was due to the lack oflinguistic resources. However, a machine learningapproach that extended syllable segmentation producedpromising results and we expect this can be developedinto a viable method as more data becomes available inthe future."}]},"item_1583103108160":{"attribute_name":"Keywords","attribute_value":[]},"item_1583103120197":{"attribute_name":"Files","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_access","date":[{"dateType":"Available","dateValue":"2019-10-23"}],"displaytype":"preview","filename":"11125.pdf","filesize":[{"value":"775 Kb"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"url":"https://meral.edu.mm/record/4400/files/11125.pdf"},"version_id":"eb018365-1112-421f-a7cd-c88131dabd91"}]},"item_1583103131163":{"attribute_name":"Journal articles","attribute_value_mlt":[{"subitem_issue":"","subitem_journal_title":"Eleventh International Conference On Computer Applications (ICCA 2013)","subitem_pages":"","subitem_volume":""}]},"item_1583103147082":{"attribute_name":"Conference papers","attribute_value_mlt":[{"subitem_acronym":"","subitem_c_date":"","subitem_conference_title":"","subitem_part":"","subitem_place":"","subitem_session":"","subitem_website":""}]},"item_1583103211336":{"attribute_name":"Books/reports/chapters","attribute_value_mlt":[{"subitem_book_title":"","subitem_isbn":"","subitem_pages":"","subitem_place":"","subitem_publisher":""}]},"item_1583103233624":{"attribute_name":"Thesis/dissertations","attribute_value_mlt":[{"subitem_awarding_university":"","subitem_supervisor(s)":[{"subitem_supervisor":""}]}]},"item_1583105942107":{"attribute_name":"Authors","attribute_value_mlt":[{"subitem_authors":[{"subitem_authors_fullname":"Thu, Ye Kyaw"},{"subitem_authors_fullname":"Finch, Andrew"},{"subitem_authors_fullname":"Sagisaka, Yoshinori"},{"subitem_authors_fullname":"Sumita, Eiichiro"}]}]},"item_1583108359239":{"attribute_name":"Upload type","attribute_value_mlt":[{"interim":"Publication"}]},"item_1583108428133":{"attribute_name":"Publication type","attribute_value_mlt":[{"interim":"Article"}]},"item_1583159729339":{"attribute_name":"Publication date","attribute_value":"2013-02-26"},"item_1583159847033":{"attribute_name":"Identifier","attribute_value":"http://onlineresource.ucsy.edu.mm/handle/123456789/2335"},"item_title":"A Study of Myanmar Word Segmentation Schemes for Statistical Machine Translation","item_type_id":"21","owner":"1","path":["1597824273898"],"publish_date":"2019-10-23","publish_status":"0","recid":"4400","relation_version_is_last":true,"title":["A Study of Myanmar Word Segmentation Schemes for Statistical Machine Translation"],"weko_creator_id":"1","weko_shared_id":-1},"updated":"2021-12-13T01:53:07.217305+00:00"}