{"created":"2020-09-01T09:58:08.603371+00:00","id":3336,"links":{},"metadata":{"_buckets":{"deposit":"2e1b75ff-1ed1-4106-a9e9-6841b725d39e"},"_deposit":{"id":"3336","owners":[],"pid":{"revision_id":0,"type":"recid","value":"3336"},"status":"published"},"_oai":{"id":"oai:meral.edu.mm:recid/3336","sets":["1582963302567:1597824273898"]},"communities":["ucsy"],"item_1583103067471":{"attribute_name":"Title","attribute_value_mlt":[{"subitem_1551255647225":"Informative Content Extraction for Web Page using Text Density and Visionbased Page Segmentation (VIPS) Algorithm Integration","subitem_1551255648112":"en"}]},"item_1583103085720":{"attribute_name":"Description","attribute_value_mlt":[{"interim":"Web pages consist of not only actualcontent, but also other elements such as brandingbanners, navigational elements, advertisements,copyright etc.Irrelevant content in the Web page istreated as noisy content. This noisy content istypically not related to the main subjects of thewebpages. A method is necessary to extract theinformative content and discard the noisy contentfrom Web pages. This system is used an integrationof textual and visual importance features to extractthe informative contents from Web pages. Initially aweb page is converted into Document Object Model(DOM) tree. For each node in the DOM tree,textual and visual importance is calculated. Textualimportance and visual importance is combined toform hybriddensity.DensitySumis calculated andused in content extraction algorithm to extract theinformative content from Web pages. The algorithmis tested with various web domains and styles ofweb pages. Performance of web content extractionis obtained by calculating precision and recall."}]},"item_1583103108160":{"attribute_name":"Keywords","attribute_value":[]},"item_1583103120197":{"attribute_name":"Files","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_access","date":[{"dateType":"Available","dateValue":"2019-07-19"}],"displaytype":"preview","filename":"248_PDFsam_PSC_final proof.pdf","filesize":[{"value":"238 Kb"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"url":"https://meral.edu.mm/record/3336/files/248_PDFsam_PSC_final proof.pdf"},"version_id":"cd139772-13ab-4cc6-81fb-6c2d7ec46c2d"}]},"item_1583103131163":{"attribute_name":"Journal articles","attribute_value_mlt":[{"subitem_issue":"","subitem_journal_title":"Eighth Local Conference on Parallel and Soft Computing","subitem_pages":"","subitem_volume":""}]},"item_1583103147082":{"attribute_name":"Conference papers","attribute_value_mlt":[{"subitem_acronym":"","subitem_c_date":"","subitem_conference_title":"","subitem_part":"","subitem_place":"","subitem_session":"","subitem_website":""}]},"item_1583103211336":{"attribute_name":"Books/reports/chapters","attribute_value_mlt":[{"subitem_book_title":"","subitem_isbn":"","subitem_pages":"","subitem_place":"","subitem_publisher":""}]},"item_1583103233624":{"attribute_name":"Thesis/dissertations","attribute_value_mlt":[{"subitem_awarding_university":"","subitem_supervisor(s)":[{"subitem_supervisor":""}]}]},"item_1583105942107":{"attribute_name":"Authors","attribute_value_mlt":[{"subitem_authors":[{"subitem_authors_fullname":"Mon, Ei Phyu Phyu"},{"subitem_authors_fullname":"Yuzana"}]}]},"item_1583108359239":{"attribute_name":"Upload type","attribute_value_mlt":[{"interim":"Publication"}]},"item_1583108428133":{"attribute_name":"Publication type","attribute_value_mlt":[{"interim":"Article"}]},"item_1583159729339":{"attribute_name":"Publication date","attribute_value":"2017-12-27"},"item_1583159847033":{"attribute_name":"Identifier","attribute_value":"http://onlineresource.ucsy.edu.mm/handle/123456789/1097"},"item_title":"Informative Content Extraction for Web Page using Text Density and Visionbased Page Segmentation (VIPS) Algorithm Integration","item_type_id":"21","owner":"1","path":["1597824273898"],"publish_date":"2019-07-19","publish_status":"0","recid":"3336","relation_version_is_last":true,"title":["Informative Content Extraction for Web Page using Text Density and Visionbased Page Segmentation (VIPS) Algorithm Integration"],"weko_creator_id":"1","weko_shared_id":-1},"updated":"2021-12-13T00:32:53.203733+00:00"}