{"created":"2023-05-15T14:24:32.810350+00:00","id":3072,"links":{},"metadata":{"_buckets":{"deposit":"813fbe1e-2545-4f33-a9ce-cf20d37ad586"},"_deposit":{"created_by":3,"id":"3072","owners":[3],"pid":{"revision_id":0,"type":"depid","value":"3072"},"status":"published"},"_oai":{"id":"oai:repository.ninjal.ac.jp:00003072","sets":["320:454"]},"author_link":["10357","10356","10355","10358","10360","10361","10362","10359"],"item_10001_biblio_info_7":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2020-02-15","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"2","bibliographicPageEnd":"161","bibliographicPageStart":"152","bibliographicVolumeNumber":"61","bibliographic_titles":[{"bibliographic_title":"情報処理学会論文誌"}]}]},"item_10001_description_24":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_description":"首都大学東京","subitem_description_type":"Other"},{"subitem_description":"首都大学東京","subitem_description_type":"Other"},{"subitem_description":"国立国語研究所","subitem_description_type":"Other"},{"subitem_description":"首都大学東京","subitem_description_type":"Other"}]},"item_10001_description_25":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_description":"Tokyo Metropolitan University","subitem_description_type":"Other"},{"subitem_description":"Tokyo Metropolitan University","subitem_description_type":"Other"},{"subitem_description":"The National Institute for Japanese Language and Linguistics","subitem_description_type":"Other"},{"subitem_description":"Tokyo Metropolitan University","subitem_description_type":"Other"}]},"item_10001_description_26":{"attribute_name":"抄録(英)","attribute_value_mlt":[{"subitem_description":"In this study, we propose a method to detect sentence boundaries for modern Japanese texts using machine learning. For modern Japanese texts, sentence boundaries are not explicitly marked so that human annotation is inevitable, but the annotation process is far from complete due to enormous number of materials. Therefore, we propose a method to detect sentence boundaries using machine learning. The main contribution of this study is that this method can support the annotation task as a primary annotation. We also show that the accuracy of morphological analysis can be improved by performing sentence boundary detection. Moreover, this is the first work to detect sentence boundaries targeting modern Japanese texts by using modern Japanese data for model training and comparing multiple machine learning methods.","subitem_description_type":"Other"}]},"item_10001_description_5":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"本稿では,機械学習を用いて近代の歴史的資料に対して文境界を検出する手法を提案する.近代の歴史的資料は明確な文境界が必ずしも存在しないため,これまで人手作業による文境界の付与が行われてきたが,膨大な資料に対してなかなか作業が進んでいない現状がある.そこで我々は機械学習を用いて文境界を検出する手法を提案する.この手法により膨大な量の資料に対して文境界の一次的なアノテーションを施すことができることに加えて,形態素解析の精度を向上させたことが本研究の貢献である.また,モデルの訓練に日本語の近代語のデータを使用して,複数の機械学習手法を比較して近代の歴史的資料を対象とした文境界推定を行うのは本研究が初めてである.","subitem_description_type":"Abstract"}]},"item_10001_publisher_8":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会"}]},"item_10001_relation_11":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_relation_type_id":{"subitem_relation_type_id_text":" AN00116647","subitem_relation_type_select":"NCID"}}]},"item_10001_relation_17":{"attribute_name":"関連サイト","attribute_value_mlt":[{"subitem_relation_name":[{"subitem_relation_name_text":"http://id.nii.ac.jp/1001/00203040/"}],"subitem_relation_type_id":{"subitem_relation_type_id_text":"http://id.nii.ac.jp/1001/00203040/","subitem_relation_type_select":"URI"}}]},"item_10001_source_id_9":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1882-7764","subitem_source_identifier_type":"ISSN"}]},"item_access_right":{"attribute_name":"アクセス権","attribute_value_mlt":[{"subitem_access_right":"metadata only access","subitem_access_right_uri":"http://purl.org/coar/access_right/c_14cb"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"白井, 良介"},{"creatorName":"シライ, リョウスケ","creatorNameLang":"ja-Kana"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"松村, 雪桜"},{"creatorName":"マツムラ, ユキオ","creatorNameLang":"ja-Kana"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"小木曽, 智信"},{"creatorName":"オギソ, トシノブ","creatorNameLang":"ja-Kana"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"小町, 守"},{"creatorName":"コマチ, マモル","creatorNameLang":"ja-Kana"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Shirai, Ryosuke","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Matsumura, Yukio","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Ogiso, Toshinobu","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Komachi, Mamoru","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"[特集:人文科学とコンピュータ] 近代文語","subitem_subject_scheme":"Other"},{"subitem_subject":"文境界推定","subitem_subject_scheme":"Other"},{"subitem_subject":"近代語コーパス","subitem_subject_scheme":"Other"},{"subitem_subject":"UniDic","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"journal article","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"近代の歴史的資料を対象とした機械学習による文境界推定","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"近代の歴史的資料を対象とした機械学習による文境界推定"},{"subitem_title":"Machine Learning-based Sentence Boundary Detection for Modern Japanese Texts","subitem_title_language":"en"}]},"item_type_id":"10001","owner":"3","path":["454"],"pubdate":{"attribute_name":"公開日","attribute_value":"2020-11-12"},"publish_date":"2020-11-12","publish_status":"0","recid":"3072","relation_version_is_last":true,"title":["近代の歴史的資料を対象とした機械学習による文境界推定"],"weko_creator_id":"3","weko_shared_id":3},"updated":"2023-05-15T15:11:27.820989+00:00"}