{"created":"2023-05-15T14:23:23.462655+00:00","id":1530,"links":{},"metadata":{"_buckets":{"deposit":"41a401d3-4be8-455a-a42f-8ad482b4ac75"},"_deposit":{"created_by":3,"id":"1530","owners":[3],"pid":{"revision_id":0,"type":"depid","value":"1530"},"status":"published"},"_oai":{"id":"oai:repository.ninjal.ac.jp:00001530","sets":["245:246"]},"author_link":["4747","4714"],"item_10003_biblio_info_32":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2017","bibliographicIssueDateType":"Issued"},"bibliographicPageEnd":"143","bibliographicPageStart":"133","bibliographicVolumeNumber":"2","bibliographic_titles":[{"bibliographic_title":"言語資源活用ワークショップ発表論文集"},{"bibliographic_title":"Proceedings of Language Resources Workshop","bibliographic_titleLang":"en"}]}]},"item_10003_description_27":{"attribute_name":"会議概要(会議名, 開催地, 会期, 主催者等)","attribute_value_mlt":[{"subitem_description":"会議名: 言語資源活用ワークショップ2017, 開催地: 国立国語研究所, 会期: 2017年9月5日-6日, 主催: 国立国語研究所 コーパス開発センター","subitem_description_type":"Other"}]},"item_10003_description_29":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"自然言語処理の分野では多言語かつ言語横断的な言語研究が盛んに取り組まれている。その言語横断的な言語研究の取り組みとしてUniversal Dependencies(UD)がある。UDでは品詞や係り受け構造の標準・スキーマを定め,多言語のコーパスを提供している。本論文では,日本語コーパスである現代日本語書き言葉均衡コーパス(BCCWJ)をUDのスキーマへと変換したコーパスについて紹介をする。BCCWJでは日本語における文節単位の係り受け情報がすでに付与されている。この係り受け構造を基にしてUDへと変換するプログラムの開発を行った。しかし,文節単位はUDの単語単位には沿っていない。そのため,BCCWJで提供されている短単位と長単位というふたつの言語単位を単語の単位をして認定したコーパスを構築する。短単位と長単位についてUDのスキーマに当てはめた場合,どのような係り受け構造ができるのかを示す。","subitem_description_type":"Abstract"}]},"item_10003_description_43":{"attribute_name":"フォーマット","attribute_value_mlt":[{"subitem_description":"application/pdf","subitem_description_type":"Other"}]},"item_10003_description_51":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_description":"国立国語研究所","subitem_description_type":"Other"},{"subitem_description":"国立国語研究所","subitem_description_type":"Other"}]},"item_10003_identifier_registration":{"attribute_name":"ID登録","attribute_value_mlt":[{"subitem_identifier_reg_text":"10.15084/00001514","subitem_identifier_reg_type":"JaLC"}]},"item_10003_publisher_45":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"国立国語研究所"}]},"item_10003_relation_40":{"attribute_name":"関連サイト","attribute_value_mlt":[{"subitem_relation_name":[{"subitem_relation_name_text":"言語資源活用ワークショップ2017"}],"subitem_relation_type_id":{"subitem_relation_type_id_text":"http://pj.ninjal.ac.jp/corpus_center/lrw2017.html","subitem_relation_type_select":"URI"}}]},"item_10003_version_type_44":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"大村, 舞"},{"creatorName":"オオムラ, マイ","creatorNameLang":"ja-Kana"},{"creatorName":"OMURA, Mai","creatorNameLang":"en"}],"nameIdentifiers":[{},{}]},{"creatorNames":[{"creatorName":"浅原, 正幸"},{"creatorName":"アサハラ, マサユキ","creatorNameLang":"ja-Kana"},{"creatorName":"ASAHARA, Masayuki","creatorNameLang":"en"}],"nameIdentifiers":[{},{},{}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2019-02-15"}],"displaytype":"detail","filename":"LRW-2017-16-P-B-6.pdf","filesize":[{"value":"572.2 kB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"LRW-2017-16-P-B-6.pdf","url":"https://repository.ninjal.ac.jp/record/1530/files/LRW-2017-16-P-B-6.pdf"},"version_id":"9a88c9e3-f67f-4790-9560-d2f8a881f4c2"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"現代日本語書き言葉均衡コーパス(BCCWJ)","subitem_subject_scheme":"Other"},{"subitem_subject":"Balanced Corpus of Contemporary Written Japanese (BCCWJ)","subitem_subject_language":"en","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"conference paper","resourceuri":"http://purl.org/coar/resource_type/c_5794"}]},"item_title":"現代日本語書き言葉均衡コーパスのUniversal Dependencies","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"現代日本語書き言葉均衡コーパスのUniversal Dependencies"},{"subitem_title":"Universal Dependencies Annotation for 'Balanced Corpus of Contemporary Written Japanese'","subitem_title_language":"en"}]},"item_type_id":"10003","owner":"3","path":["246"],"pubdate":{"attribute_name":"公開日","attribute_value":"2018-03-20"},"publish_date":"2018-03-20","publish_status":"0","recid":"1530","relation_version_is_last":true,"title":["現代日本語書き言葉均衡コーパスのUniversal Dependencies"],"weko_creator_id":"3","weko_shared_id":-1},"updated":"2023-05-16T10:23:54.920436+00:00"}