{"created":"2023-05-15T14:23:22.084277+00:00","id":1502,"links":{},"metadata":{"_buckets":{"deposit":"fcc46882-b5e6-477d-b0b7-a8492711c1e9"},"_deposit":{"created_by":3,"id":"1502","owners":[3],"pid":{"revision_id":0,"type":"depid","value":"1502"},"status":"published"},"_oai":{"id":"oai:repository.ninjal.ac.jp:00001502","sets":["245:244"]},"author_link":["4471"],"item_10003_biblio_info_32":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2017","bibliographicIssueDateType":"Issued"},"bibliographicPageEnd":"316","bibliographicPageStart":"307","bibliographicVolumeNumber":"1","bibliographic_titles":[{"bibliographic_title":"言語資源活用ワークショップ発表論文集"},{"bibliographic_title":"Proceedings of Language Resources Workshop","bibliographic_titleLang":"en"}]}]},"item_10003_description_27":{"attribute_name":"会議概要(会議名, 開催地, 会期, 主催者等)","attribute_value_mlt":[{"subitem_description":"会議名: 言語資源活用ワークショップ2016, 開催地: 国立国語研究所, 会期: 2017年3月7日-8日, 主催: 国立国語研究所 コーパス開発センター","subitem_description_type":"Other"}]},"item_10003_description_29":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"「政財界」「国内外」などの漢字 3 字で構成される「略熟語」と呼ばれる形式は,先行研究が少なく実態が明らかでない。国語辞書にも掲載されることが少ない。本発表では,現代日本語にはどのような略熟語が存在するかを『現代日本語書き言葉均衡コーパス』(以下,BCCWJ)と『分類語彙表』を使って自動的に抽出することを試みた。具体的には,BCCWJから,前後が非漢字という条件で漢字 3 文字連続を抜き出し,それらを構成する漢語の頻度および分類語彙表における意味番号を付与したデータを作成した。そこから,出現頻度が一定以上で,構成要素となる漢語の分類番号が一致するものとして 874 語を抽出した。内訳は「政財界」タイプ 656 語,「国内外」タイプ 297 語,重複が 79 語であった。目視で確認したところ,抽出された 3 字漢語には,略熟語でないものも多く,精度を高めるにはさらに別の条件が必要であることが分かった.","subitem_description_type":"Abstract"}]},"item_10003_description_43":{"attribute_name":"フォーマット","attribute_value_mlt":[{"subitem_description":"application/pdf","subitem_description_type":"Other"}]},"item_10003_description_51":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_description":"国立国語研究所","subitem_description_type":"Other"}]},"item_10003_identifier_registration":{"attribute_name":"ID登録","attribute_value_mlt":[{"subitem_identifier_reg_text":"10.15084/00001486","subitem_identifier_reg_type":"JaLC"}]},"item_10003_publisher_45":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"国立国語研究所"}]},"item_10003_relation_40":{"attribute_name":"関連サイト","attribute_value_mlt":[{"subitem_relation_name":[{"subitem_relation_name_text":"言語資源活用ワークショップ2016"}],"subitem_relation_type_id":{"subitem_relation_type_id_text":"http://pj.ninjal.ac.jp/corpus_center/lrw2016.html","subitem_relation_type_select":"URI"}}]},"item_10003_version_type_44":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"山崎, 誠"},{"creatorName":"ヤマザキ, マコト","creatorNameLang":"ja-Kana"},{"creatorName":"YAMAZAKI, Makoto","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"4471","nameIdentifierScheme":"WEKO"},{"nameIdentifier":"30182489","nameIdentifierScheme":"e-Rad","nameIdentifierURI":"https://nrid.nii.ac.jp/ja/nrid/1000030182489"},{"nameIdentifier":"YAMAZAKI_Makoto","nameIdentifierScheme":"researchmap","nameIdentifierURI":"https://researchmap.jp/YAMAZAKI_Makoto"}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2019-02-15"}],"displaytype":"detail","filename":"LRW-2016-36-P-D-1.pdf","filesize":[{"value":"524.7 kB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"LRW-2016-36-P-D-1.pdf","url":"https://repository.ninjal.ac.jp/record/1502/files/LRW-2016-36-P-D-1.pdf"},"version_id":"35ae57fd-6c5d-47d4-926f-c8268e6788c7"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"分類語彙表","subitem_subject_scheme":"Other"},{"subitem_subject":"現代日本語書き言葉均衡コーパス(BCCWJ)","subitem_subject_scheme":"Other"},{"subitem_subject":"Word List by Semantic Principles","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"Balanced Corpus of Contemporary Written Japanese (BCCWJ)","subitem_subject_language":"en","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"conference paper","resourceuri":"http://purl.org/coar/resource_type/c_5794"}]},"item_title":"『現代日本語書き言葉均衡コーパス』と『分類語彙表』を利用した漢字3文字略熟語の抽出","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"『現代日本語書き言葉均衡コーパス』と『分類語彙表』を利用した漢字3文字略熟語の抽出"},{"subitem_title":"Extraction of Clipped Compounds Comprised of Three Character Sino-Japanese Using “Balanced Corpus of Contemporary Written Japanese” and “Word List by Semantic Principles” ","subitem_title_language":"en"}]},"item_type_id":"10003","owner":"3","path":["244"],"pubdate":{"attribute_name":"公開日","attribute_value":"2018-03-20"},"publish_date":"2018-03-20","publish_status":"0","recid":"1502","relation_version_is_last":true,"title":["『現代日本語書き言葉均衡コーパス』と『分類語彙表』を利用した漢字3文字略熟語の抽出"],"weko_creator_id":"3","weko_shared_id":-1},"updated":"2023-05-16T10:25:13.155139+00:00"}