{"created":"2023-05-15T14:23:23.506009+00:00","id":1531,"links":{},"metadata":{"_buckets":{"deposit":"65838edd-5c2c-4b66-a216-a13848fd23e4"},"_deposit":{"created_by":3,"id":"1531","owners":[3],"pid":{"revision_id":0,"type":"depid","value":"1531"},"status":"published"},"_oai":{"id":"oai:repository.ninjal.ac.jp:00001531","sets":["245:246"]},"author_link":["5741","5742"],"item_10003_biblio_info_32":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2017","bibliographicIssueDateType":"Issued"},"bibliographicPageEnd":"153","bibliographicPageStart":"144","bibliographicVolumeNumber":"2","bibliographic_titles":[{"bibliographic_title":"言語資源活用ワークショップ発表論文集"},{"bibliographic_title":"Proceedings of Language Resources Workshop","bibliographic_titleLang":"en"}]}]},"item_10003_description_27":{"attribute_name":"会議概要(会議名, 開催地, 会期, 主催者等)","attribute_value_mlt":[{"subitem_description":"会議名: 言語資源活用ワークショップ2017, 開催地: 国立国語研究所, 会期: 2017年9月5日-6日, 主催: 国立国語研究所 コーパス開発センター","subitem_description_type":"Other"}]},"item_10003_description_29":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"国立国語研究所で構築している短単位自動解析用辞書『UniDic』は,現在,形態素解析器MeCab専用の解析用辞書として使用・公開を行なっている.しかし解析用UniDicで使用しているCRF素性テンプレートは,MeCab用の他の辞書(『IPA辞書』,『Juman辞書』)に比べ,行数が多く,学習後のモデルファイルのサイズ(素性数)も他より大きなものとなっている.そこで今回,現代語用の解析用『UniDic』のCRF素性テンプレートの再検討を行ない,より少メモリかつ,これまでとほぼ同等の性能の解析用辞書を実現した.","subitem_description_type":"Abstract"}]},"item_10003_description_43":{"attribute_name":"フォーマット","attribute_value_mlt":[{"subitem_description":"application/pdf","subitem_description_type":"Other"}]},"item_10003_description_51":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_description":"国立国語研究所","subitem_description_type":"Other"}]},"item_10003_identifier_registration":{"attribute_name":"ID登録","attribute_value_mlt":[{"subitem_identifier_reg_text":"10.15084/00001515","subitem_identifier_reg_type":"JaLC"}]},"item_10003_publisher_45":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"国立国語研究所"}]},"item_10003_relation_40":{"attribute_name":"関連サイト","attribute_value_mlt":[{"subitem_relation_name":[{"subitem_relation_name_text":"言語資源活用ワークショップ2017"}],"subitem_relation_type_id":{"subitem_relation_type_id_text":"http://pj.ninjal.ac.jp/corpus_center/lrw2017.html","subitem_relation_type_select":"URI"}}]},"item_10003_version_type_44":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"岡, 照晃"},{"creatorName":"オカ, テルアキ","creatorNameLang":"ja-Kana"}],"nameIdentifiers":[{"nameIdentifier":"5741","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"OKA, Teruaki","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"5742","nameIdentifierScheme":"WEKO"}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2019-02-15"}],"displaytype":"detail","filename":"LRW-2017-17-O-B-1.pdf","filesize":[{"value":"555.3 kB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"LRW-2017-17-O-B-1.pdf","url":"https://repository.ninjal.ac.jp/record/1531/files/LRW-2017-17-O-B-1.pdf"},"version_id":"2e51edfd-d00c-40d2-a6eb-b0f84f14dbd7"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"UniDic","subitem_subject_scheme":"Other"},{"subitem_subject":"現代日本語書き言葉均衡コーパス(BCCWJ)","subitem_subject_scheme":"Other"},{"subitem_subject":"日本語話し言葉コーパス(CSJ)","subitem_subject_scheme":"Other"},{"subitem_subject":"UniDic","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"Balanced Corpus of Contemporary Written Japanese (BCCWJ)","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"Corpus of Spontaneous Japanese (CSJ)","subitem_subject_language":"en","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"conference paper","resourceuri":"http://purl.org/coar/resource_type/c_5794"}]},"item_title":"CRF素性テンプレートの見直しによるモデルサイズを軽量化した解析用UniDic : unidic-cwj-2.2.0とunidic-csj-2.2.0","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"CRF素性テンプレートの見直しによるモデルサイズを軽量化した解析用UniDic : unidic-cwj-2.2.0とunidic-csj-2.2.0"}]},"item_type_id":"10003","owner":"3","path":["246"],"pubdate":{"attribute_name":"公開日","attribute_value":"2018-03-20"},"publish_date":"2018-03-20","publish_status":"0","recid":"1531","relation_version_is_last":true,"title":["CRF素性テンプレートの見直しによるモデルサイズを軽量化した解析用UniDic : unidic-cwj-2.2.0とunidic-csj-2.2.0"],"weko_creator_id":"3","weko_shared_id":-1},"updated":"2023-05-16T10:23:54.586256+00:00"}