{"created":"2023-05-15T14:24:09.583547+00:00","id":2558,"links":{},"metadata":{"_buckets":{"deposit":"f64369aa-5cc1-4eb0-8176-3b26683c1fa2"},"_deposit":{"created_by":3,"id":"2558","owners":[3],"pid":{"revision_id":0,"type":"depid","value":"2558"},"status":"published"},"_oai":{"id":"oai:repository.ninjal.ac.jp:00002558","sets":["38:371"]},"author_link":["8549","8550","8551","8548"],"item_10002_biblio_info_40":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2020-01","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"18","bibliographicPageEnd":"91","bibliographicPageStart":"77","bibliographic_titles":[{"bibliographic_title":"国立国語研究所論集"},{"bibliographic_title":"NINJAL Research Papers","bibliographic_titleLang":"en"}]}]},"item_10002_description_34":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_description":"国立国語研究所 コーパス開発センター 非常勤研究員","subitem_description_type":"Other"},{"subitem_description":"明治大学","subitem_description_type":"Other"}]},"item_10002_description_35":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_description":"Adjunct Researcher, Center for Corpus Development, NINJAL","subitem_description_type":"Other"},{"subitem_description":"Meiji University\n","subitem_description_type":"Other"}]},"item_10002_description_36":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"日本語の大規模コーパスへの網羅的・体系的な語義情報付与を目的として,語義の体系的な分類を示す大規模な現代日本語のシソーラス『分類語彙表増補改訂版データベース』の見出しと,各種大規模コーパスの構築に利用されている電子化辞書UniDicの見出し(語彙素)との同語関係による対応を表す表形式データの構築を行った。同語判別の作業は分類語彙表・UniDic両者の見出しの表記・読み・類の対応に基づいて人手により行い,その結果,『分類語彙表』の64,759見出しとUniDicの50,795語彙素との同語関係による多対多の対応を表す「分類語彙表番号-UniDic語彙素番号対応表」を構築した。本対応表を活用して大規模コーパスへの網羅的な語義情報付与作業が始まっており,また,形態素解析結果に分類語彙表番号を付与する機能を実装した形態素解析ツールも開発された。一方で,本格的な大規模コーパスへの語義情報の網羅的付与に向けて,対応表の拡張や多義語の語義選択といった課題への対処も必要である。","subitem_description_type":"Abstract"}]},"item_10002_description_37":{"attribute_name":"抄録(英)","attribute_value_mlt":[{"subitem_description":"In this study, we have constructed an alignment table between 'Word List by Semantic Principles (revised and enlarged edition)' (hereafter WLSP) and UniDic to develop large-scale Japanese corpora which is comprehensively annotated with systematic word senses. WLSP is an extensive contemporary Japanese thesaurus with systematic semantic categories. UniDic is a vast lexicon used for Japanese morphological analysis and is utilized in the development of large-scale Japanese corpora. The alignment table defines n-to-n same word relations between 64,759 WLSP entries and 50,795 UniDic lexemes. These relations were manually verified based on scripts, readings, and classes of the WLSP entries and the UniDic lexemes. The development of word-sense annotated Japanese corpora has commenced with the use of the table. A Japanese morphological analysis tool to annotate word-sense was also developed with the table. Meanwhile, for a full-scale development of word-sense annotated Japanese corpora, it is necessary that problems, such as enlargement of the table and identification of word senses in corpora are effectively dealt with.","subitem_description_type":"Other"}]},"item_10002_description_51":{"attribute_name":"フォーマット","attribute_value_mlt":[{"subitem_description":"application/pdf","subitem_description_type":"Other"}]},"item_10002_identifier_registration":{"attribute_name":"ID登録","attribute_value_mlt":[{"subitem_identifier_reg_text":"10.15084/00002542","subitem_identifier_reg_type":"JaLC"}]},"item_10002_publisher_39":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"国立国語研究所"}]},"item_10002_source_id_41":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2186-134X","subitem_source_identifier_type":"ISSN"},{"subitem_source_identifier":"2186-1358","subitem_source_identifier_type":"ISSN"}]},"item_10002_source_id_44":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AA12536262","subitem_source_identifier_type":"NCID"}]},"item_10002_version_type_52":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"近藤, 明日子"}],"nameIdentifiers":[{"nameIdentifier":"8548","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"田中, 牧郎"}],"nameIdentifiers":[{"nameIdentifier":"8549","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"KONDO, Asuko","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"8550","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"TANAKA, Makiro","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"8551","nameIdentifierScheme":"WEKO"}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2020-01-15"}],"displaytype":"detail","filename":"papers1804.pdf","filesize":[{"value":"723.6 kB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"papers1804.pdf","url":"https://repository.ninjal.ac.jp/record/2558/files/papers1804.pdf"},"version_id":"72723e13-9339-465c-9d3c-1a5e6b5831bf"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"分類語彙表","subitem_subject_scheme":"Other"},{"subitem_subject":"UniDic","subitem_subject_scheme":"Other"},{"subitem_subject":"対応表","subitem_subject_scheme":"Other"},{"subitem_subject":"大規模日本語コーパス","subitem_subject_scheme":"Other"},{"subitem_subject":"語義情報付与","subitem_subject_scheme":"Other"},{"subitem_subject":"'Word List by Semantic Principles'","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"UniDic","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"alignment table","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"large-scale Japanese corpus","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"word-sense annotation","subitem_subject_language":"en","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"departmental bulletin paper","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"「分類語彙表番号-UniDic語彙素番号対応表」の構築","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"「分類語彙表番号-UniDic語彙素番号対応表」の構築"},{"subitem_title":"Construction of an Alignment Table between 'Word List by Semantic Principles' and UniDic","subitem_title_language":"en"}]},"item_type_id":"10002","owner":"3","path":["371"],"pubdate":{"attribute_name":"公開日","attribute_value":"2020-01-15"},"publish_date":"2020-01-15","publish_status":"0","recid":"2558","relation_version_is_last":true,"title":["「分類語彙表番号-UniDic語彙素番号対応表」の構築"],"weko_creator_id":"3","weko_shared_id":-1},"updated":"2023-05-15T15:33:39.869181+00:00"}