{"created":"2023-05-15T14:23:56.859292+00:00","id":2238,"links":{},"metadata":{"_buckets":{"deposit":"399bf5c7-3e03-4054-8deb-382c6abdac53"},"_deposit":{"created_by":3,"id":"2238","owners":[3],"pid":{"revision_id":0,"type":"depid","value":"2238"},"status":"published"},"_oai":{"id":"oai:repository.ninjal.ac.jp:00002238","sets":["38:315"]},"author_link":["7565","7566"],"item_10002_biblio_info_40":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2019-07","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"17","bibliographicPageEnd":"34","bibliographicPageStart":"15","bibliographic_titles":[{"bibliographic_title":"国立国語研究所論集"},{"bibliographic_title":"NINJAL Research Papers","bibliographic_titleLang":"en"}]}]},"item_10002_description_34":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_description":"国立国語研究所 研究系 音声言語研究領域","subitem_description_type":"Other"}]},"item_10002_description_35":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_description":"Spoken Language Division, Research Department, NINJAL","subitem_description_type":"Other"}]},"item_10002_description_36":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"本論文では,『Webデータに基づく複合動詞用例データベース』の構築方法を示し,構築結果を評価する。用例データベースの構築目的は,複合動詞とその構成動詞間の関係を分析することとし,複合動詞の用例,語構成,格解析結果に加え,構成動詞の用例,格解析結果を収録する。本構築手法では,必要な量の用例を確保するために個々の動詞専用のWebコーパスを作成し,Webコーパスの構築量を削減するために漸進的に用例データベースを構築する。この際,用例データベースに登録する複合動詞は,Webから収集可能な量を基準として,半自動的に収集される。本手法により収集した複合動詞は3371語,用例数(中央値)は1173例であった。この結果は,岩波国語辞典収録語の約77.2%をカバーする。本手法の評価として,約2.1億語の汎用Webコーパスから収集した用例集合と比較し,幅広い生起確率を持つ複合動詞1829語に対して,用例を1000例以上収集できることを確認した。また,汎用コーパスから抽出した用例集合の格要素の分布とのコサイン類似度は,複合動詞0.878,単一動詞0.919となった。この結果は,本手法により収集した用例の分布が,汎用コーパスと類似しており,用例収集の偏りが抑制されていることを示唆する。","subitem_description_type":"Abstract"}]},"item_10002_description_37":{"attribute_name":"抄録(英)","attribute_value_mlt":[{"subitem_description":"This paper presents a method of constructing a database of Japanese compound verb examples, and evaluates the database. The objective of constructing this database is to analyze the relationship between Japanese compound and component verbs. Whether to include a compound verb in the database is determined semi-automatically by the number of examples that can be extracted from these Web corpora. The actual database that resulted from this method consists of 3371 compound verbs (median number of examples per verb = 1173). It covers 77.2% of the relevant entry words in the Iwanami Japanese language dictionary. A comparison with a general-purpose Web corpus shows that this method enabled to collect more than 1000 examples for 1829 compound verbs with a wide range of probability of occurrence. The average cosine similarity between the distributions of case-marked elements in the database examples and in those extracted from the Web corpus is 0.878 for compound verbs. Therefore, this result suggests that the bias of examples is controlled.","subitem_description_type":"Other"}]},"item_10002_description_51":{"attribute_name":"フォーマット","attribute_value_mlt":[{"subitem_description":"application/pdf","subitem_description_type":"Other"}]},"item_10002_identifier_registration":{"attribute_name":"ID登録","attribute_value_mlt":[{"subitem_identifier_reg_text":"10.15084/00002222","subitem_identifier_reg_type":"JaLC"}]},"item_10002_publisher_39":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"国立国語研究所"}]},"item_10002_source_id_41":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2186-134X","subitem_source_identifier_type":"ISSN"},{"subitem_source_identifier":"2186-1358","subitem_source_identifier_type":"ISSN"}]},"item_10002_source_id_44":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AA12536262","subitem_source_identifier_type":"NCID"}]},"item_10002_version_type_52":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"山口, 昌也"},{"creatorName":"ヤマグチ, マサヤ","creatorNameLang":"ja-Kana"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"YAMAGUCHI, Masaya","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2019-07-25"}],"displaytype":"detail","filename":"papers1702.pdf","filesize":[{"value":"1.2 MB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"papers1702.pdf","url":"https://repository.ninjal.ac.jp/record/2238/files/papers1702.pdf"},"version_id":"b130daf4-ad96-43e6-a2d5-f7fca49ab9c0"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"日本語複合動詞","subitem_subject_scheme":"Other"},{"subitem_subject":"用例データベース","subitem_subject_scheme":"Other"},{"subitem_subject":"Webコーパス","subitem_subject_scheme":"Other"},{"subitem_subject":"Japanese compound verb","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"example database","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"web corpus","subitem_subject_language":"en","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"departmental bulletin paper","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"『Webデータに基づく複合動詞用例データベース』の構築と評価","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"『Webデータに基づく複合動詞用例データベース』の構築と評価"},{"subitem_title":"Construction and Evaluation of \"Database of Japanese Compound Verb Examples Based on Web Pages\"","subitem_title_language":"en"}]},"item_type_id":"10002","owner":"3","path":["315"],"pubdate":{"attribute_name":"公開日","attribute_value":"2019-07-25"},"publish_date":"2019-07-25","publish_status":"0","recid":"2238","relation_version_is_last":true,"title":["『Webデータに基づく複合動詞用例データベース』の構築と評価"],"weko_creator_id":"3","weko_shared_id":-1},"updated":"2023-05-15T15:45:56.399902+00:00"}