{"created":"2023-05-15T14:23:23.549625+00:00","id":1532,"links":{},"metadata":{"_buckets":{"deposit":"dc4b5a42-e258-40cd-b03d-c7f0a5bcb5de"},"_deposit":{"created_by":3,"id":"1532","owners":[3],"pid":{"revision_id":0,"type":"depid","value":"1532"},"status":"published"},"_oai":{"id":"oai:repository.ninjal.ac.jp:00001532","sets":["245:246"]},"author_link":["4750"],"item_10003_biblio_info_32":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2017","bibliographicIssueDateType":"Issued"},"bibliographicPageEnd":"163","bibliographicPageStart":"154","bibliographicVolumeNumber":"2","bibliographic_titles":[{"bibliographic_title":"言語資源活用ワークショップ発表論文集"},{"bibliographic_title":"Proceedings of Language Resources Workshop","bibliographic_titleLang":"en"}]}]},"item_10003_description_27":{"attribute_name":"会議概要(会議名, 開催地, 会期, 主催者等)","attribute_value_mlt":[{"subitem_description":"会議名: 言語資源活用ワークショップ2017, 開催地: 国立国語研究所, 会期: 2017年9月5日-6日, 主催: 国立国語研究所 コーパス開発センター","subitem_description_type":"Other"}]},"item_10003_description_29":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"大量のデータを集めやすい母語話者コーパスと異なり,学習者コーパスでは,集められる標本数に物理的な制約がある。ここで問題となるのは,調査対象とする言語項目ごとに,どの程度の標本数を集めればある程度安定した結果が得られるかということである。内外の主要な学習者コーパスは,学習者の国(母語)ごとにモジュール構成を取っているが,1モジュール当たりの標本数は,作文コーパスの場合,ICLE(英語・作文)で243-982,ICNALE(英語・作文)で200-800,日本語学習者作文コーパス(日本語・作文)で144-160また,発話コーパスの場合, LINDSEI(英語・インタビュー発話)で50-53,ICNALE(英語・独話)で200-600,I-JAS(日本語・インタビュー発話等)で50となっており,コーパスごとに大きな差がある。本論では,I-JASの母語話者および学習者データを用い,分析するサンプル数を変化させた場合の基本的言語指標値の変化を概観し,その収束のポイントを検討する。","subitem_description_type":"Abstract"}]},"item_10003_description_43":{"attribute_name":"フォーマット","attribute_value_mlt":[{"subitem_description":"application/pdf","subitem_description_type":"Other"}]},"item_10003_description_51":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_description":"神戸大学","subitem_description_type":"Other"}]},"item_10003_description_53":{"attribute_name":"抄録(英)","attribute_value_mlt":[{"subitem_description":"The number of samples collected in learner corpora is generally small in comparison to native speaker corpora, ut the extent to which the limited sample size influences the reliability of learner corpus studies has not yet been holly elucidated. Therefore, we extracted short writing pieces from the International Corpus of Japanese as a econd Language (I-JAS) and prepared text sets of different sizes (n = 10, n = 20, n = 30, n = 40, and n = 50) for Chinese and Korean learners of Japanese as well as Japanese native speakers. We then examined the difference ratios observed across five kinds of text sets with a focus on basic linguistic indices, such as the total number of tokens per texts, and frequencies of punctuation marks, nouns and verbs, and conjugation forms of verbs. Our analyses show that the influence of sample size is not as strong as generally expected, and that discussion of learners’ L2 production with a relatively smaller corpus data could be rationalized to some extent.","subitem_description_type":"Other"}]},"item_10003_identifier_registration":{"attribute_name":"ID登録","attribute_value_mlt":[{"subitem_identifier_reg_text":"10.15084/00001516","subitem_identifier_reg_type":"JaLC"}]},"item_10003_publisher_45":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"国立国語研究所"}]},"item_10003_relation_40":{"attribute_name":"関連サイト","attribute_value_mlt":[{"subitem_relation_name":[{"subitem_relation_name_text":"言語資源活用ワークショップ2017"}],"subitem_relation_type_id":{"subitem_relation_type_id_text":"http://pj.ninjal.ac.jp/corpus_center/lrw2017.html","subitem_relation_type_select":"URI"}}]},"item_10003_version_type_44":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"石川, 慎一郎"},{"creatorName":"イシカワ, シンイチロウ","creatorNameLang":"ja-Kana"},{"creatorName":"ISHIKAWA, Shin'ichiro","creatorNameLang":"en"}],"nameIdentifiers":[{},{}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2019-02-15"}],"displaytype":"detail","filename":"LRW-2017-18-O-B-2.pdf","filesize":[{"value":"944.9 kB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"LRW-2017-18-O-B-2.pdf","url":"https://repository.ninjal.ac.jp/record/1532/files/LRW-2017-18-O-B-2.pdf"},"version_id":"0cb41586-0432-4c0e-bdf3-cdf006ddeaf1"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"多言語母語の日本語学習者横断コーパス(I-JAS)","subitem_subject_scheme":"Other"},{"subitem_subject":"International Corpus of Japanese as a Second Language (I-JAS)","subitem_subject_language":"en","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"eng"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"conference paper","resourceuri":"http://purl.org/coar/resource_type/c_5794"}]},"item_title":"学習者コーパス研究における標本数の問題","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"学習者コーパス研究における標本数の問題"},{"subitem_title":"A Reconsideration of the Needed Sample Size in Learner Corpus Studies","subitem_title_language":"en"}]},"item_type_id":"10003","owner":"3","path":["246"],"pubdate":{"attribute_name":"公開日","attribute_value":"2018-03-20"},"publish_date":"2018-03-20","publish_status":"0","recid":"1532","relation_version_is_last":true,"title":["学習者コーパス研究における標本数の問題"],"weko_creator_id":"3","weko_shared_id":-1},"updated":"2023-05-16T10:23:53.779738+00:00"}