WEKO3
アイテム
{"_buckets": {"deposit": "c5a8784d-dad5-4c01-854f-d65a74a6a489"}, "_deposit": {"created_by": 3, "id": "492", "owners": [3], "pid": {"revision_id": 0, "type": "depid", "value": "492"}, "status": "published"}, "_oai": {"id": "oai:repository.ninjal.ac.jp:00000492", "sets": ["61"]}, "author_link": ["6445", "6446"], "item_10002_biblio_info_40": {"attribute_name": "書誌情報", "attribute_value_mlt": [{"bibliographicIssueDates": {"bibliographicIssueDate": "2011-11", "bibliographicIssueDateType": "Issued"}, "bibliographicIssueNumber": "2", "bibliographicPageEnd": "106", "bibliographicPageStart": "91", "bibliographic_titles": [{"bibliographic_title": "国立国語研究所論集"}, {"bibliographic_title": "NINJAL Research Papers", "bibliographic_titleLang": "en"}]}]}, "item_10002_description_34": {"attribute_name": "著者所属", "attribute_value_mlt": [{"subitem_description": "国立国語研究所 コーパス開発センター 非常勤研究員", "subitem_description_type": "Other"}]}, "item_10002_description_35": {"attribute_name": "著者所属(英)", "attribute_value_mlt": [{"subitem_description": "Adjunct Researcher, Center for Corpus Development, National Institute for Japanese Language and Linguistics", "subitem_description_type": "Other"}]}, "item_10002_description_36": {"attribute_name": "抄録", "attribute_value_mlt": [{"subitem_description": "中古和文において,どこからどこまでを一語と認めるかという語認定には,従来明確な尺度がなく,既存の辞書の見出し語をあたっても,立項基準は感覚的・主観的なものであると言わざるを得ない。語と語の結びつきの強さ(コロケーション強度)を具体的な数値で示すダイス係数を取り上げ,「名詞+あり/なし/よし/あし」の組み合わせを例に,語認定の一つの客観的基準として,ダイス係数が有効であることを論じた。", "subitem_description_type": "Abstract"}]}, "item_10002_description_37": {"attribute_name": "抄録(英)", "attribute_value_mlt": [{"subitem_description": "It has long been a serious problem for researchers of Early Middle Japanese to determine whether a set phrase like kai-nashi should be classified as one word or a combination of separate words. There is no definite criterion, and some phrases are listed in dictionaries as a word while others are neglected, all depending on the judgment of the editor. In this paper, the Dice coefficient is introduced as a solution. The Dice coefficient is an index for estimating collocation strength, i.e., how strongly two words are connected with each other. In combination with a morphological analysis dictionary (Chuko-Wabun UniDic), the Dice coefficient works as one criterion for word identification.", "subitem_description_type": "Other"}]}, "item_10002_description_51": {"attribute_name": "フォーマット", "attribute_value_mlt": [{"subitem_description": "application/pdf", "subitem_description_type": "Other"}]}, "item_10002_identifier_registration": {"attribute_name": "ID登録", "attribute_value_mlt": [{"subitem_identifier_reg_text": "10.15084/00000483", "subitem_identifier_reg_type": "JaLC"}]}, "item_10002_publisher_39": {"attribute_name": "出版者", "attribute_value_mlt": [{"subitem_publisher": "国立国語研究所"}]}, "item_10002_source_id_41": {"attribute_name": "ISSN", "attribute_value_mlt": [{"subitem_source_identifier": "2186-134X", "subitem_source_identifier_type": "ISSN"}, {"subitem_source_identifier": "2186-1358", "subitem_source_identifier_type": "ISSN"}]}, "item_10002_source_id_44": {"attribute_name": "書誌レコードID", "attribute_value_mlt": [{"subitem_source_identifier": "AA12536262", "subitem_source_identifier_type": "NCID"}]}, "item_10002_title_29": {"attribute_name": "タイトル(ヨミ)", "attribute_value_mlt": [{"subitem_title": "コロケーション キョウド オ モチイタ チュウコゴ ノ ゴ ニンテイ"}]}, "item_10002_version_type_52": {"attribute_name": "著者版フラグ", "attribute_value_mlt": [{"subitem_version_resource": "http://purl.org/coar/version/c_970fb48d4fbd8a85", "subitem_version_type": "VoR"}]}, "item_creator": {"attribute_name": "著者", "attribute_type": "creator", "attribute_value_mlt": [{"creatorNames": [{"creatorName": "須永, 哲矢"}, {"creatorName": "スナガ, テツヤ", "creatorNameLang": "ja-Kana"}], "nameIdentifiers": [{"nameIdentifier": "6445", "nameIdentifierScheme": "WEKO"}]}, {"creatorNames": [{"creatorName": "SUNAGA, Tetsuya", "creatorNameLang": "en"}], "nameIdentifiers": [{"nameIdentifier": "6446", "nameIdentifierScheme": "WEKO"}]}]}, "item_files": {"attribute_name": "ファイル情報", "attribute_type": "file", "attribute_value_mlt": [{"accessrole": "open_date", "date": [{"dateType": "Available", "dateValue": "2019-02-20"}], "displaytype": "detail", "download_preview_message": "", "file_order": 0, "filename": "papers0205.pdf", "filesize": [{"value": "967.7 kB"}], "format": "application/pdf", "future_date_message": "", "is_thumbnail": false, "licensetype": "license_free", "mimetype": "application/pdf", "size": 967700.0, "url": {"label": "papers0205.pdf", "url": "https://repository.ninjal.ac.jp/record/492/files/papers0205.pdf"}, "version_id": "9c26495d-2b13-403b-b0fd-4fdd6399216b"}]}, "item_keyword": {"attribute_name": "キーワード", "attribute_value_mlt": [{"subitem_subject": "形態素解析辞書", "subitem_subject_scheme": "Other"}, {"subitem_subject": "中古語", "subitem_subject_scheme": "Other"}, {"subitem_subject": "コロケーション強度", "subitem_subject_scheme": "Other"}, {"subitem_subject": "ダイス係数", "subitem_subject_scheme": "Other"}, {"subitem_subject": "morphological analysis dictionary", "subitem_subject_language": "en", "subitem_subject_scheme": "Other"}, {"subitem_subject": "Early Middle Japanese", "subitem_subject_language": "en", "subitem_subject_scheme": "Other"}, {"subitem_subject": "collocation strength", "subitem_subject_language": "en", "subitem_subject_scheme": "Other"}, {"subitem_subject": "Dice coefficient", "subitem_subject_language": "en", "subitem_subject_scheme": "Other"}]}, "item_language": {"attribute_name": "言語", "attribute_value_mlt": [{"subitem_language": "jpn"}]}, "item_resource_type": {"attribute_name": "資源タイプ", "attribute_value_mlt": [{"resourcetype": "departmental bulletin paper", "resourceuri": "http://purl.org/coar/resource_type/c_6501"}]}, "item_title": "コロケーション強度を用いた中古語の語認定", "item_titles": {"attribute_name": "タイトル", "attribute_value_mlt": [{"subitem_title": "コロケーション強度を用いた中古語の語認定"}, {"subitem_title": "Word Identification in Early Middle Japanese Using Collocation Strength", "subitem_title_language": "en"}]}, "item_type_id": "10002", "owner": "3", "path": ["61"], "permalink_uri": "https://doi.org/10.15084/00000483", "pubdate": {"attribute_name": "公開日", "attribute_value": "2015-10-30"}, "publish_date": "2015-10-30", "publish_status": "0", "recid": "492", "relation": {}, "relation_version_is_last": true, "title": ["コロケーション強度を用いた中古語の語認定"], "weko_shared_id": -1}
コロケーション強度を用いた中古語の語認定
https://doi.org/10.15084/00000483
https://doi.org/10.15084/00000483a408862e-cf32-4747-a14c-cc5f0ae69196
名前 / ファイル | ライセンス | アクション |
---|---|---|
papers0205.pdf (967.7 kB)
|
|
Item type | 紀要論文 / Departmental Bulletin Paper(1) | |||||
---|---|---|---|---|---|---|
公開日 | 2015-10-30 | |||||
タイトル | ||||||
タイトル | コロケーション強度を用いた中古語の語認定 | |||||
タイトル | ||||||
言語 | en | |||||
タイトル | Word Identification in Early Middle Japanese Using Collocation Strength | |||||
言語 | ||||||
言語 | jpn | |||||
キーワード | ||||||
主題Scheme | Other | |||||
主題 | 形態素解析辞書 | |||||
キーワード | ||||||
主題Scheme | Other | |||||
主題 | 中古語 | |||||
キーワード | ||||||
主題Scheme | Other | |||||
主題 | コロケーション強度 | |||||
キーワード | ||||||
主題Scheme | Other | |||||
主題 | ダイス係数 | |||||
キーワード | ||||||
言語 | en | |||||
主題Scheme | Other | |||||
主題 | morphological analysis dictionary | |||||
キーワード | ||||||
言語 | en | |||||
主題Scheme | Other | |||||
主題 | Early Middle Japanese | |||||
キーワード | ||||||
言語 | en | |||||
主題Scheme | Other | |||||
主題 | collocation strength | |||||
キーワード | ||||||
言語 | en | |||||
主題Scheme | Other | |||||
主題 | Dice coefficient | |||||
資源タイプ | ||||||
資源タイプ識別子 | http://purl.org/coar/resource_type/c_6501 | |||||
資源タイプ | departmental bulletin paper | |||||
ID登録 | ||||||
ID登録 | 10.15084/00000483 | |||||
ID登録タイプ | JaLC | |||||
著者 |
須永, 哲矢
× 須永, 哲矢× SUNAGA, Tetsuya |
|||||
著者所属 | ||||||
内容記述タイプ | Other | |||||
内容記述 | 国立国語研究所 コーパス開発センター 非常勤研究員 | |||||
著者所属(英) | ||||||
内容記述タイプ | Other | |||||
内容記述 | Adjunct Researcher, Center for Corpus Development, National Institute for Japanese Language and Linguistics | |||||
抄録 | ||||||
内容記述タイプ | Abstract | |||||
内容記述 | 中古和文において,どこからどこまでを一語と認めるかという語認定には,従来明確な尺度がなく,既存の辞書の見出し語をあたっても,立項基準は感覚的・主観的なものであると言わざるを得ない。語と語の結びつきの強さ(コロケーション強度)を具体的な数値で示すダイス係数を取り上げ,「名詞+あり/なし/よし/あし」の組み合わせを例に,語認定の一つの客観的基準として,ダイス係数が有効であることを論じた。 | |||||
抄録(英) | ||||||
内容記述タイプ | Other | |||||
内容記述 | It has long been a serious problem for researchers of Early Middle Japanese to determine whether a set phrase like kai-nashi should be classified as one word or a combination of separate words. There is no definite criterion, and some phrases are listed in dictionaries as a word while others are neglected, all depending on the judgment of the editor. In this paper, the Dice coefficient is introduced as a solution. The Dice coefficient is an index for estimating collocation strength, i.e., how strongly two words are connected with each other. In combination with a morphological analysis dictionary (Chuko-Wabun UniDic), the Dice coefficient works as one criterion for word identification. | |||||
出版者 | ||||||
出版者 | 国立国語研究所 | |||||
書誌情報 |
国立国語研究所論集 en : NINJAL Research Papers 号 2, p. 91-106, 発行日 2011-11 |
|||||
ISSN | ||||||
収録物識別子タイプ | ISSN | |||||
収録物識別子 | 2186-134X | |||||
ISSN | ||||||
収録物識別子タイプ | ISSN | |||||
収録物識別子 | 2186-1358 | |||||
書誌レコードID | ||||||
収録物識別子タイプ | NCID | |||||
収録物識別子 | AA12536262 | |||||
フォーマット | ||||||
内容記述タイプ | Other | |||||
内容記述 | application/pdf | |||||
著者版フラグ | ||||||
出版タイプ | VoR | |||||
出版タイプResource | http://purl.org/coar/version/c_970fb48d4fbd8a85 |