{"created":"2021-03-01T06:16:57.635648+00:00","id":420,"links":{},"metadata":{"_buckets":{"deposit":"635dd94d-c158-428d-8389-fbb314c9a1c1"},"_deposit":{"id":"420","owners":[],"pid":{"revision_id":0,"type":"depid","value":"420"},"status":"published"},"_oai":{"id":"oai:repository.dl.itc.u-tokyo.ac.jp:00000420","sets":["12:13","9:10:15"]},"item_2_alternative_title_1":{"attribute_name":"その他のタイトル","attribute_value_mlt":[{"subitem_alternative_title":"A System for Constructing a Synonym Dictionaty"}]},"item_2_biblio_info_7":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2008-04","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"2","bibliographicPageEnd":"58","bibliographicPageStart":"39","bibliographicVolumeNumber":"15","bibliographic_titles":[{"bibliographic_title":"自然言語処理"}]}]},"item_2_description_13":{"attribute_name":"フォーマット","attribute_value_mlt":[{"subitem_description":"application/pdf","subitem_description_type":"Other"}]},"item_2_description_5":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"同義語の同定は,情報検索,テキストマイニングなどのテキスト処理を行う上で必要な作業である.同義語辞書を作成することにより,テキスト処理の効率や精度の向上を期待できる.特定分野における文書には,専門の表現が多く用いられており,その中には,分野独特の同義語が多量に含まれている.例えば,日本語の航空分野では,漢字・ひらがなだけでなく,カタカナ,アルファベット,およびそれらの略語が同義語として用いられている.この分野の同義語は,汎用の辞書に登録されていないものが多く,既存の辞書を使用できないので,辞書を新たに作成する必要がある.また,辞書作成後も常に新しい語が発生するので,辞書の定期的な更新が必要となるが,それを人手で行うのは大変な作業である.本論文では,同義語辞書作成を半自動化するシステムを提案する,システムは,クエリが与えられると意味的に同じ候補語を提示する.辞書作成者は,その中から同義語を選択して,辞書登録を行うことができる.候補語のクエリに対する類似度は,同義語の周辺に出現する語の頻度情報を文脈情報とし,その余弦から計算する.文脈情報のみでは十分な精度が得られない場合,既知の同義語を知識としてシステムに与えることにより,文脈語の正規化を行い,精度を向上できることを確認した.実験は,航空分野の日本語のレポートを対象とし,システムの評価には平均精度を用いて行い,満足できる結果が得られた.","subitem_description_type":"Abstract"},{"subitem_description":"To identify a synonym is a necessary procedure for text processing such as information retrieval and text mining. We can expect to improve the proficiency and performance in text processing by constructing a synonym dictionary. Same words might possibly be used as a different meaning if the target field differs, so a synonym dictionary has to be constructed for each field. In some fields in Japanese, such as in aviation, synonym nouns include kanjijhiragana, katakana, alphabet and their abbreviations. Many of these words are not registerd in a general dictionary. In addition, as new words always come to be used, the dictionary update is a big issue. In this paper, we propose a system for constructing a synonym dictionary. The system will return synonym candidates on the descending order of similarity against a query. A synonym can be easily registered in a dictionary by looking the synonym candidates generated by the proposed system. We define a context information as words frequency appearing around a target word. Then a similarity is calculated by cosine measure using context information. We confirmed that the system performance was remarkably improved by providing the system with known synonym set to make context word nominalization, especially when the performance was low. We experimentally evaluated the system performance by aviation safety reports in Japanese and evaluated it by average precision, and got promising results.","subitem_description_type":"Abstract"}]},"item_2_full_name_3":{"attribute_name":"著者別名","attribute_value_mlt":[{"nameIdentifiers":[{"nameIdentifier":"106374","nameIdentifierScheme":"WEKO"}],"names":[{"name":"TERADA, AKIRA"}]},{"nameIdentifiers":[{"nameIdentifier":"106375","nameIdentifierScheme":"WEKO"}],"names":[{"name":"YOSHIDA, MINORU"}]},{"nameIdentifiers":[{"nameIdentifier":"106376","nameIdentifierScheme":"WEKO"}],"names":[{"name":"HNAKAGAWA, IROSHI"}]}]},"item_2_publisher_20":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"言語処理学会"}]},"item_2_source_id_10":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10472659","subitem_source_identifier_type":"NCID"}]},"item_2_source_id_8":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"13407619","subitem_source_identifier_type":"ISSN"}]},"item_2_subject_15":{"attribute_name":"日本十進分類法","attribute_value_mlt":[{"subitem_subject":"007","subitem_subject_scheme":"NDC"}]},"item_2_text_21":{"attribute_name":"出版者別名","attribute_value_mlt":[{"subitem_text_value":"The Association for Natural Language Processing"}]},"item_2_text_4":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"(株)日本航空インターナショナル"},{"subitem_text_value":"東京大学情報基盤センター"},{"subitem_text_value":"Japan Airlines Co., Ltd."},{"subitem_text_value":"Information Technology Center,The University of Tokyo"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"寺田, 昭"}],"nameIdentifiers":[{"nameIdentifier":"106371","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"吉田, 稔"}],"nameIdentifiers":[{"nameIdentifier":"106372","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"中川, 裕志"}],"nameIdentifiers":[{"nameIdentifier":"106373","nameIdentifierScheme":"WEKO"}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2017-06-26"}],"displaytype":"detail","filename":"v15n2_03.pdf","filesize":[{"value":"1.5 MB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"v15n2_03.pdf","url":"https://repository.dl.itc.u-tokyo.ac.jp/record/420/files/v15n2_03.pdf"},"version_id":"754eca26-b53d-481d-8c89-d4a5eb634aa4"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"同義語","subitem_subject_scheme":"Other"},{"subitem_subject":"文脈情報","subitem_subject_scheme":"Other"},{"subitem_subject":"辞書作成","subitem_subject_scheme":"Other"},{"subitem_subject":"文脈語の正規化","subitem_subject_scheme":"Other"},{"subitem_subject":"Synonym","subitem_subject_scheme":"Other"},{"subitem_subject":"Context information","subitem_subject_scheme":"Other"},{"subitem_subject":"Constructing a dictionary","subitem_subject_scheme":"Other"},{"subitem_subject":"Context word nominalization","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"journal article","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"同義語辞書作成支援システム","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"同義語辞書作成支援システム"}]},"item_type_id":"2","owner":"1","path":["13","15"],"pubdate":{"attribute_name":"公開日","attribute_value":"2009-12-15"},"publish_date":"2009-12-15","publish_status":"0","recid":"420","relation_version_is_last":true,"title":["同義語辞書作成支援システム"],"weko_creator_id":"1","weko_shared_id":null},"updated":"2022-12-19T03:41:13.407142+00:00"}