WEKO3
アイテム
{"_buckets": {"deposit": "081a8436-3e59-44ff-904c-7b0ff5f3d032"}, "_deposit": {"id": "3419", "owners": [], "pid": {"revision_id": 0, "type": "depid", "value": "3419"}, "status": "published"}, "_oai": {"id": "oai:repository.dl.itc.u-tokyo.ac.jp:00003419", "sets": ["234", "262"]}, "item_7_alternative_title_1": {"attribute_name": "その他のタイトル", "attribute_value_mlt": [{"subitem_alternative_title": "情報の公共性に基づくMicroblog記事の分類"}]}, "item_7_biblio_info_7": {"attribute_name": "書誌情報", "attribute_value_mlt": [{"bibliographicIssueDates": {"bibliographicIssueDate": "2012-03-22", "bibliographicIssueDateType": "Issued"}, "bibliographic_titles": [{}]}]}, "item_7_date_granted_25": {"attribute_name": "学位授与年月日", "attribute_value_mlt": [{"subitem_dategranted": "2012-03-22"}]}, "item_7_degree_name_20": {"attribute_name": "学位名", "attribute_value_mlt": [{"subitem_degreename": "修士(情報理工学)"}]}, "item_7_description_5": {"attribute_name": "抄録", "attribute_value_mlt": [{"subitem_description": "Microblog, especially Twitter today has become an important tool to propagate public information among Internet users. The content of Twitter is an extraordinarily large number of small textual messages, posted by millions of users, at random or in response to perceived events or situations. However, messages of Twitter (tweets) cover so many categories including news, spam and others that it\u0027s difficult to provide public information directly. Since the traditional search cannot meet demands of tweets of some category, we aim to classify tweets automatically into defined categories to help users search. In our paper, we focus on approaches of collecting a corpus automatically for training classifiers. We proposed two approaches that are based on typical Twitter user accounts and based on Twitter lists using label propagation respectively. Using the corpora, we built classifiers, which are able to determine news, commercial and private tweets. Experiments evaluations show our proposed techniques are effective. In our search, we worked with Japanese, but the proposed approaches can be used with any other language.", "subitem_description_type": "Abstract"}]}, "item_7_full_name_3": {"attribute_name": "著者別名", "attribute_value_mlt": [{"nameIdentifiers": [{"nameIdentifier": "8213", "nameIdentifierScheme": "WEKO"}], "names": [{"name": "鄭, 洪光"}]}]}, "item_7_select_21": {"attribute_name": "学位", "attribute_value_mlt": [{"subitem_select_item": "master"}]}, "item_7_subject_13": {"attribute_name": "日本十進分類法", "attribute_value_mlt": [{"subitem_subject": "007", "subitem_subject_scheme": "NDC"}]}, "item_7_text_24": {"attribute_name": "研究科・専攻", "attribute_value_mlt": [{"subitem_text_value": "情報理工学系研究科電子情報学専攻"}]}, "item_7_text_36": {"attribute_name": "資源タイプ", "attribute_value_mlt": [{"subitem_text_value": "Thesis"}]}, "item_7_text_4": {"attribute_name": "著者所属", "attribute_value_mlt": [{"subitem_text_value": "東京大学大学院情報理工学系研究科電子情報学専攻"}, {"subitem_text_value": "Department of Information and Communication Engineering, Graduate School of Information Science and Technology, The University of Tokyo"}]}, "item_creator": {"attribute_name": "著者", "attribute_type": "creator", "attribute_value_mlt": [{"creatorNames": [{"creatorName": "Zheng, Hongguang"}], "nameIdentifiers": [{"nameIdentifier": "8212", "nameIdentifierScheme": "WEKO"}]}]}, "item_files": {"attribute_name": "ファイル情報", "attribute_type": "file", "attribute_value_mlt": [{"accessrole": "open_date", "date": [{"dateType": "Available", "dateValue": "2017-05-31"}], "displaytype": "detail", "download_preview_message": "", "file_order": 0, "filename": "48106424.pdf", "filesize": [{"value": "1.3 MB"}], "format": "application/pdf", "future_date_message": "", "is_thumbnail": false, "licensetype": "license_free", "mimetype": "application/pdf", "size": 1300000.0, "url": {"label": "48106424.pdf", "url": "https://repository.dl.itc.u-tokyo.ac.jp/record/3419/files/48106424.pdf"}, "version_id": "c6c80104-d39f-4358-9a1a-e63cfdae1cdd"}]}, "item_keyword": {"attribute_name": "キーワード", "attribute_value_mlt": [{"subitem_subject": "Twitter", "subitem_subject_scheme": "Other"}, {"subitem_subject": "Classification", "subitem_subject_scheme": "Other"}, {"subitem_subject": "Label propagation", "subitem_subject_scheme": "Other"}]}, "item_language": {"attribute_name": "言語", "attribute_value_mlt": [{"subitem_language": "eng"}]}, "item_resource_type": {"attribute_name": "資源タイプ", "attribute_value_mlt": [{"resourcetype": "thesis", "resourceuri": "http://purl.org/coar/resource_type/c_46ec"}]}, "item_title": "Classification of Microblog Posts Based on Information Publicness", "item_titles": {"attribute_name": "タイトル", "attribute_value_mlt": [{"subitem_title": "Classification of Microblog Posts Based on Information Publicness"}]}, "item_type_id": "7", "owner": "1", "path": ["234", "262"], "permalink_uri": "http://hdl.handle.net/2261/51760", "pubdate": {"attribute_name": "公開日", "attribute_value": "2012-05-30"}, "publish_date": "2012-05-30", "publish_status": "0", "recid": "3419", "relation": {}, "relation_version_is_last": true, "title": ["Classification of Microblog Posts Based on Information Publicness"], "weko_shared_id": null}
Classification of Microblog Posts Based on Information Publicness
http://hdl.handle.net/2261/51760
http://hdl.handle.net/2261/51760478963dc-34c4-414a-bc38-190d71e2994b
名前 / ファイル | ライセンス | アクション |
---|---|---|
48106424.pdf (1.3 MB)
|
|
Item type | 学位論文 / Thesis or Dissertation(1) | |||||
---|---|---|---|---|---|---|
公開日 | 2012-05-30 | |||||
タイトル | ||||||
タイトル | Classification of Microblog Posts Based on Information Publicness | |||||
言語 | ||||||
言語 | eng | |||||
キーワード | ||||||
主題 | ||||||
主題Scheme | Other | |||||
キーワード | ||||||
主題 | Classification | |||||
主題Scheme | Other | |||||
キーワード | ||||||
主題 | Label propagation | |||||
主題Scheme | Other | |||||
資源タイプ | ||||||
資源 | http://purl.org/coar/resource_type/c_46ec | |||||
タイプ | thesis | |||||
その他のタイトル | ||||||
その他のタイトル | 情報の公共性に基づくMicroblog記事の分類 | |||||
著者 |
Zheng, Hongguang
× Zheng, Hongguang |
|||||
著者別名 | ||||||
識別子 | 8213 | |||||
識別子Scheme | WEKO | |||||
姓名 | 鄭, 洪光 | |||||
著者所属 | ||||||
著者所属 | 東京大学大学院情報理工学系研究科電子情報学専攻 | |||||
著者所属 | ||||||
著者所属 | Department of Information and Communication Engineering, Graduate School of Information Science and Technology, The University of Tokyo | |||||
Abstract | ||||||
内容記述タイプ | Abstract | |||||
内容記述 | Microblog, especially Twitter today has become an important tool to propagate public information among Internet users. The content of Twitter is an extraordinarily large number of small textual messages, posted by millions of users, at random or in response to perceived events or situations. However, messages of Twitter (tweets) cover so many categories including news, spam and others that it's difficult to provide public information directly. Since the traditional search cannot meet demands of tweets of some category, we aim to classify tweets automatically into defined categories to help users search. In our paper, we focus on approaches of collecting a corpus automatically for training classifiers. We proposed two approaches that are based on typical Twitter user accounts and based on Twitter lists using label propagation respectively. Using the corpora, we built classifiers, which are able to determine news, commercial and private tweets. Experiments evaluations show our proposed techniques are effective. In our search, we worked with Japanese, but the proposed approaches can be used with any other language. | |||||
書誌情報 | 発行日 2012-03-22 | |||||
日本十進分類法 | ||||||
主題 | 007 | |||||
主題Scheme | NDC | |||||
学位名 | ||||||
学位名 | 修士(情報理工学) | |||||
学位 | ||||||
値 | master | |||||
研究科・専攻 | ||||||
情報理工学系研究科電子情報学専攻 | ||||||
学位授与年月日 | ||||||
学位授与年月日 | 2012-03-22 |