{"created":"2025-01-18T23:13:09.205467+00:00","updated":"2025-01-22T08:50:43.116196+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00047747","sets":["1164:4179:4180:4186"]},"path":["4186"],"owner":"1","recid":"47747","title":["blog分類のための半教師有り学習"],"pubdate":{"attribute_name":"公開日","attribute_value":"2008-01-22"},"_buckets":{"deposit":"476f0066-f673-4d83-95d6-afb3b65593ed"},"_deposit":{"id":"47747","pid":{"type":"depid","value":"47747","revision_id":0},"owners":[1],"status":"published","created_by":1},"item_title":"blog分類のための半教師有り学習","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"blog分類のための半教師有り学習"},{"subitem_title":"Semi-supervised Learning for Blog Classification","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2008-01-22","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"東京工業大学"},{"subitem_text_value":"東京工業大学"},{"subitem_text_value":"東京工業大学"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Tokyo Institute of Technology","subitem_text_language":"en"},{"subitem_text_value":"Tokyo Institute of Technology","subitem_text_language":"en"},{"subitem_text_value":"Tokyo Institute of Technology","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/47747/files/IPSJ-NL08183009.pdf"},"date":[{"dateType":"Available","dateValue":"2010-01-22"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-NL08183009.pdf","filesize":[{"value":"727.9 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"23"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"a8640f59-cbed-42cf-a3ea-289059fb9907","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2008 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"池田, 大介"},{"creatorName":"高村, 大也"},{"creatorName":"奥村, 学"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Daisuke, IKEDA","creatorNameLang":"en"},{"creatorName":"Hiroya, TAKAMURA","creatorNameLang":"en"},{"creatorName":"Manabu, OKUMURA","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10115061","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"blog著者の属性推定など,教師有り学習を用いblogを分類する研究がなされている.ラベルの無いblogであれば容易に収集が可能であるが,正解ラベル付きのblogは一般に高価である.そこで,本研究では半教師有り学習によるblog分類手法を提案する.blog中の各エントリはスタイルや内容が共通している.本研究ではこれに着目し,各エントリがどのblogに属していたか, という補助問題を解くことにより,blogのスタイルやコンテンツと言った各blogに固有の特徴をモデル化する.この情報を利用することで, 目的の分類問題の精度を向上させることができる.本手法を用いた, いくつかの分類タスクでの実験結果についても報告する.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"Classifying blogs, e.g. identifying bloggers' gender or age, is one of the most interesting problems in blog analysis today. Although it is usually solved by applying supervised learning techniques, it is not always easy to collect labeled blogs enough to train an accurate classifier. To the contrary, we can collect a huge amount of blogs that have no labels. In this paper, therefore, we propose a semi-supervised learning method for blog classification in order to incorporate unlabeled data into supervised learning. We assume that the entries from the same blog have the same characteristics. With this assumption, our method captures the characteristics of each blog, such as writing styles, and uses it to improve classification accuracy.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"66","bibliographic_titles":[{"bibliographic_title":"情報処理学会研究報告自然言語処理(NL)"}],"bibliographicPageStart":"59","bibliographicIssueDates":{"bibliographicIssueDate":"2008-01-22","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"4(2008-NL-183)","bibliographicVolumeNumber":"2008"}]},"relation_version_is_last":true,"weko_creator_id":"1"},"id":47747,"links":{}}