{"updated":"2025-01-22T12:21:34.708441+00:00","links":{},"id":40583,"created":"2025-01-18T23:07:39.686549+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00040583","sets":["1164:3500:3546:3549"]},"path":["3549"],"owner":"1","recid":"40583","title":["WWWページの自動分類 NDCの分類体系とYahooのカテゴリを使った分類"],"pubdate":{"attribute_name":"公開日","attribute_value":"1999-05-17"},"_buckets":{"deposit":"5650cd65-ea30-4003-8f3b-b12244373d4d"},"_deposit":{"id":"40583","pid":{"type":"depid","value":"40583","revision_id":0},"owners":[1],"status":"published","created_by":1},"item_title":"WWWページの自動分類 NDCの分類体系とYahooのカテゴリを使った分類","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"WWWページの自動分類 NDCの分類体系とYahooのカテゴリを使った分類"},{"subitem_title":"Automatic Classification of World Wide Web Pages","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"1999-05-17","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"亜細亜大学"},{"subitem_text_value":"慶應義塾大学大学院"},{"subitem_text_value":"作新学院女子短大"},{"subitem_text_value":"鉄道総合技術研究所"},{"subitem_text_value":"慶應義塾大学文学部"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Asia University","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Library and Information Science, Keio University","subitem_text_language":"en"},{"subitem_text_value":"Sakushin Gakuin Women's Junior College","subitem_text_language":"en"},{"subitem_text_value":"Railway Technical Research Institute","subitem_text_language":"en"},{"subitem_text_value":"School of Library and Information Science Keio University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/40583/files/IPSJ-FI99054015.pdf"},"date":[{"dateType":"Available","dateValue":"2001-05-17"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-FI99054015.pdf","filesize":[{"value":"703.6 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"39"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"673d3320-40a1-471c-92f6-59151fc05b58","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 1999 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"安形, 輝"},{"creatorName":"石田, 栄美"},{"creatorName":"久野, 高志"},{"creatorName":"野末, 道子"},{"creatorName":"上田, 修一"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Teru, Agata","creatorNameLang":"en"},{"creatorName":"Emi, Ishida","creatorNameLang":"en"},{"creatorName":"Takashi, Kuno","creatorNameLang":"en"},{"creatorName":"Michiko, Nozue","creatorNameLang":"en"},{"creatorName":"Shuichi, Ueda","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10114171","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"インターネットの発展とともにWebページ数は急速に増加し,国内だけで2000万ページに達しているとみられる。人手による選択と分類によるディレクトリ型では,増え続ける量を管理できないことが予想され,ロボットが網羅的にWebページを自動収集するロボット型では,内容の乏しいページが大量に出力される。そこでWebページを巡回するロボットに各ページの自動判断機能を持たせる必要があり,これは,不要ページの除去,ページ群の判定,有用性の判定,それに分類という手順になる。Webページの標本を元にその特徴を調査して,有用性についての目安を示した。さらに,文字列から形態素解析により抽出した語に相対頻度により重み付けする手法とn?gramにより文字列を抽出しベクトル空間型モデルによる情報検索を応用した手法によって,webページの自動分類を行った。なお,分類体系としては,『日本十進分類法』,Yahoo! Japanで用いられているカテゴリを用いた。さらに,比較のために,外部の分類体系としてCSJインデックスの分類表を用いた。","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"The amount of World Wide Web (WWW) pages has grown dramatically over the last few years with the growth of internet. It is estimated that there are currently over 18 million WWW pages in Japan. In order to satisfy the requirement for new search engines for WWW pages, it is necessary to develop automatic mechanisms for the deletion of less important pages, the identification of identical pages, judgement of usefulness of pages, and classification. In order to classify WWW pages in Japanese, experiments of classification using NDC. Yahoo! categories, and CSJ index as classification scheme were conducted. We present two classification algorithms based on relative frequencies of terms and information retrieval technique using vector-space model.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"120","bibliographic_titles":[{"bibliographic_title":"情報処理学会研究報告情報学基礎(FI)"}],"bibliographicPageStart":"113","bibliographicIssueDates":{"bibliographicIssueDate":"1999-05-17","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"39(1999-FI-054)","bibliographicVolumeNumber":"1999"}]},"relation_version_is_last":true,"weko_creator_id":"1"}}