{"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00235071","sets":["1164:3206:11566:11671"]},"path":["11671"],"owner":"44499","recid":"235071","title":["Retrieval-Augmented Multi-Floor Building Image Generation"],"pubdate":{"attribute_name":"公開日","attribute_value":"2024-06-22"},"_buckets":{"deposit":"ff524f12-bc80-4cf4-a160-765f9bcc25c0"},"_deposit":{"id":"235071","pid":{"type":"depid","value":"235071","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"Retrieval-Augmented Multi-Floor Building Image Generation","author_link":["641805","641806","641802","641807","641804","641803"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"Retrieval-Augmented Multi-Floor Building Image Generation"},{"subitem_title":"Retrieval-Augmented Multi-Floor Building Image Generation","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"CG一般セッション","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2024-06-22","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"Japan Advanced Institute of Science and Technology"},{"subitem_text_value":"Japan Advanced Institute of Science and Technology"},{"subitem_text_value":"Japan Advanced Institute of Science and Technology"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Japan Advanced Institute of Science and Technology","subitem_text_language":"en"},{"subitem_text_value":"Japan Advanced Institute of Science and Technology","subitem_text_language":"en"},{"subitem_text_value":"Japan Advanced Institute of Science and Technology","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"eng"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/235071/files/IPSJ-CG24194003.pdf","label":"IPSJ-CG24194003.pdf"},"date":[{"dateType":"Available","dateValue":"2026-06-22"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-CG24194003.pdf","filesize":[{"value":"4.0 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"28"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"6b69964f-edc1-4c49-8af4-7599b5a97b4d","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2024 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Zhengyang, Wang"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Hao, Jin"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Haoran, Xie"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Zhengyang, Wang","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Hao, Jin","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Haoran, Xie","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10100541","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8949","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"Demand for generating building images from text prompts grows, despite recent advances in diffusion models greatly enhancing image quality. The current generative models struggle with controlling the number of floors. To this end, we propose a retrieval-augmented framework for generating building images with provided floor count using a diffusion model. Initially, the text prompts with the provided floor count to retrieve the most suitable image from a building image database. Then, we adopted a multi-level structure detection algorithm to obtain a sketch from the matched image to ensure structural consistency. Finally, the building image with the desired floor count and style is generated by diffusion model, guided by the detected building sketch. Our proposed framework enables accurate control over the floor count in building image synthesis. We demonstrate the robustness and scalability of generating building images with a specific floor count from text prompts.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"Demand for generating building images from text prompts grows, despite recent advances in diffusion models greatly enhancing image quality. The current generative models struggle with controlling the number of floors. To this end, we propose a retrieval-augmented framework for generating building images with provided floor count using a diffusion model. Initially, the text prompts with the provided floor count to retrieve the most suitable image from a building image database. Then, we adopted a multi-level structure detection algorithm to obtain a sketch from the matched image to ensure structural consistency. Finally, the building image with the desired floor count and style is generated by diffusion model, guided by the detected building sketch. Our proposed framework enables accurate control over the floor count in building image synthesis. We demonstrate the robustness and scalability of generating building images with a specific floor count from text prompts.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"4","bibliographic_titles":[{"bibliographic_title":"研究報告コンピュータグラフィックスとビジュアル情報学（CG）"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2024-06-22","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"3","bibliographicVolumeNumber":"2024-CG-194"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"id":235071,"updated":"2025-01-19T09:37:05.647072+00:00","links":{},"created":"2025-01-19T01:37:03.965615+00:00"}