{"id":"https://openalex.org/W4389501290","doi":"https://doi.org/10.48550/arxiv.2312.04326","title":"iDesigner: A High-Resolution and Complex-Prompt Following Text-to-Image Diffusion Model for Interior Design","display_name":"iDesigner: A High-Resolution and Complex-Prompt Following Text-to-Image Diffusion Model for Interior Design","publication_year":2023,"publication_date":"2023-12-07","ids":{"openalex":"https://openalex.org/W4389501290","doi":"https://doi.org/10.48550/arxiv.2312.04326"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2312.04326","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.04326","pdf_url":"https://arxiv.org/pdf/2312.04326","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2312.04326","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108691724","display_name":"Ruyi Gan","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Gan, Ruyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087450445","display_name":"Xiao\u2010Jun Wu","orcid":"https://orcid.org/0000-0002-0310-5778"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Xiaojun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102402775","display_name":"Junyu Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Junyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024080570","display_name":"Yuanhe Tian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian, Yuanhe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047880537","display_name":"Dixiang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Dixiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101794936","display_name":"Ziwei Wu","orcid":"https://orcid.org/0000-0003-3999-4367"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Ziwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111089828","display_name":"Renliang Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Renliang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100652633","display_name":"Chang Liu","orcid":"https://orcid.org/0000-0002-1213-9814"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Chang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100628333","display_name":"Jiaxing Zhang","orcid":"https://orcid.org/0000-0002-1324-6486"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jiaxing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048283341","display_name":"Pingjian Zhang","orcid":"https://orcid.org/0000-0002-9087-4494"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Pingjian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100573313","display_name":"Yan Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Yan","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5108691724"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14254","display_name":"Digital Media and Visual Art","score":0.8439000248908997,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14254","display_name":"Digital Media and Visual Art","score":0.8439000248908997,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7537648677825928},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5815528035163879},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.5546624660491943},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.5385317802429199},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.48372796177864075},{"id":"https://openalex.org/keywords/resolution","display_name":"Resolution (logic)","score":0.4741760492324829},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44629722833633423},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.42374560236930847},{"id":"https://openalex.org/keywords/anime","display_name":"Anime","score":0.4159639775753021},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3686143159866333},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07643929123878479}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7537648677825928},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5815528035163879},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.5546624660491943},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.5385317802429199},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.48372796177864075},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.4741760492324829},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44629722833633423},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.42374560236930847},{"id":"https://openalex.org/C118130439","wikidata":"https://www.wikidata.org/wiki/Q11425","display_name":"Anime","level":2,"score":0.4159639775753021},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3686143159866333},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07643929123878479},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2312.04326","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.04326","pdf_url":"https://arxiv.org/pdf/2312.04326","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2312.04326","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2312.04326","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2312.04326","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.04326","pdf_url":"https://arxiv.org/pdf/2312.04326","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2075421999","https://openalex.org/W4241725891","https://openalex.org/W4247978692","https://openalex.org/W592941694","https://openalex.org/W4200085573","https://openalex.org/W4296571029","https://openalex.org/W2098776115","https://openalex.org/W4248856211","https://openalex.org/W2270259880","https://openalex.org/W2056165575"],"abstract_inverted_index":{"With":[0],"the":[1,29,57,69,97,110,122,125,146,156,165,169,172],"open-sourcing":[2],"of":[3,21,124,149,158,171],"text-to-image":[4,75],"models":[5,22,45,76],"(T2I)":[6],"such":[7,33,49],"as":[8,34,50,87,89,153],"stable":[9,13],"diffusion":[10,14],"(SD)":[11],"and":[12,61,105,113,119,138,179],"XL":[15],"(SD-XL),":[16],"there":[17,41],"is":[18,54],"an":[19],"influx":[20],"fine-tuned":[23],"in":[24,35,46,66,109,116],"specific":[25],"domains":[26],"based":[27],"on":[28,121,164],"open-source":[30,126],"SD":[31],"model,":[32],"anime,":[36],"character":[37],"portraits,":[38],"etc.":[39],"However,":[40],"are":[42,80],"few":[43],"specialized":[44],"certain":[47],"domains,":[48],"interior":[51,78],"design,":[52,67],"which":[53,175],"attributed":[55],"to":[56,82,95,144,154],"complex":[58],"textual":[59],"descriptions":[60],"detailed":[62],"visual":[63],"elements":[64],"inherent":[65],"alongside":[68],"necessity":[70],"for":[71,77],"adaptable":[72],"resolution.":[73],"Therefore,":[74],"design":[79,93,111],"required":[81],"have":[83],"outstanding":[84],"prompt-following":[85,147],"capabilities,":[86],"well":[88],"iterative":[90],"collaboration":[91],"with":[92,135],"professionals":[94],"achieve":[96],"desired":[98],"outcome.":[99],"In":[100],"this":[101],"paper,":[102],"we":[103],"collect":[104],"optimize":[106],"text-image":[107],"data":[108],"field":[112],"continue":[114],"training":[115],"both":[117],"English":[118],"Chinese":[120],"basis":[123],"CLIP":[127,142],"model.":[128],"We":[129],"also":[130],"proposed":[131,173],"a":[132],"fine-tuning":[133],"strategy":[134],"curriculum":[136],"learning":[137,140],"reinforcement":[139],"from":[141],"feedback":[143],"enhance":[145],"capabilities":[148],"our":[150],"approach":[151],"so":[152],"improve":[155],"quality":[157],"image":[159],"generation.":[160],"The":[161],"experimental":[162],"results":[163,178],"collected":[166],"dataset":[167],"demonstrate":[168],"effectiveness":[170],"approach,":[174],"achieves":[176],"impressive":[177],"outperforms":[180],"strong":[181],"baselines.":[182]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2023-12-09T00:00:00"}
