{"id":"https://openalex.org/W4403792098","doi":"https://doi.org/10.1145/3664647.3680734","title":"DreamBooth++: Boosting Subject-Driven Generation via Region-Level References Packing","display_name":"DreamBooth++: Boosting Subject-Driven Generation via Region-Level References Packing","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403792098","doi":"https://doi.org/10.1145/3664647.3680734"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3680734","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680734","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021809717","display_name":"Zhongyi Fan","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhongyi Fan","raw_affiliation_strings":["Beijing Institute of Technology, Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0000-7053-1438","affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology, Beijing, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103163232","display_name":"Zixin Yin","orcid":"https://orcid.org/0000-0002-2129-9182"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zixin Yin","raw_affiliation_strings":["State Key Lab of Software Development Environment, Beihang University, Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-2129-9182","affiliations":[{"raw_affiliation_string":"State Key Lab of Software Development Environment, Beihang University, Beijing, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100431040","display_name":"Gang Li","orcid":"https://orcid.org/0000-0001-9520-0141"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gang Li","raw_affiliation_strings":["University of the Chinese Academy of Sciences &amp; Institute of Software, Chinese Academy of Sciences, Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-9520-0141","affiliations":[{"raw_affiliation_string":"University of the Chinese Academy of Sciences &amp; Institute of Software, Chinese Academy of Sciences, Beijing, Beijing, China","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074672983","display_name":"Yibing Zhan","orcid":"https://orcid.org/0000-0003-3180-0484"},"institutions":[{"id":"https://openalex.org/I4210103986","display_name":"Jingdong (China)","ror":"https://ror.org/01dkjkq64","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210103986"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yibing Zhan","raw_affiliation_strings":["JD Explore Academy, Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-3180-0484","affiliations":[{"raw_affiliation_string":"JD Explore Academy, Beijing, Beijing, China","institution_ids":["https://openalex.org/I4210103986"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015126222","display_name":"Heliang Zheng","orcid":"https://orcid.org/0000-0003-2220-3880"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Heliang Zheng","raw_affiliation_strings":["University of Science and Technology of China, Hefei, Anhui, China"],"raw_orcid":"https://orcid.org/0000-0003-2220-3880","affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, Anhui, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5021809717"],"corresponding_institution_ids":["https://openalex.org/I125839683"],"apc_list":null,"apc_paid":null,"fwci":0.6008,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.80209546,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"11013","last_page":"11021"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.8674432039260864},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6438398361206055},{"id":"https://openalex.org/keywords/subject","display_name":"Subject (documents)","score":0.45495808124542236},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4275969862937927},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.11127841472625732}],"concepts":[{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.8674432039260864},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6438398361206055},{"id":"https://openalex.org/C2777855551","wikidata":"https://www.wikidata.org/wiki/Q12310021","display_name":"Subject (documents)","level":2,"score":0.45495808124542236},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4275969862937927},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.11127841472625732}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3664647.3680734","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680734","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2962785568","https://openalex.org/W3159481202","https://openalex.org/W4212774754","https://openalex.org/W4281661987","https://openalex.org/W4310380119","https://openalex.org/W4312933868","https://openalex.org/W4380559233","https://openalex.org/W4386072096","https://openalex.org/W4389334989","https://openalex.org/W4390871953","https://openalex.org/W4390873195","https://openalex.org/W4390874393","https://openalex.org/W4400573550","https://openalex.org/W4402753775","https://openalex.org/W4402774219"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2125652721","https://openalex.org/W1540371141","https://openalex.org/W4231274751","https://openalex.org/W1549363203","https://openalex.org/W2154063878","https://openalex.org/W2556012038","https://openalex.org/W1489772951"],"abstract_inverted_index":{"DreamBooth":[0],"has":[1],"demonstrated":[2],"significant":[3],"potential":[4],"in":[5,10,173],"subject-driven":[6,174],"text-to-image":[7],"generation,":[8],"especially":[9],"scenarios":[11],"requiring":[12],"precise":[13],"preservation":[14],"of":[15,37,59,77],"a":[16,34,47,68,75,81,115,123,132],"subject's":[17],"appearance.":[18],"However,":[19],"it":[20],"still":[21],"suffers":[22],"from":[23],"inefficiency":[24],"and":[25,57,92,139,171],"requires":[26],"extensive":[27],"iterative":[28],"training":[29,49,155],"to":[30,52,95,143,168],"customize":[31],"concepts":[32],"using":[33],"small":[35],"set":[36,76],"reference":[38,78],"images.":[39],"To":[40],"address":[41],"these":[42],"issues,":[43],"we":[44,89,130],"introduce":[45],"DreamBooth++,":[46],"region-level":[48,69],"strategy":[50,156],"designed":[51],"significantly":[53,84,165],"improve":[54],"the":[55,140,145,160],"efficiency":[56],"effectiveness":[58],"learning":[60],"specific":[61],"subjects.":[62],"In":[63],"particular,":[64],"our":[65,137,154],"approach":[66],"employs":[67],"data":[70],"re-formulation":[71],"technique":[72],"that":[73,153],"packs":[74],"images":[79],"into":[80],"single":[82,116,124],"sample,":[83],"reducing":[85],"computational":[86],"costs.":[87],"Moreover,":[88],"adapt":[90],"convolution":[91],"self-attention":[93],"layers":[94],"ensure":[96],"their":[97,105],"processings":[98],"are":[99],"restricted":[100],"within":[101,114,122],"individual":[102],"regions.":[103],"Thus":[104],"operational":[106],"scope":[107],"(i.e.,":[108],"receptive":[109],"field)":[110],"can":[111],"be":[112],"preserved":[113],"subject,":[117],"avoiding":[118],"generating":[119],"multiple":[120],"sub-images":[121],"image.":[125],"Last":[126],"but":[127,163],"not":[128,157],"least,":[129],"design":[131],"text-guided":[133],"prior":[134],"regularization":[135],"between":[136],"model":[138],"pretrained":[141],"one":[142],"preserve":[144],"original":[146],"semantic":[147],"generation":[148],"ability.":[149],"Comprehensive":[150],"experiments":[151],"demonstrate":[152],"only":[158],"accelerates":[159],"subject-learning":[161],"process":[162],"also":[164],"boosts":[166],"fidelity":[167],"both":[169],"subject":[170],"prompts":[172],"generation.":[175]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
