{"id":"https://openalex.org/W6891862403","doi":"https://doi.org/10.48550/arxiv.2503.12590","title":"Personalize Anything for Free with Diffusion Transformer","display_name":"Personalize Anything for Free with Diffusion Transformer","publication_year":2025,"publication_date":"2025-03-16","ids":{"openalex":"https://openalex.org/W6891862403","doi":"https://doi.org/10.48550/arxiv.2503.12590"},"language":"en","primary_location":{"id":"doi:10.48550/arxiv.2503.12590","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2503.12590","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2503.12590","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Feng, Haoran","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Feng, Haoran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Huang, Zehuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Zehuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Li, Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Lin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Lv, Hairong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lv, Hairong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Sheng, Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sheng, Lu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8895999789237976,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8895999789237976,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.01119999960064888,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.010499999858438969,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.554099977016449},{"id":"https://openalex.org/keywords/personalization","display_name":"Personalization","score":0.48910000920295715},{"id":"https://openalex.org/keywords/compatibility","display_name":"Compatibility (geochemistry)","score":0.40880000591278076},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4049000144004822},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.36570000648498535},{"id":"https://openalex.org/keywords/encapsulation","display_name":"Encapsulation (networking)","score":0.3573000133037567},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.3393000066280365}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6870999932289124},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.554099977016449},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.48910000920295715},{"id":"https://openalex.org/C2778648169","wikidata":"https://www.wikidata.org/wiki/Q967768","display_name":"Compatibility (geochemistry)","level":2,"score":0.40880000591278076},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4049000144004822},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3903000056743622},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.36570000648498535},{"id":"https://openalex.org/C81147070","wikidata":"https://www.wikidata.org/wiki/Q1172449","display_name":"Encapsulation (networking)","level":2,"score":0.3573000133037567},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3564000129699707},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.3393000066280365},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3334999978542328},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3246000111103058},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.2906000018119812},{"id":"https://openalex.org/C20574231","wikidata":"https://www.wikidata.org/wiki/Q844605","display_name":"Backward compatibility","level":2,"score":0.28349998593330383},{"id":"https://openalex.org/C184297639","wikidata":"https://www.wikidata.org/wiki/Q177765","display_name":"Biometrics","level":2,"score":0.2680000066757202},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.2578999996185303},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.2513999938964844},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2503.12590","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2503.12590","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2503.12590","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2503.12590","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.4054510295391083}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Personalized":[0],"image":[1,74,90],"generation":[2,91],"aims":[3],"to":[4,73,117],"produce":[5],"images":[6],"of":[7,44,53],"user-specified":[8],"concepts":[9],"while":[10,17,148],"enabling":[11],"flexible":[12],"editing.":[13,75,131],"Recent":[14],"training-free":[15,85],"approaches,":[16],"exhibit":[18],"higher":[19],"computational":[20],"efficiency":[21],"than":[22],"training-based":[23],"methods,":[24],"struggle":[25],"with":[26,32,51],"identity":[27,137],"preservation,":[28],"applicability,":[29],"and":[30,106,112,129,139],"compatibility":[31],"diffusion":[33],"transformers":[34],"(DiTs).":[35],"In":[36],"this":[37,78],"paper,":[38],"we":[39,80],"uncover":[40],"the":[41],"untapped":[42],"potential":[43],"DiT,":[45],"where":[46],"simply":[47],"replacing":[48],"denoising":[49],"tokens":[50],"those":[52],"a":[54,84,150],"reference":[55],"subject":[56,59,101],"achieves":[57,88],"zero-shot":[58],"reconstruction.":[60],"This":[61],"simple":[62],"yet":[63],"effective":[64],"feature":[65],"injection":[66,105],"technique":[67],"unlocks":[68],"diverse":[69],"scenarios,":[70],"from":[71],"personalization":[72],"Building":[76],"upon":[77],"observation,":[79],"propose":[81],"\\textbf{Personalize":[82],"Anything},":[83],"framework":[86],"that":[87,99],"personalized":[89],"in":[92,136],"DiT":[93],"through:":[94],"1)":[95],"timestep-adaptive":[96],"token":[97],"replacement":[98],"enforces":[100],"consistency":[102],"via":[103],"early-stage":[104],"enhances":[107],"flexibility":[108],"through":[109],"late-stage":[110],"regularization,":[111],"2)":[113],"patch":[114],"perturbation":[115],"strategies":[116],"boost":[118],"structural":[119],"diversity.":[120],"Our":[121,141],"method":[122],"seamlessly":[123],"supports":[124],"layout-guided":[125],"generation,":[126],"multi-subject":[127],"personalization,":[128],"mask-controlled":[130],"Evaluations":[132],"demonstrate":[133],"state-of-the-art":[134],"performance":[135],"preservation":[138],"versatility.":[140],"work":[142],"establishes":[143],"new":[144],"insights":[145],"into":[146],"DiTs":[147],"delivering":[149],"practical":[151],"paradigm":[152],"for":[153],"efficient":[154],"personalization.":[155]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
