{"id":"https://openalex.org/W4400222237","doi":"https://doi.org/10.48550/arxiv.2406.20085","title":"Auto Cherry-Picker: Learning from High-quality Generative Data Driven by Language","display_name":"Auto Cherry-Picker: Learning from High-quality Generative Data Driven by Language","publication_year":2024,"publication_date":"2024-06-28","ids":{"openalex":"https://openalex.org/W4400222237","doi":"https://doi.org/10.48550/arxiv.2406.20085"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2406.20085","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.20085","pdf_url":"https://arxiv.org/pdf/2406.20085","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2406.20085","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100769172","display_name":"Yicheng Chen","orcid":"https://orcid.org/0000-0002-2531-8002"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chen, Yicheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089900108","display_name":"Xiangtai Li","orcid":"https://orcid.org/0000-0002-0550-8247"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xiangtai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101546249","display_name":"Yining Li","orcid":"https://orcid.org/0000-0002-6552-9250"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yining","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101629056","display_name":"Yanhong Zeng","orcid":"https://orcid.org/0000-0003-3596-5163"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zeng, Yanhong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024765927","display_name":"Jianzong Wu","orcid":"https://orcid.org/0009-0007-4559-7970"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Jianzong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100645854","display_name":"Xiangyu Zhao","orcid":"https://orcid.org/0000-0003-2926-4416"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Xiangyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5038149192","display_name":"Kai Chen","orcid":"https://orcid.org/0000-0003-4160-1024"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Kai","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100769172"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9520000219345093,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9520000219345093,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9258000254631042,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.6287121772766113},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6092177033424377},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.6014909148216248},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.47771167755126953},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4772745966911316},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4067673981189728}],"concepts":[{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.6287121772766113},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6092177033424377},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.6014909148216248},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.47771167755126953},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4772745966911316},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4067673981189728},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2406.20085","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.20085","pdf_url":"https://arxiv.org/pdf/2406.20085","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2406.20085","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2406.20085","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2406.20085","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.20085","pdf_url":"https://arxiv.org/pdf/2406.20085","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4365211920","https://openalex.org/W3014948380","https://openalex.org/W3204019825","https://openalex.org/W4380551139","https://openalex.org/W4317695495","https://openalex.org/W4287117424","https://openalex.org/W4387506531","https://openalex.org/W4238433571","https://openalex.org/W3174044702","https://openalex.org/W2967848559"],"abstract_inverted_index":{"Diffusion":[0],"models":[1,19],"can":[2,160],"generate":[3,108],"realistic":[4],"and":[5,42,69,79,124,149,177,198],"diverse":[6],"images,":[7],"potentially":[8],"facilitating":[9],"data":[10,28,36,87,114],"availability":[11],"for":[12,92,188,194],"data-intensive":[13],"perception":[14,68,197],"tasks.":[15,182,200],"However,":[16],"leveraging":[17],"these":[18,48],"to":[20,66,76,107,128],"boost":[21,136],"performance":[22,137,164,178],"on":[23,82,154],"downstream":[24,155,181],"tasks":[25,156],"with":[26,34,146],"synthetic":[27,39,133],"poses":[29],"several":[30],"challenges,":[31],"including":[32],"aligning":[33],"real":[35,86],"distribution,":[37],"scaling":[38],"sample":[40,77],"volumes,":[41],"ensuring":[43],"their":[44],"quality.":[45,130],"To":[46],"bridge":[47],"gaps,":[49],"we":[50,100,170],"present":[51],"\\textbf{A}uto":[52],"\\textbf{C}herry-\\textbf{P}icker":[53],"(ACP),":[54],"a":[55,118,172],"novel":[56],"framework":[57],"that":[58,158],"generates":[59],"high-quality":[60,134],"cross-modality":[61],"training":[62],"samples":[63,135],"at":[64],"scale":[65],"augment":[67],"multi-modal":[70],"training.":[71],"ACP":[72,159],"first":[73],"uses":[74],"LLMs":[75],"descriptions":[78],"layouts":[80],"based":[81],"object":[83],"combinations":[84],"from":[85],"priors,":[88],"eliminating":[89],"the":[90,112,163,186,192],"need":[91],"ground":[93],"truth":[94],"image":[95],"captions":[96],"or":[97],"annotations.":[98],"Next,":[99],"use":[101],"an":[102],"off-the-shelf":[103],"controllable":[104],"diffusion":[105],"model":[106],"multiple":[109],"images.":[110],"Then,":[111],"generated":[113],"are":[115],"refined":[116],"using":[117],"comprehensively":[119],"designed":[120],"metric,":[121],"Composite":[122],"Layout":[123],"Image":[125],"Score":[126],"(CLIS),":[127],"ensure":[129],"Our":[131],"customized":[132],"in":[138,142,180],"various":[139,195],"scenarios,":[140],"especially":[141],"addressing":[143],"challenges":[144],"associated":[145],"long-tailed":[147],"distribution":[148],"imbalanced":[150],"datasets.":[151],"Experiment":[152],"results":[153],"demonstrate":[157],"significantly":[161],"improve":[162],"of":[165],"existing":[166],"models.":[167],"In":[168],"addition,":[169],"find":[171],"positive":[173],"correlation":[174],"between":[175],"CLIS":[176],"gains":[179],"This":[183],"finding":[184],"shows":[185],"potential":[187],"evaluation":[189],"metrics":[190],"as":[191],"role":[193],"visual":[196],"MLLM":[199]},"counts_by_year":[],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
