{"id":"https://openalex.org/W4403346595","doi":"https://doi.org/10.48550/arxiv.2410.05605","title":"CodeDPO: Aligning Code Models with Self Generated and Verified Source Code","display_name":"CodeDPO: Aligning Code Models with Self Generated and Verified Source Code","publication_year":2024,"publication_date":"2024-10-08","ids":{"openalex":"https://openalex.org/W4403346595","doi":"https://doi.org/10.48550/arxiv.2410.05605"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2410.05605","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.05605","pdf_url":"https://arxiv.org/pdf/2410.05605","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2410.05605","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062231043","display_name":"Kechi Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Kechi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100447682","display_name":"Ge Li","orcid":"https://orcid.org/0000-0002-5828-0186"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Ge","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069159185","display_name":"Yihong Dong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dong, Yihong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100735418","display_name":"Jingjing Xu","orcid":"https://orcid.org/0000-0003-1082-2262"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Jingjing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100666960","display_name":"Jun Zhang","orcid":"https://orcid.org/0000-0002-2189-3966"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023217345","display_name":"Jing Su","orcid":"https://orcid.org/0000-0001-7962-0648"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Jing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044332717","display_name":"Yongfei Liu","orcid":"https://orcid.org/0000-0002-0261-8651"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yongfei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5049100391","display_name":"Zhi Jin","orcid":"https://orcid.org/0000-0003-1087-226X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Zhi","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5062231043"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9810000061988831,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10679","display_name":"Service-Oriented Architecture and Web Services","score":0.9729999899864197,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.7026751041412354},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6137175559997559},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.531046450138092},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.46326807141304016}],"concepts":[{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.7026751041412354},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6137175559997559},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.531046450138092},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.46326807141304016},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2410.05605","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.05605","pdf_url":"https://arxiv.org/pdf/2410.05605","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2410.05605","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2410.05605","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2410.05605","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.05605","pdf_url":"https://arxiv.org/pdf/2410.05605","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4403346595.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W4402327032","https://openalex.org/W3081644756"],"abstract_inverted_index":{"Code":[0],"generation":[1,62,197],"models":[2,25],"have":[3],"shown":[4],"significant":[5,175],"potential":[6],"for":[7,203],"programming":[8],"tasks.":[9],"However,":[10],"existing":[11,183],"training":[12],"methods":[13],"like":[14],"supervised":[15],"fine-tuning":[16],"face":[17],"key":[18,66],"limitations:":[19],"they":[20,37],"do":[21,36],"not":[22],"effectively":[23,38],"teach":[24],"to":[26,63,119,182],"prioritize":[27],"correct":[28],"over":[29],"incorrect":[30],"solutions":[31],"in":[32,177,195,208],"ambiguous":[33],"situations,":[34],"nor":[35],"optimize":[39],"the":[40,44,131,191],"runtime":[41],"efficiency":[42,180],"of":[43,134,168,193],"generated":[45],"code.":[46],"To":[47],"address":[48],"these":[49],"challenges,":[50],"we":[51],"propose":[52],"CodeDPO,":[53],"a":[54,76,82,140,200],"framework":[55],"that":[56,85,98,112,188],"integrates":[57],"preference":[58,68,142,157,206],"learning":[59],"into":[60],"code":[61,67,70,90,104,111,136,141,196,205],"improve":[64],"two":[65],"factors:":[69],"correctness":[71,147,178],"and":[72,88,91,110,148,153,179,198,211],"efficiency.":[73,149],"CodeDPO":[74,150,173,189],"employs":[75],"novel":[77],"dataset":[78,144],"construction":[79],"method,":[80],"utilizing":[81],"self-generation-and-validation":[83],"mechanism":[84],"simultaneously":[86],"generates":[87],"evaluates":[89],"test":[92,99],"cases.":[93],"The":[94],"underlying":[95],"assumption":[96],"is":[97,116,151],"cases":[100],"executable":[101],"by":[102],"multiple":[103],"snippets":[105],"provide":[106],"more":[107,114,117,209],"reliable":[108],"validation,":[109],"passes":[113],"tests":[115],"likely":[118],"be":[120],"correct.":[121],"Through":[122,165],"this":[123],"self-validation":[124],"process,":[125],"our":[126],"PageRank-inspired":[127],"algorithm":[128],"iteratively":[129],"updates":[130],"ranking":[132],"score":[133],"each":[135],"snippet,":[137],"ultimately":[138],"creating":[139],"optimization":[143,158,207],"based":[145],"on":[146,162],"flexible":[152],"scalable,":[154],"generating":[155],"diverse":[156],"data":[159],"without":[160],"depending":[161],"external":[163],"resources.":[164],"comprehensive":[166],"evaluations":[167],"five":[169],"widely":[170],"used":[171],"benchmarks,":[172],"demonstrates":[174],"improvements":[176],"compared":[181],"methods.":[184],"Our":[185],"experiments":[186],"prove":[187],"enhances":[190],"capabilities":[192],"LLMs":[194],"provides":[199],"robust":[201],"foundation":[202],"conducting":[204],"complex":[210],"challenging":[212],"real-world":[213],"scenarios.":[214]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
