{"id":"https://openalex.org/W4416608663","doi":"https://doi.org/10.48550/arxiv.2505.23013","title":"Scalable Complexity Control Facilitates Reasoning Ability of LLMs","display_name":"Scalable Complexity Control Facilitates Reasoning Ability of LLMs","publication_year":2025,"publication_date":"2025-05-29","ids":{"openalex":"https://openalex.org/W4416608663","doi":"https://doi.org/10.48550/arxiv.2505.23013"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2505.23013","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.23013","pdf_url":"https://arxiv.org/pdf/2505.23013","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2505.23013","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113196540","display_name":"Liangkai Hang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Hang, Liangkai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050535359","display_name":"Junjie Yao","orcid":"https://orcid.org/0000-0003-4683-1494"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yao, Junjie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025402450","display_name":"Zhiwei Bai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bai, Zhiwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100783476","display_name":"Tianyi Chen","orcid":"https://orcid.org/0000-0003-3477-1439"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Tianyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058858848","display_name":"Yang Chen","orcid":"https://orcid.org/0000-0003-3935-8109"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Diao, Rongjie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Diao, Rongjie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085065115","display_name":"Hezhou Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Hezhou","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101345522","display_name":"Pengxiao Lin","orcid":"https://orcid.org/0009-0003-4926-8577"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Pengxiao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100688549","display_name":"Zhiwei Wang","orcid":"https://orcid.org/0000-0003-4895-050X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zhiwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100430968","display_name":"Cheng Xu","orcid":"https://orcid.org/0000-0001-8075-2867"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Cheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084678300","display_name":"Zhongwang Zhang","orcid":"https://orcid.org/0009-0006-4202-8556"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Zhongwang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021783051","display_name":"Zhangchen Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Zhangchen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100390299","display_name":"Zhiyu Li","orcid":"https://orcid.org/0000-0003-1666-9115"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Zhiyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Lin, Zehao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Zehao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100438001","display_name":"Kai Chen","orcid":"https://orcid.org/0000-0003-2587-6028"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Kai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090294171","display_name":"Feiyu Xiong","orcid":"https://orcid.org/0000-0002-1456-2202"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiong, Feiyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100680351","display_name":"Yaoyu Zhang","orcid":"https://orcid.org/0000-0003-2540-5314"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yaoyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064737794","display_name":"E Weinan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"E, Weinan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082412135","display_name":"Hongkang Yang","orcid":"https://orcid.org/0000-0003-4938-6445"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Hongkang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5002236438","display_name":"Zhi\u2010Qin John Xu","orcid":"https://orcid.org/0000-0003-0627-3520"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Zhi-Qin John","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":20,"corresponding_author_ids":["https://openalex.org/A5113196540"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3440000116825104,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3440000116825104,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.08860000222921371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.06949999928474426,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.8754000067710876},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.673799991607666},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5450999736785889},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.4950000047683716},{"id":"https://openalex.org/keywords/constant","display_name":"Constant (computer programming)","score":0.4555000066757202},{"id":"https://openalex.org/keywords/exponent","display_name":"Exponent","score":0.43459999561309814}],"concepts":[{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.8754000067710876},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.673799991607666},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6640999913215637},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5536999702453613},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5450999736785889},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.4950000047683716},{"id":"https://openalex.org/C2777027219","wikidata":"https://www.wikidata.org/wiki/Q1284190","display_name":"Constant (computer programming)","level":2,"score":0.4555000066757202},{"id":"https://openalex.org/C2780388253","wikidata":"https://www.wikidata.org/wiki/Q5421508","display_name":"Exponent","level":2,"score":0.43459999561309814},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40400001406669617},{"id":"https://openalex.org/C311688","wikidata":"https://www.wikidata.org/wiki/Q2393193","display_name":"Time complexity","level":2,"score":0.40290001034736633},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.39430001378059387},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.3646000027656555},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.3515999913215637},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3188999891281128},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3116999864578247},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.30079999566078186}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2505.23013","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.23013","pdf_url":"https://arxiv.org/pdf/2505.23013","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2505.23013","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2505.23013","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2505.23013","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.23013","pdf_url":"https://arxiv.org/pdf/2505.23013","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1339871232","display_name":null,"funder_award_id":"92270001","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G377228980","display_name":null,"funder_award_id":"12371511","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4416608663.pdf","grobid_xml":"https://content.openalex.org/works/W4416608663.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"reasoning":[1],"ability":[2],"of":[3,49,69,81,95,124],"large":[4],"language":[5],"models":[6,71],"(LLMs)":[7],"has":[8],"been":[9],"rapidly":[10],"advancing":[11],"in":[12,17,104],"recent":[13],"years,":[14],"attracting":[15],"interest":[16],"more":[18],"fundamental":[19],"approaches":[20],"that":[21,30,88,113],"can":[22],"reliably":[23],"enhance":[24],"their":[25],"generalizability.":[26],"This":[27,59],"work":[28],"demonstrates":[29],"model":[31,54,106],"complexity":[32,78,114],"control,":[33],"conveniently":[34],"implementable":[35],"by":[36,64],"adjusting":[37],"the":[38,46,66,83,98,121],"initialization":[39,84,91],"rate":[40,92],"and":[41,56,107],"weight":[42],"decay":[43],"coefficient,":[44],"improves":[45],"scaling":[47,99],"law":[48,100],"LLMs":[50],"consistently":[51],"over":[52],"varying":[53],"sizes":[55],"data":[57,108],"sizes.":[58,109],"gain":[60],"is":[61,116],"further":[62],"illustrated":[63],"comparing":[65],"benchmark":[67],"performance":[68],"2.4B":[70],"pretrained":[72],"on":[73],"1T":[74],"tokens":[75],"with":[76],"different":[77],"hyperparameters.":[79],"Instead":[80],"fixing":[82],"std,":[85],"we":[86],"found":[87],"a":[89,117],"constant":[90],"(the":[93],"exponent":[94],"std)":[96],"enables":[97],"to":[101],"descend":[102],"faster":[103],"both":[105],"These":[110],"results":[111],"indicate":[112],"control":[115],"promising":[118],"direction":[119],"for":[120],"continual":[122],"advancement":[123],"LLMs.":[125]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
