{"id":"https://openalex.org/W4389983223","doi":"https://doi.org/10.48550/arxiv.2312.10547","title":"Advancing RAN Slicing with Offline Reinforcement Learning","display_name":"Advancing RAN Slicing with Offline Reinforcement Learning","publication_year":2023,"publication_date":"2023-12-16","ids":{"openalex":"https://openalex.org/W4389983223","doi":"https://doi.org/10.48550/arxiv.2312.10547"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2312.10547","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.10547","pdf_url":"https://arxiv.org/pdf/2312.10547","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2312.10547","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100435639","display_name":"Kun Yang","orcid":"https://orcid.org/0000-0002-6782-6689"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yang, Kun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032337158","display_name":"Shu\u2010ping Yeh","orcid":"https://orcid.org/0000-0001-5255-2681"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yeh, Shu-ping","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091343342","display_name":"Menglei Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Menglei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114101923","display_name":"Jerry Sydir","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sydir, Jerry","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100780399","display_name":"Jing Yang","orcid":"https://orcid.org/0000-0002-6820-9156"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Jing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5016749653","display_name":"Cong Shen","orcid":"https://orcid.org/0000-0002-3148-4453"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Cong","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100435639"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12791","display_name":"Full-Duplex Wireless Communications","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12791","display_name":"Full-Duplex Wireless Communications","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11392","display_name":"Energy Harvesting in Wireless Networks","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8998162150382996},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8038552403450012},{"id":"https://openalex.org/keywords/slicing","display_name":"Slicing","score":0.6787248849868774},{"id":"https://openalex.org/keywords/radio-access-network","display_name":"Radio access network","score":0.6266640424728394},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.6258519887924194},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.5860109329223633},{"id":"https://openalex.org/keywords/ran","display_name":"Ran","score":0.578575611114502},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5744185447692871},{"id":"https://openalex.org/keywords/online-and-offline","display_name":"Online and offline","score":0.45149916410446167},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4262961745262146},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27656418085098267},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.23625615239143372},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.15576747059822083},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.11650636792182922},{"id":"https://openalex.org/keywords/base-station","display_name":"Base station","score":0.10149228572845459}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8998162150382996},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8038552403450012},{"id":"https://openalex.org/C2776190703","wikidata":"https://www.wikidata.org/wiki/Q488148","display_name":"Slicing","level":2,"score":0.6787248849868774},{"id":"https://openalex.org/C106365562","wikidata":"https://www.wikidata.org/wiki/Q3078360","display_name":"Radio access network","level":4,"score":0.6266640424728394},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.6258519887924194},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.5860109329223633},{"id":"https://openalex.org/C160704184","wikidata":"https://www.wikidata.org/wiki/Q18031028","display_name":"Ran","level":2,"score":0.578575611114502},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5744185447692871},{"id":"https://openalex.org/C2780102126","wikidata":"https://www.wikidata.org/wiki/Q10928179","display_name":"Online and offline","level":2,"score":0.45149916410446167},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4262961745262146},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27656418085098267},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.23625615239143372},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.15576747059822083},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.11650636792182922},{"id":"https://openalex.org/C68649174","wikidata":"https://www.wikidata.org/wiki/Q1379116","display_name":"Base station","level":2,"score":0.10149228572845459},{"id":"https://openalex.org/C207029474","wikidata":"https://www.wikidata.org/wiki/Q384018","display_name":"Mobile station","level":3,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2312.10547","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.10547","pdf_url":"https://arxiv.org/pdf/2312.10547","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2312.10547","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2312.10547","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2312.10547","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.10547","pdf_url":"https://arxiv.org/pdf/2312.10547","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4389983223.pdf","grobid_xml":"https://content.openalex.org/works/W4389983223.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3018338683","https://openalex.org/W3037103914","https://openalex.org/W2981227129","https://openalex.org/W4315630224","https://openalex.org/W2902151128","https://openalex.org/W4383173632","https://openalex.org/W104163691","https://openalex.org/W2436923341","https://openalex.org/W4381187802","https://openalex.org/W4294306393"],"abstract_inverted_index":{"Dynamic":[0],"radio":[1],"resource":[2],"management":[3],"(RRM)":[4],"in":[5,12,45,151,160],"wireless":[6],"networks":[7],"presents":[8],"significant":[9,89],"challenges,":[10],"particularly":[11],"the":[13,83,120,134,146],"context":[14],"of":[15,123,145,148],"Radio":[16],"Access":[17],"Network":[18],"(RAN)":[19],"slicing.":[20],"This":[21],"technology,":[22],"crucial":[23],"for":[24,136],"catering":[25],"to":[26,65,81,129,153],"varying":[27],"user":[28],"requirements,":[29,156],"often":[30],"grapples":[31],"with":[32],"complex":[33],"optimization":[34],"scenarios.":[35,164],"Existing":[36],"Reinforcement":[37],"Learning":[38],"(RL)":[39],"approaches,":[40],"while":[41],"achieving":[42],"good":[43],"performance":[44],"RAN":[46,84,162],"slicing,":[47],"typically":[48],"rely":[49],"on":[50],"online":[51],"algorithms":[52],"or":[53,63],"behavior":[54],"cloning.":[55],"These":[56],"methods":[57],"necessitate":[58],"either":[59],"continuous":[60],"environmental":[61,138],"interactions":[62],"access":[64],"high-quality":[66],"datasets,":[67,110],"hindering":[68],"their":[69],"practical":[70],"deployment.":[71],"Towards":[72],"addressing":[73],"these":[74],"limitations,":[75],"this":[76],"paper":[77],"introduces":[78],"offline":[79,101,124,149],"RL":[80,102,150],"solving":[82],"slicing":[85,163],"problem,":[86],"marking":[87],"a":[88,111],"shift":[90],"towards":[91],"more":[92],"feasible":[93],"and":[94],"adaptive":[95],"RRM":[96],"methods.":[97],"We":[98],"demonstrate":[99],"how":[100],"can":[103],"effectively":[104],"learn":[105],"near-optimal":[106],"policies":[107],"from":[108],"sub-optimal":[109],"notable":[112],"advancement":[113],"over":[114],"existing":[115],"practices.":[116],"Our":[117],"research":[118],"highlights":[119],"inherent":[121],"flexibility":[122],"RL,":[125],"showcasing":[126],"its":[127,158],"ability":[128],"adjust":[130],"policy":[131],"criteria":[132],"without":[133],"need":[135],"additional":[137],"interactions.":[139],"Furthermore,":[140],"we":[141],"present":[142],"empirical":[143],"evidence":[144],"efficacy":[147],"adapting":[152],"various":[154],"service-level":[155],"illustrating":[157],"potential":[159],"diverse":[161]},"counts_by_year":[],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
