{"id":"https://openalex.org/W4313447760","doi":"https://doi.org/10.48550/arxiv.2212.14883","title":"Online Statistical Inference for Contextual Bandits via Stochastic Gradient Descent","display_name":"Online Statistical Inference for Contextual Bandits via Stochastic Gradient Descent","publication_year":2022,"publication_date":"2022-12-30","ids":{"openalex":"https://openalex.org/W4313447760","doi":"https://doi.org/10.48550/arxiv.2212.14883"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2212.14883","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2212.14883","pdf_url":"https://arxiv.org/pdf/2212.14883","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2212.14883","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Chang, Xiangyu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chang, Xiangyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100329997","display_name":"Xi Chen","orcid":"https://orcid.org/0000-0002-9049-9452"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Xi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082916568","display_name":"Zehua Lai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lai, Zehua","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100317919","display_name":"Li He","orcid":"https://orcid.org/0000-0003-4729-0415"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, He","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Liu, Zhihong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Zhihong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100341419","display_name":"Yichen Zhang","orcid":"https://orcid.org/0000-0002-6925-0775"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yichen","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12879","display_name":"Distributed Sensor Networks and Detection Algorithms","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/estimator","display_name":"Estimator","score":0.6819646954536438},{"id":"https://openalex.org/keywords/statistical-inference","display_name":"Statistical inference","score":0.6383125185966492},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.6200023293495178},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.6035553812980652},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5812689661979675},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5032727122306824},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4934948682785034},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.46390292048454285},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.44585609436035156},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.43970930576324463},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.415894478559494},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.24574270844459534},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.17968440055847168},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.13317853212356567}],"concepts":[{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.6819646954536438},{"id":"https://openalex.org/C134261354","wikidata":"https://www.wikidata.org/wiki/Q938438","display_name":"Statistical inference","level":2,"score":0.6383125185966492},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.6200023293495178},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.6035553812980652},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5812689661979675},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5032727122306824},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4934948682785034},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.46390292048454285},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.44585609436035156},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.43970930576324463},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.415894478559494},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24574270844459534},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.17968440055847168},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.13317853212356567},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:arXiv.org:2212.14883","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2212.14883","pdf_url":"https://arxiv.org/pdf/2212.14883","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:doi:10.6084/m9.figshare.31211937","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Dataset"},{"id":"doi:10.48550/arxiv.2212.14883","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2212.14883","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2212.14883","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2212.14883","pdf_url":"https://arxiv.org/pdf/2212.14883","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.8199999928474426,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W137830373","https://openalex.org/W3000984192","https://openalex.org/W4206903459","https://openalex.org/W2754816816","https://openalex.org/W4366280654","https://openalex.org/W3160167280","https://openalex.org/W4231621013","https://openalex.org/W4362706668","https://openalex.org/W3008318776","https://openalex.org/W2041416246"],"abstract_inverted_index":{"With":[0],"the":[1,8,27,71,76,80,88,92,108,121,127,131,145],"fast":[2],"development":[3],"of":[4,31,39,70,79,120],"big":[5],"data,":[6],"learning":[7],"optimal":[9],"decision":[10,58],"rule":[11],"by":[12],"recursively":[13],"updating":[14],"it":[15],"and":[16,50,74,124],"making":[17],"online":[18,28,49],"decisions":[19],"has":[20],"been":[21],"easier":[22],"than":[23],"before.":[24],"We":[25,42,65,101,115],"study":[26],"statistical":[29],"inference":[30],"model":[32],"parameters":[33],"in":[34,110,130],"a":[35,44,111,117,135],"contextual":[36],"bandit":[37],"framework":[38,46],"sequential":[40],"decision-making.":[41],"propose":[43],"general":[45],"for":[47],"an":[48,104],"adaptive":[51,146],"data":[52,147],"collection":[53],"environment":[54],"that":[55,126],"can":[56],"update":[57],"rules":[59],"via":[60,97],"weighted":[61],"stochastic":[62,72],"gradient":[63,73],"descent.":[64],"allow":[66],"different":[67],"weighting":[68],"schemes":[69],"establish":[75],"asymptotic":[77,89],"normality":[78],"parameter":[81],"estimator.":[82],"Our":[83],"proposed":[84,122],"estimator":[85,123],"significantly":[86],"improves":[87],"efficiency":[90],"over":[91],"previous":[93],"averaged":[94],"SGD":[95,142],"approach":[96],"inverse":[98],"probability":[99],"weights.":[100],"also":[102],"conduct":[103],"optimality":[105],"analysis":[106],"on":[107],"weights":[109],"linear":[112],"regression":[113],"setting.":[114],"provide":[116],"Bahadur":[118,132],"representation":[119,133],"show":[125],"remainder":[128],"term":[129],"entails":[134],"slower":[136],"convergence":[137],"rate":[138],"compared":[139],"to":[140,144],"classical":[141],"due":[143],"collection.":[148]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
