{"id":"https://openalex.org/W1929309940","doi":"https://doi.org/10.1609/aaai.v27i1.8546","title":"Data-Efficient Generalization of Robot Skills with Contextual Policy Search","display_name":"Data-Efficient Generalization of Robot Skills with Contextual Policy Search","publication_year":2013,"publication_date":"2013-06-29","ids":{"openalex":"https://openalex.org/W1929309940","doi":"https://doi.org/10.1609/aaai.v27i1.8546","mag":"1929309940"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v27i1.8546","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v27i1.8546","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/8546/8405","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/8546/8405","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014691067","display_name":"Andras Kupcsik","orcid":null},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Andras Kupcsik","raw_affiliation_strings":["National University of Singapore","Dept. of Electrical & Computer Engineering National University of Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore","institution_ids":["https://openalex.org/I165932596"]},{"raw_affiliation_string":"Dept. of Electrical & Computer Engineering National University of Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001763022","display_name":"Marc Peter Deisenroth","orcid":"https://orcid.org/0000-0003-1503-680X"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Marc Deisenroth","raw_affiliation_strings":["Technische Universit\u00e4t Darmstadt","Intelligent Autonomous Systems Lab, Technische Unversit\u00e4t Darmstadt#TAB#"],"affiliations":[{"raw_affiliation_string":"Technische Universit\u00e4t Darmstadt","institution_ids":["https://openalex.org/I31512782"]},{"raw_affiliation_string":"Intelligent Autonomous Systems Lab, Technische Unversit\u00e4t Darmstadt#TAB#","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071367253","display_name":"Jan Peters","orcid":"https://orcid.org/0000-0002-5266-8091"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jan Peters","raw_affiliation_strings":["Technische Universit\u00e4t Darmstadt","Intelligent Autonomous Systems Lab, Technische Unversit\u00e4t Darmstadt#TAB#"],"affiliations":[{"raw_affiliation_string":"Technische Universit\u00e4t Darmstadt","institution_ids":["https://openalex.org/I31512782"]},{"raw_affiliation_string":"Intelligent Autonomous Systems Lab, Technische Unversit\u00e4t Darmstadt#TAB#","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110467801","display_name":"Gerhard Neumann","orcid":"https://orcid.org/0000-0002-5483-4225"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Gerhard Neumann","raw_affiliation_strings":["Technische Universit\u00e4t Darmstadt","Intelligent Autonomous Systems Lab, Technische Unversit\u00e4t Darmstadt#TAB#"],"affiliations":[{"raw_affiliation_string":"Technische Universit\u00e4t Darmstadt","institution_ids":["https://openalex.org/I31512782"]},{"raw_affiliation_string":"Intelligent Autonomous Systems Lab, Technische Unversit\u00e4t Darmstadt#TAB#","institution_ids":["https://openalex.org/I31512782"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5014691067"],"corresponding_institution_ids":["https://openalex.org/I165932596"],"apc_list":null,"apc_paid":null,"fwci":11.6324,"has_fulltext":true,"cited_by_count":91,"citation_normalized_percentile":{"value":0.98770177,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"27","issue":"1","first_page":"1401","last_page":"1407"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9896000027656555,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6915207505226135},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.690563976764679},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6880786418914795},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.6489987969398499},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6481649875640869},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6451987028121948},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6365375518798828},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.553298830986023},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.5402881503105164},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.5031773447990417},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1279301643371582},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09764325618743896}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6915207505226135},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.690563976764679},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6880786418914795},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.6489987969398499},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6481649875640869},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6451987028121948},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6365375518798828},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.553298830986023},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.5402881503105164},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.5031773447990417},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1279301643371582},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09764325618743896},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.1609/aaai.v27i1.8546","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v27i1.8546","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/8546/8405","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:eprints.lincoln.ac.uk:25777","is_oa":true,"landing_page_url":null,"pdf_url":"http://eprints.lincoln.ac.uk/id/eprint/25777/1/Kupcsik_AAAI_2013.pdf","source":{"id":"https://openalex.org/S4377196275","display_name":"Lincoln Repository (University of Lincoln)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I51532219","host_organization_name":"University of Lincoln","host_organization_lineage":["https://openalex.org/I51532219"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"},{"id":"pmh:oai:spiral.imperial.ac.uk:10044/1/12278","is_oa":true,"landing_page_url":"http://www.aaai.org/Press/Proceedings/aaai13.php","pdf_url":"http://hdl.handle.net/10044/1/12278","source":{"id":"https://openalex.org/S4306401396","display_name":"Spiral (Imperial College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I47508984","host_organization_name":"Imperial College London","host_organization_lineage":["https://openalex.org/I47508984"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"27th AAAI Conference","raw_type":"Conference Paper"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.369.5227","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.369.5227","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.ias.informatik.tu-darmstadt.de/uploads/Publications/Kupcsik_AAAI_2013.pdf","raw_type":"text"},{"id":"pmh:oai:escidoc.org:escidoc:1910025","is_oa":false,"landing_page_url":"http://hdl.handle.net/11858/00-001M-0000-0015-3AA0-7","pdf_url":null,"source":{"id":"https://openalex.org/S7407052962","display_name":"Max Planck Digital Library","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferenceObject"},{"id":"pmh:oai:figshare.com:article/24361288","is_oa":true,"landing_page_url":"https://figshare.com/articles/journal_contribution/Data-efficient_generalization_of_robot_skills_with_contextual_policy_search/24361288","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1609/aaai.v27i1.8546","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v27i1.8546","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/8546/8405","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W1929309940.pdf","grobid_xml":"https://content.openalex.org/works/W1929309940.grobid-xml"},"referenced_works_count":34,"referenced_works":["https://openalex.org/W1499669280","https://openalex.org/W1520597402","https://openalex.org/W1746819321","https://openalex.org/W1952489873","https://openalex.org/W1982803779","https://openalex.org/W2012392077","https://openalex.org/W2016765487","https://openalex.org/W2042882799","https://openalex.org/W2099768828","https://openalex.org/W2111967991","https://openalex.org/W2117629901","https://openalex.org/W2119717200","https://openalex.org/W2123967136","https://openalex.org/W2125612430","https://openalex.org/W2130105540","https://openalex.org/W2132602063","https://openalex.org/W2139053308","https://openalex.org/W2139769245","https://openalex.org/W2140135625","https://openalex.org/W2149860990","https://openalex.org/W2211399972","https://openalex.org/W2554830522","https://openalex.org/W2591436094","https://openalex.org/W3103503690","https://openalex.org/W4211049957","https://openalex.org/W4230563027","https://openalex.org/W4237733001","https://openalex.org/W6629804754","https://openalex.org/W6629881138","https://openalex.org/W6640954454","https://openalex.org/W6646105485","https://openalex.org/W6653435097","https://openalex.org/W6674989108","https://openalex.org/W6676560026"],"related_works":["https://openalex.org/W4233452137","https://openalex.org/W2961085424","https://openalex.org/W4290792893","https://openalex.org/W4254857216","https://openalex.org/W405964254","https://openalex.org/W2045758229","https://openalex.org/W4231626925","https://openalex.org/W2962829499","https://openalex.org/W2398963826","https://openalex.org/W2263237444"],"abstract_inverted_index":{"In":[0],"robotics,":[1],"controllers":[2],"make":[3],"the":[4,17,20,26,37,54,88,105,147],"robot":[5,21,55,89],"solve":[6],"a":[7,10,44,57,113,153],"task":[8,33],"within":[9],"specific":[11],"context.":[12],"The":[13],"context":[14,59],"can":[15,120],"describe":[16],"objectives":[18],"of":[19,25,85,87,107],"or":[22],"physical":[23],"properties":[24],"environment":[27],"and":[28,60,165],"is":[29,128],"always":[30],"specified":[31],"before":[32],"execution.":[34],"To":[35],"generalize":[36],"controller":[38],"to":[39,145,160],"multiple":[40],"contexts,":[41],"we":[42,141],"follow":[43],"hierarchical":[45,109],"approach":[46,118,127],"for":[47,56,69,135],"policy":[48,52,63,78,95,116],"learning:":[49],"A":[50],"lower-level":[51],"controls":[53],"given":[58],"an":[61,82],"upper-level":[62,72,124,148],"generalizes":[64],"among":[65],"contexts.":[66],"Current":[67],"approaches":[68,97],"learning":[70,108,131,157],"such":[71],"policies":[73],"are":[74,98],"based":[75,100,129],"on":[76,130,163],"model-free":[77],"search,":[79],"which":[80],"require":[81],"excessive":[83],"number":[84],"interactions":[86],"with":[90],"its":[91],"environment.":[92],"More":[93],"data-efficient":[94],"search":[96,117],"model":[99],"but,":[101],"thus":[102],"far,":[103],"without":[104],"capability":[106],"policies.":[110,125],"We":[111],"propose":[112],"new":[114],"model-based":[115],"that":[119],"also":[121],"learn":[122],"contextual":[123],"Our":[126,150],"probabilistic":[132],"forward":[133],"models":[134],"long-term":[136],"predictions.":[137],"Using":[138],"these":[139],"predictions,":[140],"use":[142],"information-theoretic":[143],"insights":[144],"improve":[146],"policy.":[149],"method":[151],"achieves":[152],"substantial":[154],"improvement":[155],"in":[156],"speed":[158],"compared":[159],"existing":[161],"methods":[162],"simulated":[164],"real":[166],"robotic":[167],"tasks.":[168]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":14},{"year":2018,"cited_by_count":9},{"year":2017,"cited_by_count":9},{"year":2016,"cited_by_count":12},{"year":2015,"cited_by_count":11},{"year":2014,"cited_by_count":10},{"year":2013,"cited_by_count":2}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
