{"id":"https://openalex.org/W4392933178","doi":"https://doi.org/10.48550/arxiv.2403.10290","title":"Offline Goal-Conditioned Reinforcement Learning for Shape Control of Deformable Linear Objects","display_name":"Offline Goal-Conditioned Reinforcement Learning for Shape Control of Deformable Linear Objects","publication_year":2024,"publication_date":"2024-03-15","ids":{"openalex":"https://openalex.org/W4392933178","doi":"https://doi.org/10.48550/arxiv.2403.10290"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2403.10290","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.10290","pdf_url":"https://arxiv.org/pdf/2403.10290","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2403.10290","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013485773","display_name":"Rita Laezza","orcid":"https://orcid.org/0000-0003-3791-065X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Laezza, Rita","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063622879","display_name":"Mohammadreza Shetab-Bushehri","orcid":"https://orcid.org/0000-0003-3243-3305"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shetab-Bushehri, Mohammadreza","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017806461","display_name":"Gabriel Arslan Waltersson","orcid":"https://orcid.org/0000-0001-6775-0584"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Waltersson, Gabriel Arslan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102824837","display_name":"Erol \u00d6zg\u00fcr","orcid":"https://orcid.org/0000-0001-5946-1213"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"\u00d6zg\u00fcr, Erol","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048178604","display_name":"Youcef Mezouar","orcid":"https://orcid.org/0000-0001-8138-3928"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mezouar, Youcef","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5066684950","display_name":"Yiannis Karayiannidis","orcid":"https://orcid.org/0000-0001-5129-342X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Karayiannidis, Yiannis","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5013485773"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11245","display_name":"Advanced Numerical Analysis Techniques","score":0.8659999966621399,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11245","display_name":"Advanced Numerical Analysis Techniques","score":0.8659999966621399,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.8424000144004822,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11115","display_name":"Topology Optimization in Engineering","score":0.8141000270843506,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6639262437820435},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.6019135117530823},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4872090220451355},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.47819140553474426},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36909788846969604},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.2937259078025818},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.07915270328521729}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6639262437820435},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.6019135117530823},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4872090220451355},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.47819140553474426},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36909788846969604},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2937259078025818},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.07915270328521729}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2403.10290","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.10290","pdf_url":"https://arxiv.org/pdf/2403.10290","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"doi:10.48550/arxiv.2403.10290","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2403.10290","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2403.10290","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.10290","pdf_url":"https://arxiv.org/pdf/2403.10290","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6294219032","display_name":null,"funder_award_id":"869855","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8869864247","display_name":null,"funder_award_id":"2022-06725","funder_id":"https://openalex.org/F4320322581","funder_display_name":"Vetenskapsr\u00e5det"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320322327","display_name":"Knut och Alice Wallenbergs Stiftelse","ror":"https://ror.org/004hzzk67"},{"id":"https://openalex.org/F4320322581","display_name":"Vetenskapsr\u00e5det","ror":"https://ror.org/03zttf063"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W2086122291"],"abstract_inverted_index":{"Deformable":[0,76],"objects":[1],"present":[2],"several":[3],"challenges":[4],"to":[5,22,33,67,111,113,115,126,135,149,176],"the":[6,13,18,82,128,139,144,151,156,164,171],"field":[7],"of":[8,12,74,84,130,146,158],"robotic":[9],"manipulation.":[10],"One":[11],"tasks":[14,54],"that":[15,170],"best":[16,152],"encapsulates":[17],"difficulties":[19],"arising":[20],"due":[21],"non-rigid":[23],"behavior":[24,161],"is":[25,174],"shape":[26,71],"control,":[27],"which":[28,133],"requires":[29],"driving":[30],"an":[31,61,96],"object":[32],"a":[34,69,75,92,104,178,182],"desired":[35],"shape.":[36],"While":[37],"shape-servoing":[38,179],"methods":[39],"have":[40],"been":[41],"shown":[42],"successful":[43],"in":[44,53,181],"contexts":[45],"with":[46,55,138],"approximately":[47],"linear":[48],"behavior,":[49],"they":[50],"can":[51],"fail":[52],"more":[56],"complex":[57],"dynamics.":[58],"We":[59,99,142],"investigate":[60],"alternative":[62],"approach,":[63],"using":[64],"offline":[65,106],"RL":[66,107],"solve":[68],"planar":[70],"control":[72],"problem":[73],"Linear":[77],"Object":[78],"(DLO).":[79],"To":[80],"evaluate":[81,143],"effect":[83,157],"material":[85],"properties,":[86],"two":[87],"DLOs":[88],"are":[89,124],"tested":[90],"namely":[91],"soft":[93],"rope":[94],"and":[95,109,121,154],"elastic":[97],"cord.":[98],"frame":[100],"this":[101],"task":[102],"as":[103],"goal-conditioned":[105],"problem,":[108],"aim":[110],"learn":[112],"generalize":[114],"unseen":[116],"goal":[117],"shapes.":[118],"Data":[119],"collection":[120],"augmentation":[122,147],"procedures":[123],"proposed":[125,172],"limit":[127],"amount":[129,145],"experimental":[131],"data":[132],"needs":[134],"be":[136],"collected":[137],"real":[140],"robot.":[141],"needed":[148],"achieve":[150],"results,":[153],"test":[155],"regularization":[159],"through":[160],"cloning":[162],"on":[163],"TD3+BC":[165],"algorithm.":[166],"Finally,":[167],"we":[168],"show":[169],"approach":[173],"able":[175],"outperform":[177],"baseline":[180],"curvature":[183],"inversion":[184],"experiment.":[185]},"counts_by_year":[],"updated_date":"2026-05-08T15:41:06.802602","created_date":"2025-10-10T00:00:00"}
