{"id":"https://openalex.org/W4403928605","doi":"https://doi.org/10.48550/arxiv.2409.19745","title":"PEAR: Position-Embedding-Agnostic Attention Re-weighting Enhances Retrieval-Augmented Generation with Zero Inference Overhead","display_name":"PEAR: Position-Embedding-Agnostic Attention Re-weighting Enhances Retrieval-Augmented Generation with Zero Inference Overhead","publication_year":2024,"publication_date":"2024-09-29","ids":{"openalex":"https://openalex.org/W4403928605","doi":"https://doi.org/10.48550/arxiv.2409.19745"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2409.19745","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.19745","pdf_url":"https://arxiv.org/pdf/2409.19745","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2409.19745","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101628586","display_name":"Tao Tan","orcid":"https://orcid.org/0000-0002-5573-1105"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Tan, Tao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027496845","display_name":"Yining Qian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qian, Yining","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102818141","display_name":"Ang Lv","orcid":"https://orcid.org/0000-0002-8027-2270"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lv, Ang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078451082","display_name":"Hongzhan Lin","orcid":"https://orcid.org/0000-0002-4111-8334"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Hongzhan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008052971","display_name":"Songhao Wu","orcid":"https://orcid.org/0009-0007-2736-206X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Songhao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100616757","display_name":"Yongbo Wang","orcid":"https://orcid.org/0000-0001-8424-0527"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yongbo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115695115","display_name":"Feng Wang","orcid":"https://orcid.org/0000-0003-3036-6735"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Feng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066199440","display_name":"Jingtong Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Jingtong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051310672","display_name":"Xin Lu","orcid":"https://orcid.org/0000-0001-6470-8022"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5083150735","display_name":"Rui-Jun Yan","orcid":"https://orcid.org/0000-0001-6362-6340"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Rui","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5101628586"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9855999946594238,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.96670001745224,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7386342287063599},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6526381969451904},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6106144785881042},{"id":"https://openalex.org/keywords/zero","display_name":"Zero (linguistics)","score":0.5571766495704651},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.5481763482093811},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5220665335655212},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.4327007532119751},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4269874095916748},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3341570794582367},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.08265763521194458},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.04684045910835266}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7386342287063599},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6526381969451904},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6106144785881042},{"id":"https://openalex.org/C2780813799","wikidata":"https://www.wikidata.org/wiki/Q3274237","display_name":"Zero (linguistics)","level":2,"score":0.5571766495704651},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.5481763482093811},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5220665335655212},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.4327007532119751},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4269874095916748},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3341570794582367},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.08265763521194458},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.04684045910835266},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2409.19745","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.19745","pdf_url":"https://arxiv.org/pdf/2409.19745","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2409.19745","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2409.19745","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2409.19745","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.19745","pdf_url":"https://arxiv.org/pdf/2409.19745","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2180954594","https://openalex.org/W2052835778","https://openalex.org/W2049003611","https://openalex.org/W2127804977","https://openalex.org/W2108418243","https://openalex.org/W164103134","https://openalex.org/W2040545019","https://openalex.org/W2787352659","https://openalex.org/W1970611213","https://openalex.org/W4206560911"],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"enhanced":[4],"with":[5,70,108],"retrieval-augmented":[6],"generation":[7],"(RAG)":[8],"have":[9],"introduced":[10],"a":[11,76,130],"new":[12],"paradigm":[13],"for":[14],"web":[15],"search.":[16],"However,":[17],"the":[18,65,89,99,126,132,151,162],"limited":[19],"context":[20,34,66,81,91],"awareness":[21,35,67,92],"of":[22,68,101,161,186,208],"LLMs":[23,69],"degrades":[24],"their":[25,106,143],"performance":[26],"on":[27,75,80,125],"RAG":[28,95,147,202],"tasks.":[29,203],"Existing":[30],"methods":[31],"to":[32,50,122,136,145,156],"enhance":[33],"are":[36,48,134,154],"often":[37],"inefficient,":[38],"incurring":[39],"time":[40],"or":[41,189],"memory":[42,187],"overhead":[43,183],"during":[44],"inference,":[45,150],"and":[46,198],"many":[47],"tailored":[49],"specific":[51,163],"position":[52,209],"embeddings.":[53],"In":[54],"this":[55],"paper,":[56],"we":[57,83,104],"propose":[58],"Position-Embedding-Agnostic":[59],"attention":[60],"Re-weighting":[61],"(PEAR),":[62],"which":[63,87],"enhances":[64],"zero":[71,180],"inference":[72,182,190],"overhead.":[73],"Specifically,":[74],"proxy":[77,127],"task":[78,164],"focused":[79],"copying,":[82],"first":[84],"detect":[85],"heads":[86],"suppress":[88,146],"models'":[90],"thereby":[93,141],"diminishing":[94],"performance.":[96,148],"To":[97],"weaken":[98],"impact":[100],"these":[102,120,158],"heads,":[103,159],"re-weight":[105,157],"outputs":[107],"learnable":[109],"coefficients.":[110],"The":[111],"LLM":[112],"(with":[113],"frozen":[114],"parameters)":[115],"is":[116,206],"optimized":[117,135,152],"by":[118],"adjusting":[119],"coefficients":[121,133,153],"minimize":[123],"loss":[124],"task.":[128],"As":[129],"result,":[131],"values":[137],"less":[138],"than":[139],"one,":[140],"reducing":[142],"tendency":[144],"During":[149],"fixed":[155],"regardless":[160],"at":[165],"hand.":[166],"Our":[167],"proposed":[168],"PEAR":[169],"offers":[170],"two":[171],"major":[172],"advantages":[173],"over":[174],"previous":[175],"approaches:":[176],"(1)":[177],"It":[178,205],"introduces":[179],"additional":[181],"in":[184,196],"terms":[185],"usage":[188],"time,":[191],"while":[192],"outperforming":[193],"competitive":[194],"baselines":[195],"accuracy":[197],"efficiency":[199],"across":[200],"various":[201],"(2)":[204],"independent":[207],"embedding":[210],"algorithms,":[211],"ensuring":[212],"broader":[213],"applicability.":[214]},"counts_by_year":[],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2024-11-01T00:00:00"}
