{"id":"https://openalex.org/W7083825230","doi":"https://doi.org/10.48550/arxiv.2509.24101","title":"BTC-SAM: Leveraging LLMs for Generation of Bias Test Cases for Sentiment Analysis Models","display_name":"BTC-SAM: Leveraging LLMs for Generation of Bias Test Cases for Sentiment Analysis Models","publication_year":2025,"publication_date":"2025-09-28","ids":{"openalex":"https://openalex.org/W7083825230","doi":"https://doi.org/10.48550/arxiv.2509.24101"},"language":"en","primary_location":{"id":"doi:10.48550/arxiv.2509.24101","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.24101","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2509.24101","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Kardkovacs, Zsolt T.","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kardkovacs, Zsolt T.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Djennane, Lynda","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Djennane, Lynda","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Field, Anna","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Field, Anna","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Benatallah, Boualem","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Benatallah, Boualem","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Gaci, Yacine","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gaci, Yacine","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Casati, Fabio","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Casati, Fabio","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Gaaloul, Walid","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gaaloul, Walid","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T13001","display_name":"Restraint-Related Deaths","score":0.6223000288009644,"subfield":{"id":"https://openalex.org/subfields/2711","display_name":"Emergency Medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T13001","display_name":"Restraint-Related Deaths","score":0.6223000288009644,"subfield":{"id":"https://openalex.org/subfields/2711","display_name":"Emergency Medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T14106","display_name":"Environmental and Sediment Control","score":0.09870000183582306,"subfield":{"id":"https://openalex.org/subfields/2308","display_name":"Management, Monitoring, Policy and Law"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10376","display_name":"Suicide and Self-Harm Studies","score":0.08340000361204147,"subfield":{"id":"https://openalex.org/subfields/3203","display_name":"Clinical Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.6118000149726868},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.5497000217437744},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4814000129699707},{"id":"https://openalex.org/keywords/sentiment-analysis","display_name":"Sentiment analysis","score":0.4388999938964844},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4032999873161316},{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.3409000039100647}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6258999705314636},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.6118000149726868},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.5497000217437744},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.527999997138977},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5270000100135803},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4814000129699707},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45320001244544983},{"id":"https://openalex.org/C66402592","wikidata":"https://www.wikidata.org/wiki/Q2271421","display_name":"Sentiment analysis","level":2,"score":0.4388999938964844},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4032999873161316},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.35749998688697815},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.3409000039100647},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.32760000228881836},{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.3125},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.303600013256073},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.2957000136375427},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.27799999713897705},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.26899999380111694},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.26089999079704285},{"id":"https://openalex.org/C2983427547","wikidata":"https://www.wikidata.org/wiki/Q93200","display_name":"Gender bias","level":2,"score":0.25920000672340393},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2509.24101","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.24101","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2509.24101","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.24101","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6403284668922424}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Sentiment":[0],"Analysis":[1],"(SA)":[2],"models":[3,25,92],"harbor":[4],"inherent":[5],"social":[6],"biases":[7,16],"that":[8,28,48,111],"can":[9,115],"be":[10],"harmful":[11],"in":[12,31,90,122],"real-world":[13],"applications.":[14],"These":[15],"are":[17],"identified":[18],"by":[19],"examining":[20],"the":[21,32,36,53,102,123],"output":[22],"of":[23,35,46,63,105],"SA":[24,91],"for":[26,87,101,137],"sentences":[27,47],"only":[29],"vary":[30],"identity":[33],"groups":[34],"subjects.":[37],"Constructing":[38],"natural,":[39],"linguistically":[40],"rich,":[41],"relevant,":[42],"and":[43,120],"diverse":[44],"sets":[45],"provide":[49,116],"sufficient":[50],"coverage":[51,130],"over":[52],"domain":[54,67],"is":[55],"expensive,":[56],"especially":[57],"when":[58],"addressing":[59],"a":[60,76],"wide":[61],"range":[62],"biases:":[64],"it":[65],"requires":[66],"experts":[68],"and/or":[69],"crowd-sourcing.":[70],"In":[71],"this":[72],"paper,":[73],"we":[74],"present":[75],"novel":[77],"bias":[78,88],"testing":[79,89],"framework,":[80],"BTC-SAM,":[81],"which":[82],"generates":[83],"high-quality":[84],"test":[85,106,124,129],"cases":[86],"with":[93],"minimal":[94],"specification":[95],"using":[96],"Large":[97],"Language":[98],"Models":[99],"(LLMs)":[100],"controllable":[103],"generation":[104],"sentences.":[107],"Our":[108],"experiments":[109],"show":[110],"relying":[112],"on":[113],"LLMs":[114],"high":[117],"linguistic":[118],"variation":[119],"diversity":[121],"sentences,":[125],"thereby":[126],"offering":[127],"better":[128],"compared":[131],"to":[132],"base":[133],"prompting":[134],"methods":[135],"even":[136],"previously":[138],"unseen":[139],"biases.":[140]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
