{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,2]],"date-time":"2025-08-02T16:51:25Z","timestamp":1754153485737,"version":"3.41.2"},"reference-count":50,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T00:00:00Z","timestamp":1750204800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T00:00:00Z","timestamp":1750204800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100008899","name":"University of South Carolina","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100008899","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,6,18]]},"DOI":"10.1109\/ichi64645.2025.00049","type":"proceedings-article","created":{"date-parts":[[2025,7,22]],"date-time":"2025-07-22T18:00:50Z","timestamp":1753207250000},"page":"251-260","source":"Crossref","is-referenced-by-count":0,"title":["Automated Reddit Data Annotation with Large Language Models"],"prefix":"10.1109","author":[{"given":"Sai","family":"Vuruma","sequence":"first","affiliation":[{"name":"University of South Carolina,HI3 Tech Lab,Columbia,SC,USA"}]},{"given":"Dezhi","family":"Wu","sequence":"additional","affiliation":[{"name":"University of South Carolina,HI3 Tech Lab,Columbia,SC,USA"}]},{"given":"Saborny Sen","family":"Gupta","sequence":"additional","affiliation":[{"name":"University of South Carolina,HI3 Tech Lab,Columbia,SC,USA"}]},{"given":"Lucas","family":"Aust","sequence":"additional","affiliation":[{"name":"University of South Carolina,HI3 Tech Lab,Columbia,SC,USA"}]},{"given":"Valerie","family":"Lookingbill","sequence":"additional","affiliation":[{"name":"University of South Carolina,HI3 Tech Lab,Columbia,SC,USA"}]},{"given":"Wyatt","family":"Bellamy","sequence":"additional","affiliation":[{"name":"University of South Carolina,HI3 Tech Lab,Columbia,SC,USA"}]},{"given":"Yang","family":"Ren","sequence":"additional","affiliation":[{"name":"University of South Carolina,HI3 Tech Lab,Columbia,SC,USA"}]},{"given":"Erin","family":"Kasson","sequence":"additional","affiliation":[{"name":"Washington University,School of Medicine,St. Louis,MO,USA"}]},{"given":"Li-Shiun","family":"Chen","sequence":"additional","affiliation":[{"name":"Washington University,School of Medicine,St. Louis,MO,USA"}]},{"given":"Patricia","family":"Cavazos-Rehg","sequence":"additional","affiliation":[{"name":"Washington University,School of Medicine,St. Louis,MO,USA"}]},{"given":"Dian","family":"Hu","sequence":"additional","affiliation":[{"name":"University of Texas Health Science Center at Houston,MacWilliam School of Biomedical Informatics,Houston,TX,USA"}]},{"given":"Hongfang","family":"Liu","sequence":"additional","affiliation":[{"name":"University of Texas Health Science Center at Houston,MacWilliam School of Biomedical Informatics,Houston,TX,USA"}]},{"given":"Ming","family":"Huang","sequence":"additional","affiliation":[{"name":"University of Texas Health Science Center at Houston,MacWilliam School of Biomedical Informatics,Houston,TX,USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.2196\/55177"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1542\/peds.2021-050164"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1177\/1179173X20945695"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.drugalcdep.2020.107886"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1136\/tobaccocontrol-2018-054432"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1016\/j.pmedr.2017.02.026"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.2196\/28303"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1001\/jamapediatrics.2020.2348"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.2196\/13673"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.2196\/39460"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/j.ijmedinf.2021.104574"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1609\/icwsm.v8i1.14526"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1080\/08934215.2019.1607516"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1016\/j.ijmedinf.2020.104223"},{"key":"ref15","article-title":"Gpt-4 as a twitter data annotator: Unraveling its performance on a stance classification task","author":"Liyanage","year":"2023","journal-title":"Authorea Preprints"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3639233.3639353"},{"article-title":"Chatgpt-4 outperforms experts and crowd workers in annotating political twitter messages with zero-shot learning","year":"2023","author":"T\u00f6rnberg","key":"ref17"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-emnlp.637"},{"key":"ref19","first-page":"1877","article-title":"Language models are few-shot learners","volume":"33","author":"Brown","year":"2020","journal-title":"Advances in neural information processing systems"},{"article-title":"Gpt-4 technical report","year":"2023","author":"Achiam","key":"ref20"},{"key":"ref21","first-page":"232","article-title":"Using large language models (llms) to extract evidence from pre-annotated social media data","volume-title":"Proceedings of the 9th Workshop on Computational Linguistics and Clinical Psychology (CLPsych 2024)","author":"Alhamed"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3543873.3587605"},{"article-title":"Automated annotation with generative ai requires validation","year":"2023","author":"Pangakis","key":"ref23"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3543873.3587368"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/3594536.3595161"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.2196\/52499"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.626"},{"article-title":"From humans to machines: can chatgpt-like llms effectively replace human annotators in nlp tasks","volume-title":"Workshop Proceedings of the 17th International AAAI Conference on Web and Social Media","author":"Thapa","key":"ref28"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1098\/rsta.2023.0254"},{"key":"ref30","article-title":"NLTK sentence tokenizer"},{"key":"ref31","first-page":"2","article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","volume-title":"Proceedings of naacL-HLT","volume":"1","author":"Kenton"},{"article-title":"Attention is all you need","year":"2023","author":"Vaswani","key":"ref32"},{"key":"ref33","first-page":"1746","article-title":"Convolutional neural networks for sentence classification","volume-title":"Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP)","author":"Kim"},{"key":"ref34","doi-asserted-by":"crossref","DOI":"10.3115\/v1\/P14-1062","article-title":"A convolutional neural network for modelling sentences","author":"Kalchbrenner","year":"2014"},{"article-title":"A sensitivity analysis of (and practitioners\u2019 guide to) convolutional neural networks for sentence classification","year":"2016","author":"Zhang","key":"ref35"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1007\/bfb0026683"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-34747-9_18"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1088\/1757-899X\/1098\/5\/052081"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ICAICA50127.2020.9182555"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/TR.2021.3087864"},{"article-title":"Gemini 1.5: Unlocking multimodal understanding across millions of tokens of context","year":"2024","author":"Reid","key":"ref41"},{"article-title":"Gemma 2: Improving open language models at a practical size","year":"2024","author":"Riviere","key":"ref42"},{"article-title":"Phi-3 technical report: A highly capable language model locally on your phone","year":"2024","author":"Abdin","key":"ref43"},{"article-title":"The llama 3 herd of models","year":"2024","author":"Dubey","key":"ref44"},{"article-title":"How well does gpt-4v (ision) adapt to distribution shifts? a preliminary investigation","year":"2023","author":"Han","key":"ref45"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW63382.2024.00780"},{"article-title":"Chain-of-thought prompting elicits reasoning in large language models","year":"2023","author":"Wei","key":"ref47"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1037\/10248-026"},{"article-title":"Tree of thoughts: Deliberate problem solving with large language models","year":"2023","author":"Yao","key":"ref49"},{"article-title":"Retrieval-augmented generation for knowledge-intensive nlp tasks","year":"2021","author":"Lewis","key":"ref50"}],"event":{"name":"2025 IEEE 13th International Conference on Healthcare Informatics (ICHI)","start":{"date-parts":[[2025,6,18]]},"location":"Rende, Italy","end":{"date-parts":[[2025,6,21]]}},"container-title":["2025 IEEE 13th International Conference on Healthcare Informatics (ICHI)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11081517\/11081519\/11081946.pdf?arnumber=11081946","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,23]],"date-time":"2025-07-23T04:56:30Z","timestamp":1753246590000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11081946\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,18]]},"references-count":50,"URL":"https:\/\/doi.org\/10.1109\/ichi64645.2025.00049","relation":{},"subject":[],"published":{"date-parts":[[2025,6,18]]}}}