Javascript is required
@article@book{1,title={World mental health report: {T}ransforming mental health for all},author={{World Health Organization}},year={2022}}.
@article{2,title={Global prevalence of past-year violence against children: {A} systematic review and minimum estimates},author={Hillis, S. and Mercy, J. and Amobi, A. and Kress, H.},journal={Pediatrics},volume={137},number={3},pages={e20154079},year={2016},doi={10.1542/peds.2015-4079},url={}}. [Crossref]
@article{3,title={Childhood adversities and adult psychiatric disorders in the national comorbidity survey replication {II}: {A}ssociations with persistence of {DSM-IV} disorders},author={McLaughlin, K. A. and Green, J. G. and Gruber, M. J. and Sampson, N. A. and Zaslavsky, A. M. and Kessler, R. C.},journal={Arch. Gen. Psychiatry.},volume={67},number={2},pages={124-132},year={2010},doi={10.1001/archgenpsychiatry.2009.187},url={}}. [Crossref]
@article{4,title={The consequences of the {COVID}-19 pandemic on mental health and implications for clinical practice},author={Fiorillo, A. and Gorwood, P.},journal={Eur. Psychiatry},volume={63},number={1},pages={e32},year={2020},doi={10.1192/j.eurpsy.2020.35},url={}}. [Crossref]
@article{5,title={Barriers to treatment for mental disorders in six countries of the {A}mericas: {A} regional report from the {World Mental Health Surveys}},author={Orozco, R. and Vigo, D. and Benjet, C. and Borges, G. and Aguilar-Gaxiola, S. and Andrade, L. H. and Cia, A. and Hwang, I. and Kessler, R. C. and Piazza, M. and others},journal={J. Affect. Disord.},volume={303},pages={273-285},year={2022},doi={10.1016/j.jad.2022.02.031},url={}}. [Crossref]
@article{6,title={A meta-analysis of mentalizing in anxiety disorders, obsessive-compulsive and related disorders, and trauma and stressor related disorders},author={Sloover, M. and van Est, L. A. C. and Janssen, P. G. J. and Hilbink, M. and van Ee, E.},journal={J. Anxiety Disord.},volume={92},pages={102641},year={2022},doi={10.1016/j.janxdis.2022.102641},url={}}. [Crossref]
@article{7,title={The epidemiology of {DSM-5} posttraumatic stress disorder in the {U}nited {S}tates: {R}esults from the National Epidemiologic Survey on Alcohol and Related Conditions-III},author={Goldstein, R. B. and Smith, S. M. and Chou, S. P. and Saha, T. D. and Jung, J. and Zhang, H. T. and Pickering, R. P. and Huang, B. J. and Grant, B. F.},journal={Soc. Psychiatry Psychiatr. Epidemiol.},volume={51},number={8},pages={1137-1148},year={2016},doi={10.1007/s00127-016-1208-5},url={}}. [Crossref]
@article{8,title={{ELIZA}—{A} computer program for the study of natural language communication between man and machine},author={Weizenbaum, J.},journal={Commun. ACM},volume={9},number={1},pages={36-45},year={1966},doi={10.1145/365153.365168},url={}}. [Crossref]
@article{9,title={The {PRISMA} statement for reporting systematic reviews and meta-analyses of studies that evaluate health care interventions: {E}xplanation and elaboration},author={Liberati, A. and Altman, D. G. and Tetzlaff, J. and Mulrow, C. and Gøtzsche, P. C. and Ioannidis, J. P. and Clarke, M. and Devereaux, P. J. and Kleijnen, J. and Moher, D.},journal={Ann. Intern. Med.},volume={151},number={4},pages={W65-W94},year={2009},doi={10.7326/0003-4819-151-4-200908180-00136},url={}}. [Crossref]
@article{10,title={Software survey: {VOS}viewer, a computer program for bibliometric mapping},author={van Eck, N. J. and Waltman, L.},journal={Scientometrics},volume={84},pages={523-538},year={2009},doi={10.1007/s11192-009-0146-3},url={}}. [Crossref]
@article{11,title={The {PRISMA} 2020 statement: {A}n updated guideline for reporting systematic reviews},author={Page, M. J. and McKenzie, J. E. and Bossuyt, P. M. and Boutron, I. and Hoffmann, T. C. and Mulrow, C. D. and Shamseer, L. and Tetzlaff, J. M. and Akl, E. A. and Brennan, S. E. and others},journal={BMJ},volume={372},year={2021},doi={10.1136/bmj.n71},url={}}. [Crossref]
@article{12,title={Preliminary guideline for reporting bibliometric reviews of the biomedical literature ({BIBLIO}): {A} minimum requirements},author={Montazeri, A. and Mohammadi, S. and Hesari, P. M. and Ghaemi, M. and Riazi, H. and Sheikhi-Mobarakeh, Z.},journal={Syst. Rev.},volume={12},number={1},pages={239},year={2023},doi={10.1186/s13643-023-02410-2},url={}}. [Crossref]
@article{13,title={Coauthorship networks and patterns of scientific collaboration},author={Newman, M. E. J.},journal={Proceedings of the National Academy of Sciences},volume={101},pages={5200-5205},year={2004},doi={10.1073/PNAS.0307545100},url={}}. [Crossref]
@article{14,title={Guidelines from the heritage field for the integration of landscape and heritage planning: {A} systematic literature review},author={Sánchez, M. L. and Cabrera, A. T. and Del Pulgar, M. L. G.},journal={Landsc. Urban. Plan.},volume={204},pages={103931},year={2021},doi={10.1016/j.landurbplan.2020.103931},url={}}@inproceedings{15,title={Distributed Representations of Words and Phrases and their Compositionality},author={Mikolov, T. and Sutskever, I. and Chen, K. and Corrado, G. S. and Dean, J.},journal={Advances in Neural Information Processing Systems(NIPS 2013)},volume={26},year={2013},url={https://proceedings.neurips.cc/paper_files/paper/2013/file/9aa42b31882ec039965f3c4923ce901b-Paper.pdf}}. [Crossref]
@article{16,title={From frequency to meaning: {V}ector space models of semantics},author={Turney, P. D. and Pantel, P.},journal={J. Artif. Intell. Res.},volume={37},pages={141-188},year={2010},doi={10.1613/jair.2934},url={}}. [Crossref]
@article{17,title={A survey of outlier detection methodologies},author={Hodge, V. J. and Austin, J.},journal={Artif. Intell. Rev.},volume={22},pages={85-126},year={2004},doi={10.1023/b:aire.0000045502.10941.a9},url={}}. [Crossref]
@article{18,title={Term-weighting approaches in automatic text retrieval},author={Salton, G. and Buckley, C.},journal={Inf. Process. Manag.},volume={24},number={5},pages={513-523},year={1988},doi={10.1016/0306-4573(88)90021-0},url={}}. [Crossref]
@article{19,title={N-gram-based text categorization},author={Cavnar, W. B. and Trenkle, J. M.},journal={Proceedings of SDAIR-94, 3rd annual symposium on document analysis and information retrieval},volume={161175},pages={14},year={1994}}.
@article{20,title={Word2{V}ec},author={Church, K. W.},journal={Nat. Lang. Eng.},volume={23},number={1},pages={155-162},year={2017},doi={10.1017/S1351324916000334},url={}}@inproceedings{21,title={Glo{V}e: {G}lobal Vectors for Word Representation},author={Pennington, J. and Socher, R. and Manning, C. D.},journal={Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP)},pages={1532-1543},year={2014},url={https://aclanthology.org/D14-1162.pdf}}@inproceedings{22,title={Text Classification Model Based on fast{T}ext},author={Yao, T. J. and Zhai, Z. G. and Gao, B. T.},journal={2020 IEEE International conference on artificial intelligence and information systems (ICAIIS)},pages={154-157},year={2020},doi={10.1109/ICAIIS49377.2020.9194939},url={https://doi.org/10.1109/ICAIIS49377.2020.9194939}}. [Crossref]
@article{23,title={A neural probabilistic language model},author={Bengio, Y. and Ducharme, R. and Vincent, P. and Jauvin, C.},journal={J. Mach. Learn. Res.},volume={3},pages={1137-1155},year={2003}}.
@article{24,title={Information Retrieval Based upon Latent Class Analysis},author={Baker, F. B.},journal={J. ACM},volume={9},number={4},pages={512-521},year={1962},doi={10.1145/321138.321148},url={}}. [Crossref]
@article{25,title={Latent Dirichlet allocation: {E}xtracting topics from software engineering data},author={Campbell, J. C. and Hindle, A. and Stroulia, E.},journal={The Art and Science of Analyzing Software Data},pages={139-159},year={2015},doi={10.1016/B978-0-12-411519-4.00006-9},url={}}. [Crossref]
@article{26,title={Text Representation for Sentiment Analysis: {F}rom Static to Dynamic},author={Gavali, P. M. and Shiragave, S. K.},journal={2023 3rd International Conference on Smart Data Intelligence (ICSMDI)},pages={99-105},year={2023},doi={10.1109/ICSMDI57622.2023.00025},url={}}. [Crossref]
@article{27,title={Context2{V}ec: {L}earning generic context embedding with bidirectional {LSTM}},author={Melamud, O. and Goldberger, J. and Dagan, I.},journal={Proceedings of the 20th SIGNLL conference on computational natural language learning},pages={51-61},year={2016},doi={10.18653/v1/k16-1006},url={}}@inproceedings{28,title={Contextualized context2{V}ec},author={Ashihara, K. and Kajiwara, T. and Arase, Y. and Uchida, S.},journal={Proceedings of the 5th Workshop on Noisy User-generated Text (W-NUT 2019)},pages={397-406},year={2019},doi={10.18653/V1/D19-5552},url={https://doi.org/10.18653/V1/D19-5552}}. [Crossref]
@article{29,title={Learned in translation: {C}ontextualized word vectors},author={McCann, B. and Bradbury, J. and Xiong, C. and Socher, R.},journal={Advances in Neural Information Processing Systems 30 (NIPS 2017)},year={2017},url={https://proceedings.neurips.cc/paper_files/paper/2017/file/20c86a628232a67e7bd46f76fba7ce12-Paper.pdf}}@incollection{30,title={Long Short-Term Memory},author={Graves, A.},booktitle={Supervised Sequence Labelling with Recurrent Neural Networks},publisher={Springer},pages={37-45},year={2012},doi={10.1007/978-3-642-24797-2_4},url={}}. [Crossref]
@article{31,title={Bidirectional recurrent neural networks},author={Schuster, M. and Paliwal, K. K.},journal={IEEE Trans. Signal Process.},volume={45},number={11},pages={2673-2681},year={1997}}@inproceedings{32,title={Attention is all you need},author={Vaswani, A. and Shazeer, N. and Parmar, N. and Uszkoreit, J. and Jones, L. and Gomez, A. N. and Kaiser, L. and Polosukhin, I.},booktitle={Advances in Neural Information Processing Systems (NIPS 2017)},volume={30},year={2017}}@inproceedings{33,title={Bert: {P}re-training of deep bidirectional transformers for language understanding},author={Devlin, J. and Chang, M. W. and Lee, K. and Toutanova, K.},booktitle={Proceedings of the 2019 conference of the North American chapter of the association for computational linguistics: human language technologies},pages={4171-4186},year={2019},doi={10.18653/v1/n19-1423},url={}}. [Crossref]
@article{34,title={Language models are unsupervised multitask learners},author={Radford, A. and Wu, J. and Child, R. and Luan, D. and Amodei, D. and Sutskever, I.},journal={OpenAI Blog},volume={1},number={8},pages={9},year={2019},url={https://storage.prod.researchhub.com/uploads/papers/2020/06/01/language-models.pdf}}.
@article{35,title={Screening for posttraumatic stress disorder using verbal features in self narratives: {A} text mining approach},author={He, Q. and Veldkamp, B. P. and de Vries, T.},journal={Psychiatry Res.},volume={198},number={3},pages={441-447},year={2012},doi={10.1016/j.psychres.2012.01.032},url={}}. [Crossref]
@article{36,title={Automated classification of psychotherapy note text: {I}mplications for quality assessment in {PTSD} care},author={Shiner, B. and D’Avolio, L. W. and Nguyen, T. M. and Zayed, M. H. and Watts, B. V. and Fiore, L.},journal={J. Eval. Clin. Pract.},volume={18},number={3},pages={698},year={2012},doi={10.1111/j.1365-2753.2011.01634.x},url={}}. [Crossref]
@article{37,title={{MedCat}: {A} framework for high level conceptualization of medical notes},author={Fodeh, S. J. and Zirkle, M. and Finch, R. and Reeves, J. and Erdos, C. and Brandt, C.},journal={2013 IEEE 13th International Conference on Data Mining Workshops},pages={274-280},year={2013},doi={10.1109/ICDMW.2013.89},url={}}. [Crossref]
@article{38,title={Measuring use of evidence based psychotherapy for posttraumatic stress disorder},author={Shiner, B. and D’Avolio, L. W. and Nguyen, T. M. and Zayed, M. H. and Young-Xu, Y. and Desai, R. A. and Schnurr, P. P. and Fiore, B. V. and Watts, B. V.},journal={Adm. Policy Ment. Health},volume={40},number={4},pages={311-318},year={2013},doi={10.1007/s10488-012-0421-0},url={}}. [Crossref]
@article{39,title={Automatic detection of psychological distress indicators and severity assessment in crisis hotline conversations},author={Pacula, M. and Meltzer, T. and Crystal, M. and Srivastava, A. and Marx, B.},journal={2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},pages={4863-4867},year={2014},doi={10.1109/ICASSP.2014.6854526},url={}}. [Crossref]
@article{40,title={Implementation of evidence-based psychotherapies for posttraumatic stress disorder in {VA} specialty clinics},author={Watts, B. V. and Shiner, B. and Zubkoff, L. and Carpenter-Song, E. and Ronconi, J. M. and Coldwell, C. M.},journal={Psychiatr. Serv.},volume={65},number={5},pages={648-653},year={2014},doi={10.1176/appi.ps.201300176},url={}}. [Crossref]
@article{41,title={Towards a differential diagnostic of {PTSD} using cognitive computing methods},author={Howard, N. and Jehel, L. and Arnal, R.},journal={2014 IEEE 13th International Conference on Cognitive Informatics and Cognitive Computing},pages={9-20},year={2014},doi={10.1109/ICCI-CC.2014.6921435},url={}}. [Crossref]
@article{42,title={Automated assessment of patients’ self-narratives for posttraumatic stress disorder screening using natural language processing and text mining},author={He, Q. and Veldkamp, B. P. and Glas, C. A. W. and de Vries, T.},journal={Assessment},volume={24},number={2},pages={157-172},year={2015},doi={10.1177/1073191115602551},url={}}. [Crossref]
@article{43,title={A pilot study of a heuristic algorithm for novel template identification from {VA} electronic medical record text},author={Redd, A. M. and Gundlapalli, A. V. and Divita, G. and Carter, M. E. and Tran, L. T. and Samore, M. H.},journal={J. Biomed. Inform.},volume={71},pages={S68-S76},year={2017},doi={10.1016/j.jbi.2016.07.019},url={}}. [Crossref]
@article{44,title={Predicting mental conditions based on “history of present illness” in psychiatric notes with deep neural networks},author={Tran, T. and Kavuluru, R.},journal={J. Biomed. Inform.},volume={75},pages={S138-S148},year={2017},doi={10.1016/j.jbi.2017.06.010},url={}}. [Crossref]
@article{45,title={Measuring use of evidence based psychotherapy for posttraumatic stress disorder in a large national healthcare system},author={Maguen, S. and Madden, E. and Patterson, O. V. and DuVall, S. L. and Goldstein, L. A. and Burkman, K. and Shiner, B.},journal={Adm. Policy Ment. Health},volume={45},number={4},pages={519-529},year={2018},doi={10.1007/S10488-018-0850-5},url={}}. [Crossref]
@article{46,title={Natural language processing tools for assessing progress and outcome of two veteran populations: {C}ohort study from a novel online intervention for posttraumatic growth},author={Norman, K. P. and Govindjee, A. and Norman, S. R. and Godoy, M. and Cerrone, D. W. and Kieschnick, W. and Kassler, W.},journal={JMIR Form. Res.},volume={4},number={e17424},year={2020},doi={10.2196/17424},url={}}. [Crossref]
@article{47,title={{LAXARY}: {A} trustworthy explainable {T}witter analysis model for post-traumatic stress disorder assessment},author={Alam, M. A. and Kapadia, D.},journal={2020 IEEE International Conference on Smart Computing (SMARTCOMP)},pages={308-313},year={2020},doi={10.1109/SMARTCOMP50058.2020.00069},url={}}. [Crossref]
@article{48,title={Evidence-based psychotherapy trends among posttraumatic stress disorder patients in a national healthcare system, 2001–2014},author={Maguen, S. and Holder, N. and Madden, E. and Li, Y. and Seal, K. H. and Neylan, T. C. and Lujan, O. V. and Patterson, S. L. and DuVall, B. and Shiner, B.},journal={Depress. Anxiety},volume={37},number={4},pages={356-364},year={2020},doi={10.1002/da.22983},url={}}. [Crossref]
@article{49,title={Multi-aspect transfer learning for detecting low resource mental disorders on social media},author={Uban, A. S. and Chulvi, B. and Rosso, P.},journal={Proceedings of the Thirteenth Language Resources and Evaluation Conference},pages={3202-3219},year={2022}}.
@article{50,title={Artificial intelligence language predictors of two-year trauma-related outcomes},author={Oltmanns, J. R. and Schwartz, H. A. and Ruggero, C. and Son, J. and Miao, M. and Waszczuk, S. A. P. and Clouston, E. J. and Bromet, B. J. and Luft, R. and Kotov, R.},journal={J. Psychiatr. Res.},volume={143},pages={239-245},year={2021},doi={10.1016/j.jpsychires.2021.09.015},url={}}. [Crossref]
@article{51,title={Improvements to {PTSD} quality metrics with natural language processing},author={Shiner, B. and Levis, M. and V. M. Dufort, O. V. and Patterson, B. V. and Watts, S. L. and DuVall, C. J. and Russ, S. and Maguen, B.},journal={J Eval. Clin. Pract.},volume={28},number={4},pages={520-530},year={2022},doi={10.1111/jep.13587},url={}}@inproceedings{52,title={Detecting and inoculating against {PTSD} in online forums and platforms},author={Shurafa, C.},booktitle={2021 8th International Conference on Behavioral and Social Computing (BESC)},pages={1-3},year={2021},doi={10.1109/BESC53957.2021.9635325},url={https://doi.org/10.1109/BESC53957.2021.9635325}}. [Crossref]
@article{53,title={Diagnosing post-traumatic stress disorder using electronic medical record data},author={Zafari, H. and Kosowan, L. and Zulkernine, F. and Signer, A.},journal={Health Inform. J.},volume={27},number={4},year={2021},doi={10.1177/14604582211053259},url={}}@inproceedings{54,title={Child abuse mental symptom prediction model using machine learning techniques},author={Elankeerthana, R. and Hanshiya, D. and Pranavajothi, A. and Shanmugapriya, S.},booktitle={2022 6th International Conference on Trends in Electronics and Informatics (ICOEI)},pages={1459-1465},year={2022},doi={10.1109/ICOEI53556.2022.9777138},url={https://doi.org/10.1109/ICOEI53556.2022.9777138}}. [Crossref]
@article{55,title={Detecting presence of {PTSD} using sentiment analysis from text data},author={Sawalha, J. and Yousefnezhad, M. and Shah, Z. and Brown, M. R. G. and Greenshaw, A. J. and Greiner, R.},journal={Front. Psychiatry},volume={12},pages={811392},year={2022},doi={10.3389/fpsyt.2021.811392},url={}}. [Crossref]
@article{56,title={Pan-Canadian electronic medical record diagnostic and unstructured text data for capturing {PTSD}: {R}etrospective observational study},author={Kosowan, L. and Singer, A. and Zulkernine, F. and Zafari, H. and Nesca, M. and Muthumuni, D.},journal={JMIR Med. Inform.},volume={10},number={12},pages={e41312},year={2022},doi={10.2196/41312},url={}}. [Crossref]
@article{57,title={Identifying women with postdelivery posttraumatic stress disorder using natural language processing of personal childbirth narratives},author={Bartal, A. and Jagodnik, K. M. and Chan, S. J. and Babu, M. S. and Dekel, S.},journal={Am. J. Obstet. Gynecol. MFM},volume={5},number={3},pages={100834},year={2023},doi={10.1016/j.ajogmf.2022.100834},url={}}. [Crossref]
@article{58,title={Dynamic suicide topic modelling: {D}eriving population-specific, psychosocial and time-sensitive suicide risk variables from electronic health record psychotherapy notes},author={Levis, M. and Levy, J. and Dufort, V. and Russ, C. J. and Shiner, B.},journal={Clin. Psychol. Psychother.},volume={30},number={4},pages={795-810},year={2023},doi={10.1002/cpp.2842},url={}}. [Crossref]
Search
Open Access
Review article

Natural Language Processing for PTSD Detection: A Systematic Review and Bibliometric Analysis

Engin Seven*,
Eylem Yucel
Department of Computer Engineering, Istanbul University—Cerrahpasa, 34320 Istanbul, Turkey
Acadlore Transactions on AI and Machine Learning
|
Volume 4, Issue 4, 2025
|
Pages 263-290
Received: 09-06-2025,
Revised: 11-14-2025,
Accepted: 11-23-2025,
Available online: 12-04-2025
View Full Article|Download PDF

Abstract:

Post-traumatic stress disorder (PTSD) has been recognized as a critical global mental health challenge, and the application of natural language processing (NLP) has emerged as a promising approach for its detection and management. In this study, a systematic review was conducted to evaluate the quality, quantity, and consistency of research investigating the role of NLP in PTSD detection. Through this process, prior research was consolidated, methodological gaps were identified, and a conceptual framework was formulated to guide future investigations. To complement the systematic review, a bibliometric analysis was performed to map the intellectual landscape, assess publication trends, and visualize research networks within this domain. The systematic review involved a structured search across ScienceDirect, IEEE Xplore, PubMed, and Web of Science, resulting in the retrieval of 328 records. After rigorous screening, 56 studies were included in the final synthesis. Separately, a bibliometric analysis was conducted on 4,138 publications obtained from the Web of Science database. The findings highlight that NLP methods not only enhance the detection of PTSD but also support the development of personalized treatment strategies. Ethical and security considerations were also identified as pressing concerns requiring further attention. The results of this study underscore the significance of NLP in advancing PTSD research and emphasize its potential to transform mental health services. By identifying trends, challenges, and opportunities, this study provides a foundation for future research aimed at strengthening the role of NLP in clinical practice and mental health policy.
Keywords: Post-traumatic stress disorder, Natural language processing, Health system, Systematic review, Bibliometric analysis

1. Introduction

The World Mental Health Report 2022 issued by the World Health Organization (WHO) highlights significant global disparities in mental health care systems and outcomes. It is estimated that one in every eight individuals worldwide experiences a mental health disorder [1]. Furthermore, individuals suffering from such disorders are at an increased risk of premature mortality. Among children aged 2 to 17, high levels of emotional, physical, and sexual violence have been reported, which significantly elevates the risk of developing mental disorders in later stages of life [2]. Childhood represents a critical period in which adverse experiences can shape emotional and psychological development. These adverse experiences are linked to a heightened risk of disorders such as depression, anxiety, and PTSD [3]. Mental health conditions also pose substantial social and economic burdens. For instance, the global economic cost of mental disorders was estimated at USD 2.5 trillion in 2010, with projections reaching nearly USD 5 trillion by 2030 [4]. Environmental and societal stressors, including natural disasters (e.g., earthquakes and floods) and human-made crises (e.g., terrorism), are recognized as major contributors to the onset of mental health issues. The COVID-19 pandemic further exacerbated this burden; mental health disorders such as PTSD, anxiety, and depression increased by approximately 25% during the first year of the outbreak, placing additional strain on healthcare infrastructures worldwide [5].

PTSD is a complex clinical condition characterized by symptoms, including hypervigilance, avoidance behaviors, cognitive and mood disturbances, and heightened physiological reactivity following a traumatic event [6]. Prevalence rates vary across populations and contexts; for example, a study conducted in the United States and Canada reported PTSD prevalence between 6\% and 9\% [7]. Untreated PTSD can significantly impair social functioning and lead to comorbid psychiatric or physical health conditions. Common symptoms include attention deficits, disrupted sleep, emotional dysregulation, and anger outbursts, which collectively contribute to poor quality of life and may escalate to suicidal ideation. NLP, a subfield of artificial intelligence (AI), has emerged as a promising tool for analyzing unstructured text data, including clinical notes, survey responses, and social media content. NLP encompasses technologies such as speech and emotion recognition, and semantic analysis. Its applications in healthcare are increasingly diverse, spanning radiology reports, biomedical terminology mapping, and physician documentation. One of the earliest examples of human-machine interaction via NLP is the ELIZA program developed in 1966 [8]. In modern implementations, NLP often integrates machine learning (ML) and deep learning (DL) to convert raw text into computable features for classification or prediction tasks. WHO’s 2022 report highlights significant global disparities in access to mental health services, particularly regarding limited availability of psychotherapy and shortages in trained professionals [1]. In this context, AI and NLP technologies have emerged as supportive tools for the early detection and monitoring of mental health symptoms, especially in resource-limited settings. This study aims to systematically review the current literature on how NLP techniques may contribute to addressing these systemic challenges in mental healthcare delivery.

The goal of this study is to systematically review and evaluate how NLP techniques have been employed to support the identification and classification of PTSD-related symptoms. This review also explores methodological trends, research gaps, and the potential integration of NLP-based tools into clinical workflows.

The research questions addressed in this study are as follows:

1. How have NLP techniques evolved specifically in the detection of PTSD?

2. What are the focal areas of NLP-based trauma research aimed at identifying PTSD?

3. Which NLP approaches have been used specifically for PTSD detection, and how were they applied?

4. What are the methodological challenges in using NLP for PTSD classification?

5. Can AI-based PTSD detection approaches be realistically integrated into healthcare systems?

The structure of this study is organized as follows: Section 2 outlines the methodology; Section 3 discusses PTSD and associated research methods; Section 4 reviews NLP methods used in PTSD-related studies; and Section 5 presents the results and discussion.

2. Research Methodology

In this systematic review, the primary objective was not to establish a direct diagnostic framework for PTSD using NLP techniques, but rather to assess the potential of NLP methods for detecting PTSD-related symptoms in unstructured text data. The focus was on identifying and extracting key symptoms and linguistic markers associated with PTSD, as reported in the literature. As such, the reviewed studies predominantly have utilized NLP for the detection and classification of PTSD symptoms rather than formal diagnostic assessment based on clinical criteria. The number of studies conducted in the field of mental health is increasing on a daily basis. A bibliometric analysis and systematic literature review in this field are anticipated to serve as a roadmap for researchers. A research project specifically focused on PTSD in the field of mental health can provide guidance on general trends, potential issues, and solutions. To this end, a bibliometric analysis can identify significant trends and gaps in the literature [9]. In order to achieve this objective, a comprehensive and systematic analysis of a substantial corpus of studies was conducted. This analysis generated a map of the trends and latest developments. The general process of the literature review in this study is illustrated in Figure 1.

Figure 1. Literature review process
2.1 Bibliometric Analysis Method

One of the earliest bibliometric analysis studies was conducted in the 1950s [9]. The bibliometric analysis of publications, including articles, papers and books on a specific subject, allowed for the identification of emerging trends, collaborations and research components. Furthermore, it was employed to examine the intellectual structure of a subject area that is of interest to researchers. The existence of extensive databases such as Scopus and Web of Science has greatly enhanced the accessibility of a vast array of publications. Consequently, researchers have been able to conduct bibliometric analysis on big data in a more effective manner. The field of NLP has undergone significant advancements over the past decade. These developments have resulted in the production of a substantial corpus of articles, papers, and books. It is therefore evident that there is a growing need for bibliometric analysis in the field of NLP. Selecting the most appropriate parameters for a bibliometric analysis within a specific field is a crucial aspect of the process. To illustrate, the number of citations can be employed to determine the relative importance of each publication. Furthermore, the citation network between publications can be employed to analyze relationships between publications, thereby identifying the most influential articles in the field of interest. Additionally, data regarding the countries in which the publications are concentrated can be obtained. Bibliometric analysis encompasses a vast publication network within the applied database, and thus the collected information can be presented graphically. In this study, VOSViewer was utilized for the visual representation of the bibliometric network [10].

2.2 PRISMA Method

The Preferred Reporting Items for Systematic Reviews and Meta-Analyses (PRISMA) 2020 guidelines provide an updated framework for reporting systematic reviews and meta-analyses [11]. The systematic review method is a frequently employed approach for empirically evaluating, developing a critical perspective, and summarizing data collected by researchers. Systematic reviews assist in determining future research priorities. Additionally, systematic reviews facilitate the synthesis of information about a research field and identify potential issues that may emerge in the future by utilizing the information obtained.

Following the PRISMA 2020 guideline, the article selection process was updated to provide detailed counts at each stage. Specifically, during the title and abstract screening, 198 articles were excluded due to irrelevance to PTSD or NLP. At the full-text assessment stage, 35 articles were excluded, primarily because they were reviews, did not apply NLP methods directly, or treated PTSD as a secondary topic.

3. Research Methodology for PTSD

Two research methods were selected for the examination and analysis of studies on the detection of PTSD using NLP methods. These are bibliometric analysis and a systematic literature review method, respectively.

3.1 Bibliometric Analysis and Results

This bibliometric analysis was conducted in accordance with the Guideline for Reporting Bibliometric Reviews of the Biomedical Literature (BIBLIO) [12] which outlines minimum reporting standards for bibliometric reviews in biomedical literature. The guideline was followed to structure the processes of database selection, search strategy development, inclusion/exclusion criteria definition, data extraction, performance analysis, and science mapping. In particular, the Web of Science database was selected, and search strategies were designed based on keywords (Table 1). The analysis covered aspects such as publication trends, country-wise distributions, co-authorship patterns, citation counts, institutional productivity, keyword co-occurrence, and document-based bibliographic coupling.

Table 1. Search criteria for NLP in computer science
DatabaseResearch ScopeKeywordsLanguage
Web of ScienceArticles, papers, book chapters, inprogress documents, review articles, and early access items published between 2012 and May 2024(“natural language processing” OR “Transformers” OR “language models” OR “text analysis”) AND (“healthcare” OR “electronic health records” OR “unstructured data”)English

In the initial phase of this study, the bibliometric analysis method was employed. This approach enabled us to examine the trends in the utilization of NLP in the domain of health. The bibliometric analysis method entails the examination of publications sourced from pertinent databases on research within a particular field. It entails the analysis, mapping and visualization of these publications under specific parameters, thereby providing guidance for researchers regarding the field under investigation (Wallin, 2005). In the course of this research on the use of NLP in the detection of PTSD, the requisite information for the research query was gathered and the requisite analysis was conducted. To this end, the Web of Science database was used, which is one of the leading databases of abstracts and citations of major peer-reviewed publications, including journal articles, conference proceedings, books, and book chapters. A search was conducted in May 2024 utilizing the keywords outlined in Table 1. A total of 4,138 results were obtained from the research conducted by selecting all fields, including the title, author, and publication title. The corpus comprises 2,873 articles, 498 ongoing documents, 446 review articles, 143 early access items, 81 meeting abstracts, 72 editorial materials and 25 book chapters published between May 2012 and 2024. The data obtained from the study was subjected to evaluation under a number of different headings, including those relating to the increase in published material, the number of publications produced by individual countries, an analysis of the number of authors contributing to each publication, an analysis of the number of times each author has been cited, an analysis of the most productive organizations, an investigation into the co-occurrence of keywords, and a document-based bibliographic matching exercise.

For the bibliometric analysis, the Web of Science database was chosen over Scopus. This decision was made because Web of Science offers more standardized citation metadata, higher consistency in author and institutional affiliations, and strong compatibility with visualization tools such as VOSviewer. Although Scopus has broader coverage, it contains more duplicates and heterogeneous document types, which may compromise the precision of bibliometric mapping. Moreover, previous bibliometric guidelines (e.g., BIBLIO) frequently recommend Web of Science as the primary source for systematic bibliometric reviews in biomedical fields.

In this study, a comprehensive search strategy was developed to identify publications related to the use of NLP in the detection of PTSD. The search was performed in the Web of Science database in May 2024. The following keywords were used: “post-traumatic stress disorder” “PTSD” “natural language processing” and “NLP”. These terms were combined using Boolean operators (AND, OR) to create the final search string. The search was conducted across all fields, including title, author, keywords, and abstract. A total of 4,138 documents were retrieved using this strategy, covering the period from May 2012 to May 2024. The inclusion and exclusion criteria below were applied during the selection of documents. The inclusion criteria were (i) publications written in English; (ii) documents categorized as articles, review papers, conference papers, or book chapters; and (iii) studies addressing the use of NLP in the context of PTSD. The exclusion criteria were (i) publications not written in English; (ii) documents such as editorials, meeting abstracts, letters, or commentaries; and (iii) studies not directly addressing the relationship between PTSD and NLP.

3.1.1 Publication increase

Based on the documents obtained from the Web of Science database, 4,138 documents published in the field of NLP and health since 2012 were classified according to years. As seen in Figure 2, 212 documents were accessed in 2012 and more than 700 documents were published by May 2024. It is seen that the interest of researchers working in this field increases with each passing year. Rapid developments in AI have increased the possibilities of using this technology in the field of healthcare.

Figure 2. Annual publication numbers
3.1.2 Publication numbers by country

The distribution of more than 4,000 documents taken from the Web of Science database by country was examined. The most common country in these distributions is the United States. Figure 3 shows the distribution of the ten countries that published the most documents. Based on these publication numbers, it is seen that the United States is focusing on AI studies in the field of health. Pioneering studies have been carried out by the United States on the use of NLP in the healthcare sector.

Figure 3. Number of publications by country

In addition, it is seen that the United Kingdom and China have contributed to the developments in this field with over 300 publications. The United States, on the other hand, published seven times more documents. A cross-validation between the bibliometric and systematic review findings reveals a strong degree of consistency. Countries that ranked highest in publication output in the bibliometric analysis, such as the United States and the United Kingdom, also contributed the majority of high-quality studies included in the systematic review, often relying on Diagnostic and Statistical Manual of Mental Disorders, Fifth Edition (DSM-5) criteria and advanced NLP methodologies. In contrast, some countries such as China, while highly productive in bibliometric counts, were less represented in the systematic review due to stricter methodological inclusion criteria. This comparison highlights both convergence and divergence across the two analyses, thereby strengthening the reliability of the conclusions of this study.

3.1.3 Co-authorship analysis

The act of co-authorship represents a tangible expression of scientific collaboration within a particular field of study. In the context of academic publishing, co-authorship refers to a publication where two or more individuals contribute to the work together [13]. It encourages academic creativity and improves the quality of scholarly work by providing a forum for the exchange of ideas and knowledge among authors. Using VOSviewer, a joint author analysis was conducted based on the criteria shown in Figure 4. Hongfang Liu is identified as one of the most prolific collaborative authors in this field, with 69 documents. The top 10 authors in the field are presented in Table 2.

Figure 4. Graphical representation of the co-authorship analysis
Table 2. Search criteria for NLP in computer science
Author NameDocuments
Liu, Hongfang69
Stewart, Robert42
Xu, Hua36
Sohn, Sunghwan33
Zhou, Li32
Cai, Tianxi31
Zhang, Rui28
Wang, Yanshan27
Fu, Sunyang26
Topaz, Maxim26
3.1.4 Author citation analysis

An author citation analysis enables the relationship between studies in the relevant field to be identified. Researchers employ citations to establish a connection between their own studies and those in the existing literature, thereby facilitating their own contributions to the field. This approach allows the connections between studies on a given subject and between authors to be revealed [14]. A citation analysis was conducted on 4,138 documents retrieved from the Web of Science database. The most frequently cited author is Hongfang Liu, with 1,521 citations. The list of the most cited authors is presented in Table 3. Despite having only two publications, authors such as Katherina Chou and Greg Corrado have a high citation count of 1,291. Using VOSviewer, a joint author citation analysis was conducted based on the criteria shown in Figure 5.

Figure 5. Map of the author citation analysis
Table 3. Search criteria for NLP in computer science
AuthorsCitation Counts
Liu, Hongfang1,521
Chou, Katherine1,291
Corrado, Greg1,291
Cui, Claire1,291
Dean, Jeff1,291
Depristo, Mark1,276
Esteva, Andre1,276
Kuleshov, Volodymyr1,276
Ramsundar, Bharath1,276
Robicquet, Alexandre1,276
Thrun, Sebastian1,276
3.1.5 Most productive organizations

Vosviewer was used to examine 4,138 documents retrieved using the relevant keywords. The organizations that support researchers in this field were listed. Table 4 shows the top ten organizations according to the number of documents. Harvard Med School is the most supportive institution, with 165 documents in this field. It has been observed that Mayo Clinic College of Medicine and Science allocates large amounts of resources to researchers on this subject.

In total, there are 3,266 organizations that support researchers in this field. While some of these organizations have published only one document, some have published 100 or more documents. Figure 6 also shows the map of all organizations.

Table 4. Search criteria for NLP in computer science

Establishment

Document

Citation Number

Harvard Med. Sch.

165

2,380

Mayo Clin.

141

2,837

Brigham & Women’s Hosp

112

2,641

Univ. Utah

111

1,797

Massachusetts Gen. Hosp.

102

2,869

Vanderbilt Univ.

102

2,137

Stanford Univ.

96

2,894

Kings Coll London

91

1,648

Columbia Univ.

78

1,899

Univ. Penn

72

1,490

Figure 6. Graph of productive organizations
3.1.6 Co-occurrence of keywords

Keywords are employed by researchers to provide a concise summary of their studies. The combination of keywords serves to guide researchers in their exploration of a given research field. Furthermore, the use of keywords has been shown to enhance the likelihood of an author being recognized within their respective field of expertise. In this study, the term “natural language processing” was identified as the most frequently occurring keyword, with a total of 1,655 repetitions. Table 5 shows the list of the most used keywords. Figure 7 presents a map illustrating the frequency of occurrence of keywords across 3,667 documents.

Table 5. Search criteria for NLP in computer science
KeywordsNumber of Co-occurrences
natural language processing1,655
machine learning545
electronic health records509
deep learning336
artificial intelligence264
text mining136
NLP104
sentiment analysis103
COVID-1990
Figure 7. Co-occurrence of keywords in PTSD-related NLP studies
3.1.7 Document-based bibliographic matching

The analysis is conducted by examining the intertextual relationships between the documents. The referencing technique employed in a given document can be classified into two main categories: bibliographic coupling and co-citation. Bibliographic matching refers to the practice of citing the same publication in two different sources, whereas co-citation denotes the referencing of two distinct publications in a single source. The list of documents that received the highest number of bibliographic matching citations among the 3,667 documents is presented in Table 6. The document by Estava (2019) has been cited by 1,276 different documents. In addition, the document by Jiang (2017) is expected to guide researchers working in this field by citing 1,150 different documents. A map of all documents is given in Figure 8.

Table 6. Search criteria for NLP in computer science
ReferenceNumber of Citations
Esteva (2019)1,276
Jiang (2017)1,150
Lundervold (2019)869
Ting (2019b)525
Dharmage (2019)492
Lala (2020)466
Zhang (2013d)433
Lee (2018b)380
Gould (2015)364
Wang (2018e)334
Perera (2016)310
Figure 8. Bibliographic matching map of top-cited PTSD NLP studies
3.1.8 Limitations

This study has certain limitations. Firstly, the analysis was limited to publications indexed in the Web of Science database, potentially excluding relevant studies listed in other academic databases such as Scopus, PubMed, or IEEE Xplore. Secondly, only publications written in English were included, which may have led to the omission of significant research published in other languages. Finally, while bibliometric indicators such as citation counts and co-authorship analysis provide valuable quantitative insights, they may not fully capture the qualitative impact or methodological quality of the included publications.

3.2 Comprehensive Review of Advanced NLP Techniques

This section outlines key NLP techniques used in computer science. To classify textual data, words must first be converted into numerical vectors. The second step involves interpreting these vectors, and the final step is the assessment of model performance using classification algorithms. This section is divided into three parts: text representation, neural network architectures, and pre-trained language models. Text representation refers to the process of making natural language texts processable by computers [13], which can only handle numerical vectors. Thus, text must be transformed into mathematically expressible forms. These methods fall into two main categories: discrete and continuous representations, mainly differing in how they preserve the size and structure of data. These vector formats allow for mathematical operations and similarity calculations between texts.

3.2.1 Discrete text representation

Digitizing text for computer processing is a key concern in digital humanities. Researchers have proposed various methods to address this. Discrete text representation converts documents of different lengths into fixed-length vectors [14], typically by indexing unique words as a dictionary. Each vector has the same length as the dictionary, marking present words with “1” and others with “0” Common methods include the bag-of-words model, Term Frequency-Inverse Document Frequency (TF-IDF), and n-gram. The sparsity of one-hot vectors led to the Bag of Words (BoW) model, where texts are represented by a matrix with rows for sentences and columns for unique words with dimensions depending on sentence count and vocabulary size [15].

TF-IDF is a statistical method used to assess word significance in a document [16]. Term Frequency (TF) reflects how often a word appears, while Inverse Document Frequency (IDF) shows its rarity across the corpus. Words with high TF and IDF scores are considered important. TF-IDF is widely applied in information retrieval, text classification, recommendation systems, and text mining. Another key method is n-gram representation, which splits text into sequences of n words (e.g., bigrams for two words and trigrams for three) [17]. This approach retains word order and context, making it valuable in language modeling, sentiment analysis, automatic classification, and recommendation systems.

3.2.2 Continuous text representation

Continuous text representation mathematically maps words into a high-dimensional vector space to preserve semantic similarity [18-20]. Models like Word to Vector (Word2Vec), Global Vectors for Word Representation (GloVe), and FastText learn these vectors from large text corpora, capturing meaning and context. This method is widely used in NLP tasks such as sentiment analysis, classification, and information retrieval [21]. Latent Semantic Analysis (LSA) identifies semantic relationships in texts by transforming a term-frequency matrix into a lower-dimensional space using Singular Value Decomposition (SVD) [22]. It enables grouping of semantically similar words and documents, but its limitations lead to the development of advanced methods like Word2Vec. LSA reduces a term-frequency matrix to a lower-dimensional space using SVD, grouping semantically related words and documents, though it has limitations that lead to more advanced models like Word2Vec [22]. Latent Dirichlet Allocation (LDA) is a probabilistic model that identifies hidden topics in document collections [23]. It assumes that documents are mixtures of topics, and words are linked to topics probabilistically, often using algorithms like Gibbs sampling to uncover thematic structures.

Word2Vec generates word embeddings that capture semantic relationships by training on large corpora [13]. It includes Continuous Bag of Words (CBOW), which predicts a word from its context, and Skip-gram, which predicts context from a word. These vectors place semantically similar words closer in space and are widely used in NLP tasks like classification and sentiment analysis. Dynamic word representation allows word embeddings to adapt over time and across contexts, addressing the limitations of static vectors [24]. This is crucial for analyzing rapidly evolving language use, such as on social media, where words like "cool" may shift in meaning depending on context. These models enhance language understanding by capturing temporal and contextual semantic shifts. Contextualized word embeddings, such as Context Vectors (CoVe), Embeddings from Language Models (ELMo), Generative Pre-trained Transformer (GPT), and Bidirectional Encoder Representations from Transformers (BERT), generate vectors that vary with context, reflecting a word’s meaning dynamically. These are typically trained on large-scale language modelling tasks to create context-sensitive representations [24].

Context2Vec builds on this by learning word or phrase representations based on their surrounding context, offering deeper insight than traditional fixed embeddings [25]. Context2Vec uses neural networks, often Recurrent Neural Network (RNN) or Transformer-based, to generate word embeddings that reflect immediate context [26]. For example, in “The bank is by the river”, it distinguishes between meanings of “bank” by analyzing surrounding words. This enhances performance in tasks like language modelling, sentiment analysis, and machine translation by capturing nuanced semantic relationships. CoVe, on the other hand, generates contextual embeddings using Bidirectional Long Short-Term Memory networks (BiLSTM) that process text in both directions [27]. This allows the model to consider both preceding and following words, producing richer word representations. CoVe has shown strong results in tasks like question answering, sentiment analysis, and named entity recognition by better capturing contextual meaning.

3.3 Neural Network Architectures

In recent years, there has been a notable increase in the utilization of artificial neural network models by researchers in the field of health-related text analysis. Amongst the most prevalent are Convolutional Neural Network (CNN), Long Short-Term Memory (LSTM), RNN and Transformer-based architectures.

3.3.1 CNN

Initially successful in image processing [27], CNNs have since proven highly effective in NLP. Designed to capture local patterns and dependencies in word sequences, CNNs apply convolution operations to extract key features from text. These operations help identify important structures, such as nearby word relationships. CNNs are widely used in NLP tasks like sentiment analysis, text classification, summarization, and language modeling, significantly enhancing structural understanding of textual data.

3.3.2 LSTM

LSTM networks, a type of RNN, were developed to address the vanishing gradient problem and capture long-term dependencies in sequences [28]. They feature internal memory cells and three gates of forget, input, and output that regulate information flow. These gates allow LSTM to retain or discard information as needed, enabling learning across longer contexts. LSTMs are widely used in NLP tasks such as machine translation, sentiment analysis, speech recognition, and text generation, where understanding sequence and context is critical. Their ability to model syntax, semantics, and discourse has significantly improved language modelling.

3.3.3 RNN

RNNs are designed to model sequential data by retaining an internal state and using feedback loops to capture temporal dependencies [29]. Unlike feedforward networks, RNNs process sequences recursively, making them suitable for tasks involving variable-length inputs. However, they face the vanishing gradient problem, which limits their ability to learn long-term dependencies. To address this, enhanced versions like LSTM and Gated Recurrent Unit (GRU) include gating mechanisms that improve information retention over longer sequences. RNNs are widely applied in NLP, time series analysis, and speech recognition, particularly in language modeling, translation, sentiment analysis, and entity recognition.

3.3.4 Transformer-based language models

Transformer-based models, introduced by [30], revolutionized NLP by replacing recurrent and convolutional layers with a self-attention mechanism. This allows them to capture long-range dependencies and process sequences in parallel, boosting efficiency. Models like BERT and GPT have achieved state-of-the-art results in tasks such as classification, question answering, and machine translation [31]. Pre-trained on large corpora, they offer strong linguistic representations adaptable to various applications. Their success has led to widespread use in academia and industry, enhancing NLP capabilities across numerous domains.

3.4 Systematic Literature Review and Results

This systematic review was conducted in accordance with the updated PRISMA 2020 guidelines. The study aimed to synthesize the current state of research on the use of AI and NLP in the detection of PTSD. A PRISMA 2020 flow diagram was used to document the screening process, and a completed PRISMA 2020 checklist was provided as supplementary material. This review did not include a quantitative meta-analysis. Therefore, no formal data extraction of statistical outcomes (e.g., sample sizes, confidence intervals, and effect sizes) was performed. Instead, a thematic and bibliometric synthesis approach was applied. Each eligible study was manually reviewed and coded using a structured extraction framework. The following key data items were recorded for each study: title, first author, publication year, database source, dataset type, target task (e.g., classification or detection of PTSD), applied NLP or AI techniques (e.g., RNN, LSTM, and BERT), language of the dataset, and study context (e.g., clinical or social media). This information was manually organized into an Excel spreadsheet and served as the basis for qualitative comparison and thematic categorization. As no meta-analysis was conducted, formal statistical tests for reporting bias (e.g., funnel plot analysis) and formal risk of bias tools such as the Revised Cochrane Risk of Bias Tool for Randomized Trials (RoB 2) or Risk Of Bias In Non-randomized Studies—of Interventions (ROBINS-I) were not applied. However, potential sources of methodological limitations such as small sample sizes, dataset imbalance, insufficient reporting, and domain specificity were noted qualitatively during the screening process. These factors were taken into account when evaluating the robustness of each study's findings.

Similarly, a formal certainty of evidence assessment tool such as Grading of Recommendations Assessment, Development and Evaluation (GRADE) was not utilized due to the absence of aggregate quantitative outcomes. Nonetheless, the overall reliability of included studies was considered based on the consistency of reported results, methodological transparency, and dataset characteristics (e.g., annotation quality, linguistic variability, and population representativeness). A systematic literature review is a type of review article that aims to identify evidence-based clinical effectiveness on a given problem in order to provide recommendations for the resolution of specific research topics. The objective of a systematic literature review is to synthesize existing research, identify gaps in the existing research landscape, produce a coherent report, and create a research framework. In this study, databases such as ScienceDirect, IEEE, Web of Science and PubMed were scanned. A systematic literature review was conducted in accordance with the PRISMA method and meta-analysis. The following steps were followed for the systematic literature review in the study:

Step 1: Identifying a research question.

Step 2: Determining the database to be researched.

Step 3: Identifying keywords.

Step 4: Review of title, abstract and keywords.

Step 5: Literature eligibility criteria (inclusion and exclusion criteria).

3.4.1 Keywords selection

A systematic literature review was conducted to determine research topics. These were evaluated in relation to PTSD and AI, and search terms were identified. The research terms are provided in the table. The research was conducted using these keywords in relevant databases. The selected keywords are given in Table 7.

The research was conducted using databases that had been previously identified through the application of a keyword selection process. The relevant keywords were determined to be “post-traumatic stress disorder,” “PTSD,” “natural language processing,” “recurrent neural network,” “RNN,” “NLP,” “language models,” and “Transformers.” The research text was created by combining the keywords into two groups. The resulting search string was as follows: (“post-traumatic stress disorder” OR “PTSD”) AND (“recurrent neural network” OR “RNN” OR “natural language processing” OR “NLP” OR “language models” OR “Transformers”).

Table 7. Search criteria for NLP in computer science
Keywords
post-traumatic stress disorder
PTSD
recurrent neural network
RNN
natural language processing
language model
Transformers
3.4.2 Research questions

A systematic literature review is a process that begins with the formulation of research questions. These questions serve to guide the investigation and facilitate the analysis of the subject matter. Table 8 illustrates the research questions and objectives associated with the detection of PTSD using NLP methods.

Table 8. Search criteria for NLP in computer science
NumberQuestionPurpose
1What are the challenges associated with the utilization of NLP for the classification of PTSD?Identifying the challenges experienced and determining solutions
2Can AI be used for the detection of PTSD in the healthcare system?Determining its impacts on the healthcare system
3What are the datasets used in PTSD detection? What are the challenges of these datasets?Evaluating the methods used based on specific criteria
4What are the AI techniques used in solving PTSD? What are the opportunities and challenges of these techniques in mental health disorder detection using NLP?Identifying the challenges and opportunities in mental health disorder detection using NLP techniques
3.4.3 Exclusion criteria and database results

a. Articles published before 2012 are not selected.

b. Articles that use PTSD disorder as a subheading of another disease are not selected.

c. Articles written in a language other than English are not selected.

Studies written in English were searched between January 2012 and May 2024 through ScienceDirect, IEEE, PubMed and Web of Science. Following the PRISMA guideline, 206 studies were identified from ScienceDirect, 12 from the IEEE database, 29 from PubMed, and 37 from Web of Science. A total of 328 documents were examined. The results obtained are shown in Table 9. The article selection process is shown in Figure 9. Although 29 records were initially retrieved from PubMed, only two articles met the inclusion criteria. Most PubMed results were clinical or biological studies not directly related to NLP, or general psychiatric research where PTSD was treated as a secondary aspect. In some cases, NLP was mentioned in the abstract, but a full-text review revealed insufficient application of NLP techniques for PTSD detection. Therefore, the low number of included articles is due to the characteristics of PubMed-indexed literature rather than overly strict selection, minimizing the risk of selection bias.

Table 9. Search criteria for NLP in computer science
Database NameNumber of Articles FoundNumber of Articles IncludedNumber of Excluded Articles
ScienceDirect24027213
IEEE1587
Web of Science441925
PubMed29227
Figure 9. Article selection process

4. NLP Methods Used in PTSD

A categorization and examination of NLP methods used in the detection of PTSD was conducted. Furthermore, an investigation was undertaken into the evolution of NLP methods between 2012 and 2024, with a particular focus on their utilization in the early detection of the disease.

4.1 Classification of NLP Techniques Used in PTSD

This analysis examines approaches used in research on PTSD by comparing NLP methods and techniques used in various studies. The results obtained are shown in Table 10.

Reference & NLP Techniques & Strengths & Weaknesses & Comparative performance / applicability\\

Reference & NLP Techniques & Strengths & Weaknesses & Comparative performance / applicability\\

[32] & Text mining, Support Vector Machine (SVM), Logistic Regression (LR), text cleaning, tokenization, lemmatization, and stop word removal & Effective at identifying PTSD features from narratives & Limited generalizability due to small sample size (159 narratives) & SVM and LR achieve moderate accuracy ($\sim$70–75\%) in small narrative datasets; good for pilot studies but not scalable \\

[33] & SVM, Naive Bayes (NB), text cleaning, tokenization, entity recognition, and sentiment analysis & Useful for quality assessment of therapy notes and automated classification & May not capture nuanced meanings in therapy notes & SVM generally outperforms NB in precision; suitable for structured text (therapy notes) but weaker in nuanced semantics \\

[34] & NLP, entity recognition, standardization, NB, and Decision Tree (DT) & Good for highlevel conceptualization of medical notes & Less effective for detailed text analysis and requires substantial manual labeling & NB and DT are simple, interpretable methods; effective for structured Electronic Health Records (EHR) data but weaker on unstructured text \\

[35] & LR, Random Forest (RF), text cleaning, data standardization, and NLP & Comprehensive analysis of psychotherapy usage & Limited by the specificity of the text data used (e.g., psychotherapy notes) & RF shows better generalization than LR on psychotherapy notes; LR remains robust with smaller, structured data \\

[36] & SVM, NB, text cleaning, speech recognition, language modeling, and data coding & Effective for real-time distress detection in crisis situations & Speech recognition accuracy may impact the results & SVM performs better than NB ($\sim$75\% F1) when ASR accuracy is high; applicable in real-time crisis systems \\

[37] & LR, NB, text cleaning, data standardization, and missing data analysis & Effective for assessing psychotherapy implementation in a clinical setting & May not generalize to non-Veterans Affairs (VA) settings or other types of psychotherapy & NB is faster for categorical data; LR is more robust with continuous data; both are limited to VA datasets \\

[38] & NN, SVM, text cleaning, data normalization, and statistical methods & Innovative use of cognitive computing methods for differential diagnosis & Complex methodology, potentially high computational requirements & NN$>$80\% F1 on clinical records; better than SVM in large datasets, but requires strong hardware \\

[39] & SVM, LR, text cleaning, tokenization, lemmatization, and stop word removal & Effective for automated PTSD screening from self-narratives & Limited by data diversity and sample size & SVM slightly outperforms LR in short self-narratives; accuracy $\sim$70–75\%, limited generalizability \\

[40] & Heuristic algorithms, DT, text cleaning, template extraction, and entity recognition & Useful for novel template identification from medical records & Pilot study, limited sample size (5,000 records) & Effective for exploratory tasks; low scalability and generalization \\

[41] & Deep Neural Network (DNN), CNN, text cleaning, NLP, and data normalization & Advanced neural network techniques, good for complex pattern recognition & Requires extensive computational resources and data normalization & CNN/DNN achieve $>$ 80–85\% accuracy in psychiatric notes; best for large text corpora and require GPUs \\

[42] & LR, NB, text cleaning, NLP, and data standardization & Large-scale analysis, applicable to a national healthcare system & Data quality and consistency issues across a large system & Both scale well; LR offers stability, NB is faster but less robust with noisy data \\

[43] & LR, NB, text cleaning, NLP, and data standardization & Comprehensive assessment of progress and outcomes in veterans & May not be applicable to non-veteran populations & Similar to [42]; applicability restricted to VA data \\

[44] & LR, SVM, text cleaning, sentiment analysis, and topic modeling & Focus on explainability and trustworthiness in Twitter analysis & Limited to Twitter data, which may not capture all aspects of PTSD & SVM handles sparse Twitter features better; LR is easier to interpret but less accurate \\

[45] & LR, NB, text cleaning, NLP, and data standardization & Longitudinal analysis over a significant time period & May be affected by changes in data collection methods over time & Stable over time but sensitive to changes in data capture; NB is simpler, LR is more robust \\

[46] & NB, DT, text cleaning, NLP, entity recognition, missing data analysis, data standardization, and data normalization & Comprehensive approach to psychiatric assessments, addressing various data quality issues & Limited by the quality of patient records and normalization processes & Useful in noisy records; DT is interpretable, NB is scalable but less accurate \\

[47] & NN, LR, text cleaning, NLP, and sentiment analysis & Advanced AI methods for predicting longterm outcomes, effective sentiment analysis & Requires substantial computational resources and highquality data & NN achieves $>$ 80\% F1 in longitudinal datasets; LR is less accurate but efficient on smaller sets \\

[48] & LR, RF, text cleaning, NLP, entity recognition, missing data analysis, data standardization, and text normalization & Comprehensive analysis of VA clinical notes, addressing multiple data quality issues & May not generalize beyond VA clinical settings, potential issues with data normalization & RF generally outperforms LR; both are sensitive to normalization quality \\

[49] & Social media analytics, text analysis, and emoji analysis & Interdisciplinary approach combining linguistics and cyber psychology, bilingual analysis (English and Arabic) & & Strong in exploratory social/cyber psychology; weak comparability with clinical data \\

[50] & CNN and BoW & Combining structured and text data, high interpretability, better handling of false positives & DL models are prone to overfitting, missing values need to be handled carefully & CNN achieves higher recall, BoW is more interpretable; CNN is $>$ 80\% in EHR but data hungry \\

[51] & LSTM, RF, survey data cleaning, missing data imputation, text normalization, and data labeling & Focus on a specific and important issue, effective for handling sequential data & Limited to a specific population and data type & LSTM is $>$ 80\% accuracy on sequence data; RF is stronger \\

[52] & SVM, NB, text cleaning, NLP, entity recognition, and text normalization & Large-scale data from national healthcare systems, effective for large-scale analysis & Data quality and consistency issues across a large system & SVM is generally more accurate; NB is faster but less robust with heterogeneous data \\

[53] & MentalBERT and processing of EMR data & High precision and recall in capturing PTSD from EMR data, combining structured and unstructured data. & Model performance may vary depending on data quality, requiring extensive preprocessing of EMR data. & BERT-based models have $>$ 85\% F1, state-of-the-art; strong but compute-intensive \\

[54] & ML modeling analysis and data mining & Personalized approach, focus on postpartum PTSD, presented at many conferences & Limited to women's health context, specific to birth experiences & Promising in postpartum data; not easily generalizable outside women's health \\

[55] & LDASeq (dynamic topic modelling) & Identification of time-sensitive suicide risk variables improved over the REACHVET model & Requires large data sets, may not generalize well to smaller cohorts & Works best in longitudinal VA datasets; not reliable for small cohorts \\

Vaswani et al. [32] proposed the use of TF-IDF and n-gram models, in conjunction with verbal feature analysis and text mining techniques, to effectively detect the symptoms of PTSD. While this approach is effective in detecting PTSD symptoms based on self-narratives, it is constrained to self-reported narratives alone. The MedCat framework, developed by Radford et al. [34], employed an ontology-based approach to conceptualize medical notes, thereby facilitating a high level of conceptualization and the interpretation of medical terms. However, there are some limitations to the applicability of this framework [48] examined the use of evidence-based psychotherapy through analysis of electronic medical records and treatment notes, utilizing word frequency analysis and text classification techniques. While this method provides information on evidence-based practices, it remains dependent on accurate documentation. Fodeh et al. [37] automatically classified psychotherapy note texts using SVM and LR techniques with the aid of algorithms in ML. However, with this technique offering an automatic, objective quality assessment method, accuracy in text classification, including comprehensiveness, should be guaranteed. Howard et al. [41] did research on cognitive computational methods for various diagnoses of PTSD, such as semantic analysis and pattern recognition techniques. While these methods offer more accurate diagnoses, they are not without difficulties in terms of complexity and applicability. Fodeh et al. [37] examined the implementation of evidence-based psychotherapies in VA specialty clinics, analyzing both electronic medical records and clinical notes. Although this approach does give an indication that evidence-based practices are effective, there is a need to ensure that such practices are sustainable and documented.

In the work of Pacula et al. [39], audio signal processing and text mining techniques were employed to automatically detect the signs of psychological distress in crisis line conversations. While this method detects symptoms with both speed and accuracy, crisis line conversations are inherently complex, posing a great challenge. Shiner et al. [38] used a DNN for the prediction of mental states from psychiatric notes and retrieved high accuracies with the use of both RNN and CNN models. However, such models require training on large amounts of data. Another novel approach was the heuristic algorithms to identify new patterns from VA text data obtained from electronic medical records; however, the algorithm’s applicability and generalizability are big challenges. In a nutshell, all these papers make a great contribution to the detection and analysis of PTSD, as well as other mental disorders, by applying different NLP techniques. Yet, each method has its strengths and weaknesses depending on the specific context in which it would be put to application, together with the dataset. Therefore, their combination and continuous improvement will go hand in glove with more comprehensive and accurate results.

Several of the reviewed studies in Section 4.1 incorporated internationally recognized standardized diagnostic tools for assessing PTSD. For instance, Shiner et al. [51] utilized both the PTSD Checklist for DSM-IV (PCL-IV) and the PCL-5 (aligned with DSM-5 criteria); Sawalha et al. [55] applied the PCL-C and discussed its correlation with Clinician-Administered PTSD Scale for DSM-5 (CAPS-5), the clinical gold standard; Bartal et al. [56] employed the PCL-5 for postnatal PTSD symptom evaluation. In addition, Zafari et al. [53] classified PTSD cases using the International Classification of Diseases, Ninth Revision, Clinical Modification (ICD-9-CM) code 309.81, and Shiner et al. [38] integrated structured clinical interviews such as CAPS, Structured Clinical Interview for DSM Disorders (SCID), the Diagnostic Interview Schedule, Fourth Edition (DIS-IV), and the Composite International Diagnostic Interview (CIDI). Although not all articles referenced ICD-11 directly, the continued use of ICD-9/10 across large health systems provides clinically valid diagnostic frameworks. Therefore, a significant portion of the analyzed literature demonstrates alignment with established diagnostic standards such as DSM and ICD, adequately supporting PTSD classification within this review context.

The included studies varied in their definition of PTSD symptoms. While the majority relied on DSM-based criteria (primarily DSM-5 in recent studies, with a smaller number using DSM-IV), several studies referred to ICD-10/11 classifications, and others employed validated symptom scales such as PCL or CAPS [57]. Although these approaches are broadly aligned, they are not identical, and this heterogeneity may introduce bias in the comparison of results. To mitigate this, this study explicitly reports the diagnostic frameworks used and emphasizes that future research should adopt standardized definitions, preferably DSM-5 or ICD-11, to ensure comparability across studies.

4.2 Datasets

A variety of datasets have been employed in research on NLP methods used to assess and treat PTSD. An in-depth examination of these datasets is essential to ascertain the efficacy of the methods, their potential applications, and the challenges encountered. The section below presents a summary of the key points regarding the datasets utilized in the articles referenced in Table 11.

Reference & Datasets Used & Data Type & Dataset Size & Dataset Accessibility\\

Reference & Datasets Used & Data Type & Dataset Size & Dataset Accessibility\\

[32] & Verbal features in self-narratives & Text & 159 narratives & Closed \\

[33] & Automated classification of psychotherapy note text & Text & 4,310 notes & Closed \\

[34] & High-level conceptualization of medical notes & Text & 10,000+ notes & Closed \\

[35] & Measuring use of evidence-based psychotherapy for PTSD & Text & 3,191 notes & Closed \\

[36] & Differential diagnosis of PTSD using cognitive computing methods & Text and clinical records & 1,000+ records & Closed \\

[37] & Crisis hotline conversations & Speech & 100 hours & Closed \\

[38] & Evidence-based psychotherapies in VA specialty clinics & Text & 1,000+ notes & Closed \\

[39] & “History of present illness” in psychiatric notes & Text & 3,000+ notes & Closed \\

[40] & Patients' self-narratives & Text & 200+ narratives & Closed \\

[41] & VA electronic medical record texts & Text & 5,000+ records & Closed \\

[42] & Evidence-based psychotherapy trends in a national healthcare system & Text & 19,000+ records & Closed \\

[43] & Evidence-based psychotherapy trends for PTSD in a national healthcare system & Text & 19,000+ records & Closed \\

[44] & Twitter analysis model for PTSD assessment & Social media data & 1,000,00 0+ tweets & Open \\

[45] & NLP tools for assessing veteran populations & Text & 10,000+ records & Closed \\

[46] & Psychiatric assessments and patient records & Text and clinical records & 2,000+ records & Closed \\

[47] & AI language predictors for two-year trauma-related outcomes & Text and clinical records & 4,000+ records & Closed \\

[48] & Social media data from online forums and platforms & Social media data & 500,000+ posts & Open \\

[49] & VA clinical notes & Text & 7,000+ notes & Closed \\

[50] & EHR data from the Manitoba Primary Care Research Network (MaPCReN) of primary care clinicians in Manitoba, Canada. & Text & 154,118 & closed \\

[51] & Child abuse mental symptom cases in India & Survey data & 1,000+ cases & Closed \\

[52] & Pan-Canadian EHR data were used & Short diagnostic text fields and free text encounter notes obtained from some regional networks & 56,795 & Processed with anonymization algorithms and accessible by certain researchers \\

[53] & Data from US national healthcare systems & Text & 25,000+ records & Closed \\

[54] & Used data from 1,127 postpartum women who participated in a research survey conducted during the COVID-19 pandemic & Participants' written accounts of their personal birth experiences, PTSD scales & 1,127 & Available by agreement \\

[55] & It included US VA patients diagnosed with PTSD between 2004 and 2013. & Psychotherapy notes, free text encounter notes & 568 & limited \\

Some studies [39-41] were conducted with patients' own narratives and clinical notes. These data include patients’ PTSD symptoms and the way they express their condition. Such data can be difficult to analyze due to the complexity of language and individual differences. However, NLP and text mining techniques can be used effectively to extract important features from these narratives. Shiner et al. [36] similarly measured the use of evidence-based treatment methods by analyzing clinical notes and psychotherapy texts. Some studies [34-40] were conducted with medical records and EHR data. These datasets contain large amounts of unstructured data and provide extensive information about patients' medical history. Processing such data may present challenges due to the volume and diversity of data, but NLP techniques can be used to extract meaningful information from the data. Studies were conducted with social media and other open-source data. Twitter data was used in the study by Vaswani et al. [32]. Social media data consists of information that users voluntarily share, and the data can reflect real-time emotional states. However, social media data has a high potential to be noisy and misleading, so it is important to use reliable and explainable models in analyzing the data. Some studies were conducted with psychotherapy notes and interviews. For example, psychotherapy notes and crisis line conversations were used [36-37]. Such data are valuable for understanding patients' treatment processes and responses because they involve direct patient-therapist interactions. However, the emotional content and context in the data must be interpreted correctly.

The predominance of closed datasets (e.g., EMR and VA clinical notes) in PTSD research raises challenges for reproducibility and comparability across studies. While such datasets ensure clinical validity, they are often inaccessible to independent researchers due to strict privacy regulations, limiting external validation and generalization of findings. In contrast, open data sources such as social media provide broader accessibility and support replicability, but they introduce challenges related to noise, context validity, and ethical concerns. A balanced approach is required: advanced anonymization techniques, federated learning, and secure data-sharing frameworks can help preserve patient privacy while enabling academic transparency. The establishment of controlled-access repositories with de-identified clinical data may also support reproducibility without compromising confidentiality.

The reliance on closed datasets such as VA clinical records may lead to selection bias, as these sources typically represent specific populations and limit generalization to broader contexts. Conversely, open datasets like Twitter and Reddit provide broader coverage and replicability, but raise ethical concerns (e.g., lack of informed consent) and methodological challenges due to noisy, unstructured, and culturally variable content. Another critical issue is data imbalance, since PTSD-positive cases are often underrepresented compared to negative or control samples. This imbalance can bias models toward majority classes and reduce sensitivity to true PTSD cases. Addressing this challenge requires the use of techniques such as data augmentation, resampling strategies such as Synthetic Minority Over-sampling Technique (SMOTE), cost-sensitive learning, and the integration of synthetic or multimodal data. Such strategies help mitigate bias, improve generalizability, and ensure more ethically robust PTSD detection systems.

4.3 Preprocessing Techniques

The use of NLP techniques and ML algorithms in PTSD research plays an important role in understanding patients’ conditions and improving treatment processes. Table 12 shows the datasets, pre-processing techniques, classification algorithms used, and the results obtained.

Reference & Used Datasets & Preprocessing Techniques & Classification Algorithms & Impact on PTSD Detection / Sensitivity\\

Reference & Used Datasets & Preprocessing Techniques & Classification Algorithms & Impact on PTSD Detection / Sensitivity\\

[32] & Automated classification of psychotherapy note text & Text cleaning, tokenization, entity recognition, and sentiment analysis & SVM and NB & Entity recognition and sentiment analysis improved affective feature extraction, leading to higher sensitivity in therapy notes \\

[33] & Verbal features in self-narratives & Text cleaning, tokenization, lemmatization, and stop word removal & SVM and LR & Lemmatization preserved linguistic meaning; excessive stop-word removal risked losing affective cues (e.g., negations) \\

[34] & Measuring use of evidence-based psychotherapy for PTSD & Text cleaning, NLP, and data standardization & LR and RF & Standardization improved comparability across records, critical for longitudinal consistency \\

[35] & High-level conceptualization of medical notes & Text cleaning, entity recognition, standardization, and text normalization & NB and DT & Entity recognition of trauma-related concepts improved detection; normalization reduced noise \\

[36] & Evidence-based psychotherapies in VA specialty clinics & Text cleaning, data standardization, and missing data analysis & LR and NB & Handling missing data ensured robust outcomes; preprocessing minimized false negatives \\

[37] & Crisis hotline conversations & Text cleaning, speech recognition, language modeling, and data coding & SVM and NB & ASR quality is critical; errors in speech recognition directly reduced PTSD detection sensitivity \\

[38] & Differential diagnosis of PTSD using cognitive computing methods & Text cleaning, data normalization, statistical methods, and data integration & NN and SVM & Normalization and integration improved comparability; NN showed better robustness to preprocessing noise \\

[39] & VA electronic medical record texts & Text cleaning, template extraction, entity recognition, and missing data analysis & Heuristic algorithms and DT & Template extraction improved structured feature capture; entity recognition boosted affective feature detection \\

[40] & Patients' selfnarratives & Text cleaning, tokenization, lemmatization, and stop word removal & SVM and LR & Similar to [32], lemmatization aided consistency, stopword removal sometimes removed emotional words \\

[41] & "History of present illness" in psychiatric notes & Text cleaning, NLP, data coding, and data normalization & DNN and CNN & Normalization essential for DNN/CNN; improved signal-to-noise ratio for affective features \\

[42] & Evidence-based psychotherapy trends in a national healthcare system & Text cleaning, NLP, and data standardization & LR and NB & Standardization critical for multicenter data; ensured stable feature extraction \\

[43] & NLP tools for assessing veteran populations & Text cleaning, NLP, and data standardization & LR and NB & Similar to [42], preprocessing stability improved longitudinal assessments \\

[44] & Twitter analysis model for PTSD assessment & Text cleaning, sentiment analysis, and topic modeling & LR and SVM & Sentiment analysis directly enhanced affective signal detection; noise in tweets remained a challenge \\

[45] & Evidence-based psychotherapy trends for PTSD in a national healthcare system & Text cleaning, NLP, and data standardization & LR and NB & Standardization key for large-scale VA datasets; reduced variability across facilities \\

[46] & EHR data from the MaPCReN & BoW, lemmatization, and TF-IDF & Multi-layered NN, and RF & Lemmatization and TF-IDF improved text vectorization; critical for sparse EHR data \\

[47] & VA clinical notes & Text cleaning, NLP, entity recognition, missing data analysis, data standardization, and text normalization & LR and RF & Entity recognition and normalization improved affective feature extraction and reduced false negatives \\

[48] & Social media data from online forums and platforms & Text cleaning, language detection, sentence and word tokenization, stop word removal, and sentiment analysis for labeling & SVM and NB & Sentiment analysis effective for PTSD signals; stop-word removal risked losing emotional cues \\

[49] & AI language predictors for twoyear trauma-related outcomes & Text cleaning, NLP, and sentiment analysis & NN and LR & Sentiment analysis crucial for affective feature extraction; improved long-term PTSD prediction \\

[50] & Psychiatric assessments and patient records & Text cleaning, NLP, entity recognition, missing data analysis, data standardization, and data normalization & NB and DT & Entity recognition + normalization improved affective extraction; missing data analysis increased robustness \\

[51] & Data from multiple clinical studies and trials & Data cleaning, missing data imputation, statistical normalization, data integration, and data coding and labeling & SVM and NN & Imputation stabilized datasets; normalization reduced bias, NN became more robust \\

[52] & Pan-Canadian EHR data & Stop words removed, special characters removed, and case editing, tokenization, removal of stop words, lemmatization, and TF-IDF & - & Stop-word removal simplified vectors, but risked affective word loss; lemmatization preserved semantics \\

[53] & Child abuse mental symptom cases in India & Survey data cleaning, missing data imputation, text normalization, and data labeling & LSTM and RF & Normalization and labeling essential for sequential data; LSTM performed best on preprocessed data \\

[54] & Data from US national healthcare systems & Text cleaning, NLP, entity recognition, and text normalization & SVM and NB & Entity recognition key for medical concept extraction; normalization improved crosssystem generalization \\

[55] & They provided brief written accounts of their birth experiences. & all-mpnet-base-v2, Deep Feed Forward Neural Network (DFNN), SentenceTransformers & DFNN & Transformer embeddings reduced reliance on preprocessing; better affective capture \\

[58] & US VA patients diagnosed with PTSD between 2004 and 2013. & Tokenization, removing stop words, removing symbols and punctuation, and converting all words to lowercase & Dynamic topic modelling and LDA & Tokenization essential for topic modeling; stop-word removal sometimes removed negations critical for PTSD features \\

The preprocessing techniques employed in these studies are essential for transforming raw text data into a format that is conducive to analysis. These techniques enhance the quality of the data, reducing noise and extracting meaningful information, which is essential for NLP and ML models to perform effectively. The selection of preprocessing techniques is contingent upon the characteristics of the data and the analytical objectives. For instance, in the context of clinical and medical studies, entity recognition and standardization are essential for the extraction and classification of medical terms. In the domain of social media analysis, sentiment analysis and topic modelling are crucial for understanding public opinion and detecting mental health conditions. In general, the judicious choice and implementation of preprocessing techniques are pivotal for the success of text analysis and ML projects.

5. Results and discussion

While this review underscores the potential of NLP techniques in identifying PTSD-related symptoms, it is crucial to delineate the distinction between symptom detection and diagnostic assessment. The studies reviewed herein employed NLP primarily for the identification of linguistic markers and symptomatology associated with PTSD. However, direct diagnostic classification using NLP remains a complex and evolving domain, requiring further validation through clinical datasets and standardized diagnostic tools (e.g., PCL-5, CAPS, and ICD-11). Consequently, this review does not claim that NLP techniques can independently diagnose PTSD but rather highlights their supplementary role in symptom detection and clinical assessment. PTSD is widely recognized as a significant mental health concern. This study was designed to examine the relationship between PTSD research and AI methods, with a particular focus on NLP. Systematic searches were conducted in four major databases: Web of Science, IEEE Xplore, ScienceDirect, and PubMed. The databases were subjected to a comprehensive examination through the application of systematic literature review and bibliometric analysis techniques. With regard to the bibliometric analysis, the Web of Science database was queried with the pertinent keywords, resulting in the retrieval of 4,138 documents. In the context of the systematic literature review, 328 documents were accessed through the use of relevant keywords across four databases, namely Web of Science, IEEE, ScienceDirect and PubMed. The systematic literature review was structured around four research questions, which are outlined in Table 8 (Chapter 3). The first of these, “What are the challenges associated with the utilization of NLP for the classification of PTSD?”, was addressed under the following thematic headings. The corresponding findings are presented in Table 13.

Table 10. Challenges encountered
Challenge CategoryDescription
Data quality and diversityClinical data is often of high quality, whereas data from unstructured sources like social media may have lower quality. This makes it challenging to accurately understand emotional and linguistic contexts.
Linguistic and contextual complexityVariations in language and contextual differences between data sources can make it difficult for NLP techniques to accurately capture emotional and traumatic expressions.
Data security and privacyHandling health data involves significant concerns regarding data security and privacy. Protecting data requires compliance with legal and ethical standards.
Lexical and semantic parsingHighlights the importance of semantic parsing and linguistic features in text. Semantic parsing can affect the accuracy of NLP models, especially as individuals use different linguistic expressions to describe trauma experiences, making the parsing process complex.

Challenges in detecting PTSD using NLP involve several factors, from data quality to the selection of algorithms. Major factors include data cleaning and standardization, linguistic and contextual complexities, dataset size and diversity, choice of classification algorithms, and semantic parsing. Future studies should focus on investigating various strategies and improvements for overcoming these challenges and developing more accurate and reliable NLP-based PTSD detection methods. As for the second research question, “To what extent is AI used in detecting PTSD within the healthcare system?”, the answers can be seen in Table 14.

Table 11. Health system integration
CriterionDescription
Early detection and interventionAI systems can quickly analyze large datasets to detect PTSD symptoms early, which can accelerate early intervention and treatment processes.
Big data analysisAI can process large datasets and identify emotional patterns. It can analyze data from sources such as social media and EHR.
Personalized treatment approachesAI can provide customized treatment recommendations based on individual data and past experiences, making treatment processes more effective.
Data quality and securityThe quality and security of health data are crucial. Concerns about data privacy and security can complicate the protection of personal information.

This holds a number of advantages with regard to health systems for the detection of PTSD using AI. The benefits it confers due to early diagnosis, scalability, personalized treatment, and holistic data analysis can help manage the condition more effectively. However, challenges such as data quality, accuracy of algorithms, cultural and linguistic barriers, and ethical issues also exist. Overcoming these challenges will grant new frontiers of leveraging AI systems into healthcare applications safely and more reliably. As for another question, “What are the datasets used in PTSD detection? What are the challenges of these datasets?”, the answers are shown in Table 15.

The datasets for diagnosing PTSD are full of challenges. EHR consists of patients' medical histories and treatment processes. However, while analyzing these datasets, the main challenges found were those related to a lack of data standards, incomplete data, and data security. Crisis hotline conversations have other issues, which involve personal information protection and diversity in language accommodation. In contrast, social media data is marked by linguistic variations and noisy data that hamper proper classification and analysis. Similarly, psychiatric notes are also linguistically and contextually diverse, which may impact the effectiveness of NLP techniques. All these datasets have other challenges, such as data anonymization and protection of personal information. These challenges may cause problems in most ways of carrying out AI, especially NLP-based methods, for PTSD and highly underline careful processing and standardization of data. Beyond general considerations, the ethical challenges of applying NLP to PTSD data are unique and multi-layered. First, trauma narratives expose both researchers and clinicians to the risk of secondary trauma, underlining the need for careful curation, anonymization, and support mechanisms. Second, algorithmic transparency is critical: PTSD detection tools must provide explainable outputs so that clinicians and patients understand the basis of risk assessments. Third, mining social media data for PTSD research raises issues of informed consent, user privacy, and the potential re-exposure of individuals to trauma content. Although open data enhance replicability, ethical safeguards such as anonymization, adherence to platform policies, and privacy-preserving methods (e.g., differential privacy and federated learning) are essential. Finally, clinical data such as EMR and VA records demand strict data governance and advanced security protocols, as breaches may have severe consequences for vulnerable populations. These considerations highlight that ethical design is not peripheral but central to NLP applications in PTSD. As for the fourth and final question, "What are the AI techniques employed in the treatment of post-PTSD? What are the opportunities and challenges presented by these techniques?", the answers are shown in Table 16.

Table 12. Dataset challenges
DatasetDescriptionChallenges
EHRRecords containing patients' medical histories, treatment processes, and symptoms.Non-standardized data, missing data, data security and privacy issues.
Crisis hotline conversationsCalls and conversations during crisis situations.Protection of personal information, data anonymization, and diversity in spoken language.
Social media dataMessages and posts collected from social media platforms.Variability in data quality, linguistic variation, and lack of context.
Psychiatric notesNotes written by psychiatrists about patients.Linguistic and contextual diversity, and lack of standardized data.
Medical notes and reportsVarious medical reports and notes about patients.Data heterogeneity, and missing or ambiguous labels.
Twitter and Reddit dataMessages and comments from users on social media.Data noise, linguistic complexity, and mislabeling.
Table 13. Opportunities and challenges of AI techniques used for PTSD
AI techniqueUsageOpportunitiesChallenges
NLPAnalysis of patient reports, psychiatry notes, and social media data.Extracting meaningful information from large datasets, and developing early warning systemsData heterogeneity, linguistic variations, contextual differences, and protection of personal data.
MLSymptom prediction and classification.Learning capacity from large datasets, and accurate symptom classification.Data quality and quantity, model interpretability, and generalization ability.
DLExtracting complex features from text and speech data.Capturing complex symptom models and high performance on large datasets.High computational power and data requirements and model interpretability issues.
Probabilistic modelsIdentifying latent topics and semantic structures.Understanding hidden structures and topics in data, and meaningful representation of texts.Data preprocessing, hyperparameter tuning, and interpretability of results.

Application of AI techniques shows great promise in detecting and treating PTSD, though it is not an obstacle-free territory. Techniques like NLP, ML, DL, and probabilistic models can bring about improvement in the management of PTSD. However, data quality issues, concerns pertaining to privacy, and model explainability might hamper the effectiveness of such techniques. Therefore, the integration of AI applications requires careful assessment and planning in order to be effectively realized. Articles under review indicated a different level of influence that NLP had on the detection and analysis of PTSD. Some common methods followed in general involve text cleaning, tokenization, lemmatization, and many other types of classification algorithms. The most common algorithms adopted include SVM and LR. Other research also went deep to conduct more advanced DNN and CNN techniques. Various strengths can be found in the high-performance models. Most of the articles use a high-performance model for the detection of PTSD. In particular, methods such as DNN and CNN have been demonstrated to be effective in understanding complex patterns and relationships. For instance, [29] attained favorable outcomes through the utilization of DL techniques. The utilization of extensive data sets is a further strength. The utilization of extensive data sets enhances the model's capacity for generalization. The findings of [30], which were obtained using large-scale health data, serve to emphasize the importance of large data sets. A very critical cleaning and preprocessing of data must be performed in order for the quality and reliability of a data set to be present. Effective cleaning and preprocessing techniques employed in articles enhanced the performance of models. Among those, especially, text preprocessing techniques like cleaning, tokenization, and removal of stop words proved very effective to enhance the accuracy of results.

As summarized in Table 10, classical ML models such as SVM and LR are effective for small, structured datasets, while DL models (CNN, LSTM, and DNN) achieve higher accuracy in complex or sequential data but require extensive resources. Transformer-based models (e.g., MentalBERT) currently demonstrate the best performance in EMR-based studies, though they are dependent on large annotated corpora. Thus, model selection in PTSD detection should be guided by dataset size, structure, and computational resources. The aspects below also need more emphasis. Another source of worry is the quality and diversity of data. Quite a good number of studies have reported constraints regarding the quality and diversity of data. In particular, the limited size or scope of the data sets may affect the model's ability to generalize. For example, Church [20] obtained limited results using a small data set. The deployment of DL methodologies necessitates the availability of substantial computational resources and data processing capabilities. This may be a limitation in small-scale studies or projects with limited resources [26]. While the benefits of using NLP techniques in PTSD analysis are apparent, a host of challenges includes data quality issues, generalization ability, and computational requirements. Future performance enhancement to result in higher accuracy may only be realized once larger data sets and more sources of data have been utilized. Moreover, new computational power enables the methods to be applied on a wider array of data and enhances the NLP techniques themselves.

The impact of preprocessing steps on PTSD detection performance varies across data types. For example, entity recognition plays a crucial role in extracting trauma-specific concepts (e.g., “combat” and “assault”), thereby improving the sensitivity of affective feature extraction. Lemmatization and normalization reduce linguistic variability and are particularly beneficial in morphologically rich languages or noisy social media data. Conversely, aggressive stop-word removal may inadvertently eliminate emotionally charged words (e.g., “never” and “alone”), thus reducing classification sensitivity. This suggests that preprocessing pipelines should be carefully tailored. While general cleaning improves robustness, certain steps such as entity recognition and normalization are critical for effective feature capture in PTSD detection.

Although NLP technologies show promise in supporting personalized PTSD treatment, their clinical applicability remains limited. Most current models are at the research stage and have not undergone prospective clinical validation. In practice, NLP can complement existing diagnostic tools such as PCL-5 and CAPS by automatically screening EMR notes or therapy transcripts for symptom patterns, thereby reducing clinician burden. However, integration into clinical workflows requires addressing key barriers, including physician acceptance, regulatory approval, and trust issues arising from inadequate model interpretability. Pilot projects, such as NLP-assisted EMR screening initiatives in VA hospitals, illustrate potential pathways, yet broader deployment will depend on ensuring transparency, explainability, and secure integration into electronic health record systems.

6. Future Work

Results obtained from this study serve as a very good insight into the state of analyzing PTSD with NLP techniques. Nevertheless, the following recommendations could further develop the research of the subject in an area of its limitation to explore future studies.

$\bullet$ Diversity of data and its coverage: Larger and more diverse data should be used in the future. Studies have focused their attention on data sources such as social media and medical records. Data from diverse cultural and geographical regions can enable models to provide wider generalization, and therefore model validity assessments can be realized in a much larger population.

$\bullet$ Advanced NLP methods: The technique is ever-evolving in the field of NLP. With the introduction of DL methodologies and the rise of large language models, such as GPT-4 and BERT, the possibility for more advanced forms of analysis becomes possible. It is recommended that future studies investigate the potential of these advanced NLP techniques in the context of PTSD detection and further explore how such methods can be operationalized in practical applications.

$\bullet$ Data quality and ethics: While improving data quality, ethical aspects also require stronger standards in collecting and treating data. Most importantly, this involves ensuring that ethical legislation and privacy standards are guaranteed during the processing of personal and sensitive information. Moreover, standardized cleaning and preprocessing methods of data can sometimes help in enhancing the performance of the models as well.

$\bullet$ Multimodal data usage: Future research can make use of multimodal datasets that include audio, images, and other forms of data in addition to text data. Available data in this regard can help gain deep insights into the psychological state of subjects and perhaps will be more useful for the analytics involved.

Future work should focus on the integration of multimodal data (e.g., text, voice, and physiological signals) to improve the robustness of PTSD detection. However, multimodal integration faces specific challenges. Heterogeneity across modalities requires synchronization and representation learning that can bridge linguistic, acoustic, and physiological features. Moreover, labeling multimodal datasets is resource-intensive, as expert annotation is needed for both clinical and affective cues. Possible technical pathways include early, late, and hybrid fusion strategies, as well as the use of self-supervised multimodal models that reduce annotation costs. Pilot projects could involve collecting text and voice data from therapy sessions or crisis hotlines, supplemented with wearable sensor data, to test the feasibility of multimodal PTSD detection in real-world settings.

Author Contributions

Conceptualization, E.S. and E.Y.; Methodology, E.S. and E.Y.; Software, E.S.; Validation, E.Y.; Formal Analysis, E.S.; Investigation, E.S. and E.Y.; Data Curation, E.S.; Writing—Original Draft Preparation, E.S.; Writing—Review and Editing: E.S. and E.Y.; Visualization, E.S.; Supervision, E.Y.; Project Administration, E.S.; Funding Acquisition, E.S. All authors have read and agreed to the published version of the manuscript and consented to its submission to ATAIML (Advances in Technology and Artificial Intelligence in Machine Learning).

Conflicts of Interest

The authors declare no conflict of interest.

References
@article@book{1,title={World mental health report: {T}ransforming mental health for all},author={{World Health Organization}},year={2022}}.
@article{2,title={Global prevalence of past-year violence against children: {A} systematic review and minimum estimates},author={Hillis, S. and Mercy, J. and Amobi, A. and Kress, H.},journal={Pediatrics},volume={137},number={3},pages={e20154079},year={2016},doi={10.1542/peds.2015-4079},url={}}. [Crossref]
@article{3,title={Childhood adversities and adult psychiatric disorders in the national comorbidity survey replication {II}: {A}ssociations with persistence of {DSM-IV} disorders},author={McLaughlin, K. A. and Green, J. G. and Gruber, M. J. and Sampson, N. A. and Zaslavsky, A. M. and Kessler, R. C.},journal={Arch. Gen. Psychiatry.},volume={67},number={2},pages={124-132},year={2010},doi={10.1001/archgenpsychiatry.2009.187},url={}}. [Crossref]
@article{4,title={The consequences of the {COVID}-19 pandemic on mental health and implications for clinical practice},author={Fiorillo, A. and Gorwood, P.},journal={Eur. Psychiatry},volume={63},number={1},pages={e32},year={2020},doi={10.1192/j.eurpsy.2020.35},url={}}. [Crossref]
@article{5,title={Barriers to treatment for mental disorders in six countries of the {A}mericas: {A} regional report from the {World Mental Health Surveys}},author={Orozco, R. and Vigo, D. and Benjet, C. and Borges, G. and Aguilar-Gaxiola, S. and Andrade, L. H. and Cia, A. and Hwang, I. and Kessler, R. C. and Piazza, M. and others},journal={J. Affect. Disord.},volume={303},pages={273-285},year={2022},doi={10.1016/j.jad.2022.02.031},url={}}. [Crossref]
@article{6,title={A meta-analysis of mentalizing in anxiety disorders, obsessive-compulsive and related disorders, and trauma and stressor related disorders},author={Sloover, M. and van Est, L. A. C. and Janssen, P. G. J. and Hilbink, M. and van Ee, E.},journal={J. Anxiety Disord.},volume={92},pages={102641},year={2022},doi={10.1016/j.janxdis.2022.102641},url={}}. [Crossref]
@article{7,title={The epidemiology of {DSM-5} posttraumatic stress disorder in the {U}nited {S}tates: {R}esults from the National Epidemiologic Survey on Alcohol and Related Conditions-III},author={Goldstein, R. B. and Smith, S. M. and Chou, S. P. and Saha, T. D. and Jung, J. and Zhang, H. T. and Pickering, R. P. and Huang, B. J. and Grant, B. F.},journal={Soc. Psychiatry Psychiatr. Epidemiol.},volume={51},number={8},pages={1137-1148},year={2016},doi={10.1007/s00127-016-1208-5},url={}}. [Crossref]
@article{8,title={{ELIZA}—{A} computer program for the study of natural language communication between man and machine},author={Weizenbaum, J.},journal={Commun. ACM},volume={9},number={1},pages={36-45},year={1966},doi={10.1145/365153.365168},url={}}. [Crossref]
@article{9,title={The {PRISMA} statement for reporting systematic reviews and meta-analyses of studies that evaluate health care interventions: {E}xplanation and elaboration},author={Liberati, A. and Altman, D. G. and Tetzlaff, J. and Mulrow, C. and Gøtzsche, P. C. and Ioannidis, J. P. and Clarke, M. and Devereaux, P. J. and Kleijnen, J. and Moher, D.},journal={Ann. Intern. Med.},volume={151},number={4},pages={W65-W94},year={2009},doi={10.7326/0003-4819-151-4-200908180-00136},url={}}. [Crossref]
@article{10,title={Software survey: {VOS}viewer, a computer program for bibliometric mapping},author={van Eck, N. J. and Waltman, L.},journal={Scientometrics},volume={84},pages={523-538},year={2009},doi={10.1007/s11192-009-0146-3},url={}}. [Crossref]
@article{11,title={The {PRISMA} 2020 statement: {A}n updated guideline for reporting systematic reviews},author={Page, M. J. and McKenzie, J. E. and Bossuyt, P. M. and Boutron, I. and Hoffmann, T. C. and Mulrow, C. D. and Shamseer, L. and Tetzlaff, J. M. and Akl, E. A. and Brennan, S. E. and others},journal={BMJ},volume={372},year={2021},doi={10.1136/bmj.n71},url={}}. [Crossref]
@article{12,title={Preliminary guideline for reporting bibliometric reviews of the biomedical literature ({BIBLIO}): {A} minimum requirements},author={Montazeri, A. and Mohammadi, S. and Hesari, P. M. and Ghaemi, M. and Riazi, H. and Sheikhi-Mobarakeh, Z.},journal={Syst. Rev.},volume={12},number={1},pages={239},year={2023},doi={10.1186/s13643-023-02410-2},url={}}. [Crossref]
@article{13,title={Coauthorship networks and patterns of scientific collaboration},author={Newman, M. E. J.},journal={Proceedings of the National Academy of Sciences},volume={101},pages={5200-5205},year={2004},doi={10.1073/PNAS.0307545100},url={}}. [Crossref]
@article{14,title={Guidelines from the heritage field for the integration of landscape and heritage planning: {A} systematic literature review},author={Sánchez, M. L. and Cabrera, A. T. and Del Pulgar, M. L. G.},journal={Landsc. Urban. Plan.},volume={204},pages={103931},year={2021},doi={10.1016/j.landurbplan.2020.103931},url={}}@inproceedings{15,title={Distributed Representations of Words and Phrases and their Compositionality},author={Mikolov, T. and Sutskever, I. and Chen, K. and Corrado, G. S. and Dean, J.},journal={Advances in Neural Information Processing Systems(NIPS 2013)},volume={26},year={2013},url={https://proceedings.neurips.cc/paper_files/paper/2013/file/9aa42b31882ec039965f3c4923ce901b-Paper.pdf}}. [Crossref]
@article{16,title={From frequency to meaning: {V}ector space models of semantics},author={Turney, P. D. and Pantel, P.},journal={J. Artif. Intell. Res.},volume={37},pages={141-188},year={2010},doi={10.1613/jair.2934},url={}}. [Crossref]
@article{17,title={A survey of outlier detection methodologies},author={Hodge, V. J. and Austin, J.},journal={Artif. Intell. Rev.},volume={22},pages={85-126},year={2004},doi={10.1023/b:aire.0000045502.10941.a9},url={}}. [Crossref]
@article{18,title={Term-weighting approaches in automatic text retrieval},author={Salton, G. and Buckley, C.},journal={Inf. Process. Manag.},volume={24},number={5},pages={513-523},year={1988},doi={10.1016/0306-4573(88)90021-0},url={}}. [Crossref]
@article{19,title={N-gram-based text categorization},author={Cavnar, W. B. and Trenkle, J. M.},journal={Proceedings of SDAIR-94, 3rd annual symposium on document analysis and information retrieval},volume={161175},pages={14},year={1994}}.
@article{20,title={Word2{V}ec},author={Church, K. W.},journal={Nat. Lang. Eng.},volume={23},number={1},pages={155-162},year={2017},doi={10.1017/S1351324916000334},url={}}@inproceedings{21,title={Glo{V}e: {G}lobal Vectors for Word Representation},author={Pennington, J. and Socher, R. and Manning, C. D.},journal={Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP)},pages={1532-1543},year={2014},url={https://aclanthology.org/D14-1162.pdf}}@inproceedings{22,title={Text Classification Model Based on fast{T}ext},author={Yao, T. J. and Zhai, Z. G. and Gao, B. T.},journal={2020 IEEE International conference on artificial intelligence and information systems (ICAIIS)},pages={154-157},year={2020},doi={10.1109/ICAIIS49377.2020.9194939},url={https://doi.org/10.1109/ICAIIS49377.2020.9194939}}. [Crossref]
@article{23,title={A neural probabilistic language model},author={Bengio, Y. and Ducharme, R. and Vincent, P. and Jauvin, C.},journal={J. Mach. Learn. Res.},volume={3},pages={1137-1155},year={2003}}.
@article{24,title={Information Retrieval Based upon Latent Class Analysis},author={Baker, F. B.},journal={J. ACM},volume={9},number={4},pages={512-521},year={1962},doi={10.1145/321138.321148},url={}}. [Crossref]
@article{25,title={Latent Dirichlet allocation: {E}xtracting topics from software engineering data},author={Campbell, J. C. and Hindle, A. and Stroulia, E.},journal={The Art and Science of Analyzing Software Data},pages={139-159},year={2015},doi={10.1016/B978-0-12-411519-4.00006-9},url={}}. [Crossref]
@article{26,title={Text Representation for Sentiment Analysis: {F}rom Static to Dynamic},author={Gavali, P. M. and Shiragave, S. K.},journal={2023 3rd International Conference on Smart Data Intelligence (ICSMDI)},pages={99-105},year={2023},doi={10.1109/ICSMDI57622.2023.00025},url={}}. [Crossref]
@article{27,title={Context2{V}ec: {L}earning generic context embedding with bidirectional {LSTM}},author={Melamud, O. and Goldberger, J. and Dagan, I.},journal={Proceedings of the 20th SIGNLL conference on computational natural language learning},pages={51-61},year={2016},doi={10.18653/v1/k16-1006},url={}}@inproceedings{28,title={Contextualized context2{V}ec},author={Ashihara, K. and Kajiwara, T. and Arase, Y. and Uchida, S.},journal={Proceedings of the 5th Workshop on Noisy User-generated Text (W-NUT 2019)},pages={397-406},year={2019},doi={10.18653/V1/D19-5552},url={https://doi.org/10.18653/V1/D19-5552}}. [Crossref]
@article{29,title={Learned in translation: {C}ontextualized word vectors},author={McCann, B. and Bradbury, J. and Xiong, C. and Socher, R.},journal={Advances in Neural Information Processing Systems 30 (NIPS 2017)},year={2017},url={https://proceedings.neurips.cc/paper_files/paper/2017/file/20c86a628232a67e7bd46f76fba7ce12-Paper.pdf}}@incollection{30,title={Long Short-Term Memory},author={Graves, A.},booktitle={Supervised Sequence Labelling with Recurrent Neural Networks},publisher={Springer},pages={37-45},year={2012},doi={10.1007/978-3-642-24797-2_4},url={}}. [Crossref]
@article{31,title={Bidirectional recurrent neural networks},author={Schuster, M. and Paliwal, K. K.},journal={IEEE Trans. Signal Process.},volume={45},number={11},pages={2673-2681},year={1997}}@inproceedings{32,title={Attention is all you need},author={Vaswani, A. and Shazeer, N. and Parmar, N. and Uszkoreit, J. and Jones, L. and Gomez, A. N. and Kaiser, L. and Polosukhin, I.},booktitle={Advances in Neural Information Processing Systems (NIPS 2017)},volume={30},year={2017}}@inproceedings{33,title={Bert: {P}re-training of deep bidirectional transformers for language understanding},author={Devlin, J. and Chang, M. W. and Lee, K. and Toutanova, K.},booktitle={Proceedings of the 2019 conference of the North American chapter of the association for computational linguistics: human language technologies},pages={4171-4186},year={2019},doi={10.18653/v1/n19-1423},url={}}. [Crossref]
@article{34,title={Language models are unsupervised multitask learners},author={Radford, A. and Wu, J. and Child, R. and Luan, D. and Amodei, D. and Sutskever, I.},journal={OpenAI Blog},volume={1},number={8},pages={9},year={2019},url={https://storage.prod.researchhub.com/uploads/papers/2020/06/01/language-models.pdf}}.
@article{35,title={Screening for posttraumatic stress disorder using verbal features in self narratives: {A} text mining approach},author={He, Q. and Veldkamp, B. P. and de Vries, T.},journal={Psychiatry Res.},volume={198},number={3},pages={441-447},year={2012},doi={10.1016/j.psychres.2012.01.032},url={}}. [Crossref]
@article{36,title={Automated classification of psychotherapy note text: {I}mplications for quality assessment in {PTSD} care},author={Shiner, B. and D’Avolio, L. W. and Nguyen, T. M. and Zayed, M. H. and Watts, B. V. and Fiore, L.},journal={J. Eval. Clin. Pract.},volume={18},number={3},pages={698},year={2012},doi={10.1111/j.1365-2753.2011.01634.x},url={}}. [Crossref]
@article{37,title={{MedCat}: {A} framework for high level conceptualization of medical notes},author={Fodeh, S. J. and Zirkle, M. and Finch, R. and Reeves, J. and Erdos, C. and Brandt, C.},journal={2013 IEEE 13th International Conference on Data Mining Workshops},pages={274-280},year={2013},doi={10.1109/ICDMW.2013.89},url={}}. [Crossref]
@article{38,title={Measuring use of evidence based psychotherapy for posttraumatic stress disorder},author={Shiner, B. and D’Avolio, L. W. and Nguyen, T. M. and Zayed, M. H. and Young-Xu, Y. and Desai, R. A. and Schnurr, P. P. and Fiore, B. V. and Watts, B. V.},journal={Adm. Policy Ment. Health},volume={40},number={4},pages={311-318},year={2013},doi={10.1007/s10488-012-0421-0},url={}}. [Crossref]
@article{39,title={Automatic detection of psychological distress indicators and severity assessment in crisis hotline conversations},author={Pacula, M. and Meltzer, T. and Crystal, M. and Srivastava, A. and Marx, B.},journal={2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},pages={4863-4867},year={2014},doi={10.1109/ICASSP.2014.6854526},url={}}. [Crossref]
@article{40,title={Implementation of evidence-based psychotherapies for posttraumatic stress disorder in {VA} specialty clinics},author={Watts, B. V. and Shiner, B. and Zubkoff, L. and Carpenter-Song, E. and Ronconi, J. M. and Coldwell, C. M.},journal={Psychiatr. Serv.},volume={65},number={5},pages={648-653},year={2014},doi={10.1176/appi.ps.201300176},url={}}. [Crossref]
@article{41,title={Towards a differential diagnostic of {PTSD} using cognitive computing methods},author={Howard, N. and Jehel, L. and Arnal, R.},journal={2014 IEEE 13th International Conference on Cognitive Informatics and Cognitive Computing},pages={9-20},year={2014},doi={10.1109/ICCI-CC.2014.6921435},url={}}. [Crossref]
@article{42,title={Automated assessment of patients’ self-narratives for posttraumatic stress disorder screening using natural language processing and text mining},author={He, Q. and Veldkamp, B. P. and Glas, C. A. W. and de Vries, T.},journal={Assessment},volume={24},number={2},pages={157-172},year={2015},doi={10.1177/1073191115602551},url={}}. [Crossref]
@article{43,title={A pilot study of a heuristic algorithm for novel template identification from {VA} electronic medical record text},author={Redd, A. M. and Gundlapalli, A. V. and Divita, G. and Carter, M. E. and Tran, L. T. and Samore, M. H.},journal={J. Biomed. Inform.},volume={71},pages={S68-S76},year={2017},doi={10.1016/j.jbi.2016.07.019},url={}}. [Crossref]
@article{44,title={Predicting mental conditions based on “history of present illness” in psychiatric notes with deep neural networks},author={Tran, T. and Kavuluru, R.},journal={J. Biomed. Inform.},volume={75},pages={S138-S148},year={2017},doi={10.1016/j.jbi.2017.06.010},url={}}. [Crossref]
@article{45,title={Measuring use of evidence based psychotherapy for posttraumatic stress disorder in a large national healthcare system},author={Maguen, S. and Madden, E. and Patterson, O. V. and DuVall, S. L. and Goldstein, L. A. and Burkman, K. and Shiner, B.},journal={Adm. Policy Ment. Health},volume={45},number={4},pages={519-529},year={2018},doi={10.1007/S10488-018-0850-5},url={}}. [Crossref]
@article{46,title={Natural language processing tools for assessing progress and outcome of two veteran populations: {C}ohort study from a novel online intervention for posttraumatic growth},author={Norman, K. P. and Govindjee, A. and Norman, S. R. and Godoy, M. and Cerrone, D. W. and Kieschnick, W. and Kassler, W.},journal={JMIR Form. Res.},volume={4},number={e17424},year={2020},doi={10.2196/17424},url={}}. [Crossref]
@article{47,title={{LAXARY}: {A} trustworthy explainable {T}witter analysis model for post-traumatic stress disorder assessment},author={Alam, M. A. and Kapadia, D.},journal={2020 IEEE International Conference on Smart Computing (SMARTCOMP)},pages={308-313},year={2020},doi={10.1109/SMARTCOMP50058.2020.00069},url={}}. [Crossref]
@article{48,title={Evidence-based psychotherapy trends among posttraumatic stress disorder patients in a national healthcare system, 2001–2014},author={Maguen, S. and Holder, N. and Madden, E. and Li, Y. and Seal, K. H. and Neylan, T. C. and Lujan, O. V. and Patterson, S. L. and DuVall, B. and Shiner, B.},journal={Depress. Anxiety},volume={37},number={4},pages={356-364},year={2020},doi={10.1002/da.22983},url={}}. [Crossref]
@article{49,title={Multi-aspect transfer learning for detecting low resource mental disorders on social media},author={Uban, A. S. and Chulvi, B. and Rosso, P.},journal={Proceedings of the Thirteenth Language Resources and Evaluation Conference},pages={3202-3219},year={2022}}.
@article{50,title={Artificial intelligence language predictors of two-year trauma-related outcomes},author={Oltmanns, J. R. and Schwartz, H. A. and Ruggero, C. and Son, J. and Miao, M. and Waszczuk, S. A. P. and Clouston, E. J. and Bromet, B. J. and Luft, R. and Kotov, R.},journal={J. Psychiatr. Res.},volume={143},pages={239-245},year={2021},doi={10.1016/j.jpsychires.2021.09.015},url={}}. [Crossref]
@article{51,title={Improvements to {PTSD} quality metrics with natural language processing},author={Shiner, B. and Levis, M. and V. M. Dufort, O. V. and Patterson, B. V. and Watts, S. L. and DuVall, C. J. and Russ, S. and Maguen, B.},journal={J Eval. Clin. Pract.},volume={28},number={4},pages={520-530},year={2022},doi={10.1111/jep.13587},url={}}@inproceedings{52,title={Detecting and inoculating against {PTSD} in online forums and platforms},author={Shurafa, C.},booktitle={2021 8th International Conference on Behavioral and Social Computing (BESC)},pages={1-3},year={2021},doi={10.1109/BESC53957.2021.9635325},url={https://doi.org/10.1109/BESC53957.2021.9635325}}. [Crossref]
@article{53,title={Diagnosing post-traumatic stress disorder using electronic medical record data},author={Zafari, H. and Kosowan, L. and Zulkernine, F. and Signer, A.},journal={Health Inform. J.},volume={27},number={4},year={2021},doi={10.1177/14604582211053259},url={}}@inproceedings{54,title={Child abuse mental symptom prediction model using machine learning techniques},author={Elankeerthana, R. and Hanshiya, D. and Pranavajothi, A. and Shanmugapriya, S.},booktitle={2022 6th International Conference on Trends in Electronics and Informatics (ICOEI)},pages={1459-1465},year={2022},doi={10.1109/ICOEI53556.2022.9777138},url={https://doi.org/10.1109/ICOEI53556.2022.9777138}}. [Crossref]
@article{55,title={Detecting presence of {PTSD} using sentiment analysis from text data},author={Sawalha, J. and Yousefnezhad, M. and Shah, Z. and Brown, M. R. G. and Greenshaw, A. J. and Greiner, R.},journal={Front. Psychiatry},volume={12},pages={811392},year={2022},doi={10.3389/fpsyt.2021.811392},url={}}. [Crossref]
@article{56,title={Pan-Canadian electronic medical record diagnostic and unstructured text data for capturing {PTSD}: {R}etrospective observational study},author={Kosowan, L. and Singer, A. and Zulkernine, F. and Zafari, H. and Nesca, M. and Muthumuni, D.},journal={JMIR Med. Inform.},volume={10},number={12},pages={e41312},year={2022},doi={10.2196/41312},url={}}. [Crossref]
@article{57,title={Identifying women with postdelivery posttraumatic stress disorder using natural language processing of personal childbirth narratives},author={Bartal, A. and Jagodnik, K. M. and Chan, S. J. and Babu, M. S. and Dekel, S.},journal={Am. J. Obstet. Gynecol. MFM},volume={5},number={3},pages={100834},year={2023},doi={10.1016/j.ajogmf.2022.100834},url={}}. [Crossref]
@article{58,title={Dynamic suicide topic modelling: {D}eriving population-specific, psychosocial and time-sensitive suicide risk variables from electronic health record psychotherapy notes},author={Levis, M. and Levy, J. and Dufort, V. and Russ, C. J. and Shiner, B.},journal={Clin. Psychol. Psychother.},volume={30},number={4},pages={795-810},year={2023},doi={10.1002/cpp.2842},url={}}. [Crossref]

Cite this:
APA Style
IEEE Style
BibTex Style
MLA Style
Chicago Style
GB-T-7714-2015
Seven, E. & Yucel, E. (2025). Natural Language Processing for PTSD Detection: A Systematic Review and Bibliometric Analysis. Acadlore Trans. Mach. Learn., 4(4), 263-290. https://doi.org/10.56578/ataiml040404
E. Seven and E. Yucel, "Natural Language Processing for PTSD Detection: A Systematic Review and Bibliometric Analysis," Acadlore Trans. Mach. Learn., vol. 4, no. 4, pp. 263-290, 2025. https://doi.org/10.56578/ataiml040404
@review-article{Seven2025NaturalLP,
title={Natural Language Processing for PTSD Detection: A Systematic Review and Bibliometric Analysis},
author={Engin Seven and Eylem Yucel},
journal={Acadlore Transactions on AI and Machine Learning},
year={2025},
page={263-290},
doi={https://doi.org/10.56578/ataiml040404}
}
Engin Seven, et al. "Natural Language Processing for PTSD Detection: A Systematic Review and Bibliometric Analysis." Acadlore Transactions on AI and Machine Learning, v 4, pp 263-290. doi: https://doi.org/10.56578/ataiml040404
Engin Seven and Eylem Yucel. "Natural Language Processing for PTSD Detection: A Systematic Review and Bibliometric Analysis." Acadlore Transactions on AI and Machine Learning, 4, (2025): 263-290. doi: https://doi.org/10.56578/ataiml040404
SEVEN E, YUCEL E. Natural Language Processing for PTSD Detection: A Systematic Review and Bibliometric Analysis[J]. Acadlore Transactions on AI and Machine Learning, 2025, 4(4): 263-290. https://doi.org/10.56578/ataiml040404
cc
©2025 by the author(s). Published by Acadlore Publishing Services Limited, Hong Kong. This article is available for free download and can be reused and cited, provided that the original published version is credited, under the CC BY 4.0 license.