Identifying Suicide-Related Language in Smartphone Keyboard Entries Among High-Risk Adolescents. Bloom, P., Treves, I., Pagliaccio, D., Nadel, I., Wool, E., Quinones, H., Greenblatt, J., Parjane, N., Durham, K., Salem, S., Trivedi, E., Galfalvy, H., Allen, N., Barch, D., Blanchard, A., Brent, D., Chernick, L., Dayan, P., Hoyniak, C., Joyce, K., Kirshenbaum, J., Li, L. Y., Luby, J., Porta, G., Saha, K., Shankman, S., Schwartz, A., Shimgekar, S., Zelazny, J., & Auerbach, R. September, 2025.
Paper doi abstract bibtex Adolescent suicide rates have risen over the past two decades, underscoring the need for improved strategies to detect risk. This study leverages passively collected smartphone data to identify suicide-related language in adolescents’ keyboard usage using natural language processing. We developed a youth suicide lexicon for adolescent language and validated it with labeled data (N=121,515 entries), demonstrating higher sensitivity and precision than lexicons not designed for youth. Across two independent cohorts at elevated suicide risk (Ns=208 and 211; >6 million text entries), both lifetime suicidal thoughts and behaviors and current suicidal ideation were associated with increased frequency of smartphone suicide-related language. Human coding indicated varied language—e.g., serious expressions of active suicidal ideation, jokes, hyperbole, and expressing support for others. Most suicide-related entries did not express serious current first-person suicidal ideation, underscoring the need for improved approaches to distinguish intent. Findings highlight both the promise and limitations of NLP approaches for suicide prevention.
@misc{bloom_identifying_2025,
title = {Identifying {Suicide}-{Related} {Language} in {Smartphone} {Keyboard} {Entries} {Among} {High}-{Risk} {Adolescents}},
url = {https://osf.io/gfa7h_v1},
doi = {10.31234/osf.io/gfa7h_v1},
abstract = {Adolescent suicide rates have risen over the past two decades, underscoring the need for improved strategies to detect risk. This study leverages passively collected smartphone data to identify suicide-related language in adolescents’ keyboard usage using natural language processing. We developed a youth suicide lexicon for adolescent language and validated it with labeled data (N=121,515 entries), demonstrating higher sensitivity and precision than lexicons not designed for youth. Across two independent cohorts at elevated suicide risk (Ns=208 and 211; \>6 million text entries), both lifetime suicidal thoughts and behaviors and current suicidal ideation were associated with increased frequency of smartphone suicide-related language. Human coding indicated varied language—e.g., serious expressions of active suicidal ideation, jokes, hyperbole, and expressing support for others. Most suicide-related entries did not express serious current first-person suicidal ideation, underscoring the need for improved approaches to distinguish intent. Findings highlight both the promise and limitations of NLP approaches for suicide prevention.},
language = {en-us},
urldate = {2025-09-18},
publisher = {OSF},
author = {Bloom, Paul and Treves, Isaac and Pagliaccio, David and Nadel, Isabella and Wool, Emma and Quinones, Hayley and Greenblatt, Julia and Parjane, Natalia and Durham, Katherine and Salem, Samantha and Trivedi, Esha and Galfalvy, Hanga and Allen, Nicholas and Barch, Deanna and Blanchard, Ashley and Brent, David and Chernick, Lauren and Dayan, Peter and Hoyniak, Caroline and Joyce, Karla and Kirshenbaum, Jaclyn and Li, Lilian Y. and Luby, Joan and Porta, Giovanna and Saha, Koustuv and Shankman, Stewart and Schwartz, Adela and Shimgekar, Soorya and Zelazny, Jamie and Auerbach, Randy},
month = sep,
year = {2025},
keywords = {smartphone, adolescent, language, suicide, mobile sensing, passive, lexicon, nlp, STB},
}
Downloads: 0
{"_id":"aWaE4ioZ7vB5kwd3G","bibbaseid":"bloom-treves-pagliaccio-nadel-wool-quinones-greenblatt-parjane-etal-identifyingsuiciderelatedlanguageinsmartphonekeyboardentriesamonghighriskadolescents-2025","author_short":["Bloom, P.","Treves, I.","Pagliaccio, D.","Nadel, I.","Wool, E.","Quinones, H.","Greenblatt, J.","Parjane, N.","Durham, K.","Salem, S.","Trivedi, E.","Galfalvy, H.","Allen, N.","Barch, D.","Blanchard, A.","Brent, D.","Chernick, L.","Dayan, P.","Hoyniak, C.","Joyce, K.","Kirshenbaum, J.","Li, L. Y.","Luby, J.","Porta, G.","Saha, K.","Shankman, S.","Schwartz, A.","Shimgekar, S.","Zelazny, J.","Auerbach, R."],"bibdata":{"bibtype":"misc","type":"misc","title":"Identifying Suicide-Related Language in Smartphone Keyboard Entries Among High-Risk Adolescents","url":"https://osf.io/gfa7h_v1","doi":"10.31234/osf.io/gfa7h_v1","abstract":"Adolescent suicide rates have risen over the past two decades, underscoring the need for improved strategies to detect risk. This study leverages passively collected smartphone data to identify suicide-related language in adolescents’ keyboard usage using natural language processing. We developed a youth suicide lexicon for adolescent language and validated it with labeled data (N=121,515 entries), demonstrating higher sensitivity and precision than lexicons not designed for youth. Across two independent cohorts at elevated suicide risk (Ns=208 and 211; >6 million text entries), both lifetime suicidal thoughts and behaviors and current suicidal ideation were associated with increased frequency of smartphone suicide-related language. Human coding indicated varied language—e.g., serious expressions of active suicidal ideation, jokes, hyperbole, and expressing support for others. Most suicide-related entries did not express serious current first-person suicidal ideation, underscoring the need for improved approaches to distinguish intent. Findings highlight both the promise and limitations of NLP approaches for suicide prevention.","language":"en-us","urldate":"2025-09-18","publisher":"OSF","author":[{"propositions":[],"lastnames":["Bloom"],"firstnames":["Paul"],"suffixes":[]},{"propositions":[],"lastnames":["Treves"],"firstnames":["Isaac"],"suffixes":[]},{"propositions":[],"lastnames":["Pagliaccio"],"firstnames":["David"],"suffixes":[]},{"propositions":[],"lastnames":["Nadel"],"firstnames":["Isabella"],"suffixes":[]},{"propositions":[],"lastnames":["Wool"],"firstnames":["Emma"],"suffixes":[]},{"propositions":[],"lastnames":["Quinones"],"firstnames":["Hayley"],"suffixes":[]},{"propositions":[],"lastnames":["Greenblatt"],"firstnames":["Julia"],"suffixes":[]},{"propositions":[],"lastnames":["Parjane"],"firstnames":["Natalia"],"suffixes":[]},{"propositions":[],"lastnames":["Durham"],"firstnames":["Katherine"],"suffixes":[]},{"propositions":[],"lastnames":["Salem"],"firstnames":["Samantha"],"suffixes":[]},{"propositions":[],"lastnames":["Trivedi"],"firstnames":["Esha"],"suffixes":[]},{"propositions":[],"lastnames":["Galfalvy"],"firstnames":["Hanga"],"suffixes":[]},{"propositions":[],"lastnames":["Allen"],"firstnames":["Nicholas"],"suffixes":[]},{"propositions":[],"lastnames":["Barch"],"firstnames":["Deanna"],"suffixes":[]},{"propositions":[],"lastnames":["Blanchard"],"firstnames":["Ashley"],"suffixes":[]},{"propositions":[],"lastnames":["Brent"],"firstnames":["David"],"suffixes":[]},{"propositions":[],"lastnames":["Chernick"],"firstnames":["Lauren"],"suffixes":[]},{"propositions":[],"lastnames":["Dayan"],"firstnames":["Peter"],"suffixes":[]},{"propositions":[],"lastnames":["Hoyniak"],"firstnames":["Caroline"],"suffixes":[]},{"propositions":[],"lastnames":["Joyce"],"firstnames":["Karla"],"suffixes":[]},{"propositions":[],"lastnames":["Kirshenbaum"],"firstnames":["Jaclyn"],"suffixes":[]},{"propositions":[],"lastnames":["Li"],"firstnames":["Lilian","Y."],"suffixes":[]},{"propositions":[],"lastnames":["Luby"],"firstnames":["Joan"],"suffixes":[]},{"propositions":[],"lastnames":["Porta"],"firstnames":["Giovanna"],"suffixes":[]},{"propositions":[],"lastnames":["Saha"],"firstnames":["Koustuv"],"suffixes":[]},{"propositions":[],"lastnames":["Shankman"],"firstnames":["Stewart"],"suffixes":[]},{"propositions":[],"lastnames":["Schwartz"],"firstnames":["Adela"],"suffixes":[]},{"propositions":[],"lastnames":["Shimgekar"],"firstnames":["Soorya"],"suffixes":[]},{"propositions":[],"lastnames":["Zelazny"],"firstnames":["Jamie"],"suffixes":[]},{"propositions":[],"lastnames":["Auerbach"],"firstnames":["Randy"],"suffixes":[]}],"month":"September","year":"2025","keywords":"smartphone, adolescent, language, suicide, mobile sensing, passive, lexicon, nlp, STB","bibtex":"@misc{bloom_identifying_2025,\n\ttitle = {Identifying {Suicide}-{Related} {Language} in {Smartphone} {Keyboard} {Entries} {Among} {High}-{Risk} {Adolescents}},\n\turl = {https://osf.io/gfa7h_v1},\n\tdoi = {10.31234/osf.io/gfa7h_v1},\n\tabstract = {Adolescent suicide rates have risen over the past two decades, underscoring the need for improved strategies to detect risk. This study leverages passively collected smartphone data to identify suicide-related language in adolescents’ keyboard usage using natural language processing. We developed a youth suicide lexicon for adolescent language and validated it with labeled data (N=121,515 entries), demonstrating higher sensitivity and precision than lexicons not designed for youth. Across two independent cohorts at elevated suicide risk (Ns=208 and 211; \\>6 million text entries), both lifetime suicidal thoughts and behaviors and current suicidal ideation were associated with increased frequency of smartphone suicide-related language. Human coding indicated varied language—e.g., serious expressions of active suicidal ideation, jokes, hyperbole, and expressing support for others. Most suicide-related entries did not express serious current first-person suicidal ideation, underscoring the need for improved approaches to distinguish intent. Findings highlight both the promise and limitations of NLP approaches for suicide prevention.},\n\tlanguage = {en-us},\n\turldate = {2025-09-18},\n\tpublisher = {OSF},\n\tauthor = {Bloom, Paul and Treves, Isaac and Pagliaccio, David and Nadel, Isabella and Wool, Emma and Quinones, Hayley and Greenblatt, Julia and Parjane, Natalia and Durham, Katherine and Salem, Samantha and Trivedi, Esha and Galfalvy, Hanga and Allen, Nicholas and Barch, Deanna and Blanchard, Ashley and Brent, David and Chernick, Lauren and Dayan, Peter and Hoyniak, Caroline and Joyce, Karla and Kirshenbaum, Jaclyn and Li, Lilian Y. and Luby, Joan and Porta, Giovanna and Saha, Koustuv and Shankman, Stewart and Schwartz, Adela and Shimgekar, Soorya and Zelazny, Jamie and Auerbach, Randy},\n\tmonth = sep,\n\tyear = {2025},\n\tkeywords = {smartphone, adolescent, language, suicide, mobile sensing, passive, lexicon, nlp, STB},\n}\n\n","author_short":["Bloom, P.","Treves, I.","Pagliaccio, D.","Nadel, I.","Wool, E.","Quinones, H.","Greenblatt, J.","Parjane, N.","Durham, K.","Salem, S.","Trivedi, E.","Galfalvy, H.","Allen, N.","Barch, D.","Blanchard, A.","Brent, D.","Chernick, L.","Dayan, P.","Hoyniak, C.","Joyce, K.","Kirshenbaum, J.","Li, L. Y.","Luby, J.","Porta, G.","Saha, K.","Shankman, S.","Schwartz, A.","Shimgekar, S.","Zelazny, J.","Auerbach, R."],"key":"bloom_identifying_2025","id":"bloom_identifying_2025","bibbaseid":"bloom-treves-pagliaccio-nadel-wool-quinones-greenblatt-parjane-etal-identifyingsuiciderelatedlanguageinsmartphonekeyboardentriesamonghighriskadolescents-2025","role":"author","urls":{"Paper":"https://osf.io/gfa7h_v1"},"keyword":["smartphone","adolescent","language","suicide","mobile sensing","passive","lexicon","nlp","STB"],"metadata":{"authorlinks":{}}},"bibtype":"misc","biburl":"https://bibbase.org/f/ZRjsQ58xmRS385CAj/mypubs.bib","dataSources":["qg54cFyjST4rE4gZr","fB4GuzdCZcPR6LeBn","hKTEXvGKSBsqbXw2D"],"keywords":["smartphone","adolescent","language","suicide","mobile sensing","passive","lexicon","nlp","stb"],"search_terms":["identifying","suicide","related","language","smartphone","keyboard","entries","high","risk","adolescents","bloom","treves","pagliaccio","nadel","wool","quinones","greenblatt","parjane","durham","salem","trivedi","galfalvy","allen","barch","blanchard","brent","chernick","dayan","hoyniak","joyce","kirshenbaum","li","luby","porta","saha","shankman","schwartz","shimgekar","zelazny","auerbach"],"title":"Identifying Suicide-Related Language in Smartphone Keyboard Entries Among High-Risk Adolescents","year":2025}