
@article{ref1,
title="Suicide Ideation Estimators within Canadian Provinces Using Machine Learning Tools on Social Media Text",
journal="Journal of Advances in Information Technology",
year="2021",
author="Skaik, R. and Inkpen, D.",
volume="12",
number="4",
pages="357-362",
abstract="Suicide has become one of the leading causes of death worldwide. It is a serious public health problem, and the right prompt response can mitigate it. Therefore, identifying individuals with suicide risk and offering immediate counseling to everyone that might need it is a crucial step. In this research, we utilize personal narratives collected through the popular social media website (Reddit) to build a model suitable for predicting suicide ideation in a sample of Twitter users that is representative for the Canadian population. The labeled dataset contains only 621 users, and with that limited number of training instances we extracted features for classical machine learning and achieved an F1-score of 0.922 using linguistic and emotion features. In addition, we fine-tuned a Sentence Pair Classification BERT model and achieved 92.6 F1-score. The classical machine learning trained model was applied on Canadian population representative dataset. The geographic and demographic patterns of suicide ideation correlate with the suicide statistics reported by Statistics Canada for 2015. © 2021 J. Adv. Inf. Technol.<p /><p>Language: en</p>",
language="en",
issn="1798-2340",
doi="10.12720/jait.12.4.357-362",
url="http://dx.doi.org/10.12720/jait.12.4.357-362"
}