
@article{ref1,
title="Hybrid singular value decomposition; a model of human text classification",
journal="International journal of human factors modelling and simulation",
year="2006",
author="Noorinaeini, Amirali and Lehto, Mark R.",
volume="1",
number="1",
pages="95-118",
abstract="The objective of this study was to investigate and compare the accuracy of three Singular Value Decomposition (SVD) based models in classifying injury narratives into external-cause-of-injury and poisoning (E-codes) categories. Two SVD-Bayesian models and one SVD-Regression model were developed for free text classification purposes. This study used injury narratives and corresponding E-codes assigned by human experts from the 1997 and 1998 US National Health Interview Survey (NHIS). Sensitivity, specificity and positive predictive value were measured by comparing all the three models' results with E-code categories assigned by experts. The performance of the equidistant Bayes model and regression model improved as more SVD vectors were used for the input. The regression model was compared to the fuzzy Bayes model as well. It was concluded that all three models are capable of learning from human experts to accurately categorise cause-of-injury codes from injury narratives, with the regression-based model being the strongest.<p />",
language="",
issn="1742-5549",
doi="10.1504/IJHFMS.2006.011684",
url="http://dx.doi.org/10.1504/IJHFMS.2006.011684"
}