
@article{ref1,
title="A novel violent videos classification scheme based on the bag of audio words features",
journal="International journal of computational intelligence and applications",
year="2012",
author="Li, Lei",
volume="11",
number="2",
pages="1250010-1250010",
abstract="A novel method to identify the violent videos only with audio features is introduced. Most previous content-based image or video classification schemes apply the bag of words (BOW) or bag of visual words (BOVW), which employ multiple visual features to characterize image or video content. In our method, the bag of audio words (BOAW) is suggested to be built by effective audio features. Two reasons are considered here. First, audio features should have very special significance for violent videos. Second, the computational complexity of dealing with audio features is much lower than that of visual features. The MPEG-7 low level features such as AudioSpectrum-Centroid and AudioSpectrum-Spread, and the high level feature such as AudioSignature, are combined into one 44-dimensions vector in the BOAW model. The audio words are built from the vector by the clustering strategy, and support vector machine (SVM) with revised soft-weighting scheme is used to group the audio words features into two classes, i.e., the violent and nonviolent. Experiments demonstrate that the proposed method can achieve good recall accuracy and precision accuracy on detecting violent videos. The method also can be applied to classify other types of videos. Copyright  2012 Imperial College Press.<p />",
language="",
issn="1469-0268",
doi="10.1142/S1469026812500101",
url="http://dx.doi.org/10.1142/S1469026812500101"
}