@misc{cogprints5626, title = {Fast \& Confident Probabilistic Categorization}, author = {Cyril Goutte}, year = {2007}, keywords = {Text categorization, probabilistic model, confidence estimation, multi-label categorization, category description}, url = {http://cogprints.org/5626/}, abstract = {We describe NRC's submission to the Anomaly Detection/Text Mining competition organised at the Text Mining Workshop 2007. This submission relies on a straightforward implementation of the probabilistic categoriser described in (Gaussier et al., ECIR'02). This categoriser is adapted to handle multiple labelling and a piecewise-linear confidence estimation layer is added to provide an estimate of the labelling confidence. This technique achieves a score of 1.689 on the test data. } }