Excellence in Research and Innovation for Humanity
@article{(International Science Index):http://waset.org/publications/11975,
  title    = {A Content Vector Model for Text Classification},
  author    = {Eric Jiang},
  country   = {},
  abstract  = {As a popular rank-reduced vector space approach,
Latent Semantic Indexing (LSI) has been used in information
retrieval and other applications. In this paper, an LSI-based content
vector model for text classification is presented, which constructs
multiple augmented category LSI spaces and classifies text by their
content. The model integrates the class discriminative information
from the training data and is equipped with several pertinent feature
selection and text classification algorithms. The proposed classifier
has been applied to email classification and its experiments on a
benchmark spam testing corpus (PU1) have shown that the approach
represents a competitive alternative to other email classifiers based
on the well-known SVM and naïve Bayes algorithms.},
    journal   = {International Journal of Computer, Electrical, Automation, Control and Information Engineering},  volume    = {2},
  number    = {1},
  year      = {2008},
  pages     = {222 - 226},
  ee        = {http://waset.org/publications/11975},
  url       = {http://waset.org/Publications?p=13},
  bibsource = {http://waset.org/Publications},
  issn      = {eISSN:1307-6892},
  publisher = {World Academy of Science, Engineering and Technology},
  index     = {International Science Index 13, 2008},