[{"title":"( 11 个子文件 98KB ) TextClassification:基于scikit-learn实现对新浪新闻的文本分类,数据集为100w篇文档,总计10类,测试集与训练集1:1划分。分类算法采用SVM和Bayes,其中Bayes作为基线-源码","children":[{"title":"TextClassification-master","children":[{"title":"svm.py <span style='color:#111;'> 2.60KB </span>","children":null,"spread":false},{"title":"spider.py <span style='color:#111;'> 1.82KB </span>","children":null,"spread":false},{"title":"img","children":[{"title":"Figure_2.png <span style='color:#111;'> 58.67KB </span>","children":null,"spread":false},{"title":"Figure_1.png <span style='color:#111;'> 44.20KB </span>","children":null,"spread":false}],"spread":true},{"title":"text2term.py <span style='color:#111;'> 2.62KB </span>","children":null,"spread":false},{"title":"readme.md <span style='color:#111;'> 2.64KB </span>","children":null,"spread":false},{"title":"stopwords.py <span style='color:#111;'> 786B </span>","children":null,"spread":false},{"title":"viewer.py <span style='color:#111;'> 3.08KB </span>","children":null,"spread":false},{"title":"vectorizer.py <span style='color:#111;'> 2.21KB </span>","children":null,"spread":false},{"title":".gitignore <span style='color:#111;'> 55B </span>","children":null,"spread":false},{"title":"baseline.py <span style='color:#111;'> 3.31KB </span>","children":null,"spread":false}],"spread":true}],"spread":true}]