Další formáty:
BibTeX
LaTeX
RIS
@inproceedings{556650, author = {Blaťák, Jan and Popelínský, Lubomír and Mráková, Eva}, address = {Barcelona (Spain)}, booktitle = {The Companion Volume to the Proceedings of 42st Annual Meeting of the Association for Computational Linguistics}, keywords = {text classification; fragments}, language = {eng}, location = {Barcelona (Spain)}, isbn = {1-932432-33-7}, pages = {226-229}, publisher = {Association for Computational Linguistics}, title = {Fragments and Text Categorization}, year = {2004} }
TY - JOUR ID - 556650 AU - Blaťák, Jan - Popelínský, Lubomír - Mráková, Eva PY - 2004 TI - Fragments and Text Categorization PB - Association for Computational Linguistics CY - Barcelona (Spain) SN - 1932432337 KW - text classification KW - fragments N2 - We introduce two novel methods of text categorization in which documents are split into fragments. We conducted experiments on English, French and Czech. In all cases, the problems referred to a binary document classification. We find that both methods increase the accuracy of text categorization. For the Naive Bayes classifier this increase is significant. ER -
BLAŤÁK, Jan, Lubomír POPELÍNSKÝ a Eva MRÁKOVÁ. Fragments and Text Categorization. In \textit{The Companion Volume to the Proceedings of 42st Annual Meeting of the Association for Computational Linguistics}. Barcelona (Spain): Association for Computational Linguistics, 2004, s.~226-229. ISBN~1-932432-33-7.
|