Další formáty:
BibTeX
LaTeX
RIS
@inproceedings{1181475, author = {Rychlý, Pavel}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing, RASLAN 2010}, editor = {Petr Sojka, Aleš Horák}, keywords = {Computational linguistics Language model; Low-frequency; Text analysis; Text corpora}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-7399-246-0}, pages = {53-57}, publisher = {Tribun EU}, title = {Frequency of Low-Frequency Words in Text Corpora}, url = {https://nlp.fi.muni.cz/raslan/2010/paper15.pdf}, year = {2010} }
TY - JOUR ID - 1181475 AU - Rychlý, Pavel PY - 2010 TI - Frequency of Low-Frequency Words in Text Corpora PB - Tribun EU CY - Brno SN - 9788073992460 KW - Computational linguistics Language model KW - Low-frequency KW - Text analysis KW - Text corpora UR - https://nlp.fi.muni.cz/raslan/2010/paper15.pdf N2 - Low-frequency words, esp. words occurring only once in a text corpus, are very popular in text analysis. Also many lexicographers draw attention to such words. This paper lists a detailed statistical analysis of low-frequency words. The results provides important information for many practical applications, including lexicography and language modeling. ER -
RYCHLÝ, Pavel. Frequency of Low-Frequency Words in Text Corpora. In Petr Sojka, Aleš Horák. \textit{Proceedings of Recent Advances in Slavonic Natural Language Processing, RASLAN 2010}. Brno: Tribun EU, 2010, s.~53-57. ISBN~978-80-7399-246-0.
|