Other formats:
BibTeX
LaTeX
RIS
@inproceedings{864035, author = {Sojka, Petr and Sojka, Petr and Horák, Aleš}, address = {Brno}, booktitle = {Third Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2009}, edition = {prvni}, keywords = {language of mathematics;mathematics of language;random walking;plagiarity;similarity;topicality;conarrativity;DML-CZ;EuDML}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-210-5048-8}, pages = {127-133}, publisher = {Masaryk University}, title = {Languages of Mathematics -- Random Walking in the Mathematics of Languages}, url = {http://www.fi.muni.cz/usr/sojka/presentations/sojka-raslan-pres2009.pdf}, year = {2009} }
TY - JOUR ID - 864035 AU - Sojka, Petr - Sojka, Petr - Horák, Aleš PY - 2009 TI - Languages of Mathematics -- Random Walking in the Mathematics of Languages PB - Masaryk University CY - Brno SN - 9788021050488 KW - language of mathematics;mathematics of language;random walking;plagiarity;similarity;topicality;conarrativity;DML-CZ;EuDML UR - http://www.fi.muni.cz/usr/sojka/presentations/sojka-raslan-pres2009.pdf L2 - http://www.fi.muni.cz/usr/sojka/papers/raslan-2009-sojka.pdf N2 - An essay about mathematics being a sublanguage of other natural languages: how it may be represented, stored, searched and handled in several projects of (European) Digital Mathematics Libraries as DML-CZ or EuDML. A framework for solving problem of computing of similar papers in a digital library is proposed, allowing several types of similarity type definitions: \emph{plagiarity} counting on common word $n$-grams, \emph{topicality} counting on common topics, or \emph{conarrativity} counting on the same narrative. The vector of the most similar documents for a given similarity type is suggested to be computed using the algorithm by Page for web page ranking, often explained as `random walking'. ER -
SOJKA, Petr. Languages of Mathematics -- Random Walking in the Mathematics of Languages. In SOJKA, Petr and Aleš HORÁK. \textit{Third Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2009}. prvni. Brno: Masaryk University, 2009, p.~127-133. ISBN~978-80-210-5048-8.
|