Další formáty:
BibTeX
LaTeX
RIS
@inproceedings{1363110, author = {Rambousek, Adam}, address = {Brno}, booktitle = {RASLAN 2016 Recent Advances in Slavonic Natural Language Processing}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {DEB platform; lexicography; big data; family names; data conversion}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1095-2}, pages = {105-109}, publisher = {Tribun EU}, title = {Pre-processing Large Resources for Family Names Research}, url = {https://nlp.fi.muni.cz/raslan/2016/paper11-Rambousek.pdf}, year = {2016} }
TY - JOUR ID - 1363110 AU - Rambousek, Adam PY - 2016 TI - Pre-processing Large Resources for Family Names Research PB - Tribun EU CY - Brno SN - 9788026310952 KW - DEB platform KW - lexicography KW - big data KW - family names KW - data conversion UR - https://nlp.fi.muni.cz/raslan/2016/paper11-Rambousek.pdf N2 - This paper describes methodology and tools used to pre-process historical archive documents in various formats and their conversion to unified format. Resources were used to investigate the origins and geographical distribution of surnames in the United Kingdom, as part of the Family Names in Britain and Ireland research project. Data extracted from the documents and their connection proved to be valuable research resource which helped to speed up the lexicographic work. ER -
RAMBOUSEK, Adam. Pre-processing Large Resources for Family Names Research. In Aleš Horák, Pavel Rychlý, Adam Rambousek. \textit{RASLAN 2016 Recent Advances in Slavonic Natural Language Processing}. Brno: Tribun EU, 2016, s.~105-109. ISBN~978-80-263-1095-2.
|