Další formáty:
BibTeX
LaTeX
RIS
@article{2301611, author = {Slanináková, Terézia and Antol, Matej and Oľha, Jaroslav and Dohnal, Vlastislav and Ladra, Susana and MartínezandPrieto, Miguel A.}, article_number = {1}, doi = {http://dx.doi.org/10.1016/j.is.2023.102255}, keywords = {Reproducible paper;Index structures;Learned index;Unstructured data;Content-based search;Metric space}, language = {eng}, issn = {0306-4379}, journal = {Information systems}, title = {Reproducible experiments with Learned Metric Index Framework}, url = {https://www.sciencedirect.com/science/article/pii/S0306437923000911}, volume = {118}, year = {2023} }
TY - JOUR ID - 2301611 AU - Slanináková, Terézia - Antol, Matej - Oľha, Jaroslav - Dohnal, Vlastislav - Ladra, Susana - Martínez-Prieto, Miguel A. PY - 2023 TI - Reproducible experiments with Learned Metric Index Framework JF - Information systems VL - 118 IS - 1 SP - 102255 EP - 102255 PB - Elsevier SN - 03064379 KW - Reproducible paper;Index structures;Learned index;Unstructured data;Content-based search;Metric space UR - https://www.sciencedirect.com/science/article/pii/S0306437923000911 N2 - This work is a companion reproducible paper of a previous paper (Antol et al., 2021) in which we presented an alternative to the traditional paradigm of similarity searching in metric spaces called the Learned Metric Index. Inspired by the advance in learned indexing of structured data, we used machine learning models to replace index pivots, thus posing similarity search as a classification problem. This implementation proved to be more than competitive with the conventional methods in terms of speed and recall, proving the concept as viable. The aim of this publication is to make our source code, datasets, and experiments publicly available. For this purpose, we create a collection of Python3 software libraries, YAML reproducible experiment files, and JSON ground-truth files, all bundled in a Docker image – the Learned Metric Index Framework (LMIF) – which can be run using any Docker-compatible operating system on a CPU with Advanced vector extensions (AVX). We introduce a reproducibility protocol for our experiments using LMIF and provide a closer look at the experimental process. We introduce new experimental results by running the reproducibility protocol introduced herein and discussing the differences with the results reported in our primary work (Antol et al., 2021). Finally, we make an argument that these results can be considered weakly reproducible (in both of the performance metrics), since they point to the same conclusions derived in the primary paper. ER -
SLANINÁKOVÁ, Terézia, Matej ANTOL, Jaroslav OĽHA, Vlastislav DOHNAL, Susana LADRA a Miguel A. MARTÍNEZ-PRIETO. Reproducible experiments with Learned Metric Index Framework. \textit{Information systems}. Elsevier, 2023, roč.~118, č.~1, s.~102255-102270. ISSN~0306-4379. Dostupné z: https://dx.doi.org/10.1016/j.is.2023.102255.
|