@inproceedings{6e91b40d18ab485aacc7a8d78fd9bddd,
title = "SMURF: Efficient and Scalable Metadata Access for Distributed Applications from Edge to the Cloud",
abstract = "In parallel with big data processing and analysis dominating the usage of distributed and cloud infrastructures, the demand for distributed metadata access and transfer has increased. In many application domains, the volume of data generated exceeds petabytes, while the corresponding metadata amounts to terabytes or even more. In this paper, we propose a novel solution for efficient and scalable metadata access for distributed applications across wide-area networks, dubbed SMURF. Our solution combines novel pipelining and concurrent transfer mechanisms with reliability, provides distributed continuum caching and prefetching strategies to sidestep fetching latency, and achieves scalable and high-performance metadata fetch/prefetch services in the cloud. We also study the phenomenon of semantic locality in real trace logs which is not well utilized in metadata access prediction. We implement our predictor based on this observation and compare it with three existing state-of-the-art prefetch schemes on Yahoo! Hadoop audit traces. By effectively caching and prefetching metadata based on the access patterns, our continuum caching and prefetching mechanism greatly improves local cache hit rate and reduces the average fetching latency. We replayed approximately 20 Million metadata access operations from real audit traces, in which our system achieved 80% accuracy during prefetch prediction and reduced the average fetch latency 50% compared to the state-of-the-art mechanisms.",
keywords = "Metadata access, continuum caching, efficiency, prefetching, scalability, semantic locality",
author = "Bing Zhang and Tevfik Kosar",
note = "Publisher Copyright: {\textcopyright} 2019 IEEE.; 3rd IEEE International Conference on Edge Computing, EDGE 2019 ; Conference date: 08-07-2019 Through 13-07-2019",
year = "2019",
month = jul,
doi = "10.1109/EDGE.2019.00031",
language = "English (US)",
series = "Proceedings - 2019 IEEE International Conference on Edge Computing, EDGE 2019 - Part of the 2019 IEEE World Congress on Services",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "102--106",
editor = "Elisa Bertino and Chang, {Carl K.} and Peter Chen and Ernesto Damiani and Michael Goul and Katsunori Oyama",
booktitle = "Proceedings - 2019 IEEE International Conference on Edge Computing, EDGE 2019 - Part of the 2019 IEEE World Congress on Services",
address = "United States",
}