@inproceedings{9684574ba03e40b4ad50b22414ad6596,
title = "EMLIO: Minimizing I/O Latency and Energy Consumption for Large-Scale AI Training",
abstract = "Large-scale deep learning workloads increasingly suffer from I/O bottlenecks as datasets grow beyond local storage capacities and GPU compute outpaces network and disk latencies. While recent systems optimize data-loading time, they overlook the energy cost of I/O-a critical factor at large scale. We introduce EMLIO, an Efficient Machine Learning I/O service that jointly minimizes end-to-end data-loading latency (T) and I/O energy consumption (E) across variable-latency networked storage. EMLIO deploys a lightweight data-serving daemon on storage nodes that serializes and batches raw samples, streams them over TCP with out-of-order prefetching, and integrates seamlessly with GPU-accelerated (NVIDIA DALI) preprocessing on the client side. In exhaustive evaluations over local disk, LAN (0.05 ms \& 10 ms round trip time (RTT)), and WAN (30 ms RTT) environments, EMLIO delivers on average up to 8.6× faster I/O and 10.9× lower energy use compared to state-of-the-art loaders, while maintaining constant performance and energy profiles irrespective of network distance. EMLIO{\textquoteright}s service-based architecture offers a scalable blueprint for energy-aware I/O in next-generation AI clouds.",
keywords = "GPU-accelerated preprocessing, I/O latency, data-loading, deep learning, distributed storage, energy-efficency",
author = "Jamil, \{Md Hasibul\} and Nine, \{Md S.Q.Zulkar\} and Tevfik Kosar",
note = "Publisher Copyright: {\textcopyright} 2025 Copyright held by the owner/author(s).; 2025 Workshops of the International Conference on High Performance Computing, Network, Storage, and Analysis, SC 2025 Workshops ; Conference date: 16-11-2025 Through 21-11-2025",
year = "2025",
month = nov,
day = "15",
doi = "10.1145/3731599.3767566",
language = "English",
series = "Proceedings of 2025 Workshops of the International Conference on High Performance Computing, Network, Storage, and Analysis, SC 2025 Workshops",
publisher = "Association for Computing Machinery, Inc",
pages = "2022--2031",
booktitle = "Proceedings of 2025 Workshops of the International Conference on High Performance Computing, Network, Storage, and Analysis, SC 2025 Workshops",
}