@article{li2025scaling, author = {Li, Yinan and Ding, Bailu and Wei, Ziyun and Maas, Lukas M. and Al-Ghosien, Momin and Blanas, Spyros and Bruno, Nicolas and Curino, Carlo and Interlandi, Matteo and Peeper, Craig and Rajan, Kaushik and Chaudhuri, Surajit and Gehrke, Johannes}, title = {Scaling GPU-Accelerated Databases Beyond GPU Memory Size}, year = {2025}, month = {June}, abstract = {There has been considerable interest in leveraging GPUs' computational power and high memory bandwidth for analytical database workloads. However, their limited memory capacity remains a fundamental limitation for databases whose sizes far exceed the GPU memory size. This challenge is exacerbated by the slow PCIe data transfer speed, that creates a bottleneck in overall system performance. In this work, we introduce a hybrid CPU-GPU query processing strategy that leverages the distinct strengths of CPU and GPU to alleviate the data transfer bottleneck. Our approach performs highly efficient data filtering on the CPU, which substantially reduces the volume of data transferred to the GPU via PCIe, and offloads compute-intensive operators such as joins to the GPU for further processing. Our evaluation on the TPC-H benchmark at scale factors up to 1000 (1TB), using a single A100 GPU with 80GB memory, demonstrates that our approach can effectively handle datasets significantly larger than the GPU memory size. Moreover, it substantially outperforms a state-of-the-art CPU-only database system in both performance and cost-effectiveness.}, url = {http://approjects.co.za/?big=en-us/research/publication/scaling-gpu-accelerated-databases-beyond-gpu-memory-size/}, pages = {4518-4531}, journal = {Proc. VLDB Endow.}, volume = {18}, }