@inproceedings{liu2026lipschitz,
author = {Liu, Zhongxuan and Kang, Yue and Lee, Thomas C. M.},
title = {Lipschitz Bandits with Stochastic Delayed Feedback},
booktitle = {ICLR 2026},
year = {2026},
month = {April},
abstract = {The Lipschitz bandit problem extends stochastic bandits to a continuous action set defined over a metric space, where the expected reward function satisfies a Lipschitz condition. In this work, we introduce a new problem of Lipschitz bandit in the presence of stochastic delayed feedback, where the rewards are not observed immediately but after a random delay. We consider both bounded and unbounded stochastic delays, and design algorithms that attain sublinear regret guarantees in each setting. For bounded delays, we propose a delay-aware zooming algorithm that retains the optimal performance of the delay-free setting up to an additional term that scales with the maximum delay . For unbounded delays, we propose a novel phased learning strategy that accumulates reliable feedback over carefully scheduled intervals, and establish a regret lower bound showing that our method is nearly optimal up to logarithmic factors. Finally, we present experimental results to demonstrate the efficiency of our algorithms under various delay scenarios.},
url = {http://approjects.co.za/?big=en-us/research/publication/lipschitz-bandits-with-stochastic-delayed-feedback/},
}