@inproceedings{95e76042b3ce481591ccd1554b6985ef,
title = "Real-Time Rideshare Driver Supply Values Using Online Reinforcement Learning",
abstract = "In this paper, we present Online Supply Values (OSV), a system for estimating the return of available rideshare drivers to match drivers to ride requests at Lyft. Because a future driver state can be accurately predicted from a request destination, it is possible to estimate the expected action value of assigning a ride request to an available driver as a Markov Decision Process using the Bellman Equation. These estimates are updated using temporal difference and are shown to adapt to changing marketplace conditions in real-time. While reinforcement learning has been studied for rideshare dispatch, fully-online approaches without offline priors or other guardrails had never been evaluated in the real world. This work presents the algorithmic changes needed to bridge this gap. OSV is now deployed globally as a core component of Lyft's dispatch matching system. Our A/B user experiments in major US cities measure a +(0.96±0.53)% increase in the request fulfillment rate and a +(0.73±0.22)% increase to profit per passenger session over the previous algorithm.",
keywords = "adaptive, dispatch, matching, multi-agent reinforcement learning, on-policy control, online learning, real-time, rideshare, streaming, temporal difference, transportation",
author = "Benjamin Han and Hyungjun Lee and S{\'e}bastien Martin",
note = "Publisher Copyright: {\textcopyright} 2022 Owner/Author.; 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining, KDD 2022 ; Conference date: 14-08-2022 Through 18-08-2022",
year = "2022",
month = aug,
day = "14",
doi = "10.1145/3534678.3539141",
language = "English (US)",
series = "Proceedings of the ACM SIGKDD International Conference on Knowledge Discovery and Data Mining",
publisher = "Association for Computing Machinery",
pages = "2968--2976",
booktitle = "KDD 2022 - Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining",
}