From 85a4ad52cdc975dbcda4d682552ae8657043f569 Mon Sep 17 00:00:00 2001 From: Christian Theune Date: Sun, 18 Aug 2024 16:53:54 +0200 Subject: [PATCH] Reduce the maximum delay waiting to get the migration lock. During the network rollout week we evacuated a lot of hosts and saw very high delays in the long tail even with randomization and decided to reduce it noticably. We're now down to 20s max delay instead of 80s originally. --- src/fc/qemu/outgoing.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/fc/qemu/outgoing.py b/src/fc/qemu/outgoing.py index 3963dce..a448ba1 100644 --- a/src/fc/qemu/outgoing.py +++ b/src/fc/qemu/outgoing.py @@ -208,9 +208,9 @@ def acquire_migration_locks(self): # In case that there are multiple processes waiting, randomize to # avoid steplock retries. We us CSMA/CD-based exponential backoff, # timeslot 10ms but with a max of 13 instead of 16. - # This means we'll wait up to 80s, 40s on average if everything + # This means we'll wait up to 20s, 10s on average if everything # becomes really busy and we may experience lock contention. - tries = min([tries + 1, 13]) + tries = min([tries + 1, 11]) timeout.interval = random.randint(1, 2**tries) * 0.01 if self.agent.has_new_config(): self.target.cancel(self.cookie)