Skip to content

Commit

Permalink
fix(manager): extend HTTP server waiting timeout for >=6 nodes cluster
Browse files Browse the repository at this point in the history
With more nodes in cluster, it may take longer for the manager to start.
Existing tests confirm this observation - for 6-nodes cluster, from time
to time, Manager fails to start HTTP server in 3 minutes.
  • Loading branch information
mikliapko authored and fruch committed Nov 7, 2024
1 parent 202ac92 commit 429ef17
Showing 1 changed file with 5 additions and 3 deletions.
8 changes: 5 additions & 3 deletions ccmlib/scylla_cluster.py
Original file line number Diff line number Diff line change
Expand Up @@ -431,9 +431,11 @@ def start(self):
pid_file.write(str(self._process_scylla_manager.pid))

api_interface = common.parse_interface(self._get_api_address(), 5080)
if not common.check_socket_listening(api_interface, timeout=180):
raise Exception("scylla manager interface %s:%s is not listening after 180 seconds, scylla manager may have failed to start."
% (api_interface[0], api_interface[1]))
# With more nodes in cluster it may take longer for the manager to start HTTP server
timeout = 180 if len(self.scylla_cluster.nodes) < 6 else 240
if not common.check_socket_listening(api_interface, timeout=timeout):
raise Exception("scylla manager interface %s:%s is not listening after %s seconds, scylla manager may have failed to start."
% (api_interface[0], api_interface[1], timeout))

return self._process_scylla_manager

Expand Down

0 comments on commit 429ef17

Please sign in to comment.