From 39fc5e675731b0b055e58fa0499394d22971be73 Mon Sep 17 00:00:00 2001 From: Pavan Kumar <66913595+ascender1729@users.noreply.github.com> Date: Thu, 12 Jun 2025 20:38:24 +0530 Subject: [PATCH] refactor: compute workers based on cpu --- swarms/utils/vllm_wrapper.py | 11 +++++------ 1 file changed, 5 insertions(+), 6 deletions(-) diff --git a/swarms/utils/vllm_wrapper.py b/swarms/utils/vllm_wrapper.py index 863bd322..8a114ad1 100644 --- a/swarms/utils/vllm_wrapper.py +++ b/swarms/utils/vllm_wrapper.py @@ -133,12 +133,11 @@ class VLLMWrapper: Returns: List[str]: List of model responses. """ - # Fetch 95% of the available CPU cores - num_cores = os.cpu_count() - num_workers = int(num_cores * 0.95) - with concurrent.futures.ThreadPoolExecutor( - max_workers=num_workers - ) as executor: + # Calculate the worker count based on 95% of available CPU cores + num_workers = max(1, int((os.cpu_count() or 1) * 0.95)) + with concurrent.futures.ThreadPoolExecutor( + max_workers=num_workers + ) as executor: futures = [ executor.submit(self.run, task) for task in tasks ]