no quantization

2 years ago · 692a4557b1
parent 4469164e1e
commit 692a4557b1
2 changed files with 7 additions and 2 deletions
--- a/swarms/init.py
+++ b/swarms/init.py
@ -4,7 +4,6 @@ from swarms.orchestrator.autoscaler import AutoScaler
 # worker
 # from swarms.workers.worker_node import WorkerNode
 from swarms.workers.worker import Worker
 from swarms.workers.autobot import AutoBot
 #boss
 from swarms.boss.boss_node import BossNode
--- a/swarms/models/huggingface.py
+++ b/swarms/models/huggingface.py
@ -5,7 +5,13 @@ import logging
 from transformers import AutoModelForCausalLM, AutoTokenizer
 class HuggingFaceLLM:
-    def __init__(self, model_id: str, device: str = None, max_length: int = 20, quantize: bool = False, quantization_config: dict = None):
+    def __init__(self, 
                model_id: str, 
                device: str = None, 
                max_length: int = 20, 
                quantize: bool = False, 
                quantization_config: dict = None
                ):
        self.logger = logging.getLogger(__name__)
        self.device = device if device else ('cuda' if torch.cuda.is_available() else 'cpu')
        self.model_id = model_id