diff --git a/swarms/agents/multi_modal_visual_agent.py b/swarms/agents/multi_modal_visual_agent.py index 3571f91d..454ee8fb 100644 --- a/swarms/agents/multi_modal_visual_agent.py +++ b/swarms/agents/multi_modal_visual_agent.py @@ -1636,10 +1636,10 @@ class MultiModalAgent: self.temperature = temperature self.langigage = language - if load_dict is None: - load_dict = { - "ImageCaptioning": "default_device" - } + # if load_dict is None: + load_dict = { + "ImageCaptioning": "default_device" + } self.agent = MultiModalVisualAgent( load_dict,