from swarms import QwenVLMultiModal # Instantiate the QwenVLMultiModal model model = QwenVLMultiModal( model_name="Qwen/Qwen-VL-Chat", device="cuda", quantize=True, ) # Run the model response = model("Hello, how are you?", "https://example.com/image.jpg") # Print the response print(response)