|
|
|
@ -1636,10 +1636,10 @@ class MultiModalAgent:
|
|
|
|
|
self.temperature = temperature
|
|
|
|
|
self.langigage = language
|
|
|
|
|
|
|
|
|
|
if load_dict is None:
|
|
|
|
|
load_dict = {
|
|
|
|
|
"ImageCaptioning": "default_device"
|
|
|
|
|
}
|
|
|
|
|
# if load_dict is None:
|
|
|
|
|
load_dict = {
|
|
|
|
|
"ImageCaptioning": "default_device"
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
self.agent = MultiModalVisualAgent(
|
|
|
|
|
load_dict,
|
|
|
|
|