Spaces:

OctoTools
/

octotools

Running on A10G

bowenchen118 commited on 13 days ago

Commit

a181016

1 Parent(s): ae05573

Update

Files changed (4) hide show

octotools/models/initializer.py CHANGED Viewed

@@ -113,7 +113,13 @@ class Initializer:
                 tool_class = getattr(module, tool_name)
                 # Instantiate the tool
-                tool_instance = tool_class()
                 # FIXME This is a temporary workaround to avoid running demo commands
                 self.available_tools.append(tool_name)

                 tool_class = getattr(module, tool_name)
                 # Instantiate the tool
+                inputs = {}
+                if hasattr(tool_class, 'require_llm_engine') and tool_class.require_llm_engine:
+                    inputs['model_string'] = self.model_string
+                if hasattr(tool_class, 'require_api_key') and tool_class.require_api_key:
+                    inputs['api_key'] = self.api_key
+                tool_instance = tool_class(**inputs)
                 # FIXME This is a temporary workaround to avoid running demo commands
                 self.available_tools.append(tool_name)

octotools/tools/image_captioner/tool.py CHANGED Viewed

@@ -4,8 +4,9 @@ from octotools.engine.openai import ChatOpenAI
 class Image_Captioner_Tool(BaseTool):
     require_llm_engine = True
-    def __init__(self, model_string="gpt-4o-mini"):
         super().__init__(
             tool_name="Image_Captioner_Tool",
             tool_description="A tool that generates captions for images using OpenAI's multimodal model.",
@@ -30,7 +31,7 @@ class Image_Captioner_Tool(BaseTool):
             },
         )
         print(f"\nInitializing Image Captioner Tool with model: {model_string}")
-        self.llm_engine = ChatOpenAI(model_string=model_string, is_multimodal=True) if model_string else None
     def execute(self, image, prompt="Describe this image in detail."):
         try:

 class Image_Captioner_Tool(BaseTool):
     require_llm_engine = True
+    require_api_key = True
+    def __init__(self, model_string="gpt-4o-mini", api_key=None):
         super().__init__(
             tool_name="Image_Captioner_Tool",
             tool_description="A tool that generates captions for images using OpenAI's multimodal model.",
             },
         )
         print(f"\nInitializing Image Captioner Tool with model: {model_string}")
+        self.llm_engine = ChatOpenAI(model_string=model_string, is_multimodal=True, api_key=api_key) if model_string else None
     def execute(self, image, prompt="Describe this image in detail."):
         try:

octotools/tools/python_code_generator/tool.py CHANGED Viewed

@@ -37,8 +37,9 @@ def timeout(seconds):
 class Python_Code_Generator_Tool(BaseTool):
     require_llm_engine = True
-    def __init__(self, model_string="gpt-4o-mini"):
         super().__init__(
             tool_name="Python_Code_Generator_Tool",
             tool_description="A tool that generates and executes simple Python code snippets for basic arithmetical calculations and math-related problems. The generated code runs in a highly restricted environment with only basic mathematical operations available.",
@@ -83,7 +84,7 @@ class Python_Code_Generator_Tool(BaseTool):
             }
         )
         print(f"\nInitializing Python_Code_Generator_Tool with model_string: {model_string}")
-        self.llm_engine = ChatOpenAI(model_string=model_string, is_multimodal=False) if model_string else None
     @staticmethod
     def preprocess_code(code):

 class Python_Code_Generator_Tool(BaseTool):
     require_llm_engine = True
+    require_api_key = True
+    def __init__(self, model_string="gpt-4o-mini", api_key=None):
         super().__init__(
             tool_name="Python_Code_Generator_Tool",
             tool_description="A tool that generates and executes simple Python code snippets for basic arithmetical calculations and math-related problems. The generated code runs in a highly restricted environment with only basic mathematical operations available.",
             }
         )
         print(f"\nInitializing Python_Code_Generator_Tool with model_string: {model_string}")
+        self.llm_engine = ChatOpenAI(model_string=model_string, is_multimodal=False, api_key=api_key) if model_string else None
     @staticmethod
     def preprocess_code(code):

octotools/tools/relevant_patch_zoomer/tool.py CHANGED Viewed

@@ -10,8 +10,9 @@ class PatchZoomerResponse(BaseModel):
 class Relevant_Patch_Zoomer_Tool(BaseTool):
     require_llm_engine = True
-    def __init__(self, model_string="gpt-4o"):
         super().__init__(
             tool_name="Relevant_Patch_Zoomer_Tool",
             tool_description="A tool that analyzes an image, divides it into 5 regions (4 quarters + center), and identifies the most relevant patches based on a question. The returned patches are zoomed in by a factor of 2.",
@@ -44,7 +45,7 @@ class Relevant_Patch_Zoomer_Tool(BaseTool):
         }
         print(f"\nInitializing Patch Zoomer Tool with model: {model_string}")
-        self.llm_engine = ChatOpenAI(model_string=model_string, is_multimodal=True) if model_string else None
     def _save_patch(self, image_path, patch, save_path, zoom_factor=2):
         """Extract and save a specific patch from the image with 10% margins."""

 class Relevant_Patch_Zoomer_Tool(BaseTool):
     require_llm_engine = True
+    require_api_key = True
+    def __init__(self, model_string="gpt-4o", api_key=None):
         super().__init__(
             tool_name="Relevant_Patch_Zoomer_Tool",
             tool_description="A tool that analyzes an image, divides it into 5 regions (4 quarters + center), and identifies the most relevant patches based on a question. The returned patches are zoomed in by a factor of 2.",
         }
         print(f"\nInitializing Patch Zoomer Tool with model: {model_string}")
+        self.llm_engine = ChatOpenAI(model_string=model_string, is_multimodal=True, api_key=api_key) if model_string else None
     def _save_patch(self, image_path, patch, save_path, zoom_factor=2):
         """Extract and save a specific patch from the image with 10% margins."""