Added max_tokens support for localai provider

valentinfrlch · May 20, 2024 · ffdab1b · ffdab1b
1 parent 9aacb3a
commit ffdab1b
Show file tree

Hide file tree

Showing 2 changed files with 11 additions and 12 deletions.
diff --git a/custom_components/gpt4vision/__init__.py b/custom_components/gpt4vision/__init__.py
@@ -36,7 +36,8 @@ async def async_setup_entry(hass, entry):
 
     return True
 
-def validate(mode, api_key, ip_address, port):
+
+def validate(mode, api_key, ip_address, port, image_path):
     """Validate the configuration for the component
 
     Args:
@@ -55,6 +56,9 @@ def validate(mode, api_key, ip_address, port):
     elif mode == "LocalAI":
         if not ip_address or not port:
             raise ServiceValidationError("localai_not_configured")
+    # Check if image file exists
+    if not os.path.exists(image_path):
+        raise ServiceValidationError("invalid_image_path")
 
 
 def setup(hass, config):
@@ -78,9 +82,9 @@ async def image_analyzer(data_call):
         image_path = data_call.data.get(CONF_IMAGE_FILE)
         # Resolution (width only) of the image. Example: 1280 for 720p etc.
         target_width = data_call.data.get(CONF_TARGET_WIDTH, 1280)
-        
+
         # Validate configuration
-        validate(mode, api_key, ip_address, port)
+        validate(mode, api_key, ip_address, port, image_path)
 
         if mode == "OpenAI":
             # Maximum number of tokens used by model. Default is 100.
@@ -91,11 +95,6 @@ async def image_analyzer(data_call):
             # GPT model: Default model is gpt-4-vision-preview for LocalAI
             model = str(data_call.data.get(CONF_MODEL, "gpt-4-vision-preview"))
 
-        # Check if image file exists
-        if not os.path.exists(image_path):
-            raise ServiceValidationError(
-                f"Image does not exist: {image_path}")
-
         def encode_image(image_path):
             """Encode image as base64
 
@@ -133,16 +132,16 @@ def encode_image(image_path):
         session = async_get_clientsession(hass)
 
         if mode == "LocalAI":
-            response_text = await handle_localai_request(session, model, message, base64_image, ip_address, port)
+            response_text = await handle_localai_request(session, model, message, base64_image, ip_address, port, max_tokens)
 
         elif mode == "OpenAI":
             response_text = await handle_openai_request(session, model, message, base64_image, api_key, max_tokens)
 
         return {"response_text": response_text}
 
-    async def handle_localai_request(session, model, message, base64_image, ip_address, port):
+    async def handle_localai_request(session, model, message, base64_image, ip_address, port, max_tokens):
         data = {"model": model, "messages": [{"role": "user", "content": [{"type": "text", "text": message},
-                                                                          {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{base64_image}"}}]}]}
+                                                                          {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{base64_image}"}}]}], "max_tokens": max_tokens}
         try:
             response = await session.post(
                 f"http://{ip_address}:{port}/v1/chat/completions", json=data)

diff --git a/custom_components/gpt4vision/translations/en.json b/custom_components/gpt4vision/translations/en.json
@@ -27,7 +27,7 @@
         "error": {
             "openai_not_configured": "OpenAI provider is not configured",
             "localai_not_configured": "LocalAI provider is not configured",
-            "handshake_failed": "Failed to connect to LocalAI server. Please check the IP address and port and try again."
+            "invalid_image_path": "Image not found. Check the path and try again."
         }
     }
 }