nuffin · nuffin · Oct 20, 2024 · Oct 18, 2024 · Oct 18, 2024 · Oct 20, 2024
diff --git a/llmpa/app.py b/llmpa/app.py
@@ -11,7 +11,8 @@
 import plotly.express as px
 
 project_root = os.path.abspath(os.path.dirname(__file__))
-sys.path.insert(0, project_root)
+if project_root not in sys.path:
+    sys.path.insert(0, project_root)
 
 
 logging.basicConfig(level=logging.DEBUG)

diff --git a/llmpa/backends/base.py b/llmpa/backends/base.py
@@ -1,22 +1,26 @@
+import requests
+from requests.exceptions import HTTPError, Timeout, RequestException
 from typing import Optional, List
 
 
-class ClientBase:
-    def __init__(self, base_url: str, timeout: Optional[int] = 10):
-        self.base_url = base_url
-        self.timeout = timeout
+class BaseBackend:
+    def get_model_info(self, model: str) -> Optional[dict]:
+        raise NotImplementedError
+
+    def list_available_models(self) -> Optional[list]:
+        raise NotImplementedError
 
     def generate(
         self,
-        model: str,
         prompt: str,
+        model: Optional[str] = None,
         max_tokens: Optional[int] = 150,
         temperature: Optional[float] = 1.0,
     ) -> Optional[str]:
         raise NotImplementedError
 
-    def embedding_text(self, model: str, text: str) -> Optional[List[float]]:
+    def embedding_text(self, text: str, model: str) -> Optional[List[float]]:
         raise NotImplementedError
 
-    def embedding_image(self, model: str, filepath: str) -> Optional[List[float]]:
+    def embedding_file(self, filepath: str, model: str) -> Optional[List[float]]:
         raise NotImplementedError
diff --git a/llmpa/backends/localai.py b/llmpa/backends/localai.py
@@ -1,72 +1,42 @@
-import requests
+import os
+import sys
+
 import json
+from requests.exceptions import HTTPError, Timeout, RequestException
 from typing import Optional, List
 
-from .base import ClientBase
-
+project_root = os.path.abspath(os.path.join(os.path.dirname(__file__), ".."))
+if project_root not in sys.path:
+    sys.path.insert(0, project_root)
 
-class LocalAIClient(ClientBase):
-    def __init__(self, base_url: str, timeout: Optional[int] = 10):
-        """
-        Initializes the LocalAI client with the specified server base URL.
+from clients.http import HttpClient
+from .base import BaseBackend
 
-        Args:
-            base_url (str): The base URL of the LocalAI server (e.g., "http://localhost:8080").
-            timeout (int, optional): Timeout for the HTTP requests. Default is 10 seconds.
-        """
-        super(LocalAIClient, self).__init__(base_url, timeout)
 
-    def get_model_info(self, model: str) -> Optional[dict]:
-        """
-        Retrieves model information from the LocalAI server.
-
-        Returns:
-            dict: Model information as a dictionary, or None if the request fails.
-        """
-        try:
-            response = requests.get(
-                f"{self.base_url}/v1/models/{model}", timeout=self.timeout
-            )
-            response.raise_for_status()
-            return response.json()
-        except requests.exceptions.RequestException as e:
-            print(f"Error retrieving model information: {e}")
-            return None
+class Backend(BaseBackend, HttpClient):
+    def __init__(self, base_url: str, api_key=None, verify_ssl=True, timeout=10):
+        super(Backend, self).__init__(base_url, api_key, verify_ssl, timeout)
+        self.client = HttpClient(base_url, api_key, verify_ssl, timeout)
 
     def list_available_models(self) -> Optional[list]:
-        """
-        Retrieves a list of available models from the LocalAI server.
-
-        Returns:
-            list: List of available models, or None if the request fails.
-        """
         try:
-            response = requests.get(f"{self.base_url}/v1/models", timeout=self.timeout)
+            response = self.client.get("/v1/models", timeout=self.timeout)
+            print(response.json())
+            if not response:
+                return None
             response.raise_for_status()
-            return response.json().get("models", [])
-        except requests.exceptions.RequestException as e:
+            return response.json().get("data", [])
+        except RequestException as e:
             print(f"Error retrieving list of models: {e}")
             return None
 
     def generate(
         self,
-        model: str,
         prompt: str,
+        model: Optional[str] = None,
         max_tokens: Optional[int] = 150,
         temperature: Optional[float] = 1.0,
     ) -> Optional[str]:
-        """
-        Sends a request to the LocalAI server to generate text based on the input prompt.
-
-        Args:
-            model (str): The name of the model to be used for inference and embeddings.
-            prompt (str): The prompt or question to send to the LocalAI model.
-            max_tokens (int, optional): The maximum number of tokens to generate. Default is 150.
-            temperature (float, optional): The sampling temperature to control the randomness of output. Default is 1.0.
-
-        Returns:
-            str: The generated text or None if the request fails.
-        """
         headers = {"Content-Type": "application/json"}
 
         payload = {
@@ -77,12 +47,13 @@ def generate(
         }
 
         try:
-            response = requests.post(
-                f"{self.base_url}/v1/generate",
-                headers=headers,
-                data=json.dumps(payload),
+            response = self.client.post(
+                "/v1/chat/completions",
+                json=payload,
                 timeout=self.timeout,
             )
+            if not response:
+                return None
             response.raise_for_status()
 
             # Extract and return the generated text from the response
@@ -93,32 +64,24 @@ def generate(
                 print("No valid response received from the model.")
                 return None
 
-        except requests.exceptions.RequestException as e:
+        except RequestException as e:
             print(f"Error during the request to LocalAI: {e}")
             return None
 
-    def embedding(self, model: str, text: str) -> Optional[List[float]]:
-        """
-        Sends a request to the LocalAI server to generate embeddings from the input text.
-
-        Args:
-            model (str): The name of the model to be used for inference and embeddings.
-            text (str): The input text for which to generate embeddings.
-
-        Returns:
-            list: A list of floats representing the embedding vector, or None if the request fails.
-        """
+    def embedding(self, text: str, model: str) -> Optional[List[float]]:
         headers = {"Content-Type": "application/json"}
 
         payload = {"model": model, "input": text}
 
         try:
-            response = requests.post(
-                f"{self.base_url}/v1/embeddings",
-                headers=headers,
-                data=json.dumps(payload),
+            response = self.client.post(
+                "/embeddings",
+                extra_headers=headers,
+                json=payload,
                 timeout=self.timeout,
             )
+            if not response:
+                return None
             response.raise_for_status()
 
             result = response.json()
@@ -128,37 +91,30 @@ def embedding(self, model: str, text: str) -> Optional[List[float]]:
                 print("No valid embedding received from the model.")
                 return None
 
-        except requests.exceptions.RequestException as e:
+        except RequestException as e:
             print(f"Error during the request to LocalAI for embedding: {e}")
             return None
 
 
 # Example usage:
 if __name__ == "__main__":
-    # Initialize the client
-    client = LocalAIClient(base_url="http://localhost:8080", model="your-model-name")
+    backend = Backend(base_url="http://localhost:58080")
 
     # Example 1: Generating text
     prompt = "Tell me a story about a brave knight."
-    generated_text = client.generate(prompt, max_tokens=100, temperature=0.7)
+    generated_text = backend.generate(
+        prompt, max_tokens=100, temperature=0.7, model="text-embedding-ada-002"
+    )
     if generated_text:
         print(f"Generated Text: {generated_text}")
 
-    # Example 2: Get model information
-    model_info = client.get_model_info()
-    if model_info:
-        print(f"Model Information: {json.dumps(model_info, indent=2)}")
-
     # Example 3: List available models
-    models = client.list_available_models()
+    models = backend.list_available_models()
     if models:
         print(f"Available Models: {models}")
 
     # Example 4: Get embeddings for input text
     input_text = "Artificial intelligence is transforming industries."
-    embedding = client.embedding(input_text)
+    embedding = backend.embedding(input_text, "text-embedding-ada-002")
     if embedding:
         print(f"Embedding: {embedding}")
-
-    # Example 5: Update the model used by the client
-    client.update_model("another-model-name")
diff --git a/llmpa/clients/__init__.py b/llmpa/clients/__init__.py
diff --git a/llmpa/clients/http.py b/llmpa/clients/http.py
@@ -0,0 +1,124 @@
+import requests
+from requests.exceptions import HTTPError, Timeout, RequestException
+from typing import Optional, List
+
+
+class HttpClient:
+    def __init__(
+        self,
+        base_url: str,
+        api_key: Optional[str] = None,
+        verify_ssl: Optional[bool] = True,
+        timeout: Optional[int] = 10,
+    ):
+        self.base_url = base_url
+        if self.base_url.endswith("/"):
+            self.base_url = self.base_url[:-1]
+        self.api_key = api_key
+        self.verify_ssl = verify_ssl
+        self.timeout = timeout
+        self.headers = {
+            "Authorization": f"Bearer {self.api_key}" if self.api_key else None,
+            "Content-Type": "application/json",
+        }
+
+    def _make_request(
+        self,
+        method,
+        endpoint,
+        data=None,
+        json=None,
+        params=None,
+        extra_headers=None,
+        timeout: Optional[int] = None,
+    ):
+        """
+        Make an HTTP request to the LocalAI server.
+
+        :param method: HTTP method (GET, POST, PUT, DELETE).
+        :param endpoint: The API endpoint to hit.
+        :param data: The request body for POST/PUT requests.
+        :param params: Query parameters for GET/DELETE requests.
+        :param extra_headers: Additional headers for the request.
+        :return: Parsed JSON response or None if an error occurred.
+        """
+        url = f"{self.base_url}{endpoint}"
+        headers = {**self.headers, **(extra_headers or {})}
+
+        print(
+            f"data={data}, json={json}, params={params}, extra_headers={extra_headers}"
+        )
+        try:
+            response = requests.request(
+                method=method.upper(),
+                url=url,
+                data=data,
+                json=json,
+                params=params,
+                headers=headers,
+                verify=self.verify_ssl,
+                timeout=timeout or self.timeout,
+            )
+            response.raise_for_status()  # Raise HTTPError for bad responses
+            return response
+        except HTTPError as http_err:
+            print(f"HTTP error occurred: {http_err}")
+        except Timeout as timeout_err:
+            print(f"Timeout error: {timeout_err}")
+        except RequestException as req_err:
+            print(f"Request error: {req_err}")
+        except Exception as err:
+            print(f"An error occurred: {err}")
+        return None
+
+    def get(
+        self, endpoint, params=None, extra_headers=None, timeout: Optional[int] = None
+    ):
+        return self._make_request(
+            "GET", endpoint, params=params, extra_headers=extra_headers, timeout=timeout
+        )
+
+    def post(
+        self,
+        endpoint,
+        data=None,
+        json=None,
+        extra_headers=None,
+        timeout: Optional[int] = None,
+    ):
+        return self._make_request(
+            "POST",
+            endpoint,
+            data=data,
+            json=json,
+            extra_headers=extra_headers,
+            timeout=timeout,
+        )
+
+    def put(
+        self,
+        endpoint,
+        data=None,
+        json=None,
+        extra_headers=None,
+        timeout: Optional[int] = None,
+    ):
+        return self._make_request(
+            "PUT",
+            endpoint,
+            data=data,
+            json=json,
+            extra_headers=extra_headers,
+            timeout=timeout,
+        )
+
+    def delete(
+        self, endpoint, params=None, extra_headers=None, timeout: Optional[int] = None
+    ):
+        return self._make_request(
+            "DELETE",
+            endpoint,
+            params=params,
+            extra_headers=extra_headers,
+            timeout=timeout,
+        )