BeastByteAI
diff --git a/‎skllm/__init__.py‎
Lines changed: 0 additions & 7 deletions b/‎skllm/__init__.py‎
Lines changed: 0 additions & 7 deletions
diff --git a/‎skllm/google/completions.py‎
Lines changed: 0 additions & 41 deletions b/‎skllm/google/completions.py‎
Lines changed: 0 additions & 41 deletions
diff --git a/‎skllm/llm/base.py‎
Lines changed: 29 additions & 0 deletions b/‎skllm/llm/base.py‎
Lines changed: 29 additions & 0 deletions
diff --git a/‎skllm/gpt4all_client.py‎ ‎…lm/llm/gpt/clients/gpt4all/completion.py‎skllm/gpt4all_client.py renamed to skllm/llm/gpt/clients/gpt4all/completion.py b/‎skllm/gpt4all_client.py‎ ‎…lm/llm/gpt/clients/gpt4all/completion.py‎skllm/gpt4all_client.py renamed to skllm/llm/gpt/clients/gpt4all/completion.py
diff --git a/‎skllm/llm/gpt/clients/openai/completion.py‎
Lines changed: 50 additions & 0 deletions b/‎skllm/llm/gpt/clients/openai/completion.py‎
Lines changed: 50 additions & 0 deletions
diff --git a/‎skllm/openai/chatgpt.py‎ ‎…lm/llm/gpt/clients/openai/credentials.py‎skllm/openai/chatgpt.py renamed to skllm/llm/gpt/clients/openai/credentials.py
Lines changed: 37 additions & 23 deletions b/‎skllm/openai/chatgpt.py‎ ‎…lm/llm/gpt/clients/openai/credentials.py‎skllm/openai/chatgpt.py renamed to skllm/llm/gpt/clients/openai/credentials.py
Lines changed: 37 additions & 23 deletions
diff --git a/‎skllm/llm/gpt/clients/openai/embedding.py‎
Lines changed: 45 additions & 0 deletions b/‎skllm/llm/gpt/clients/openai/embedding.py‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎skllm/openai/tuning.py‎ ‎skllm/llm/gpt/clients/openai/tuning.py‎skllm/openai/tuning.py renamed to skllm/llm/gpt/clients/openai/tuning.py b/‎skllm/openai/tuning.py‎ ‎skllm/llm/gpt/clients/openai/tuning.py‎skllm/openai/tuning.py renamed to skllm/llm/gpt/clients/openai/tuning.py
diff --git a/‎skllm/completions.py‎ ‎skllm/llm/gpt/completion.py‎skllm/completions.py renamed to skllm/llm/gpt/completion.py
Lines changed: 8 additions & 5 deletions b/‎skllm/completions.py‎ ‎skllm/llm/gpt/completion.py‎skllm/completions.py renamed to skllm/llm/gpt/completion.py
Lines changed: 8 additions & 5 deletions
diff --git a/‎skllm/llm/gpt/embedding.py‎
Lines changed: 33 additions & 0 deletions b/‎skllm/llm/gpt/embedding.py‎
Lines changed: 33 additions & 0 deletions
@@ -1,7 +0,0 @@
-# ordering is important here to prevent circular imports
-from skllm.models.gpt.gpt_zero_shot_clf import (
-    MultiLabelZeroShotGPTClassifier,
-    ZeroShotGPTClassifier,
-)
-from skllm.models.gpt.gpt_few_shot_clf import FewShotGPTClassifier
-from skllm.models.gpt.gpt_dyn_few_shot_clf import DynamicFewShotGPTClassifier
@@ -0,0 +1,29 @@
+from abc import ABC, abstractmethod
+from typing import Any
+
+
+class BaseTextCompletionMixin(ABC):
+    @abstractmethod
+    def _get_chat_completion(self, **kwargs):
+        """Gets a chat completion from the LLM"""
+        pass
+
+
+class BaseClassifierMixin(BaseTextCompletionMixin):
+    @abstractmethod
+    def _extract_out_label(self, completion: Any, **kwargs):
+        """Extracts the label from a completion"""
+        pass
+
+
+class BaseEmbeddingMixin(ABC):
+    @abstractmethod
+    def _get_embeddings(self, **kwargs):
+        """Gets embeddings from the LLM"""
+        pass
+
+
+class BaseTunableMixin(ABC):
+    @abstractmethod
+    def _tune(self, X: Any, y: Any):
+        pass
@@ -0,0 +1,50 @@
+import openai
+from skllm.llm.gpt.clients.openai.credentials import (
+    set_azure_credentials,
+    set_credentials,
+)
+from skllm.utils import retry
+
+
+@retry(max_retries=3)
+def get_chat_completion(
+    messages: dict,
+    key: str,
+    org: str,
+    model: str = "gpt-3.5-turbo",
+    api="openai",
+):
+    """Gets a chat completion from the OpenAI API.
+
+    Parameters
+    ----------
+    messages : dict
+        input messages to use.
+    key : str
+        The OPEN AI key to use.
+    org : str
+        The OPEN AI organization ID to use.
+    model : str, optional
+        The OPEN AI model to use. Defaults to "gpt-3.5-turbo".
+    max_retries : int, optional
+        The maximum number of retries to use. Defaults to 3.
+    api : str
+        The API to use. Must be one of "openai" or "azure". Defaults to "openai".
+
+    Returns
+    -------
+    completion : dict
+    """
+    if api == "openai":
+        set_credentials(key, org)
+        model_dict = {"model": model}
+    elif api == "azure":
+        set_azure_credentials(key, org)
+        model_dict = {"engine": model}
+    else:
+        raise ValueError("Invalid API")
+
+    completion = openai.ChatCompletion.create(
+        temperature=0.0, messages=messages, **model_dict
+    )
+    return completion
@@ -1,27 +1,6 @@
-from time import sleep
-
 import openai
-
-from skllm.openai.credentials import set_azure_credentials, set_credentials
-
-
-def construct_message(role: str, content: str) -> dict:
-    """Constructs a message for the OpenAI API.
-
-    Parameters
-    ----------
-    role : str
-        The role of the message. Must be one of "system", "user", or "assistant".
-    content : str
-        The content of the message.
-
-    Returns
-    -------
-    message : dict
-    """
-    if role not in ("system", "user", "assistant"):
-        raise ValueError("Invalid role")
-    return {"role": role, "content": content}
+from skllm.config import SKLLMConfig as _Config
+from time import sleep
 
 
 def get_chat_completion(
@@ -77,3 +56,38 @@ def get_chat_completion(
         f"Could not obtain the completion after {max_retries} retries: `{error_type} ::"
         f" {error_msg}`"
     )
+
+
+def set_credentials(key: str, org: str) -> None:
+    """Set the OpenAI key and organization.
+
+    Parameters
+    ----------
+    key : str
+        The OpenAI key to use.
+    org : str
+        The OPEN AI organization ID to use.
+    """
+    openai.api_key = key
+    openai.organization = org
+    openai.api_type = "open_ai"
+    openai.api_version = None
+    openai.api_base = "https://api.openai.com/v1"
+
+
+def set_azure_credentials(key: str, org: str) -> None:
+    """Sets OpenAI credentials for Azure.
+
+    Parameters
+    ----------
+    key : str
+        The OpenAI (Azure) key to use.
+    org : str
+        The OpenAI (Azure) organization ID to use.
+    """
+    if not openai.api_type or not openai.api_type.startswith("azure"):
+        openai.api_type = "azure"
+    openai.api_key = key
+    openai.organization = org
+    openai.api_base = _Config.get_azure_api_base()
+    openai.api_version = _Config.get_azure_api_version()
@@ -0,0 +1,45 @@
+from skllm.llm.gpt.clients.openai.credentials import set_credentials
+from skllm.utils import retry
+import openai
+
+
+@retry(max_retries=3)
+def get_embedding(
+    text: str,
+    key: str,
+    org: str,
+    model: str = "text-embedding-ada-002",
+):
+    """
+    Encodes a string and return the embedding for a string.
+
+    Parameters
+    ----------
+    text : str
+        The string to encode.
+    key : str
+        The OPEN AI key to use.
+    org : str
+        The OPEN AI organization ID to use.
+    model : str, optional
+        The model to use. Defaults to "text-embedding-ada-002".
+    max_retries : int, optional
+        The maximum number of retries to use. Defaults to 3.
+
+    Returns
+    -------
+    emb : list
+        The GPT embedding for the string.
+    """
+    set_credentials(key, org)
+    text = [str(t).replace("\n", " ") for t in text]
+    embeddings = []
+    emb = openai.Embedding.create(input=text, model=model)
+    for i in range(len(emb["data"])):
+        e = emb["data"][i]["embedding"]
+        if not isinstance(e, list):
+            raise ValueError(
+                f"Encountered unknown embedding format. Expected list, got {type(emb)}"
+            )
+        embeddings.append(e)
+    return embeddings
@@ -1,21 +1,24 @@
-from skllm.gpt4all_client import get_chat_completion as _g4a_get_chat_completion
-from skllm.openai.chatgpt import get_chat_completion as _oai_get_chat_completion
+from skllm.llm.gpt.clients.openai.completion import (
+    get_chat_completion as _oai_get_chat_completion,
+)
+from skllm.llm.gpt.clients.gpt4all.completion import (
+    get_chat_completion as _g4a_get_chat_completion,
+)
 
 
 def get_chat_completion(
     messages: dict,
     openai_key: str = None,
     openai_org: str = None,
     model: str = "gpt-3.5-turbo",
-    max_retries: int = 3,
 ):
-    """Gets a chat completion from the OpenAI API."""
+    """Gets a chat completion from the OpenAI compatible API."""
     if model.startswith("gpt4all::"):
         return _g4a_get_chat_completion(messages, model[9:])
     else:
         api = "azure" if model.startswith("azure::") else "openai"
         if api == "azure":
             model = model[7:]
         return _oai_get_chat_completion(
-            messages, openai_key, openai_org, model, max_retries, api=api
+            messages, openai_key, openai_org, model, api=api
         )
@@ -0,0 +1,33 @@
+from skllm.llm.gpt.clients.openai.embedding import get_embedding as _oai_get_embedding
+
+
+def get_embedding(
+    text: str,
+    key: str,
+    org: str,
+    model: str = "text-embedding-ada-002",
+):
+    """
+    Encodes a string and return the embedding for a string.
+
+    Parameters
+    ----------
+    text : str
+        The string to encode.
+    key : str
+        The OPEN AI key to use.
+    org : str
+        The OPEN AI organization ID to use.
+    model : str, optional
+        The model to use. Defaults to "text-embedding-ada-002".
+
+    Returns
+    -------
+    emb : list
+        The GPT embedding for the string.
+    """
+    if model.startswith("gpt4all::"):
+        raise ValueError("GPT4All is not supported for embeddings")
+    elif model.startswith("azure::"):
+        raise ValueError("Azure is not supported for embeddings")
+    return _oai_get_embedding(text, key, org, model)