add generic openai-compatible API, add credential template for that

(cherry picked from commit 0e1e0d3)
Gnurro · Jan 26, 2024 · ae2d728 · ae2d728
1 parent c6c7b43
commit ae2d728
Show file tree

Hide file tree

Showing 3 changed files with 73 additions and 77 deletions.
diff --git a/backends/fastchat_api.py b/backends/fastchat_api.py
diff --git a/backends/openai_compatible_api.py b/backends/openai_compatible_api.py
@@ -0,0 +1,71 @@
+from typing import List, Dict, Tuple, Any
+from retry import retry
+
+import json
+import openai
+import backends
+
+logger = backends.get_logger(__name__)
+
+MAX_TOKENS = 100
+
+# For this backend, it makes less sense to talk about "supported models" than for others,
+# because what is supported depends very much on where this is pointed to.
+# E.g., if I run FastChat on my local machine, I may have very different models available
+# than if this is pointed to FastChat running on our cluster.
+# Also, what is supported depends on what the server that this is pointed to happens to be
+# serving at that moment.
+# But anyway, hopefull we'll soon have a different method for selecting backends. 2024-01-10
+SUPPORTED_MODELS = ["fsc-vicuna-13b-v1.5", "fsc-vicuna-33b-v1.3", "fsc-vicuna-7b-v1.5",
+                    "lcp-openchat_openchat-3.5-1210"]
+
+NAME = "generic_openai_compatible"
+
+
+class GenericOpenAI(backends.Backend):
+
+    def __init__(self):
+        creds = backends.load_credentials(NAME)
+        self.client = openai.OpenAI(
+            base_url=creds[NAME]["base_url"],
+            api_key = "sk-no-key-required"
+            )
+        self.temperature: float = -1.
+
+    def list_models(self):
+        models = self.client.models.list()
+        names = [item.id for item in models.data]
+        names = sorted(names)
+        return names
+
+    @retry(tries=3, delay=0, logger=logger)
+    def generate_response(self, messages: List[Dict], model: str) -> Tuple[str, Any, str]:
+        """
+        :param messages: for example
+                [
+                    {"role": "system", "content": "You are a helpful assistant."},
+                    {"role": "user", "content": "Who won the world series in 2020?"},
+                    {"role": "assistant", "content": "The Los Angeles Dodgers won the World Series in 2020."},
+                    {"role": "user", "content": "Where was it played?"}
+                ]
+        :param model: chat-gpt for chat-completion, otherwise text completion
+        :return: the continuation
+        """
+        assert 0.0 <= self.temperature <= 1.0, "Temperature must be in [0.,1.]"
+
+        if model.startswith('fsc-') or model.startswith('lcp-'):
+            model = model[4:] 
+
+        prompt = messages
+        api_response = self.client.chat.completions.create(model=model, messages=prompt,
+                                                         temperature=self.temperature, max_tokens=MAX_TOKENS)
+        message = api_response.choices[0].message
+        if message.role != "assistant":  # safety check
+            raise AttributeError("Response message role is " + message.role + " but should be 'assistant'")
+        response_text = message.content.strip()
+        response = json.loads(api_response.json())
+
+        return prompt, response, response_text
+
+    def supports(self, model_name: str):
+        return model_name in SUPPORTED_MODELS
diff --git a/key.json.template b/key.json.template
@@ -15,8 +15,8 @@
   "cohere": {
     "api_key": ""
   },
-  "fastchat_openai": {
+  "generic_openai_compatible": {
     "api_key": "",
-    "fastchat_ip": ""
+    "base_url": "http://127.0.0.1:8000/v1"
   }
 }