Spaces:

NeuronSolutions
/

target-poc

Sleeping

App Files Files Community

gerglitzen commited on Dec 4, 2023

Commit

0ab9543

1 Parent(s): 47c7f9e

stable

Browse files

Files changed (1) hide show

call_openai.py +231 -0

call_openai.py ADDED Viewed

	@@ -0,0 +1,231 @@

+import openai
+import json
+from typing import List, Dict
+from .callback_handler import BaseCallbackHandler
+import tiktoken
+def call_openai(
+    messages: List[Dict[str, str]],
+    functions: List[str] = None,
+    stream: str = "no",
+    model: str = "gpt-3.5-turbo",
+    temperature: float = 0,
+    callback: BaseCallbackHandler = None
+  ) -> str:
+  """
+    Call openai with list of messages and optional list of functions. See description at openai website.
+    Args:
+        messages: messages passed to openai. list of dictionaries with keys: role=[system, user, assitant, function] + content= message
+        functions: function list passed to openai
+        stream: ["no", "sentence", "token"]
+        model: name of openai model
+        temperature: of openai model
+        callback: callback handler class. If streaming, it is mandatory
+    Returns:
+        final message
+  """
+  current_state = None
+  prompt_tokens = token_count(
+    messages=messages,
+    functions=functions
+    )
+  if functions == None:
+    completion_tokens = -2
+    response = openai.ChatCompletion.create(
+      model = model,
+      temperature=temperature,
+      stream=True,
+      messages=messages,
+    )
+  else:
+    completion_tokens = -1
+    response = openai.ChatCompletion.create(
+      model = model,
+      temperature=temperature,
+      stream=True,
+      messages=messages,
+      functions=functions
+    )
+  for chunk in response:
+    completion_tokens += 1
+    data = json.loads(str(chunk["choices"][0]))
+    delta = data["delta"]
+    finish_reason = data["finish_reason"]
+    if finish_reason is not None:
+      if finish_reason == "function_call":
+         completion_tokens += 6
+      final_response = {
+        "usage": {
+          "completion_tokens": completion_tokens,
+          "prompt_tokens": prompt_tokens,
+        },
+        "choices": []
+      }
+      if current_state == "function":
+        d = {
+          "finish_reason": "function_call",
+          "message": {
+            "content": None,
+            "function_call": {
+              "arguments": function_arg,
+              "name": function_name
+            },
+            "role": "assistant"
+          }
+        }
+        final_response["choices"].append(d)
+      if current_state == "user":
+        d = {
+          "finish_reason": "stop",
+          "message": {
+            "content": message_all,
+            "role": "assistant"
+          }
+        }
+        final_response["choices"].append(d)
+      if callback:
+        callback.on_llm_end(response=final_response)
+      return final_response
+    else:
+      if current_state == None:
+        if 'function_call' in delta:
+          current_state = "function"
+          function_name = delta["function_call"]["name"]
+          function_arg = ""
+          # if stream != "no":
+          #   s = f" - {function_name}"
+          #   callback.on_llm_new_token(token=s)
+        else:
+          current_state = "user"
+          message_stream = ""
+          message_all = ""
+      elif current_state == "function":
+        function_arg += delta['function_call']['arguments']
+      elif current_state == "user":
+        token = delta["content"]
+        message_all += token
+        if stream == "token":
+          callback.on_llm_new_token(token=token)
+        if stream == "sentence":
+          message_stream += token
+          if "." in token or "!" in token or "?" in token or "\n" in token:
+            if message_stream[-1] == "\n":
+              callback.on_llm_new_token(token=message_stream[:-1])
+            else:
+              callback.on_llm_new_token(token=message_stream)
+            message_stream = ""
+def num_tokens_from_messages(messages, model="gpt-3.5-turbo-0613"):
+    """Return the number of tokens used by a list of messages."""
+    try:
+        encoding = tiktoken.encoding_for_model(model)
+    except KeyError:
+#        print("Warning: model not found. Using cl100k_base encoding.")
+        encoding = tiktoken.get_encoding("cl100k_base")
+    if model in {
+        "gpt-3.5-turbo-0613",
+        "gpt-3.5-turbo-16k-0613",
+        "gpt-4-0314",
+        "gpt-4-32k-0314",
+        "gpt-4-0613",
+        "gpt-4-32k-0613",
+        }:
+        tokens_per_message = 3
+        tokens_per_name = 1
+    elif model == "gpt-3.5-turbo-0301":
+        tokens_per_message = 4  # every message follows <|start|>{role/name}\n{content}<|end|>\n
+        tokens_per_name = -1  # if there's a name, the role is omitted
+    elif "gpt-3.5-turbo" in model:
+#        print("Warning: gpt-3.5-turbo may update over time. Returning num tokens assuming gpt-3.5-turbo-0613.")
+        return num_tokens_from_messages(messages, model="gpt-3.5-turbo-0613")
+    elif "gpt-4" in model:
+#        print("Warning: gpt-4 may update over time. Returning num tokens assuming gpt-4-0613.")
+        return num_tokens_from_messages(messages, model="gpt-4-0613")
+    else:
+        raise NotImplementedError(
+            f"""num_tokens_from_messages() is not implemented for model {model}. See https://github.com/openai/openai-python/blob/main/chatml.md for information on how messages are converted to tokens."""
+        )
+    num_tokens = 0
+#    print(messages)
+    for message in messages:
+        num_tokens += tokens_per_message
+        for key, value in message.items():
+            if key == "function_call":
+                num_tokens += tokens_per_name
+                for k, v in value.items():
+#                    print(k,v)
+                    num_tokens += len(encoding.encode(v))
+            if value != None and key != "function_call":
+                num_tokens += len(encoding.encode(value))
+            if key == "name":
+                num_tokens += tokens_per_name
+    num_tokens += 3  # every reply is primed with <|start|>assistant<|message|>
+    return num_tokens
+def num_tokens_from_functions(functions, model="gpt-3.5-turbo-0613"):
+    """Return the number of tokens used by a list of functions."""
+    try:
+        encoding = tiktoken.encoding_for_model(model)
+    except KeyError:
+#        print("Warning: model not found. Using cl100k_base encoding.")
+        encoding = tiktoken.get_encoding("cl100k_base")
+    num_tokens = 0
+    for function in functions:
+        function_tokens = len(encoding.encode(function['name']))
+        function_tokens += len(encoding.encode(function['description']))
+        if 'parameters' in function:
+            parameters = function['parameters']
+            if 'properties' in parameters:
+                for propertiesKey in parameters['properties']:
+                    function_tokens += len(encoding.encode(propertiesKey))
+                    v = parameters['properties'][propertiesKey]
+                    for field in v:
+                        if field == 'type':
+                            function_tokens += 2
+                            function_tokens += len(encoding.encode(v['type']))
+                        elif field == 'description':
+                            function_tokens += 2
+                            function_tokens += len(encoding.encode(v['description']))
+                        elif field == 'enum':
+                            function_tokens -= 3
+                            for o in v['enum']:
+                                function_tokens += 3
+                                function_tokens += len(encoding.encode(o))
+                        else:
+                            dummy = 0
+#                            print(f"Warning: not supported field: {field}")
+                function_tokens += 16
+        num_tokens += function_tokens
+    num_tokens += 16
+    return num_tokens
+def token_count(
+    messages: List[Dict[str, str]],
+    functions: List[str] = None,
+    model = "gpt-3.5-turbo-0613"
+    ) -> int:
+    msgs_tokens = num_tokens_from_messages(messages=messages, model=model)
+    tokens_used = msgs_tokens
+    if functions is not None:
+        function_tokens = num_tokens_from_functions(functions=functions, model=model)
+        tokens_used += function_tokens
+    return tokens_used