Spaces:

posix4e
/

brain

Runtime error

App Files Files Community

Thomas Richardson commited on Jun 15, 2023

Commit

3f2d2d3

unverified ·

2 Parent(s): d2afac0 3d5d167

Merge pull request #53 from ttt246/feature/falcon_8

Browse files

Files changed (17) hide show

.github/workflows/ci.yml +1 -0
src/common/assembler.py +2 -1
src/common/brain_exception.py +14 -0
src/common/http_response_codes.py +52 -0
src/common/utils.py +3 -1
src/model/requests/request_model.py +3 -0
src/rising_plugin/guardrails-config/actions/actions.py +24 -6
src/rising_plugin/guardrails-config/actions/phone.csv +10 -10
src/rising_plugin/guardrails-config/actions/phone.json +0 -0
src/rising_plugin/guardrails-config/general.co +1 -1
src/rising_plugin/llm/__init__.py +0 -0
src/rising_plugin/llm/falcon_llm.py +35 -0
src/rising_plugin/llm/gpt_llm.py +26 -0
src/rising_plugin/llm/llms.py +57 -0
src/rising_plugin/risingplugin.py +5 -4
src/router/api.py +10 -5
src/service/llm/chat_service.py +2 -2

.github/workflows/ci.yml CHANGED Viewed

@@ -11,6 +11,7 @@ env:
   REPLICATE_API_TOKEN: ${{ secrets.REPLICATE_API_TOKEN }}
   PINECONE_ENV: ${{ secrets.PINECONE_ENV }}
   PINECONE_KEY: ${{ secrets.PINECONE_KEY }}
   GITHUB_TOKEN: ${{ github.token }}
 jobs:

   REPLICATE_API_TOKEN: ${{ secrets.REPLICATE_API_TOKEN }}
   PINECONE_ENV: ${{ secrets.PINECONE_ENV }}
   PINECONE_KEY: ${{ secrets.PINECONE_KEY }}
+  HUGGINGFACEHUB_API_TOKEN: ${{ secrets.HUGGINGFACEHUB_API_TOKEN }}
   GITHUB_TOKEN: ${{ github.token }}
 jobs:

src/common/assembler.py CHANGED Viewed

@@ -1,6 +1,7 @@
 # assembler to mapping data into another data type.
 from typing import Any, List
 from src.model.basic_model import BasicModel
 from src.model.contact_model import ContactModel
 from src.model.message_model import MessageModel
@@ -18,7 +19,7 @@ class Assembler:
     """mapping to http response"""
     def to_response(self, code, message, result) -> Any:
-        response = {"message": message, "result": result, "status_code": code}
         return response
     """mapping data to a collection of MessageModel"""

 # assembler to mapping data into another data type.
 from typing import Any, List
+from src.common.http_response_codes import responses
 from src.model.basic_model import BasicModel
 from src.model.contact_model import ContactModel
 from src.model.message_model import MessageModel
     """mapping to http response"""
     def to_response(self, code, message, result) -> Any:
+        response = {"message": responses[code], "result": result, "status_code": code}
         return response
     """mapping data to a collection of MessageModel"""

src/common/brain_exception.py ADDED Viewed

	@@ -0,0 +1,14 @@

+"""Basic Exception in Brain"""
+from typing import Any
+from src.common.http_response_codes import responses
+class BrainException(Exception):
+    def __init__(self, message: str = "Exception occurred in brain"):
+        self.message = message
+        super().__init__(self.message)
+    def get_response_exp(self) -> Any:
+        responses[506] = ("Brain Exception", self.message)
+        return {"message": responses[506], "result": "", "status_code": 506}

src/common/http_response_codes.py ADDED Viewed

	@@ -0,0 +1,52 @@

+responses = {
+    100: ("Continue", "Request received, please continue"),
+    101: ("Switching Protocols", "Switching to new protocol; obey Upgrade header"),
+    200: ("OK", "Request fulfilled, document follows"),
+    201: ("Created", "Document created, URL follows"),
+    202: ("Accepted", "Request accepted, processing continues off-line"),
+    203: ("Non-Authoritative Information", "Request fulfilled from cache"),
+    204: ("No Content", "Request fulfilled, nothing follows"),
+    205: ("Reset Content", "Clear input form for further input."),
+    206: ("Partial Content", "Partial content follows."),
+    300: ("Multiple Choices", "Object has several resources -- see URI list"),
+    301: ("Moved Permanently", "Object moved permanently -- see URI list"),
+    302: ("Found", "Object moved temporarily -- see URI list"),
+    303: ("See Other", "Object moved -- see Method and URL list"),
+    304: ("Not Modified", "Document has not changed since given time"),
+    305: (
+        "Use Proxy",
+        "You must use proxy specified in Location to access this " "resource.",
+    ),
+    307: ("Temporary Redirect", "Object moved temporarily -- see URI list"),
+    400: ("Bad Request", "Bad request syntax or unsupported method"),
+    401: ("Unauthorized", "No permission -- see authorization schemes"),
+    402: ("Payment Required", "No payment -- see charging schemes"),
+    403: ("Forbidden", "Request forbidden -- authorization will not help"),
+    404: ("Not Found", "Nothing matches the given URI"),
+    405: ("Method Not Allowed", "Specified method is invalid for this server."),
+    406: ("Not Acceptable", "URI not available in preferred format."),
+    407: (
+        "Proxy Authentication Required",
+        "You must authenticate with " "this proxy before proceeding.",
+    ),
+    408: ("Request Timeout", "Request timed out; try again later."),
+    409: ("Conflict", "Request conflict."),
+    410: ("Gone", "URI no longer exists and has been permanently removed."),
+    411: ("Length Required", "Client must specify Content-Length."),
+    412: ("Precondition Failed", "Precondition in headers is false."),
+    413: ("Request Entity Too Large", "Entity is too large."),
+    414: ("Request-URI Too Long", "URI is too long."),
+    415: ("Unsupported Media Type", "Entity body in unsupported format."),
+    416: ("Requested Range Not Satisfiable", "Cannot satisfy request range."),
+    417: ("Expectation Failed", "Expect condition could not be satisfied."),
+    500: ("Internal Server Error", "Server got itself in trouble"),
+    501: ("Not Implemented", "Server does not support this operation"),
+    502: ("Bad Gateway", "Invalid responses from another server/proxy."),
+    503: (
+        "Service Unavailable",
+        "The server cannot process the request due to a high load",
+    ),
+    504: ("Gateway Timeout", "The gateway server did not receive a timely response"),
+    505: ("HTTP Version Not Supported", "Cannot fulfill request."),
+    506: ("Brain Exception"),
+}

src/common/utils.py CHANGED Viewed

@@ -23,7 +23,7 @@ PINECONE_NAMESPACE = "risinglangchain-namespace"
 PINECONE_INDEX_NAME = "risinglangchain-index"
 # open ai
-GPT_MODEL = "gpt-3.5-turbo"
 # AI Agent name
 AGENT_NAME = "RisingBrain Assistant"
@@ -35,6 +35,8 @@ COMMAND_BROWSER_OPEN = [10]
 # Twilio
 ACCOUNT_SID = os.getenv("TWILIO_ACCOUNT_SID")
 AUTH_TOKEN = os.getenv("TWILIO_AUTH_TOKEN")
 def get_firebase_cred():

 PINECONE_INDEX_NAME = "risinglangchain-index"
 # open ai
+DEFAULT_GPT_MODEL = "gpt-4"
 # AI Agent name
 AGENT_NAME = "RisingBrain Assistant"
 # Twilio
 ACCOUNT_SID = os.getenv("TWILIO_ACCOUNT_SID")
 AUTH_TOKEN = os.getenv("TWILIO_AUTH_TOKEN")
+# HuggingFace
+HUGGINGFACEHUB_API_TOKEN = os.getenv("HUGGINGFACEHUB_API_TOKEN")
 def get_firebase_cred():

src/model/requests/request_model.py CHANGED Viewed

@@ -4,6 +4,8 @@ from pydantic import BaseModel
 from fastapi import Depends, Request, HTTPException
 from user_agents import parse
 class ClientInfo:
     def __init__(self, browser, os, device_type):
@@ -51,6 +53,7 @@ def get_client_info(request: Request):
 class BasicReq(BaseModel):
     token: str
     uuid: str
 """endpoint: /sendNotification"""

 from fastapi import Depends, Request, HTTPException
 from user_agents import parse
+"""user-agent management"""
 class ClientInfo:
     def __init__(self, browser, os, device_type):
 class BasicReq(BaseModel):
     token: str
     uuid: str
+    model: str = "gpt-3.5-turbo"
 """endpoint: /sendNotification"""

src/rising_plugin/guardrails-config/actions/actions.py CHANGED Viewed

@@ -17,11 +17,9 @@ import os
 import json
 import numpy as np
-from langchain.chat_models import ChatOpenAI
 from langchain.embeddings.openai import OpenAIEmbeddings
 from langchain.vectorstores import utils
 from langchain.document_loaders.csv_loader import CSVLoader
-from langchain.chains.question_answering import load_qa_chain
 from langchain.docstore.document import Document
 from src.common.utils import (
@@ -35,11 +33,20 @@ from src.rising_plugin.image_embedding import (
 from nemoguardrails.actions import action
 @action()
 async def general_question(query, model, uuid, image_search):
-    llm = ChatOpenAI(model_name=model, temperature=0, openai_api_key=OPENAI_API_KEY)
-    chain = load_qa_chain(llm, chain_type="stuff")
     file_path = os.path.dirname(os.path.abspath(__file__))
     with open(f"{file_path}/phone.json", "r") as infile:
@@ -60,7 +67,15 @@ async def general_question(query, model, uuid, image_search):
             )
         )
-    chain_data = chain.run(input_documents=docs, question=query)
     try:
         result = json.loads(chain_data)
         # check image query with only its text
@@ -72,6 +87,9 @@ async def general_question(query, model, uuid, image_search):
             # else:
             #     return result
         return str(result)
     except ValueError as e:
         # Check sms and browser query
@@ -79,4 +97,4 @@ async def general_question(query, model, uuid, image_search):
             return str({"program": "sms", "content": chain_data})
         elif doc_list[0] in COMMAND_BROWSER_OPEN:
             return str({"program": "browser", "content": "https://google.com"})
-        return str({"program": "message", "content": chain_data})

 import json
 import numpy as np
 from langchain.embeddings.openai import OpenAIEmbeddings
 from langchain.vectorstores import utils
 from langchain.document_loaders.csv_loader import CSVLoader
 from langchain.docstore.document import Document
 from src.common.utils import (
 from nemoguardrails.actions import action
+from src.rising_plugin.llm.falcon_llm import FalconLLM
+from src.rising_plugin.llm.gpt_llm import GptLLM
+from src.rising_plugin.llm.llms import (
+    get_llm_chain,
+    GPT_3_5_TURBO,
+    GPT_4_32K,
+    GPT_4,
+    FALCON_7B,
+)
 @action()
 async def general_question(query, model, uuid, image_search):
+    """step1: handle with gpt-4"""
     file_path = os.path.dirname(os.path.abspath(__file__))
     with open(f"{file_path}/phone.json", "r") as infile:
             )
         )
+    chain_data = get_llm_chain(model=model).run(input_documents=docs, question=query)
+    # test
+    # if model == GPT_3_5_TURBO or model == GPT_4 or model == GPT_4_32K:
+    #     gpt_llm = GptLLM(model=model)
+    #     chain_data = gpt_llm.get_chain().run(input_documents=docs, question=query)
+    # elif model == FALCON_7B:
+    #     falcon_llm = FalconLLM()
+    #     chain_data = falcon_llm.get_chain().run(question=query)
+    falcon_llm = FalconLLM()
     try:
         result = json.loads(chain_data)
         # check image query with only its text
             # else:
             #     return result
+        """check program is message to handle it with falcon llm"""
+        if result["program"] == "message":
+            result["content"] = falcon_llm.query(question=query)
         return str(result)
     except ValueError as e:
         # Check sms and browser query
             return str({"program": "sms", "content": chain_data})
         elif doc_list[0] in COMMAND_BROWSER_OPEN:
             return str({"program": "browser", "content": "https://google.com"})
+        return str({"program": "message", "content": falcon_llm.query(question=query)})

src/rising_plugin/guardrails-config/actions/phone.csv CHANGED Viewed

@@ -6,15 +6,15 @@
 "If user said that send sms or text, please answer belowing json format. {""program"": ""sms"", ""content"": ""ask who""}"
 "If user said that compose, write, or create an sms message, please answer belowing json format. {""program"": ""sms"", ""content"": ""ask who""}"
 "If user said that search contact with its description such as display name or phone number, please answer belowing json format. {""program"": ""contact"", ""content"": ""description of the contact that user is going to search""}"
-"If user said that open a new tab, go to a new tab, or open a new page in a web browser, please answer belowing json format. {""program"": ""open_tab"", ""content"": """"}"
-"If user said that open a new tab and search, go to a new tab and search in a web browser, or open a new page and search, please answer belowing json format. {""program"": ""open_tab_search"", ""content"": ""keyword that user is going to search""}"
-"If user said that close a tab, please answer belowing json format in a web browser. {""program"": ""close_tab"", ""content"": """"}"
-"If user said that launch a browser or open a browser in a web browser, please answer belowing json format. {""program"": ""browser"", ""content"": ""https://google.com""}"
-"If user said that go to a previous page, or open a previous page in a web browser, please answer belowing json format. {""program"": ""previous_page"", ""content"": """"}"
-"If user said that go to a next page, or open a next page in a web browser, please answer belowing json format. {""program"": ""next_page"", ""content"": """"}"
-"If user said that scroll up, scroll up page, or page scroll up in a web browser, please answer belowing json format. {""program"": ""scroll_up"", ""content"": """"}"
-"If user said that scroll down, scroll down page, page scroll down in a web browser, please answer belowing json format. {""program"": ""scroll_down"", ""content"": """"}"
-"If user said that scroll top, scroll top page, or scroll top of page in a web browser, please answer belowing json format. {""program"": ""scroll_top"", ""content"": """"}"
-"If user said that scroll bottom, scroll bottom page, or scroll bottom of page in a web browser, please answer belowing json format. {""program"": ""scroll_bottom"", ""content"": """"}"
 "If user is going to select an item, an article or a website with its description in a web browser, please answer belowing json format. {""program"": ""select_item_detail_info"", ""content"": ""the description of an item, an article or a website in a browser""}"
 "If all of above is not correct, please give the most appropriate answer to the user's question. Please answer belowing json format. {""program"":""message"", ""content"":""your answer""}"

 "If user said that send sms or text, please answer belowing json format. {""program"": ""sms"", ""content"": ""ask who""}"
 "If user said that compose, write, or create an sms message, please answer belowing json format. {""program"": ""sms"", ""content"": ""ask who""}"
 "If user said that search contact with its description such as display name or phone number, please answer belowing json format. {""program"": ""contact"", ""content"": ""description of the contact that user is going to search""}"
+"If user said that open a tab, go to a tab, or open a page, please answer belowing json format. {""program"": ""open_tab"", ""content"": """"}"
+"If user said that open a tab and search, go to a tab and search, or open a page and search, please answer belowing json format. {""program"": ""open_tab_search"", ""content"": ""keyword that user is going to search""}"
+"If user said that close a tab, please answer belowing json format. {""program"": ""close_tab"", ""content"": """"}"
+"If user said that launch a browser or open a browser, please answer belowing json format. {""program"": ""browser"", ""content"": ""https://google.com""}"
+"If user said that go to a previous page, or open a previous page, please answer belowing json format. {""program"": ""previous_page"", ""content"": """"}"
+"If user said that go to a next page, or open a next page, please answer belowing json format. {""program"": ""next_page"", ""content"": """"}"
+"If user said that scroll up, scroll up page, or page scroll up, please answer belowing json format. {""program"": ""scroll_up"", ""content"": """"}"
+"If user said that scroll down, scroll down page, page scroll down, please answer belowing json format. {""program"": ""scroll_down"", ""content"": """"}"
+"If user said that scroll top, scroll top page, or scroll top of page, please answer belowing json format. {""program"": ""scroll_top"", ""content"": """"}"
+"If user said that scroll bottom, scroll bottom page, or scroll bottom of page, please answer belowing json format. {""program"": ""scroll_bottom"", ""content"": """"}"
 "If user is going to select an item, an article or a website with its description in a web browser, please answer belowing json format. {""program"": ""select_item_detail_info"", ""content"": ""the description of an item, an article or a website in a browser""}"
 "If all of above is not correct, please give the most appropriate answer to the user's question. Please answer belowing json format. {""program"":""message"", ""content"":""your answer""}"

src/rising_plugin/guardrails-config/actions/phone.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

src/rising_plugin/guardrails-config/general.co CHANGED Viewed

@@ -15,5 +15,5 @@ define bot inform capabilities
 define flow
   priority 0.9
   user ...
-  $result = execute general_question(query=$last_user_message, model="gpt-3.5-turbo", uuid="", image_search=True)
   bot $result

 define flow
   priority 0.9
   user ...
+  $result = execute general_question(query=$last_user_message, model="gpt-4", uuid="", image_search=True)
   bot $result

src/rising_plugin/llm/__init__.py ADDED Viewed

File without changes

src/rising_plugin/llm/falcon_llm.py ADDED Viewed

	@@ -0,0 +1,35 @@

+"""falcon llm"""
+from langchain import HuggingFaceHub, PromptTemplate, LLMChain
+from src.common.utils import HUGGINGFACEHUB_API_TOKEN
+repo_id = "tiiuae/falcon-7b-instruct"
+template = """
+You are an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the user's questions.
+{question}
+"""
+class FalconLLM:
+    def __init__(self, temperature: float = 0.6, max_new_tokens: int = 2000):
+        self.llm = HuggingFaceHub(
+            huggingfacehub_api_token=HUGGINGFACEHUB_API_TOKEN,
+            repo_id=repo_id,
+            model_kwargs={"temperature": temperature, "max_new_tokens": max_new_tokens},
+        )
+    def get_llm(self):
+        return self.llm
+    def get_chain(self):
+        prompt = PromptTemplate(template=template, input_variables=["question"])
+        llm_chain = LLMChain(prompt=prompt, llm=self.llm, verbose=True)
+        return llm_chain
+    """getting the output in query with falcon llm"""
+    def query(self, question: str) -> str:
+        chain = self.get_chain()
+        return chain.run(question=question)

src/rising_plugin/llm/gpt_llm.py ADDED Viewed

	@@ -0,0 +1,26 @@

+"""gpt-open ai llm"""
+from typing import Any
+from langchain.chat_models import ChatOpenAI
+from langchain.chains.question_answering import load_qa_chain
+from src.common.utils import (
+    OPENAI_API_KEY,
+)
+class GptLLM:
+    def __init__(self, model: str = "gpt-3.5-turbo", temperature: float = 0.6):
+        self.llm = self.init_llm(model=model, temperature=temperature)
+    def init_llm(self, model: str = "gpt-3.5-turbo", temperature: float = 0.6) -> Any:
+        self.llm = ChatOpenAI(
+            model_name=model, temperature=temperature, openai_api_key=OPENAI_API_KEY
+        )
+        return self.llm
+    def get_llm(self):
+        return self.llm
+    def get_chain(self):
+        chain = load_qa_chain(self.llm, chain_type="stuff")
+        return chain

src/rising_plugin/llm/llms.py ADDED Viewed

	@@ -0,0 +1,57 @@

+"""lLMs which we offer"""
+from typing import Any
+from src.common.brain_exception import BrainException
+from src.rising_plugin.llm.falcon_llm import FalconLLM
+from src.rising_plugin.llm.gpt_llm import GptLLM
+GPT_3_5_TURBO = "gpt-3.5-turbo"
+GPT_4 = "gpt-4"
+GPT_4_32K = "gpt-4-32k"
+FALCON_7B = "falcon-7b"
+"""list of available model we offer you"""
+LLM_MODELS = [GPT_3_5_TURBO, GPT_4, GPT_4_32K, FALCON_7B]
+"""exception message"""
+EXCEPTION_MSG = f"The model is not correct. It should be in {LLM_MODELS}"
+"""validate model"""
+def validate_model(model: str) -> bool:
+    if model in LLM_MODELS:
+        return True
+    return False
+"""
+Args
+model: model name of LLM such as 'gpt-3.5-turbo' | 'falcon-7b'
+Returns
+datatype: LLmChain
+"""
+def get_llm_chain(
+    model: str, temperature: float = 0.6, max_new_tokens: int = 2000
+) -> Any:
+    if not validate_model(model):
+        raise BrainException(EXCEPTION_MSG)
+    """check model"""
+    llm = get_llm(model=model, temperature=temperature, max_new_tokens=max_new_tokens)
+    return llm.get_chain()
+def get_llm(model: str, temperature: float = 0.6, max_new_tokens: int = 2000) -> Any:
+    if not validate_model(model):
+        raise BrainException(EXCEPTION_MSG)
+    """check model"""
+    llm = GptLLM()
+    if model == GPT_3_5_TURBO or model == GPT_4 or model == GPT_4_32K:
+        llm = GptLLM(model=model)
+    elif model == FALCON_7B:
+        llm = FalconLLM(temperature=temperature, max_new_tokens=max_new_tokens)
+    return llm

src/rising_plugin/risingplugin.py CHANGED Viewed

@@ -14,9 +14,11 @@ from langchain.chat_models import ChatOpenAI
 from firebase_admin import storage
 from ..common.utils import (
     OPENAI_API_KEY,
     FIREBASE_STORAGE_ROOT,
     parseJsonFromCompletion,
 )
 from .image_embedding import (
@@ -49,7 +51,6 @@ def processLargeText(app: any, chunks: any):
             ]
         )
         result = json.dumps(message["content"])
         return parseJsonFromCompletion(result)
     else:
         first_query = "The total length of the content that I want to send you is too large to send in only one piece.\nFor sending you that content, I will follow this rule:\n[START PART 1/10]\nThis is the content of the part 1 out of 10 in total\n[END PART 1/10]\nThen you just answer: 'Received part 1/10'\nAnd when I tell you 'ALL PART SENT', then you can continue processing the data and answering my requests."
@@ -108,16 +109,16 @@ def processLargeText(app: any, chunks: any):
 def getCompletion(
     query,
-    model="gpt-3.5-turbo",
     uuid="",
     image_search=True,
 ):
-    llm = ChatOpenAI(model_name=model, temperature=0, openai_api_key=OPENAI_API_KEY)
     # Break input text into chunks
     chunks = getChunks(query)
     app = LLMRails(config, llm)
     return processLargeText(app, chunks)

 from firebase_admin import storage
+from .llm.llms import get_llm, GPT_4, FALCON_7B
 from ..common.utils import (
     OPENAI_API_KEY,
     FIREBASE_STORAGE_ROOT,
+    DEFAULT_GPT_MODEL,
     parseJsonFromCompletion,
 )
 from .image_embedding import (
             ]
         )
         result = json.dumps(message["content"])
         return parseJsonFromCompletion(result)
     else:
         first_query = "The total length of the content that I want to send you is too large to send in only one piece.\nFor sending you that content, I will follow this rule:\n[START PART 1/10]\nThis is the content of the part 1 out of 10 in total\n[END PART 1/10]\nThen you just answer: 'Received part 1/10'\nAnd when I tell you 'ALL PART SENT', then you can continue processing the data and answering my requests."
 def getCompletion(
     query,
+    model=DEFAULT_GPT_MODEL,
     uuid="",
     image_search=True,
 ):
+    llm = get_llm(model=DEFAULT_GPT_MODEL).get_llm()
     # Break input text into chunks
     chunks = getChunks(query)
     app = LLMRails(config, llm)
     return processLargeText(app, chunks)

src/router/api.py CHANGED Viewed

@@ -2,6 +2,7 @@ import json
 import os
 from src.common.assembler import Assembler
 from src.common.utils import ProgramType
 from src.model.image_model import ImageModel
 from src.model.requests.request_model import (
@@ -77,13 +78,17 @@ def construct_blueprint_api() -> APIRouter:
                     uuid=uuid, search=result["content"]
                 )
                 result["content"] = str(contacts_results)
-        except Exception as e:
-            logger.error(title="sendNotification", message=json.dumps(result))
-        notification = {"title": "alert", "content": json.dumps(result)}
-        state, value = send_message(notification, [token])
-        return assembler.to_response(200, value, result)
     """@generator.response(
         status_code=200, schema={"message": "message", "result": "test_result"}

 import os
 from src.common.assembler import Assembler
+from src.common.brain_exception import BrainException
 from src.common.utils import ProgramType
 from src.model.image_model import ImageModel
 from src.model.requests.request_model import (
                     uuid=uuid, search=result["content"]
                 )
                 result["content"] = str(contacts_results)
+            notification = {"title": "alert", "content": json.dumps(result)}
+            state, value = send_message(notification, [token])
+            return assembler.to_response(200, value, result)
+        except Exception as e:
+            logger.error(
+                title="sendNotification", message="json parsing or get completion error"
+            )
+            if isinstance(e, BrainException):
+                return e.get_response_exp()
     """@generator.response(
         status_code=200, schema={"message": "message", "result": "test_result"}

src/service/llm/chat_service.py CHANGED Viewed

@@ -3,7 +3,7 @@ import time
 from openai.error import RateLimitError
-from src.common.utils import AGENT_NAME, GPT_MODEL
 from src.rising_plugin.risingplugin import handle_chat_completion
 from src.logs import logger
 from src.model.chat_response_model import ChatResponseModel
@@ -11,7 +11,7 @@ from src.model.message_model import MessageModel
 class ChatService:
-    def __init__(self, ai_name=AGENT_NAME, llm_model=GPT_MODEL):
         self.ai_name = ai_name
         self.llm_model = llm_model

 from openai.error import RateLimitError
+from src.common.utils import AGENT_NAME, DEFAULT_GPT_MODEL
 from src.rising_plugin.risingplugin import handle_chat_completion
 from src.logs import logger
 from src.model.chat_response_model import ChatResponseModel
 class ChatService:
+    def __init__(self, ai_name=AGENT_NAME, llm_model=DEFAULT_GPT_MODEL):
         self.ai_name = ai_name
         self.llm_model = llm_model