Spaces:

sifars
/

sifars-chatbot-demo

Sleeping

App Files Files Community

Aryan Jain commited on Oct 21, 2024

Commit

609858e

1 Parent(s): c2ebaa7

migrate to groq

Browse files

Files changed (4) hide show

.env.example +2 -2
poetry.lock +77 -1
pyproject.toml +1 -0
src/utils/_chat_client.py +28 -14

.env.example CHANGED Viewed

@@ -1,4 +1,4 @@
 LOG_FILE=
-HF_TOKEN=
 PINECONE_API_KEY=
-PINECONE_INDEX_NAME=

 LOG_FILE=
 PINECONE_API_KEY=
+PINECONE_INDEX_NAME=
+GROQ_API_KEY=

poetry.lock CHANGED Viewed

@@ -264,6 +264,17 @@ files = [
     {file = "colorama-0.4.6.tar.gz", hash = "sha256:08695f5cb7ed6e0531a20572697297273c47b8cae5a63ffc6d6ed5c201be6e44"},
 ]
 [[package]]
 name = "fastapi"
 version = "0.112.2"
@@ -427,6 +438,25 @@ files = [
 docs = ["Sphinx", "furo"]
 test = ["objgraph", "psutil"]
 [[package]]
 name = "grpcio"
 version = "1.66.1"
@@ -496,6 +526,27 @@ files = [
     {file = "h11-0.14.0.tar.gz", hash = "sha256:8f19fbbe99e72420ff35c00b27a34cb9937e902a8b810e2c88300c6f0a3b699d"},
 ]
 [[package]]
 name = "httptools"
 version = "0.6.1"
@@ -544,6 +595,31 @@ files = [
 [package.extras]
 test = ["Cython (>=0.29.24,<0.30.0)"]
 [[package]]
 name = "huggingface-hub"
 version = "0.24.6"
@@ -1623,4 +1699,4 @@ dev = ["black (>=19.3b0)", "pytest (>=4.6.2)"]
 [metadata]
 lock-version = "2.0"
 python-versions = "3.11.*"
-content-hash = "5fdd4c6613f0bfe9744a9ad2d35e8a225ab8eb6da52724717996dbc79c6f6062"

     {file = "colorama-0.4.6.tar.gz", hash = "sha256:08695f5cb7ed6e0531a20572697297273c47b8cae5a63ffc6d6ed5c201be6e44"},
 ]
+[[package]]
+name = "distro"
+version = "1.9.0"
+description = "Distro - an OS platform information API"
+optional = false
+python-versions = ">=3.6"
+files = [
+    {file = "distro-1.9.0-py3-none-any.whl", hash = "sha256:7bffd925d65168f85027d8da9af6bddab658135b840670a223589bc0c8ef02b2"},
+    {file = "distro-1.9.0.tar.gz", hash = "sha256:2fa77c6fd8940f116ee1d6b94a2f90b13b5ea8d019b98bc8bafdcabcdd9bdbed"},
+]
 [[package]]
 name = "fastapi"
 version = "0.112.2"
 docs = ["Sphinx", "furo"]
 test = ["objgraph", "psutil"]
+[[package]]
+name = "groq"
+version = "0.11.0"
+description = "The official Python library for the groq API"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "groq-0.11.0-py3-none-any.whl", hash = "sha256:e328531c979542e563668c62260aec13b43a6ee0ca9e2fb22dff1d26f8c8ce54"},
+    {file = "groq-0.11.0.tar.gz", hash = "sha256:dbb9aefedf388ddd4801ec7bf3eba7f5edb67948fec0cd2829d97244059f42a7"},
+]
+[package.dependencies]
+anyio = ">=3.5.0,<5"
+distro = ">=1.7.0,<2"
+httpx = ">=0.23.0,<1"
+pydantic = ">=1.9.0,<3"
+sniffio = "*"
+typing-extensions = ">=4.7,<5"
 [[package]]
 name = "grpcio"
 version = "1.66.1"
     {file = "h11-0.14.0.tar.gz", hash = "sha256:8f19fbbe99e72420ff35c00b27a34cb9937e902a8b810e2c88300c6f0a3b699d"},
 ]
+[[package]]
+name = "httpcore"
+version = "1.0.6"
+description = "A minimal low-level HTTP client."
+optional = false
+python-versions = ">=3.8"
+files = [
+    {file = "httpcore-1.0.6-py3-none-any.whl", hash = "sha256:27b59625743b85577a8c0e10e55b50b5368a4f2cfe8cc7bcfa9cf00829c2682f"},
+    {file = "httpcore-1.0.6.tar.gz", hash = "sha256:73f6dbd6eb8c21bbf7ef8efad555481853f5f6acdeaff1edb0694289269ee17f"},
+]
+[package.dependencies]
+certifi = "*"
+h11 = ">=0.13,<0.15"
+[package.extras]
+asyncio = ["anyio (>=4.0,<5.0)"]
+http2 = ["h2 (>=3,<5)"]
+socks = ["socksio (==1.*)"]
+trio = ["trio (>=0.22.0,<1.0)"]
 [[package]]
 name = "httptools"
 version = "0.6.1"
 [package.extras]
 test = ["Cython (>=0.29.24,<0.30.0)"]
+[[package]]
+name = "httpx"
+version = "0.27.2"
+description = "The next generation HTTP client."
+optional = false
+python-versions = ">=3.8"
+files = [
+    {file = "httpx-0.27.2-py3-none-any.whl", hash = "sha256:7bb2708e112d8fdd7829cd4243970f0c223274051cb35ee80c03301ee29a3df0"},
+    {file = "httpx-0.27.2.tar.gz", hash = "sha256:f7c2be1d2f3c3c3160d441802406b206c2b76f5947b11115e6df10c6c65e66c2"},
+]
+[package.dependencies]
+anyio = "*"
+certifi = "*"
+httpcore = "==1.*"
+idna = "*"
+sniffio = "*"
+[package.extras]
+brotli = ["brotli", "brotlicffi"]
+cli = ["click (==8.*)", "pygments (==2.*)", "rich (>=10,<14)"]
+http2 = ["h2 (>=3,<5)"]
+socks = ["socksio (==1.*)"]
+zstd = ["zstandard (>=0.18.0)"]
 [[package]]
 name = "huggingface-hub"
 version = "0.24.6"
 [metadata]
 lock-version = "2.0"
 python-versions = "3.11.*"
+content-hash = "0f525b306edcca87bf7610ba62d87494081bf667f74bceb87cb2be1fb5b539a4"

pyproject.toml CHANGED Viewed

@@ -17,6 +17,7 @@ nltk = "^3.9.1"
 pinecone = {extras = ["grpc"], version = "^5.1.0"}
 uvicorn = {extras = ["standard"], version = "^0.30.6"}
 aiofiles = "^24.1.0"
 [build-system]

 pinecone = {extras = ["grpc"], version = "^5.1.0"}
 uvicorn = {extras = ["standard"], version = "^0.30.6"}
 aiofiles = "^24.1.0"
+groq = "^0.11.0"
 [build-system]

src/utils/_chat_client.py CHANGED Viewed

@@ -1,37 +1,49 @@
 import os
-from huggingface_hub import InferenceClient
 INSTRUCTIONS="""
 You are an AI assistant designed by Sifars, a web development company, who gives answers to queries regarding Sifars, to the best of your ability.
 You will be provided a context along with each user query which you will use to answer the queries.
 Match the question with the context and according to that answer the user query.
 <RULES>
 - Keep your responses as short and to the point as possible. They should be concise, engaging, and easy to read.
 - Avoid including extra information not asked for in the user query.
 - Use plural first person pronouns when talking about sifars.
 - Try to answer the query from the context provided. Even if the context does not directly answer the question, try to relate it to the question and formulate an answer.
-- Do not mention the context provided, or the contents of the context, for any reason in your message.
-- If someone asks about sifars, give them only the necessary details and then ask them to visit our about page at [this link](https://www.sifars.com/en/about/).
-- If someone asks about the services we provide, give them a bit of idea according to the interest of their query and then direct them to our services page at [this link](https://www.sifars.com/en/services/).
-- If someone asks about our projects or portfolio, provide them details of any three projects with minimal overview of those projects, according to the interest of their query and then direct them to our portfolio page at [this link](https://www.sifars.com/en/portfolio/).
-- If someone asks about our technology or tech stack that we use, give them a bit of idea according to the interest of their query and then direct them to our technology page at [this link](https://www.sifars.com/en/technology/).
-- If someone asks about career opportunities, direct them to our career page at [this link](https://www.sifars.com/en/career/).
 </RULES>
 """
 class ChatClient:
     def __init__(
         self,
-        model: str="meta-llama/Llama-3.2-11B-Vision-Instruct",
         max_tokens: int=4096,
         stream: bool=True,
         system_message: str=INSTRUCTIONS
     ):
-        self.client = InferenceClient(
-            model=model,
-            token=os.getenv("HF_TOKEN")
         )
         self.max_tokens = max_tokens
         self.stream = stream
         self.system_message = system_message
@@ -46,13 +58,15 @@ class ChatClient:
         self,
         messages: list,
     ):
-        for message in self.client.chat_completion(
             messages=[
                 {"role": "system", "content": self.system_message},
                 *messages
             ],
             max_tokens=self.max_tokens,
             stream=self.stream,
             temperature=0.7
         ):
-            yield message.choices[0].delta.content

 import os
+from groq import Groq
 INSTRUCTIONS="""
 You are an AI assistant designed by Sifars, a web development company, who gives answers to queries regarding Sifars, to the best of your ability.
 You will be provided a context along with each user query which you will use to answer the queries.
 Match the question with the context and according to that answer the user query.
+# Here is a bit of information about Sifars:
+Sifars, a pioneering web service provider, emerged onto the tech landscape in 2018 with a vision to revolutionize the digital sphere. Founded by visionary entrepreneurs Jatin Sethi, Munish Kumar, and Sukhwinder Singh, Sifars set its sights on empowering businesses worldwide with cutting-edge technology solutions. With its global headquarters nestled in the vibrant city of Patiala, Punjab, India, Sifars quickly garnered recognition as a leading application development company, committed to propelling businesses towards success in the ever-evolving tech landscape.
+Email: contact@sifars.com
+Address: SCO 6, First Floor, Phulkian Enclave,
+Near Mini Secretariat, Patiala, Punjab 147001
 <RULES>
+- It is mandatory to not give the project cost estimates. Instead ask the user to contact us for the same.
+- If something you not found in the context then do not say that you do not have context.
+- If user asks some information you don't have knowledge about then ask them to contact us along with the contact information and link of contact page instead of trying to answer it.
+- It is mandatory for you to not mention the context provided, or the contents of the context, for any reason in your message.
 - Keep your responses as short and to the point as possible. They should be concise, engaging, and easy to read.
 - Avoid including extra information not asked for in the user query.
 - Use plural first person pronouns when talking about sifars.
 - Try to answer the query from the context provided. Even if the context does not directly answer the question, try to relate it to the question and formulate an answer.
+- If someone asks to contact us, give them our contact information and link of contact page at https://www.sifars.com/en/contact/.
+- If someone asks about sifars, give them only the necessary details and then ask them to visit our about page at https://www.sifars.com/en/about/.
+- If someone asks about the services we provide, give them a bit of idea according to the interest of their query and then direct them to our services page at https://www.sifars.com/en/services/.
+- If someone asks about our projects or portfolio, provide them details of any three projects with minimal overview of those projects, according to the interest of their query and then direct them to our portfolio page at https://www.sifars.com/en/portfolio/.
+- If someone asks about our technology or tech stack that we use, give them a bit of idea according to the interest of their query and then direct them to our technology page at https://www.sifars.com/en/technology/.
+- If someone asks about career opportunities, direct them to our career page at https://www.sifars.com/en/career/.
+- It is mandatory for you to not make up any links on your own. Only use the links provided above.
 </RULES>
 """
 class ChatClient:
     def __init__(
         self,
+        model: str="llama-3.1-70b-versatile",
         max_tokens: int=4096,
         stream: bool=True,
         system_message: str=INSTRUCTIONS
     ):
+        self.client = Groq(
+            api_key=os.getenv("GROQ_API_KEY"),
         )
+        self.model = model
         self.max_tokens = max_tokens
         self.stream = stream
         self.system_message = system_message
         self,
         messages: list,
     ):
+        for message in self.client.chat.completions.create(
             messages=[
                 {"role": "system", "content": self.system_message},
                 *messages
             ],
+            model=self.model,
             max_tokens=self.max_tokens,
             stream=self.stream,
             temperature=0.7
         ):
+            if message.choices[0].delta.content:
+                yield message.choices[0].delta.content