kaburia commited on
Commit
4a2e120
·
1 Parent(s): 87fb7eb

utils path

Browse files
utils/coherence_bbscore.py CHANGED
@@ -3,8 +3,6 @@ import math, re, unicodedata
3
  from typing import List, Dict, Any, Optional, Tuple
4
  import numpy as np
5
  import os, re, unicodedata, numpy as np
6
- # get the reranked results with no scores
7
- from retrieve_n_rerank import retrieve_and_rerank
8
 
9
  try:
10
  from sentence_transformers import SentenceTransformer
@@ -244,12 +242,14 @@ def coherence_assessment_std(
244
  }
245
 
246
  # Get the coherence report
247
- def coherence_report(embedder="MoritzLaurer/deberta-v3-base-zeroshot-v2.0",
248
  input_text=None,
249
  reranked_results=None,
250
  run_zero_shot=True):
251
  embedder = Embedder(embedder) if isinstance(embedder, str) else embedder
252
  if reranked_results is None:
 
 
253
  reranked_results = retrieve_and_rerank(input_text)
254
  if not reranked_results:
255
  return []
 
3
  from typing import List, Dict, Any, Optional, Tuple
4
  import numpy as np
5
  import os, re, unicodedata, numpy as np
 
 
6
 
7
  try:
8
  from sentence_transformers import SentenceTransformer
 
242
  }
243
 
244
  # Get the coherence report
245
+ def coherence_report(embedder="BAAI/bge-m3",
246
  input_text=None,
247
  reranked_results=None,
248
  run_zero_shot=True):
249
  embedder = Embedder(embedder) if isinstance(embedder, str) else embedder
250
  if reranked_results is None:
251
+ # Import here to avoid circular imports
252
+ from utils.retrieve_n_rerank import retrieve_and_rerank
253
  reranked_results = retrieve_and_rerank(input_text)
254
  if not reranked_results:
255
  return []
utils/generation_streaming.py CHANGED
@@ -6,28 +6,30 @@ import time
6
  import json
7
 
8
  # encode the text
9
- from encoding_input import encode_text
10
 
11
  # rertrieve and rerank the documents
12
- from retrieve_n_rerank import retrieve_and_rerank
13
 
14
  # sentiment analysis on reranked documents
15
- from sentiment_analysis import get_sentiment
16
 
17
  # coherence assessment reports
18
- from coherence_bbscore import coherence_report
19
 
20
  # Get the vectorstore
21
- from loading_embeddings import get_vectorstore
22
- vectorstore = get_vectorstore()
23
 
24
  # build message from model generation
25
- from model_generation import build_messages
 
26
 
27
- API_KEY = "sk-do-8Hjf0liuGQCoPwglilL49xiqrthMECwjGP_kAjPM53OTOFQczPyfPK8xJc"
28
  MODEL = "llama3.3-70b-instruct"
29
 
30
  def generate_response_stream(query: str, enable_sentiment: bool, enable_coherence: bool):
 
 
31
 
32
 
33
 
 
6
  import json
7
 
8
  # encode the text
9
+ from utils.encoding_input import encode_text
10
 
11
  # rertrieve and rerank the documents
12
+ from utils.retrieve_n_rerank import retrieve_and_rerank
13
 
14
  # sentiment analysis on reranked documents
15
+ from utils.sentiment_analysis import get_sentiment
16
 
17
  # coherence assessment reports
18
+ from utils.coherence_bbscore import coherence_report
19
 
20
  # Get the vectorstore
21
+ from utils.loading_embeddings import get_vectorstore
 
22
 
23
  # build message from model generation
24
+ from utils.model_generation import build_messages
25
+ import os
26
 
27
+ API_KEY = os.getenv("API_KEY", "sk-do-8Hjf0liuGQCoPwglilL49xiqrthMECwjGP_kAjPM53OTOFQczPyfPK8xJc")
28
  MODEL = "llama3.3-70b-instruct"
29
 
30
  def generate_response_stream(query: str, enable_sentiment: bool, enable_coherence: bool):
31
+ # Initialize vectorstore when needed
32
+ vectorstore = get_vectorstore()
33
 
34
 
35
 
utils/retrieve_n_rerank.py CHANGED
@@ -1,6 +1,6 @@
1
  # load the encoded text and vectorstore
2
- from encoding_input import encode_text
3
- from loading_embeddings import get_vectorstore
4
  from sentence_transformers import CrossEncoder
5
  import numpy as np
6
  import faiss
 
1
  # load the encoded text and vectorstore
2
+ from utils.encoding_input import encode_text
3
+ from utils.loading_embeddings import get_vectorstore
4
  from sentence_transformers import CrossEncoder
5
  import numpy as np
6
  import faiss