|
|
|
|
|
import os |
|
|
|
|
|
|
|
|
HF_TOKEN = os.getenv("HF_TOKEN") |
|
|
|
|
|
|
|
|
HF_DS_REPO_ID = os.getenv("HF_REPO_ID", "m97j/pls-datasets") |
|
|
HF_INDEX_FILE = os.getenv("HF_INDEX_FILE", "faiss/faiss_index_flat.faiss") |
|
|
HF_IDS_FILE = os.getenv("HF_IDS_FILE", "faiss/vector_ids.npy") |
|
|
|
|
|
|
|
|
HF_CORPUS_REPO = os.getenv("HF_CORPUS_REPO", "HuggingFaceFW/finewiki") |
|
|
HF_CORPUS_SUBSET = os.getenv("HF_CORPUS_SUBSET", "ko") |
|
|
HF_CORPUS_SPLIT = os.getenv("HF_CORPUS_SPLIT", "train") |
|
|
|
|
|
|
|
|
MARKER_DIR = os.getenv("MARKER_DIR", "rag/state") |
|
|
CORPUS_READY_MARK = os.path.join(MARKER_DIR, ".corpus_ready") |
|
|
|
|
|
|
|
|
HF_MODEL_REPO_ID = os.getenv("HF_MODEL_REPO_ID", "m97j/pragmatic-search") |
|
|
EMBED_MODEL = os.getenv("EMBED_MODEL", "model_quantized.onnx") |
|
|
EMBED_DIR = os.getenv("EMBED_DIR", "embedder") |
|
|
|
|
|
|
|
|
RERANK_MODEL = os.getenv("RERANK_MODEL", "model_quantized.onnx") |
|
|
RERANK_DIR = os.getenv("RERANK_DIR", "reranker") |
|
|
|
|
|
|
|
|
TOP_K = int(os.getenv("TOP_K", "5")) |
|
|
|
|
|
|
|
|
|