JacobLinCool commited on
Commit
8cd6de3
·
verified ·
1 Parent(s): 99bcb68

fix: reduce embedding context

Browse files

Sync GitHub commit 663bcb5; use n_ctx=768 for dashboard retrieval embeddings.

README.md CHANGED
@@ -223,6 +223,7 @@ ADVISOR_CACHE_DIR=/data/advisor-cache
223
  ADVISOR_REFRESH_EMBEDDING_TIMEOUT_SECONDS=1800
224
  ADVISOR_EMBEDDING_MODEL_REPO=ggml-org/embeddinggemma-300m-qat-q8_0-GGUF
225
  ADVISOR_EMBEDDING_MODEL_FILE=embeddinggemma-300m-qat-Q8_0.gguf
 
226
  ADVISOR_ASR_MODEL_ID=nvidia/nemotron-speech-streaming-en-0.6b
227
  ```
228
 
 
223
  ADVISOR_REFRESH_EMBEDDING_TIMEOUT_SECONDS=1800
224
  ADVISOR_EMBEDDING_MODEL_REPO=ggml-org/embeddinggemma-300m-qat-q8_0-GGUF
225
  ADVISOR_EMBEDDING_MODEL_FILE=embeddinggemma-300m-qat-Q8_0.gguf
226
+ ADVISOR_EMBEDDING_N_CTX=768
227
  ADVISOR_ASR_MODEL_ID=nvidia/nemotron-speech-streaming-en-0.6b
228
  ```
229
 
data/project_index.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "schema_version": 3,
3
  "algorithm": "llama-cpp-embedding-v1",
4
- "generated_at": "2026-06-08T00:34:45+00:00",
5
  "snapshot_generated_at": "2026-06-07T11:51:09+00:00",
6
  "snapshot_source": "https://huggingface.co/api/spaces?author=build-small-hackathon",
7
  "snapshot_digest": "a442d8146fa01965567a27e43d42587de7048b93352e016151a524d2ecbf2034",
@@ -15,7 +15,7 @@
15
  "build_source": "local",
16
  "builder": "scripts/build_project_index.py",
17
  "llama_cpp_python_version": "0.3.27",
18
- "n_ctx": 2048
19
  },
20
  "documents": [
21
  {
 
1
  {
2
  "schema_version": 3,
3
  "algorithm": "llama-cpp-embedding-v1",
4
+ "generated_at": "2026-06-08T00:39:11+00:00",
5
  "snapshot_generated_at": "2026-06-07T11:51:09+00:00",
6
  "snapshot_source": "https://huggingface.co/api/spaces?author=build-small-hackathon",
7
  "snapshot_digest": "a442d8146fa01965567a27e43d42587de7048b93352e016151a524d2ecbf2034",
 
15
  "build_source": "local",
16
  "builder": "scripts/build_project_index.py",
17
  "llama_cpp_python_version": "0.3.27",
18
+ "n_ctx": 768
19
  },
20
  "documents": [
21
  {
hackathon_advisor/llama_embedding.py CHANGED
@@ -19,7 +19,7 @@ from hackathon_advisor.data import (
19
 
20
  TRUE_VALUES = {"1", "true", "yes", "on"}
21
  FALSE_VALUES = {"0", "false", "no", "off"}
22
- DEFAULT_N_CTX = 2048
23
 
24
 
25
  class LlamaCppEmbedder:
 
19
 
20
  TRUE_VALUES = {"1", "true", "yes", "on"}
21
  FALSE_VALUES = {"0", "false", "no", "off"}
22
+ DEFAULT_N_CTX = 768
23
 
24
 
25
  class LlamaCppEmbedder: