kenlkehl commited on
Commit
07330d2
·
verified ·
1 Parent(s): a096c3f

Update config.py

Browse files
Files changed (1) hide show
  1. config.py +6 -6
config.py CHANGED
@@ -10,19 +10,19 @@
10
  # Set to None to skip auto-loading, or provide model path/HuggingFace ID
11
  MODEL_CONFIG = {
12
  # TinyBERT tagger for extracting relevant excerpts
13
- "tagger": "/ksg/kehl_mm_data/meta/2024/v17/v17_models/auto-tiny-bert-tagger", # e.g., "prajjwal1/bert-tiny" or "./auto-tiny-bert-tagger"
14
 
15
  # Sentence transformer for embedding patient summaries and trials
16
- "embedder": "/ksg/kehl_mm_data/meta/2024/v17/v17_models/reranker_round2.model", # e.g., "Qwen/Qwen3-Embedding-0.6B" or "./reranker_round2.model"
17
 
18
  # Large language model for patient history summarization
19
- "llm": "meta-llama/Llama-3.2-3B-Instruct", # e.g., "microsoft/Phi-3-mini-4k-instruct" or "openai/gpt-oss-120b"
20
 
21
  # ModernBERT classifier for eligibility prediction
22
- "trial_checker": "/ksg/kehl_mm_data/meta/2024/v17/v17_models/modernbert-trial-checker", # e.g., "answerdotai/ModernBERT-large" or "./modernbert-trial-checker"
23
 
24
  # ModernBERT classifier for boilerplate exclusion prediction
25
- "boilerplate_checker": "/ksg/kehl_mm_data/meta/2024/v17/v17_models/modernbert-boilerplate-checker", # e.g., "answerdotai/ModernBERT-large" or "./modernbert-boilerplate-checker"
26
  }
27
 
28
  # Example configuration with base models:
@@ -50,7 +50,7 @@ MODEL_CONFIG = {
50
  # Path to default trial database CSV/Excel file
51
  # Will auto-load and embed when embedder model is ready
52
  # Set to None to disable auto-loading
53
- DEFAULT_TRIAL_DB = "/data1/ken/meta/2024/v17b/trial_space_lineitems.csv" # e.g., "./my_trials.csv" or "./sample_trials.csv"
54
 
55
  PREEMBEDDED_TRIALS = "trial_embeddings"
56
 
 
10
  # Set to None to skip auto-loading, or provide model path/HuggingFace ID
11
  MODEL_CONFIG = {
12
  # TinyBERT tagger for extracting relevant excerpts
13
+ "tagger": "kenlkehl/mmai-tiny-bert-tagger", # e.g., "prajjwal1/bert-tiny" or "./auto-tiny-bert-tagger"
14
 
15
  # Sentence transformer for embedding patient summaries and trials
16
+ "embedder": "kenlkehl/mmai-trialspace", # e.g., "Qwen/Qwen3-Embedding-0.6B" or "./reranker_round2.model"
17
 
18
  # Large language model for patient history summarization
19
+ "llm": "kenlkehl/mmai-oncoreasoning-3b", # e.g., "microsoft/Phi-3-mini-4k-instruct" or "openai/gpt-oss-120b"
20
 
21
  # ModernBERT classifier for eligibility prediction
22
+ "trial_checker": "kenlkehl/mmai-trial-checker", # e.g., "answerdotai/ModernBERT-large" or "./modernbert-trial-checker"
23
 
24
  # ModernBERT classifier for boilerplate exclusion prediction
25
+ "boilerplate_checker": "kenlkehl/mmai-boilerplate-checker", # e.g., "answerdotai/ModernBERT-large" or "./modernbert-boilerplate-checker"
26
  }
27
 
28
  # Example configuration with base models:
 
50
  # Path to default trial database CSV/Excel file
51
  # Will auto-load and embed when embedder model is ready
52
  # Set to None to disable auto-loading
53
+ DEFAULT_TRIAL_DB = "trial_space_lineitems.csv" # e.g., "./my_trials.csv" or "./sample_trials.csv"
54
 
55
  PREEMBEDDED_TRIALS = "trial_embeddings"
56