kenlkehl commited on
Commit
71d568a
·
verified ·
1 Parent(s): 1f198e6

Update config.py

Browse files
Files changed (1) hide show
  1. config.py +6 -6
config.py CHANGED
@@ -10,20 +10,20 @@
10
  # Set to None to skip auto-loading, or provide model path/HuggingFace ID
11
  MODEL_CONFIG = {
12
  # TinyBERT tagger for extracting relevant excerpts
13
- "tagger": "/ksg/kehl_mm_data/meta/2024/v20/v20_models/tagger", # e.g., "prajjwal1/bert-tiny" or "./auto-tiny-bert-tagger"
14
 
15
  # Sentence transformer for embedding patient summaries and trials
16
- "embedder": "/ksg/kehl_mm_data/meta/2024/v20/v20_models/trialspace", # e.g., "Qwen/Qwen3-Embedding-0.6B" or "./reranker_round2.model"
17
 
18
  # Large language model for patient history summarization
19
- "llm": "/ksg/kehl_mm_data/meta/2024/v20/v20_oncoreasoning_training/gcp_export/checkpoint-60000-for-export/",
20
  #"llm": "openai/gpt-oss-120b",
21
 
22
  # ModernBERT classifier for eligibility prediction
23
- "trial_checker": "/ksg/kehl_mm_data/meta/2024/v20/v20_models/trialchecker", # e.g., "answerdotai/ModernBERT-large" or "./modernbert-trial-checker"
24
 
25
  # ModernBERT classifier for boilerplate exclusion prediction
26
- "boilerplate_checker": "/ksg/kehl_mm_data/meta/2024/v20/v20_models/boilerplatechecker", # e.g., "answerdotai/ModernBERT-large" or "./modernbert-boilerplate-checker"
27
  }
28
 
29
  # Example configuration with base models:
@@ -51,7 +51,7 @@ MODEL_CONFIG = {
51
  # Path to default trial database CSV/Excel file
52
  # Will auto-load and embed when embedder model is ready
53
  # Set to None to disable auto-loading
54
- DEFAULT_TRIAL_DB = "./trial_space_lineitems.csv" # e.g., "./my_trials.csv" or "./sample_trials.csv"
55
 
56
  # ============================================================================
57
  # PRE-EMBEDDED TRIALS (Recommended for faster startup)
 
10
  # Set to None to skip auto-loading, or provide model path/HuggingFace ID
11
  MODEL_CONFIG = {
12
  # TinyBERT tagger for extracting relevant excerpts
13
+ "tagger": "ksg-dfci/TinyOncoBertTagger-1225", # e.g., "prajjwal1/bert-tiny" or "./auto-tiny-bert-tagger"
14
 
15
  # Sentence transformer for embedding patient summaries and trials
16
+ "embedder": "ksg-dfci/TrialSpace-1225, # e.g., "Qwen/Qwen3-Embedding-0.6B" or "./reranker_round2.model"
17
 
18
  # Large language model for patient history summarization
19
+ "llm": "ksg-dfci/OncoReasoning-3B-1225",
20
  #"llm": "openai/gpt-oss-120b",
21
 
22
  # ModernBERT classifier for eligibility prediction
23
+ "trial_checker": "ksg-dfci/TrialChecker-3B-1225", # e.g., "answerdotai/ModernBERT-large" or "./modernbert-trial-checker"
24
 
25
  # ModernBERT classifier for boilerplate exclusion prediction
26
+ "boilerplate_checker": "ksg-dfci/BoilerplateChecker-3B-1225", # e.g., "answerdotai/ModernBERT-large" or "./modernbert-boilerplate-checker"
27
  }
28
 
29
  # Example configuration with base models:
 
51
  # Path to default trial database CSV/Excel file
52
  # Will auto-load and embed when embedder model is ready
53
  # Set to None to disable auto-loading
54
+ #DEFAULT_TRIAL_DB = "./trial_space_lineitems.csv" # e.g., "./my_trials.csv" or "./sample_trials.csv"
55
 
56
  # ============================================================================
57
  # PRE-EMBEDDED TRIALS (Recommended for faster startup)