oktoscript / examples /qa-embeddings.okt
OktoSeek's picture
Upload 48 files
5fc8c9d verified
PROJECT "QAEmbeddings"
DESCRIPTION "Question-Answering system with embeddings and similarity search"
VERSION "1.0"
AUTHOR "OktoSeek"
DATASET {
train: "dataset/qa_train.jsonl"
validation: "dataset/qa_val.jsonl"
format: "qa"
type: "qa"
language: "en"
}
MODEL {
base: "oktoseek/qa-encoder"
architecture: "bert"
parameters: 110M
context_window: 512
precision: "fp16"
}
TRAIN {
epochs: 10
batch_size: 16
learning_rate: 0.00005
optimizer: "adamw"
scheduler: "linear"
loss: "cross_entropy"
device: "cuda"
gpu: true
mixed_precision: true
early_stopping: true
checkpoint_steps: 200
weight_decay: 0.01
gradient_clip: 1.0
warmup_steps: 500
}
METRICS {
accuracy
f1
f1_macro
cosine_similarity
custom "retrieval_accuracy"
}
VALIDATE {
on_validation: true
frequency: 1
save_best_model: true
metric_to_monitor: "f1"
}
INFERENCE {
max_tokens: 256
temperature: 0.3
top_p: 0.95
top_k: 20
}
EXPORT {
format: ["onnx", "okm", "safetensors"]
path: "export/"
quantization: "int8"
optimize_for: "accuracy"
}
DEPLOY {
target: "api"
endpoint: "http://localhost:9000/qa"
requires_auth: true
port: 9000
max_concurrent_requests: 200
}
LOGGING {
save_logs: true
metrics_file: "runs/qa-embeddings/metrics.json"
training_file: "runs/qa-embeddings/training_logs.json"
log_level: "info"
log_every: 20
}