File size: 2,169 Bytes

5fc8c9d

# okto_version: "1.1"
PROJECT "LoRAChatbot"
DESCRIPTION "Fine-tuning a chatbot using LoRA adapters for efficient training"
VERSION "1.0"
AUTHOR "OktoSeek"

DATASET {

    mix_datasets: [
        { path: "dataset/base_conversations.jsonl", weight: 60 },
        { path: "dataset/specialized_qa.jsonl", weight: 30 },
        { path: "dataset/domain_specific.jsonl", weight: 10 }
    ]

    dataset_percent: 75

    sampling: "weighted"

    shuffle: true

    format: "jsonl"

    type: "chat"

    language: "en"
}

MODEL {

    base: "oktoseek/base-llm-7b"

    architecture: "transformer"

    parameters: 7B

    context_window: 4096

    precision: "fp16"
}

FT_LORA {

    base_model: "oktoseek/base-llm-7b"

    train_dataset: "dataset/main.jsonl"

    lora_rank: 8

    lora_alpha: 32

    dataset_percent: 75

    mix_datasets: [
        { path: "dataset/base_conversations.jsonl", weight: 60 },
        { path: "dataset/specialized_qa.jsonl", weight: 30 },
        { path: "dataset/domain_specific.jsonl", weight: 10 }
    ]

    epochs: 5

    batch_size: 4

    learning_rate: 0.00003

    device: "cuda"

    target_modules: ["q_proj", "v_proj", "k_proj", "o_proj"]
}

METRICS {
    loss
    perplexity
    accuracy
    f1
    rouge_l
}

VALIDATE {

    on_validation: true

    frequency: 1

    save_best_model: true

    metric_to_monitor: "loss"
}

MONITOR {

    level: "full"

    log_metrics: [
        "loss",
        "val_loss",
        "accuracy",
        "perplexity"
    ]

    log_system: [
        "gpu_memory_used",
        "gpu_memory_free",
        "cpu_usage",
        "ram_used",
        "temperature"
    ]

    log_speed: [
        "tokens_per_second",
        "samples_per_second"
    ]

    refresh_interval: 2s

    export_to: "runs/lora-chatbot/system.json"

    dashboard: true
}

EXPORT {

    format: ["gguf", "okm", "safetensors"]

    path: "export/"

    quantization: "int8"
}

LOGGING {

    save_logs: true

    metrics_file: "runs/lora-chatbot/metrics.json"

    training_file: "runs/lora-chatbot/training_logs.json"

    log_level: "info"

    log_every: 10
}