File size: 1,391 Bytes
5fc8c9d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
PROJECT "PizzaBot"
DESCRIPTION "AI specialized in pizza restaurant service"
VERSION "1.0"
TAGS ["food", "restaurant", "chatbot"]
AUTHOR "OktoSeek"

ENV {
  accelerator: "gpu"
  min_memory: "8GB"
  precision: "fp16"
  backend: "oktoseek"
  install_missing: true
  platform: "any"
  network: "online"
}

DATASET {
  train: "dataset/train.jsonl"
  validation: "dataset/val.jsonl"
  test: "dataset/test.jsonl"
  format: "jsonl"
  type: "chat"
  language: "en"
}

MODEL {
  base: "oktoseek/pizza-small"
  architecture: "transformer"
  parameters: 120M
  context_window: 2048
  precision: "fp16"
}

TRAIN {
  epochs: 5
  batch_size: 32
  learning_rate: 0.0001
  optimizer: "adamw"
  scheduler: "cosine"
  device: "auto"
  gradient_accumulation: 2
  checkpoint_steps: 100
  early_stopping: true
}

METRICS {
  accuracy
  perplexity
  f1
  rouge
  cosine_similarity
}

VALIDATE {
  on_train: true
  on_validation: true
  frequency: 1
}

INFERENCE {
  max_tokens: 200
  temperature: 0.7
  top_p: 0.9
  top_k: 40
}

EXPORT {
  format: ["gguf", "onnx", "okm", "safetensors"]
  path: "export/"
  quantization: "int8"
}

DEPLOY {
  target: "api"
  endpoint: "http://localhost:9000/pizzabot"
  requires_auth: true
}

SECURITY {
  encrypt_model: true
  watermark: true
}

LOGGING {
  save_logs: true
  metrics_file: "runs/pizzabot-v1/metrics.json"
  training_file: "runs/pizzabot-v1/training_logs.json"
}