File size: 894 Bytes
2072181
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
{
  "model_name": "url-classifier",
  "architecture": "autoresearch",
  "version": "1.0.0",
  "training_dataset": "iowacat",
  "accuracy": 0.9962,
  "final_loss": 0.002,
  "training_seconds": 300.3,
  "gpu": "RTX 4060 Laptop",

  "model": {
    "depth": 4,
    "aspect_ratio": 96,
    "head_dim": 128,
    "model_dim": 384,
    "n_head": 3,
    "n_kv_head": 3,
    "n_embd": 384,
    "vocab_size": 100277,
    "max_seq_len": 64,
    "window_pattern": "SSSL",
    "estimated_params": 161000000
  },

  "tokenizer": {
    "name": "cl100k_base",
    "library": "tiktoken",
    "vocab_size": 100277,
    "bos_id": 1,
    "pad_id": 0
  },

  "training": {
    "batch_size": 16,
    "total_batch_size": 8192,
    "grad_accum_steps": 512,
    "time_budget_seconds": 300,
    "lr": 1.0,
    "optimizer": "muon + adamw"
  },

  "class_labels": {
    "0": "A (列表页)",
    "1": "B (详情页)"
  }
}