File size: 2,815 Bytes
034fd6a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
{
  "config": {
    "seed": 42,
    "device": "cuda",
    "dtype": "bfloat16",
    "benchmark": {
      "repeats": 3,
      "batch_sizes": [
        1,
        2,
        4,
        8,
        16
      ],
      "max_new_tokens": [
        64,
        128
      ],
      "stop_on_eos": true,
      "measure_memory": true,
      "collect_traces": true,
      "continue_on_error": true,
      "warmup": {
        "enabled": true
      }
    },
    "workloads": {
      "synthetic": {
        "enabled": false,
        "prompt_byte_buckets": [
          256,
          1024
        ],
        "samples_per_bucket": 128
      },
      "code": {
        "enabled": true,
        "data_path": "code_completion_exp/datasets/data_V4_full",
        "split": "validation",
        "prompt_byte_buckets": [
          256,
          1024
        ],
        "samples_per_bucket": 128,
        "max_samples_to_scan": 5000
      }
    },
    "models": {
      "enabled": [
        "hnet",
        "hnet_serial",
        "bolmo",
        "pythia"
      ],
      "hnet": {
        "config_path": "hnet_project/configs/hnet_2stage_XL_code.json",
        "checkpoint_path": "hnet_project/checkpoints/hnet_2stage_XL_code.pt"
      },
      "hnet_serial": {
        "config_path": "hnet_project/configs/hnet_2stage_XL_code.json",
        "checkpoint_path": "hnet_project/checkpoints/hnet_2stage_XL_code.pt"
      },
      "bolmo": {
        "model_name": "allenai/Bolmo-1B",
        "cache_dir": "cache/bolmo",
        "local_files_only": false
      },
      "pythia": {
        "model_name": "EleutherAI/pythia-1b",
        "cache_dir": "cache/hf",
        "local_files_only": false,
        "max_context_len": 4096
      }
    },
    "paths": {
      "output_root": "generation_speed_exp/outputs"
    }
  },
  "repo_root": "/workspace/byte-llms-code",
  "workloads": {
    "code/256B": 128,
    "code/1024B": 128
  },
  "environment": {
    "timestamp": "2026-05-10T23:04:30",
    "hostname": "e41665783a40",
    "platform": "Linux-6.8.0-110-generic-x86_64-with-glibc2.39",
    "python": "3.12.0 | packaged by Anaconda, Inc. | (main, Oct  2 2023, 17:29:18) [GCC 11.2.0]",
    "git_commit": "21e26deacf90f77563e3834cfb46e6dc64f52d6e",
    "git_branch": "feature/generation-bench",
    "git_dirty": false,
    "torch": "2.6.0+cu124",
    "torch_cuda": "12.4",
    "cuda_available": true,
    "transformers": "4.57.6",
    "cuda_devices": [
      {
        "index": 0,
        "name": "NVIDIA A100X",
        "total_memory_mb": 81341.8125,
        "major": 8,
        "minor": 0
      },
      {
        "index": 1,
        "name": "NVIDIA A100X",
        "total_memory_mb": 81341.8125,
        "major": 8,
        "minor": 0
      }
    ],
    "nvidia_smi": "NVIDIA A100X, 81920 MiB, 570.86.10\nNVIDIA A100X, 81920 MiB, 570.86.10"
  }
}