andrew-healey commited on
Commit
545172d
·
1 Parent(s): b76b950

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/run-crz42i9y.wandb filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/run-crz42i9y.wandb filter=lfs diff=lfs merge=lfs -text
37
+ unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/run-bd672vnz.wandb filter=lfs diff=lfs merge=lfs -text
unselective_run_1_restarted/args.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"hellaswag": true, "attention_kind": "self", "log_dir": "unselective_run_1_restarted", "resume_checkpoint": "hf://andrew-healey/context-compression/unselective_run_0/model_07500.pt", "resume_optimizer": false, "add_a_head": false, "add_head_to_start": false, "new_head_init": "normal", "max_steps": 2500, "group": "selective_surgery_2", "use_wandb": true, "kill_self_after_run": true}
unselective_run_1_restarted/dataloader_02499.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cefbc0ab907c6a30382d71f16b47450e3533ee64ae273fcfa46862dc62ec8a7
3
+ size 964
unselective_run_1_restarted/log2.txt ADDED
The diff for this file is too large to render. See raw diff
 
unselective_run_1_restarted/model_02499.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53e3fd5b54ad3d24fb0ce0a797130e359e57442c5bafb9c60b737ead39678ae2
3
+ size 497958122
unselective_run_1_restarted/optimizer_02499.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10f220f18967e0a13640ce130d00bdbcd7c084a5cd990f673b6e7bb0d5cbf9c4
3
+ size 995941510
unselective_run_1_restarted/wandb/debug-internal.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2025-02-13T07:37:21.6809945Z","level":"INFO","msg":"stream: starting","core version":"0.19.6","symlink path":"unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/logs/debug-core.log"}
2
+ {"time":"2025-02-13T07:37:21.801528338Z","level":"INFO","msg":"created new stream","id":"bd672vnz"}
3
+ {"time":"2025-02-13T07:37:21.801610934Z","level":"INFO","msg":"stream: started","id":"bd672vnz"}
4
+ {"time":"2025-02-13T07:37:21.801639326Z","level":"INFO","msg":"writer: Do: started","stream_id":"bd672vnz"}
5
+ {"time":"2025-02-13T07:37:21.801654455Z","level":"INFO","msg":"handler: started","stream_id":"bd672vnz"}
6
+ {"time":"2025-02-13T07:37:21.801694022Z","level":"INFO","msg":"sender: started","stream_id":"bd672vnz"}
7
+ {"time":"2025-02-13T07:37:22.108255632Z","level":"INFO","msg":"Starting system monitor"}
unselective_run_1_restarted/wandb/debug.log ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-02-13 07:37:21,451 INFO MainThread:2137 [wandb_setup.py:_flush():68] Current SDK version is 0.19.6
2
+ 2025-02-13 07:37:21,451 INFO MainThread:2137 [wandb_setup.py:_flush():68] Configure stats pid to 2137
3
+ 2025-02-13 07:37:21,451 INFO MainThread:2137 [wandb_setup.py:_flush():68] Loading settings from /root/.config/wandb/settings
4
+ 2025-02-13 07:37:21,451 INFO MainThread:2137 [wandb_setup.py:_flush():68] Loading settings from /workspace/context-compression/wandb/settings
5
+ 2025-02-13 07:37:21,451 INFO MainThread:2137 [wandb_setup.py:_flush():68] Loading settings from environment variables
6
+ 2025-02-13 07:37:21,452 INFO MainThread:2137 [wandb_init.py:setup_run_log_directory():637] Logging user logs to unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/logs/debug.log
7
+ 2025-02-13 07:37:21,452 INFO MainThread:2137 [wandb_init.py:setup_run_log_directory():638] Logging internal logs to unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/logs/debug-internal.log
8
+ 2025-02-13 07:37:21,452 INFO MainThread:2137 [wandb_init.py:init():756] calling init triggers
9
+ 2025-02-13 07:37:21,452 INFO MainThread:2137 [wandb_init.py:init():761] wandb.init called with sweep_config: {}
10
+ config: {'hellaswag': True, 'attention_kind': <AttentionKind.SELF: 'self'>, 'log_dir': 'unselective_run_1_restarted', 'resume_checkpoint': 'hf://andrew-healey/context-compression/unselective_run_0/model_07500.pt', 'resume_optimizer': False, 'add_a_head': False, 'add_head_to_start': False, 'new_head_init': <NewHeadInit.NORMAL: 'normal'>, 'max_steps': 2500, 'group': 'selective_surgery_2', 'use_wandb': True, 'kill_self_after_run': True, '_wandb': {}}
11
+ 2025-02-13 07:37:21,452 INFO MainThread:2137 [wandb_init.py:init():789] starting backend
12
+ 2025-02-13 07:37:21,667 INFO MainThread:2137 [wandb_init.py:init():793] sending inform_init request
13
+ 2025-02-13 07:37:21,675 INFO MainThread:2137 [backend.py:_multiprocessing_setup():97] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
14
+ 2025-02-13 07:37:21,676 INFO MainThread:2137 [wandb_init.py:init():808] backend started and connected
15
+ 2025-02-13 07:37:21,679 INFO MainThread:2137 [wandb_init.py:init():901] updated telemetry
16
+ 2025-02-13 07:37:21,688 INFO MainThread:2137 [wandb_init.py:init():936] communicating run to backend with 90.0 second timeout
17
+ 2025-02-13 07:37:22,103 INFO MainThread:2137 [wandb_init.py:init():994] starting run threads in backend
18
+ 2025-02-13 07:37:22,259 INFO MainThread:2137 [wandb_run.py:_console_start():2385] atexit reg
19
+ 2025-02-13 07:37:22,259 INFO MainThread:2137 [wandb_run.py:_redirect():2235] redirect: wrap_raw
20
+ 2025-02-13 07:37:22,259 INFO MainThread:2137 [wandb_run.py:_redirect():2300] Wrapping output streams.
21
+ 2025-02-13 07:37:22,259 INFO MainThread:2137 [wandb_run.py:_redirect():2325] Redirects installed.
22
+ 2025-02-13 07:37:22,261 INFO MainThread:2137 [wandb_init.py:init():1036] run started, returning control to user process
unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/files/output.log ADDED
The diff for this file is too large to render. See raw diff
 
unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/files/requirements.txt ADDED
@@ -0,0 +1,217 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Brotli==1.1.0
2
+ MarkupSafe==3.0.2
3
+ PySocks==1.7.1
4
+ PyYAML==6.0.2
5
+ archspec==0.2.3
6
+ asttokens==2.4.1
7
+ astunparse==1.6.3
8
+ attrs==24.2.0
9
+ beautifulsoup4==4.12.3
10
+ boltons==24.0.0
11
+ certifi==2024.8.30
12
+ cffi==1.17.1
13
+ chardet==5.2.0
14
+ charset-normalizer==3.4.0
15
+ click==8.1.7
16
+ colorama==0.4.6
17
+ conda==24.9.2
18
+ conda-build==24.9.0
19
+ conda_index==0.5.0
20
+ conda-libmamba-solver==24.9.0
21
+ conda-package-handling==2.4.0
22
+ conda_package_streaming==0.11.0
23
+ decorator==5.1.1
24
+ distro==1.9.0
25
+ dnspython==2.7.0
26
+ exceptiongroup==1.2.2
27
+ executing==2.1.0
28
+ expecttest==0.2.1
29
+ filelock==3.16.1
30
+ frozendict==2.4.6
31
+ h2==4.1.0
32
+ hpack==4.0.0
33
+ hyperframe==6.0.1
34
+ hypothesis==6.115.5
35
+ idna==3.10
36
+ importlib_resources==6.4.5
37
+ ipython==8.29.0
38
+ jedi==0.19.1
39
+ Jinja2==3.1.4
40
+ jsonpatch==1.33
41
+ jsonpointer==3.0.0
42
+ jsonschema==4.23.0
43
+ jsonschema-specifications==2024.10.1
44
+ libarchive-c==5.1
45
+ libmambapy==1.5.10
46
+ lief==0.14.1
47
+ lintrunner==0.12.5
48
+ mamba==1.5.10
49
+ matplotlib-inline==0.1.7
50
+ menuinst==2.1.2
51
+ more-itertools==10.5.0
52
+ mpmath==1.3.0
53
+ networkx==3.4.2
54
+ ninja==1.11.1.1
55
+ numpy==2.1.2
56
+ nvidia-cublas-cu12==12.4.5.8
57
+ nvidia-cuda-cupti-cu12==12.4.127
58
+ nvidia-cuda-nvrtc-cu12==12.4.127
59
+ nvidia-cuda-runtime-cu12==12.4.127
60
+ nvidia-cudnn-cu12==9.1.0.70
61
+ nvidia-cufft-cu12==11.2.1.3
62
+ nvidia-curand-cu12==10.3.5.147
63
+ nvidia-cusolver-cu12==11.6.1.9
64
+ nvidia-cusparse-cu12==12.3.1.170
65
+ nvidia-nccl-cu12==2.21.5
66
+ nvidia-nvjitlink-cu12==12.4.127
67
+ nvidia-nvtx-cu12==12.4.127
68
+ optree==0.13.0
69
+ packaging==24.1
70
+ parso==0.8.4
71
+ pexpect==4.9.0
72
+ pickleshare==0.7.5
73
+ pillow==10.2.0
74
+ pip==24.2
75
+ pkginfo==1.11.2
76
+ pkgutil_resolve_name==1.3.10
77
+ platformdirs==4.3.6
78
+ pluggy==1.5.0
79
+ prompt_toolkit==3.0.48
80
+ psutil==6.1.0
81
+ ptyprocess==0.7.0
82
+ pure_eval==0.2.3
83
+ pycosat==0.6.6
84
+ pycparser==2.22
85
+ Pygments==2.18.0
86
+ python-etcd==0.4.5
87
+ pytz==2024.2
88
+ referencing==0.35.1
89
+ requests==2.32.3
90
+ rpds-py==0.20.0
91
+ ruamel.yaml==0.18.6
92
+ ruamel.yaml.clib==0.2.8
93
+ setuptools==72.1.0
94
+ six==1.16.0
95
+ sortedcontainers==2.4.0
96
+ soupsieve==2.5
97
+ stack-data==0.6.2
98
+ sympy==1.13.1
99
+ torch==2.5.1+cu124
100
+ torchaudio==2.5.1+cu124
101
+ torchelastic==0.2.2
102
+ torchvision==0.20.1+cu124
103
+ tqdm==4.66.5
104
+ traitlets==5.14.3
105
+ triton==3.1.0
106
+ truststore==0.9.2
107
+ types-dataclasses==0.6.6
108
+ typing_extensions==4.12.2
109
+ urllib3==2.2.3
110
+ wcwidth==0.2.13
111
+ wheel==0.44.0
112
+ zipp==3.20.2
113
+ zstandard==0.23.0
114
+ smmap==5.0.2
115
+ setproctitle==1.3.4
116
+ sentry-sdk==2.21.0
117
+ pydantic_core==2.27.2
118
+ protobuf==5.29.3
119
+ docker-pycreds==0.4.0
120
+ annotated-types==0.7.0
121
+ pydantic==2.10.6
122
+ gitdb==4.0.12
123
+ GitPython==3.1.44
124
+ wandb==0.19.6
125
+ iniconfig==2.0.0
126
+ pytest==8.3.4
127
+ jupyter-archive==3.4.0
128
+ nbzip==0.1.0
129
+ webencodings==0.5.1
130
+ filetype==1.2.0
131
+ fastjsonschema==2.21.1
132
+ widgetsnbextension==4.0.13
133
+ websocket-client==1.8.0
134
+ webcolors==24.11.1
135
+ uri-template==1.3.0
136
+ types-python-dateutil==2.9.0.20241206
137
+ tornado==6.4.2
138
+ tinycss2==1.4.0
139
+ sniffio==1.3.1
140
+ Send2Trash==1.8.3
141
+ rfc3986-validator==0.1.1
142
+ rfc3339-validator==0.1.4
143
+ pyzmq==26.2.1
144
+ python-json-logger==3.2.1
145
+ prometheus_client==0.21.1
146
+ pandocfilters==1.5.1
147
+ overrides==7.7.0
148
+ nest-asyncio==1.6.0
149
+ mistune==3.1.1
150
+ jupyterlab_widgets==3.0.13
151
+ jupyterlab_pygments==0.3.0
152
+ jupyter_core==5.7.2
153
+ json5==0.10.0
154
+ h11==0.14.0
155
+ fqdn==1.5.1
156
+ defusedxml==0.7.1
157
+ debugpy==1.8.12
158
+ comm==0.2.2
159
+ bleach==6.2.0
160
+ babel==2.17.0
161
+ async-lru==2.0.4
162
+ terminado==0.18.1
163
+ jupyter_client==8.6.3
164
+ httpcore==1.0.7
165
+ arrow==1.3.0
166
+ argon2-cffi-bindings==21.2.0
167
+ anyio==4.8.0
168
+ jupyter_server_terminals==0.5.3
169
+ isoduration==20.11.0
170
+ httpx==0.28.1
171
+ argon2-cffi==23.1.0
172
+ nbformat==5.10.4
173
+ ipywidgets==8.1.5
174
+ ipykernel==6.29.5
175
+ nbclient==0.10.2
176
+ jupyter-events==0.12.0
177
+ jupyter-console==6.6.3
178
+ bash_kernel==0.10.0
179
+ nbconvert==7.16.6
180
+ jupyter_server==2.15.0
181
+ notebook_shim==0.2.4
182
+ jupyterlab_server==2.27.3
183
+ jupyter-lsp==2.2.5
184
+ jupyterlab==4.3.5
185
+ notebook==7.3.2
186
+ jupyter-http-over-ws==0.0.8
187
+ jupyter==1.1.1
188
+ aiohappyeyeballs==2.4.6
189
+ aiohttp==3.11.12
190
+ aiosignal==1.3.2
191
+ contourpy==1.3.1
192
+ cycler==0.12.1
193
+ datasets==3.2.0
194
+ dill==0.3.8
195
+ fonttools==4.56.0
196
+ frozenlist==1.5.0
197
+ fsspec==2024.9.0
198
+ huggingface-hub==0.28.1
199
+ kiwisolver==1.4.8
200
+ matplotlib==3.10.0
201
+ multidict==6.1.0
202
+ multiprocess==0.70.16
203
+ pandas==2.2.3
204
+ propcache==0.2.1
205
+ pyarrow==19.0.0
206
+ pyparsing==3.2.1
207
+ python-dateutil==2.9.0.post0
208
+ regex==2024.11.6
209
+ safetensors==0.5.2
210
+ sentencepiece==0.2.0
211
+ tiktoken==0.8.0
212
+ tokenizers==0.21.0
213
+ transformers==4.48.3
214
+ tzdata==2025.1
215
+ vastai==0.2.8
216
+ xxhash==3.5.0
217
+ yarl==1.18.3
unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/files/wandb-metadata.json ADDED
@@ -0,0 +1,95 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.4.0-182-generic-x86_64-with-glibc2.35",
3
+ "python": "CPython 3.11.10",
4
+ "startedAt": "2025-02-13T07:37:21.676558Z",
5
+ "args": [
6
+ "--group",
7
+ "selective_surgery_2",
8
+ "--resume_checkpoint",
9
+ "hf://andrew-healey/context-compression/unselective_run_0/model_07500.pt",
10
+ "--max_steps",
11
+ "2500",
12
+ "--attention_kind",
13
+ "self",
14
+ "--log_dir",
15
+ "unselective_run_1_restarted",
16
+ "--kill_self_after_run"
17
+ ],
18
+ "program": "-m context_compression.train",
19
+ "git": {
20
+ "remote": "https://github.com/andrew-healey/context-compression",
21
+ "commit": "303eb3f2a5dab5fe30125c9ccc545fc206daf467"
22
+ },
23
+ "email": "doolie.healey@gmail.com",
24
+ "root": "unselective_run_1_restarted",
25
+ "host": "8f64ce62cfdf",
26
+ "executable": "/opt/conda/bin/python3.11",
27
+ "cpu_count": 72,
28
+ "cpu_count_logical": 144,
29
+ "gpu": "NVIDIA GeForce RTX 4090",
30
+ "gpu_count": 8,
31
+ "disk": {
32
+ "/": {
33
+ "total": "222264557568",
34
+ "used": "965890048"
35
+ }
36
+ },
37
+ "memory": {
38
+ "total": "540657020928"
39
+ },
40
+ "cpu": {
41
+ "count": 72,
42
+ "countLogical": 144
43
+ },
44
+ "gpu_nvidia": [
45
+ {
46
+ "name": "NVIDIA GeForce RTX 4090",
47
+ "memoryTotal": "25757220864",
48
+ "cudaCores": 16384,
49
+ "architecture": "Ada"
50
+ },
51
+ {
52
+ "name": "NVIDIA GeForce RTX 4090",
53
+ "memoryTotal": "25757220864",
54
+ "cudaCores": 16384,
55
+ "architecture": "Ada"
56
+ },
57
+ {
58
+ "name": "NVIDIA GeForce RTX 4090",
59
+ "memoryTotal": "25757220864",
60
+ "cudaCores": 16384,
61
+ "architecture": "Ada"
62
+ },
63
+ {
64
+ "name": "NVIDIA GeForce RTX 4090",
65
+ "memoryTotal": "25757220864",
66
+ "cudaCores": 16384,
67
+ "architecture": "Ada"
68
+ },
69
+ {
70
+ "name": "NVIDIA GeForce RTX 4090",
71
+ "memoryTotal": "25757220864",
72
+ "cudaCores": 16384,
73
+ "architecture": "Ada"
74
+ },
75
+ {
76
+ "name": "NVIDIA GeForce RTX 4090",
77
+ "memoryTotal": "25757220864",
78
+ "cudaCores": 16384,
79
+ "architecture": "Ada"
80
+ },
81
+ {
82
+ "name": "NVIDIA GeForce RTX 4090",
83
+ "memoryTotal": "25757220864",
84
+ "cudaCores": 16384,
85
+ "architecture": "Ada"
86
+ },
87
+ {
88
+ "name": "NVIDIA GeForce RTX 4090",
89
+ "memoryTotal": "25757220864",
90
+ "cudaCores": 16384,
91
+ "architecture": "Ada"
92
+ }
93
+ ],
94
+ "cudaVersion": "12.4"
95
+ }
unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/logs/debug-core.log ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {"time":"2025-02-13T07:37:21.497263081Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpjgduezs0/port-2137.txt","pid":2137,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false}
2
+ {"time":"2025-02-13T07:37:21.502043586Z","level":"INFO","msg":"Will exit if parent process dies.","ppid":2137}
3
+ {"time":"2025-02-13T07:37:21.502031788Z","level":"INFO","msg":"server is running","addr":{"IP":"127.0.0.1","Port":46589,"Zone":""}}
4
+ {"time":"2025-02-13T07:37:21.667201404Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"127.0.0.1:59608"}
5
+ {"time":"2025-02-13T07:37:21.680618976Z","level":"INFO","msg":"handleInformInit: received","streamId":"bd672vnz","id":"127.0.0.1:59608"}
6
+ {"time":"2025-02-13T07:37:21.80162681Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"bd672vnz","id":"127.0.0.1:59608"}
unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/logs/debug-internal.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2025-02-13T07:37:21.6809945Z","level":"INFO","msg":"stream: starting","core version":"0.19.6","symlink path":"unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/logs/debug-core.log"}
2
+ {"time":"2025-02-13T07:37:21.801528338Z","level":"INFO","msg":"created new stream","id":"bd672vnz"}
3
+ {"time":"2025-02-13T07:37:21.801610934Z","level":"INFO","msg":"stream: started","id":"bd672vnz"}
4
+ {"time":"2025-02-13T07:37:21.801639326Z","level":"INFO","msg":"writer: Do: started","stream_id":"bd672vnz"}
5
+ {"time":"2025-02-13T07:37:21.801654455Z","level":"INFO","msg":"handler: started","stream_id":"bd672vnz"}
6
+ {"time":"2025-02-13T07:37:21.801694022Z","level":"INFO","msg":"sender: started","stream_id":"bd672vnz"}
7
+ {"time":"2025-02-13T07:37:22.108255632Z","level":"INFO","msg":"Starting system monitor"}
unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/logs/debug.log ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-02-13 07:37:21,451 INFO MainThread:2137 [wandb_setup.py:_flush():68] Current SDK version is 0.19.6
2
+ 2025-02-13 07:37:21,451 INFO MainThread:2137 [wandb_setup.py:_flush():68] Configure stats pid to 2137
3
+ 2025-02-13 07:37:21,451 INFO MainThread:2137 [wandb_setup.py:_flush():68] Loading settings from /root/.config/wandb/settings
4
+ 2025-02-13 07:37:21,451 INFO MainThread:2137 [wandb_setup.py:_flush():68] Loading settings from /workspace/context-compression/wandb/settings
5
+ 2025-02-13 07:37:21,451 INFO MainThread:2137 [wandb_setup.py:_flush():68] Loading settings from environment variables
6
+ 2025-02-13 07:37:21,452 INFO MainThread:2137 [wandb_init.py:setup_run_log_directory():637] Logging user logs to unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/logs/debug.log
7
+ 2025-02-13 07:37:21,452 INFO MainThread:2137 [wandb_init.py:setup_run_log_directory():638] Logging internal logs to unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/logs/debug-internal.log
8
+ 2025-02-13 07:37:21,452 INFO MainThread:2137 [wandb_init.py:init():756] calling init triggers
9
+ 2025-02-13 07:37:21,452 INFO MainThread:2137 [wandb_init.py:init():761] wandb.init called with sweep_config: {}
10
+ config: {'hellaswag': True, 'attention_kind': <AttentionKind.SELF: 'self'>, 'log_dir': 'unselective_run_1_restarted', 'resume_checkpoint': 'hf://andrew-healey/context-compression/unselective_run_0/model_07500.pt', 'resume_optimizer': False, 'add_a_head': False, 'add_head_to_start': False, 'new_head_init': <NewHeadInit.NORMAL: 'normal'>, 'max_steps': 2500, 'group': 'selective_surgery_2', 'use_wandb': True, 'kill_self_after_run': True, '_wandb': {}}
11
+ 2025-02-13 07:37:21,452 INFO MainThread:2137 [wandb_init.py:init():789] starting backend
12
+ 2025-02-13 07:37:21,667 INFO MainThread:2137 [wandb_init.py:init():793] sending inform_init request
13
+ 2025-02-13 07:37:21,675 INFO MainThread:2137 [backend.py:_multiprocessing_setup():97] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
14
+ 2025-02-13 07:37:21,676 INFO MainThread:2137 [wandb_init.py:init():808] backend started and connected
15
+ 2025-02-13 07:37:21,679 INFO MainThread:2137 [wandb_init.py:init():901] updated telemetry
16
+ 2025-02-13 07:37:21,688 INFO MainThread:2137 [wandb_init.py:init():936] communicating run to backend with 90.0 second timeout
17
+ 2025-02-13 07:37:22,103 INFO MainThread:2137 [wandb_init.py:init():994] starting run threads in backend
18
+ 2025-02-13 07:37:22,259 INFO MainThread:2137 [wandb_run.py:_console_start():2385] atexit reg
19
+ 2025-02-13 07:37:22,259 INFO MainThread:2137 [wandb_run.py:_redirect():2235] redirect: wrap_raw
20
+ 2025-02-13 07:37:22,259 INFO MainThread:2137 [wandb_run.py:_redirect():2300] Wrapping output streams.
21
+ 2025-02-13 07:37:22,259 INFO MainThread:2137 [wandb_run.py:_redirect():2325] Redirects installed.
22
+ 2025-02-13 07:37:22,261 INFO MainThread:2137 [wandb_init.py:init():1036] run started, returning control to user process
unselective_run_1_restarted/wandb/run-20250213_073721-bd672vnz/run-bd672vnz.wandb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69c113da980b88b9b452e990fc424443862db67d27fd812b53fc43f7d8b96947
3
+ size 3014656