andrew-healey commited on
Commit
b76b950
·
1 Parent(s): 4904367

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/run-crz42i9y.wandb filter=lfs diff=lfs merge=lfs -text
unselective_run_1_restarted_with_ko_zero/args.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"hellaswag": true, "attention_kind": "self", "log_dir": "unselective_run_1_restarted_with_ko_zero", "resume_checkpoint": "hf://andrew-healey/context-compression/unselective_run_0/model_07500.pt", "resume_optimizer": false, "add_a_head": true, "add_head_to_start": true, "new_head_init": "ko_zero", "max_steps": 2500, "group": "selective_surgery_2", "use_wandb": true, "kill_self_after_run": false}
unselective_run_1_restarted_with_ko_zero/dataloader_02499.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cefbc0ab907c6a30382d71f16b47450e3533ee64ae273fcfa46862dc62ec8a7
3
+ size 964
unselective_run_1_restarted_with_ko_zero/log2.txt ADDED
The diff for this file is too large to render. See raw diff
 
unselective_run_1_restarted_with_ko_zero/model_02499.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ab62d84e814520e6b58561d2d6c2e2c546bcf6b618befccc9be83c77f0ddaaa
3
+ size 507404522
unselective_run_1_restarted_with_ko_zero/optimizer_02499.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dacaba4dc5cebbd0985473fef564806ebe1d73c8125c413162c5605dc1dd18e1
3
+ size 1014834310
unselective_run_1_restarted_with_ko_zero/wandb/debug-internal.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2025-02-13T07:28:02.205250343Z","level":"INFO","msg":"stream: starting","core version":"0.19.6","symlink path":"unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/logs/debug-core.log"}
2
+ {"time":"2025-02-13T07:28:02.41832014Z","level":"INFO","msg":"created new stream","id":"crz42i9y"}
3
+ {"time":"2025-02-13T07:28:02.418401779Z","level":"INFO","msg":"stream: started","id":"crz42i9y"}
4
+ {"time":"2025-02-13T07:28:02.418464308Z","level":"INFO","msg":"writer: Do: started","stream_id":"crz42i9y"}
5
+ {"time":"2025-02-13T07:28:02.418522298Z","level":"INFO","msg":"handler: started","stream_id":"crz42i9y"}
6
+ {"time":"2025-02-13T07:28:02.418620407Z","level":"INFO","msg":"sender: started","stream_id":"crz42i9y"}
7
+ {"time":"2025-02-13T07:28:02.624460514Z","level":"INFO","msg":"Starting system monitor"}
unselective_run_1_restarted_with_ko_zero/wandb/debug.log ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_setup.py:_flush():68] Current SDK version is 0.19.6
2
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_setup.py:_flush():68] Configure stats pid to 1269
3
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_setup.py:_flush():68] Loading settings from /root/.config/wandb/settings
4
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_setup.py:_flush():68] Loading settings from /workspace/context-compression/wandb/settings
5
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_setup.py:_flush():68] Loading settings from environment variables
6
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_init.py:setup_run_log_directory():637] Logging user logs to unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/logs/debug.log
7
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_init.py:setup_run_log_directory():638] Logging internal logs to unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/logs/debug-internal.log
8
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_init.py:init():756] calling init triggers
9
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_init.py:init():761] wandb.init called with sweep_config: {}
10
+ config: {'hellaswag': True, 'attention_kind': <AttentionKind.SELF: 'self'>, 'log_dir': 'unselective_run_1_restarted_with_ko_zero', 'resume_checkpoint': 'hf://andrew-healey/context-compression/unselective_run_0/model_07500.pt', 'resume_optimizer': False, 'add_a_head': True, 'add_head_to_start': True, 'new_head_init': <NewHeadInit.KO_ZERO: 'ko_zero'>, 'max_steps': 2500, 'group': 'selective_surgery_2', 'use_wandb': True, 'kill_self_after_run': False, '_wandb': {}}
11
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_init.py:init():789] starting backend
12
+ 2025-02-13 07:28:02,194 INFO MainThread:1269 [wandb_init.py:init():793] sending inform_init request
13
+ 2025-02-13 07:28:02,201 INFO MainThread:1269 [backend.py:_multiprocessing_setup():97] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
14
+ 2025-02-13 07:28:02,201 INFO MainThread:1269 [wandb_init.py:init():808] backend started and connected
15
+ 2025-02-13 07:28:02,203 INFO MainThread:1269 [wandb_init.py:init():901] updated telemetry
16
+ 2025-02-13 07:28:02,211 INFO MainThread:1269 [wandb_init.py:init():936] communicating run to backend with 90.0 second timeout
17
+ 2025-02-13 07:28:02,621 INFO MainThread:1269 [wandb_init.py:init():994] starting run threads in backend
18
+ 2025-02-13 07:28:02,743 INFO MainThread:1269 [wandb_run.py:_console_start():2385] atexit reg
19
+ 2025-02-13 07:28:02,743 INFO MainThread:1269 [wandb_run.py:_redirect():2235] redirect: wrap_raw
20
+ 2025-02-13 07:28:02,743 INFO MainThread:1269 [wandb_run.py:_redirect():2300] Wrapping output streams.
21
+ 2025-02-13 07:28:02,743 INFO MainThread:1269 [wandb_run.py:_redirect():2325] Redirects installed.
22
+ 2025-02-13 07:28:02,745 INFO MainThread:1269 [wandb_init.py:init():1036] run started, returning control to user process
unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/files/output.log ADDED
The diff for this file is too large to render. See raw diff
 
unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/files/requirements.txt ADDED
@@ -0,0 +1,217 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Brotli==1.1.0
2
+ MarkupSafe==3.0.2
3
+ PySocks==1.7.1
4
+ PyYAML==6.0.2
5
+ archspec==0.2.3
6
+ asttokens==2.4.1
7
+ astunparse==1.6.3
8
+ attrs==24.2.0
9
+ beautifulsoup4==4.12.3
10
+ boltons==24.0.0
11
+ certifi==2024.8.30
12
+ cffi==1.17.1
13
+ chardet==5.2.0
14
+ charset-normalizer==3.4.0
15
+ click==8.1.7
16
+ colorama==0.4.6
17
+ conda==24.9.2
18
+ conda-build==24.9.0
19
+ conda_index==0.5.0
20
+ conda-libmamba-solver==24.9.0
21
+ conda-package-handling==2.4.0
22
+ conda_package_streaming==0.11.0
23
+ decorator==5.1.1
24
+ distro==1.9.0
25
+ dnspython==2.7.0
26
+ exceptiongroup==1.2.2
27
+ executing==2.1.0
28
+ expecttest==0.2.1
29
+ filelock==3.16.1
30
+ frozendict==2.4.6
31
+ h2==4.1.0
32
+ hpack==4.0.0
33
+ hyperframe==6.0.1
34
+ hypothesis==6.115.5
35
+ idna==3.10
36
+ importlib_resources==6.4.5
37
+ ipython==8.29.0
38
+ jedi==0.19.1
39
+ Jinja2==3.1.4
40
+ jsonpatch==1.33
41
+ jsonpointer==3.0.0
42
+ jsonschema==4.23.0
43
+ jsonschema-specifications==2024.10.1
44
+ libarchive-c==5.1
45
+ libmambapy==1.5.10
46
+ lief==0.14.1
47
+ lintrunner==0.12.5
48
+ mamba==1.5.10
49
+ matplotlib-inline==0.1.7
50
+ menuinst==2.1.2
51
+ more-itertools==10.5.0
52
+ mpmath==1.3.0
53
+ networkx==3.4.2
54
+ ninja==1.11.1.1
55
+ numpy==2.1.2
56
+ nvidia-cublas-cu12==12.4.5.8
57
+ nvidia-cuda-cupti-cu12==12.4.127
58
+ nvidia-cuda-nvrtc-cu12==12.4.127
59
+ nvidia-cuda-runtime-cu12==12.4.127
60
+ nvidia-cudnn-cu12==9.1.0.70
61
+ nvidia-cufft-cu12==11.2.1.3
62
+ nvidia-curand-cu12==10.3.5.147
63
+ nvidia-cusolver-cu12==11.6.1.9
64
+ nvidia-cusparse-cu12==12.3.1.170
65
+ nvidia-nccl-cu12==2.21.5
66
+ nvidia-nvjitlink-cu12==12.4.127
67
+ nvidia-nvtx-cu12==12.4.127
68
+ optree==0.13.0
69
+ packaging==24.1
70
+ parso==0.8.4
71
+ pexpect==4.9.0
72
+ pickleshare==0.7.5
73
+ pillow==10.2.0
74
+ pip==24.2
75
+ pkginfo==1.11.2
76
+ pkgutil_resolve_name==1.3.10
77
+ platformdirs==4.3.6
78
+ pluggy==1.5.0
79
+ prompt_toolkit==3.0.48
80
+ psutil==6.1.0
81
+ ptyprocess==0.7.0
82
+ pure_eval==0.2.3
83
+ pycosat==0.6.6
84
+ pycparser==2.22
85
+ Pygments==2.18.0
86
+ python-etcd==0.4.5
87
+ pytz==2024.2
88
+ referencing==0.35.1
89
+ requests==2.32.3
90
+ rpds-py==0.20.0
91
+ ruamel.yaml==0.18.6
92
+ ruamel.yaml.clib==0.2.8
93
+ setuptools==72.1.0
94
+ six==1.16.0
95
+ sortedcontainers==2.4.0
96
+ soupsieve==2.5
97
+ stack-data==0.6.2
98
+ sympy==1.13.1
99
+ torch==2.5.1+cu124
100
+ torchaudio==2.5.1+cu124
101
+ torchelastic==0.2.2
102
+ torchvision==0.20.1+cu124
103
+ tqdm==4.66.5
104
+ traitlets==5.14.3
105
+ triton==3.1.0
106
+ truststore==0.9.2
107
+ types-dataclasses==0.6.6
108
+ typing_extensions==4.12.2
109
+ urllib3==2.2.3
110
+ wcwidth==0.2.13
111
+ wheel==0.44.0
112
+ zipp==3.20.2
113
+ zstandard==0.23.0
114
+ smmap==5.0.2
115
+ setproctitle==1.3.4
116
+ sentry-sdk==2.21.0
117
+ pydantic_core==2.27.2
118
+ protobuf==5.29.3
119
+ docker-pycreds==0.4.0
120
+ annotated-types==0.7.0
121
+ pydantic==2.10.6
122
+ gitdb==4.0.12
123
+ GitPython==3.1.44
124
+ wandb==0.19.6
125
+ iniconfig==2.0.0
126
+ pytest==8.3.4
127
+ jupyter-archive==3.4.0
128
+ nbzip==0.1.0
129
+ webencodings==0.5.1
130
+ filetype==1.2.0
131
+ fastjsonschema==2.21.1
132
+ widgetsnbextension==4.0.13
133
+ websocket-client==1.8.0
134
+ webcolors==24.11.1
135
+ uri-template==1.3.0
136
+ types-python-dateutil==2.9.0.20241206
137
+ tornado==6.4.2
138
+ tinycss2==1.4.0
139
+ sniffio==1.3.1
140
+ Send2Trash==1.8.3
141
+ rfc3986-validator==0.1.1
142
+ rfc3339-validator==0.1.4
143
+ pyzmq==26.2.1
144
+ python-json-logger==3.2.1
145
+ prometheus_client==0.21.1
146
+ pandocfilters==1.5.1
147
+ overrides==7.7.0
148
+ nest-asyncio==1.6.0
149
+ mistune==3.1.1
150
+ jupyterlab_widgets==3.0.13
151
+ jupyterlab_pygments==0.3.0
152
+ jupyter_core==5.7.2
153
+ json5==0.10.0
154
+ h11==0.14.0
155
+ fqdn==1.5.1
156
+ defusedxml==0.7.1
157
+ debugpy==1.8.12
158
+ comm==0.2.2
159
+ bleach==6.2.0
160
+ babel==2.17.0
161
+ async-lru==2.0.4
162
+ terminado==0.18.1
163
+ jupyter_client==8.6.3
164
+ httpcore==1.0.7
165
+ arrow==1.3.0
166
+ argon2-cffi-bindings==21.2.0
167
+ anyio==4.8.0
168
+ jupyter_server_terminals==0.5.3
169
+ isoduration==20.11.0
170
+ httpx==0.28.1
171
+ argon2-cffi==23.1.0
172
+ nbformat==5.10.4
173
+ ipywidgets==8.1.5
174
+ ipykernel==6.29.5
175
+ nbclient==0.10.2
176
+ jupyter-events==0.12.0
177
+ jupyter-console==6.6.3
178
+ bash_kernel==0.10.0
179
+ nbconvert==7.16.6
180
+ jupyter_server==2.15.0
181
+ notebook_shim==0.2.4
182
+ jupyterlab_server==2.27.3
183
+ jupyter-lsp==2.2.5
184
+ jupyterlab==4.3.5
185
+ notebook==7.3.2
186
+ jupyter-http-over-ws==0.0.8
187
+ jupyter==1.1.1
188
+ aiohappyeyeballs==2.4.6
189
+ aiohttp==3.11.12
190
+ aiosignal==1.3.2
191
+ contourpy==1.3.1
192
+ cycler==0.12.1
193
+ datasets==3.2.0
194
+ dill==0.3.8
195
+ fonttools==4.56.0
196
+ frozenlist==1.5.0
197
+ fsspec==2024.9.0
198
+ huggingface-hub==0.28.1
199
+ kiwisolver==1.4.8
200
+ matplotlib==3.10.0
201
+ multidict==6.1.0
202
+ multiprocess==0.70.16
203
+ pandas==2.2.3
204
+ propcache==0.2.1
205
+ pyarrow==19.0.0
206
+ pyparsing==3.2.1
207
+ python-dateutil==2.9.0.post0
208
+ regex==2024.11.6
209
+ safetensors==0.5.2
210
+ sentencepiece==0.2.0
211
+ tiktoken==0.8.0
212
+ tokenizers==0.21.0
213
+ transformers==4.48.3
214
+ tzdata==2025.1
215
+ vastai==0.2.8
216
+ xxhash==3.5.0
217
+ yarl==1.18.3
unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/files/wandb-metadata.json ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.0-130-generic-x86_64-with-glibc2.35",
3
+ "python": "CPython 3.11.10",
4
+ "startedAt": "2025-02-13T07:28:02.202054Z",
5
+ "args": [
6
+ "--group",
7
+ "selective_surgery_2",
8
+ "--resume_checkpoint",
9
+ "hf://andrew-healey/context-compression/unselective_run_0/model_07500.pt",
10
+ "--max_steps",
11
+ "2500",
12
+ "--attention_kind",
13
+ "self",
14
+ "--log_dir",
15
+ "unselective_run_1_restarted_with_ko_zero",
16
+ "--add_a_head",
17
+ "--add_head_to_start",
18
+ "--new_head_init",
19
+ "ko_zero"
20
+ ],
21
+ "program": "-m context_compression.train",
22
+ "git": {
23
+ "remote": "https://github.com/andrew-healey/context-compression",
24
+ "commit": "303eb3f2a5dab5fe30125c9ccc545fc206daf467"
25
+ },
26
+ "email": "doolie.healey@gmail.com",
27
+ "root": "unselective_run_1_restarted_with_ko_zero",
28
+ "host": "2ed8c74725ed",
29
+ "executable": "/opt/conda/bin/python3.11",
30
+ "cpu_count": 64,
31
+ "cpu_count_logical": 128,
32
+ "gpu": "NVIDIA GeForce RTX 4090",
33
+ "gpu_count": 8,
34
+ "disk": {
35
+ "/": {
36
+ "total": "222264557568",
37
+ "used": "513650688"
38
+ }
39
+ },
40
+ "memory": {
41
+ "total": "540670349312"
42
+ },
43
+ "cpu": {
44
+ "count": 64,
45
+ "countLogical": 128
46
+ },
47
+ "gpu_nvidia": [
48
+ {
49
+ "name": "NVIDIA GeForce RTX 4090",
50
+ "memoryTotal": "25757220864",
51
+ "cudaCores": 16384,
52
+ "architecture": "Ada"
53
+ },
54
+ {
55
+ "name": "NVIDIA GeForce RTX 4090",
56
+ "memoryTotal": "25757220864",
57
+ "cudaCores": 16384,
58
+ "architecture": "Ada"
59
+ },
60
+ {
61
+ "name": "NVIDIA GeForce RTX 4090",
62
+ "memoryTotal": "25757220864",
63
+ "cudaCores": 16384,
64
+ "architecture": "Ada"
65
+ },
66
+ {
67
+ "name": "NVIDIA GeForce RTX 4090",
68
+ "memoryTotal": "25757220864",
69
+ "cudaCores": 16384,
70
+ "architecture": "Ada"
71
+ },
72
+ {
73
+ "name": "NVIDIA GeForce RTX 4090",
74
+ "memoryTotal": "25757220864",
75
+ "cudaCores": 16384,
76
+ "architecture": "Ada"
77
+ },
78
+ {
79
+ "name": "NVIDIA GeForce RTX 4090",
80
+ "memoryTotal": "25757220864",
81
+ "cudaCores": 16384,
82
+ "architecture": "Ada"
83
+ },
84
+ {
85
+ "name": "NVIDIA GeForce RTX 4090",
86
+ "memoryTotal": "25757220864",
87
+ "cudaCores": 16384,
88
+ "architecture": "Ada"
89
+ },
90
+ {
91
+ "name": "NVIDIA GeForce RTX 4090",
92
+ "memoryTotal": "25757220864",
93
+ "cudaCores": 16384,
94
+ "architecture": "Ada"
95
+ }
96
+ ],
97
+ "cudaVersion": "12.6"
98
+ }
unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/logs/debug-core.log ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {"time":"2025-02-13T07:28:02.017943707Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp49lluslg/port-1269.txt","pid":1269,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false}
2
+ {"time":"2025-02-13T07:28:02.020992573Z","level":"INFO","msg":"Will exit if parent process dies.","ppid":1269}
3
+ {"time":"2025-02-13T07:28:02.020929433Z","level":"INFO","msg":"server is running","addr":{"IP":"127.0.0.1","Port":37837,"Zone":""}}
4
+ {"time":"2025-02-13T07:28:02.194223977Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"127.0.0.1:48712"}
5
+ {"time":"2025-02-13T07:28:02.204781528Z","level":"INFO","msg":"handleInformInit: received","streamId":"crz42i9y","id":"127.0.0.1:48712"}
6
+ {"time":"2025-02-13T07:28:02.418413459Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"crz42i9y","id":"127.0.0.1:48712"}
unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/logs/debug-internal.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2025-02-13T07:28:02.205250343Z","level":"INFO","msg":"stream: starting","core version":"0.19.6","symlink path":"unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/logs/debug-core.log"}
2
+ {"time":"2025-02-13T07:28:02.41832014Z","level":"INFO","msg":"created new stream","id":"crz42i9y"}
3
+ {"time":"2025-02-13T07:28:02.418401779Z","level":"INFO","msg":"stream: started","id":"crz42i9y"}
4
+ {"time":"2025-02-13T07:28:02.418464308Z","level":"INFO","msg":"writer: Do: started","stream_id":"crz42i9y"}
5
+ {"time":"2025-02-13T07:28:02.418522298Z","level":"INFO","msg":"handler: started","stream_id":"crz42i9y"}
6
+ {"time":"2025-02-13T07:28:02.418620407Z","level":"INFO","msg":"sender: started","stream_id":"crz42i9y"}
7
+ {"time":"2025-02-13T07:28:02.624460514Z","level":"INFO","msg":"Starting system monitor"}
unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/logs/debug.log ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_setup.py:_flush():68] Current SDK version is 0.19.6
2
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_setup.py:_flush():68] Configure stats pid to 1269
3
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_setup.py:_flush():68] Loading settings from /root/.config/wandb/settings
4
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_setup.py:_flush():68] Loading settings from /workspace/context-compression/wandb/settings
5
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_setup.py:_flush():68] Loading settings from environment variables
6
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_init.py:setup_run_log_directory():637] Logging user logs to unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/logs/debug.log
7
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_init.py:setup_run_log_directory():638] Logging internal logs to unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/logs/debug-internal.log
8
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_init.py:init():756] calling init triggers
9
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_init.py:init():761] wandb.init called with sweep_config: {}
10
+ config: {'hellaswag': True, 'attention_kind': <AttentionKind.SELF: 'self'>, 'log_dir': 'unselective_run_1_restarted_with_ko_zero', 'resume_checkpoint': 'hf://andrew-healey/context-compression/unselective_run_0/model_07500.pt', 'resume_optimizer': False, 'add_a_head': True, 'add_head_to_start': True, 'new_head_init': <NewHeadInit.KO_ZERO: 'ko_zero'>, 'max_steps': 2500, 'group': 'selective_surgery_2', 'use_wandb': True, 'kill_self_after_run': False, '_wandb': {}}
11
+ 2025-02-13 07:28:01,984 INFO MainThread:1269 [wandb_init.py:init():789] starting backend
12
+ 2025-02-13 07:28:02,194 INFO MainThread:1269 [wandb_init.py:init():793] sending inform_init request
13
+ 2025-02-13 07:28:02,201 INFO MainThread:1269 [backend.py:_multiprocessing_setup():97] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
14
+ 2025-02-13 07:28:02,201 INFO MainThread:1269 [wandb_init.py:init():808] backend started and connected
15
+ 2025-02-13 07:28:02,203 INFO MainThread:1269 [wandb_init.py:init():901] updated telemetry
16
+ 2025-02-13 07:28:02,211 INFO MainThread:1269 [wandb_init.py:init():936] communicating run to backend with 90.0 second timeout
17
+ 2025-02-13 07:28:02,621 INFO MainThread:1269 [wandb_init.py:init():994] starting run threads in backend
18
+ 2025-02-13 07:28:02,743 INFO MainThread:1269 [wandb_run.py:_console_start():2385] atexit reg
19
+ 2025-02-13 07:28:02,743 INFO MainThread:1269 [wandb_run.py:_redirect():2235] redirect: wrap_raw
20
+ 2025-02-13 07:28:02,743 INFO MainThread:1269 [wandb_run.py:_redirect():2300] Wrapping output streams.
21
+ 2025-02-13 07:28:02,743 INFO MainThread:1269 [wandb_run.py:_redirect():2325] Redirects installed.
22
+ 2025-02-13 07:28:02,745 INFO MainThread:1269 [wandb_init.py:init():1036] run started, returning control to user process
unselective_run_1_restarted_with_ko_zero/wandb/run-20250213_072801-crz42i9y/run-crz42i9y.wandb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f96cb2e64c52cd56973ee403da39d5f9bfdcbac27c366cd47b87dfe63cd3d064
3
+ size 3145728