nie10 commited on
Commit
9069b10
·
verified ·
1 Parent(s): cc0e10f

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +13 -0
  2. added_tokens.json +24 -0
  3. chat_template.json +3 -0
  4. config.json +67 -0
  5. generation_config.json +16 -0
  6. logs/20250611_143916/process_pids.txt +2 -0
  7. logs/20250611_143916/remote_rm_qa.log +3 -0
  8. logs/20250611_143916/train.log +0 -0
  9. logs/20250611_172722/process_pids.txt +2 -0
  10. logs/20250611_172722/remote_rm_qa.log +3 -0
  11. logs/20250611_172722/train.log +3 -0
  12. logs/20250612_103654/process_pids.txt +2 -0
  13. logs/20250612_103654/remote_rm_qa.log +3 -0
  14. logs/20250612_103654/train.log +0 -0
  15. logs/20250612_121011/process_pids.txt +2 -0
  16. logs/20250612_121011/remote_rm_qa.log +3 -0
  17. logs/20250612_121011/train.log +0 -0
  18. logs/20250612_134052/process_pids.txt +2 -0
  19. logs/20250612_134052/remote_rm_qa.log +3 -0
  20. logs/20250612_134052/train.log +0 -0
  21. logs/20250612_154155/process_pids.txt +2 -0
  22. logs/20250612_154155/remote_rm_qa.log +9 -0
  23. logs/20250612_154155/train.log +2 -0
  24. logs/20250612_154757/process_pids.txt +2 -0
  25. logs/20250612_154757/remote_rm_qa.log +0 -0
  26. logs/20250612_154757/train.log +0 -0
  27. logs/20250612_160431/process_pids.txt +2 -0
  28. logs/20250612_160431/remote_rm_qa.log +9 -0
  29. logs/20250612_160431/train.log +0 -0
  30. logs/20250612_161405/process_pids.txt +2 -0
  31. logs/20250612_161405/remote_rm_qa.log +0 -0
  32. logs/20250612_161405/train.log +0 -0
  33. logs/20250612_170355/process_pids.txt +2 -0
  34. logs/20250612_170355/remote_rm_qa.log +0 -0
  35. logs/20250612_170355/train.log +2 -0
  36. logs/20250612_170651/process_pids.txt +2 -0
  37. logs/20250612_170651/remote_rm_qa.log +9 -0
  38. logs/20250612_170651/train.log +0 -0
  39. logs/20250612_174005/process_pids.txt +2 -0
  40. logs/20250612_174005/remote_rm_qa.log +3 -0
  41. logs/20250612_174005/train.log +0 -0
  42. logs/20250612_195753/process_pids.txt +2 -0
  43. logs/20250612_195753/remote_rm_qa.log +0 -0
  44. logs/20250612_195753/train.log +2 -0
  45. logs/20250612_213203/process_pids.txt +2 -0
  46. logs/20250612_213203/remote_rm_qa.log +0 -0
  47. logs/20250612_213203/train.log +2 -0
  48. logs/20250612_230441/process_pids.txt +2 -0
  49. logs/20250612_230441/remote_rm_qa.log +0 -0
  50. logs/20250612_230441/train.log +92 -0
.gitattributes CHANGED
@@ -33,3 +33,16 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ logs/20250611_143916/remote_rm_qa.log filter=lfs diff=lfs merge=lfs -text
37
+ logs/20250611_172722/remote_rm_qa.log filter=lfs diff=lfs merge=lfs -text
38
+ logs/20250611_172722/train.log filter=lfs diff=lfs merge=lfs -text
39
+ logs/20250612_103654/remote_rm_qa.log filter=lfs diff=lfs merge=lfs -text
40
+ logs/20250612_121011/remote_rm_qa.log filter=lfs diff=lfs merge=lfs -text
41
+ logs/20250612_134052/remote_rm_qa.log filter=lfs diff=lfs merge=lfs -text
42
+ logs/20250612_174005/remote_rm_qa.log filter=lfs diff=lfs merge=lfs -text
43
+ logs/20250612_235704/remote_rm_qa.log filter=lfs diff=lfs merge=lfs -text
44
+ logs/20250613_145402/remote_rm_qa.log filter=lfs diff=lfs merge=lfs -text
45
+ logs/20250613_164550/remote_rm_qa.log filter=lfs diff=lfs merge=lfs -text
46
+ logs/20250613_193604/remote_rm_qa.log filter=lfs diff=lfs merge=lfs -text
47
+ logs/20250613_231703/remote_rm_qa.log filter=lfs diff=lfs merge=lfs -text
48
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</tool_call>": 151658,
3
+ "<tool_call>": 151657,
4
+ "<|box_end|>": 151649,
5
+ "<|box_start|>": 151648,
6
+ "<|endoftext|>": 151643,
7
+ "<|file_sep|>": 151664,
8
+ "<|fim_middle|>": 151660,
9
+ "<|fim_pad|>": 151662,
10
+ "<|fim_prefix|>": 151659,
11
+ "<|fim_suffix|>": 151661,
12
+ "<|im_end|>": 151645,
13
+ "<|im_start|>": 151644,
14
+ "<|image_pad|>": 151655,
15
+ "<|object_ref_end|>": 151647,
16
+ "<|object_ref_start|>": 151646,
17
+ "<|quad_end|>": 151651,
18
+ "<|quad_start|>": 151650,
19
+ "<|repo_name|>": 151663,
20
+ "<|video_pad|>": 151656,
21
+ "<|vision_end|>": 151653,
22
+ "<|vision_pad|>": 151654,
23
+ "<|vision_start|>": 151652
24
+ }
chat_template.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "chat_template": "{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n{% endif %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}<|im_end|>\n{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>\n{% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}"
3
+ }
config.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen2_5_VLForConditionalGeneration"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 151643,
7
+ "eos_token_id": 151645,
8
+ "hidden_act": "silu",
9
+ "hidden_size": 3584,
10
+ "image_token_id": 151655,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 18944,
13
+ "max_position_embeddings": 128000,
14
+ "max_window_layers": 28,
15
+ "model_type": "qwen2_5_vl",
16
+ "num_attention_heads": 28,
17
+ "num_hidden_layers": 28,
18
+ "num_key_value_heads": 4,
19
+ "rms_norm_eps": 1e-06,
20
+ "rope_scaling": {
21
+ "mrope_section": [
22
+ 16,
23
+ 24,
24
+ 24
25
+ ],
26
+ "rope_type": "default",
27
+ "type": "default"
28
+ },
29
+ "rope_theta": 1000000.0,
30
+ "sliding_window": 32768,
31
+ "tie_word_embeddings": false,
32
+ "tokenizer_padding_side": "right",
33
+ "torch_dtype": "bfloat16",
34
+ "transformers_version": "4.51.0.dev0",
35
+ "use_cache": false,
36
+ "use_sliding_window": false,
37
+ "video_token_id": 151656,
38
+ "vision_config": {
39
+ "depth": 32,
40
+ "fullatt_block_indexes": [
41
+ 7,
42
+ 15,
43
+ 23,
44
+ 31
45
+ ],
46
+ "hidden_act": "silu",
47
+ "hidden_size": 1280,
48
+ "in_channels": 3,
49
+ "in_chans": 3,
50
+ "intermediate_size": 3420,
51
+ "model_type": "qwen2_5_vl",
52
+ "num_heads": 16,
53
+ "out_hidden_size": 3584,
54
+ "patch_size": 14,
55
+ "spatial_merge_size": 2,
56
+ "spatial_patch_size": 14,
57
+ "temporal_patch_size": 2,
58
+ "tokens_per_second": 2,
59
+ "torch_dtype": "bfloat16",
60
+ "window_size": 112
61
+ },
62
+ "vision_end_token_id": 151653,
63
+ "vision_lr": 2e-06,
64
+ "vision_start_token_id": 151652,
65
+ "vision_token_id": 151654,
66
+ "vocab_size": 152064
67
+ }
generation_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_attn_implementation": "flash_attention_2",
3
+ "attn_implementation": "flash_attention_2",
4
+ "bos_token_id": 151643,
5
+ "do_sample": true,
6
+ "eos_token_id": [
7
+ 151645,
8
+ 151643
9
+ ],
10
+ "pad_token_id": 151643,
11
+ "repetition_penalty": 1.05,
12
+ "temperature": 0.7,
13
+ "top_k": 20,
14
+ "top_p": 0.8,
15
+ "transformers_version": "4.51.0.dev0"
16
+ }
logs/20250611_143916/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 180844
2
+ Train PID: 180845
logs/20250611_143916/remote_rm_qa.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b0f35b5d56de91c70b36e2471046c68ee32067b6bc495138178881614fc5269
3
+ size 22014229
logs/20250611_143916/train.log ADDED
The diff for this file is too large to render. See raw diff
 
logs/20250611_172722/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 299278
2
+ Train PID: 299279
logs/20250611_172722/remote_rm_qa.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18b04c4fa78e8047ae16b1f1096e4f03db3c2a721901124364a1bbbd38959b76
3
+ size 119952587
logs/20250611_172722/train.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b538c3ff9789562759cbad5ad7e57d191b00088d854544215679fb7fff1b9f37
3
+ size 11578606
logs/20250612_103654/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 491486
2
+ Train PID: 491487
logs/20250612_103654/remote_rm_qa.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c2a4927f59546ad3294b810acd989d420a2f25b36c82dc86cd47f1a92e8efa2
3
+ size 13530701
logs/20250612_103654/train.log ADDED
The diff for this file is too large to render. See raw diff
 
logs/20250612_121011/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 286806
2
+ Train PID: 286807
logs/20250612_121011/remote_rm_qa.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d023f87ca54002ba93b5641833ed466e64f6d39c2a264d7204b5f89a99c1e879
3
+ size 13368904
logs/20250612_121011/train.log ADDED
The diff for this file is too large to render. See raw diff
 
logs/20250612_134052/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 332530
2
+ Train PID: 332531
logs/20250612_134052/remote_rm_qa.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b15ffc8a70356386f2f8140b2a876129d3d0a22892ac129db95e2dea0124ad61
3
+ size 13111244
logs/20250612_134052/train.log ADDED
The diff for this file is too large to render. See raw diff
 
logs/20250612_154155/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 266447
2
+ Train PID: 266448
logs/20250612_154155/remote_rm_qa.log ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ [2025-06-12 15:42:37,930] [INFO] [real_accelerator.py:222:get_accelerator] Setting ds_accelerator to cuda (auto detect)
2
+ load dataset success
3
+ * Serving Flask app 'math_verifier_wolatex'
4
+ * Debug mode: off
5
+ WARNING: This is a development server. Do not use it in a production deployment. Use a production WSGI server instead.
6
+ * Running on all addresses (0.0.0.0)
7
+ * Running on http://127.0.0.1:2323
8
+ * Running on http://10.140.1.128:2323
9
+ Press CTRL+C to quit
logs/20250612_154155/train.log ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ 2025-06-12 15:42:22,174 INFO dashboard_sdk.py:338 -- Uploading package gcs://_ray_pkg_62b42fe85ef00416.zip.
2
+ 2025-06-12 15:42:22,175 INFO packaging.py:575 -- Creating a file package for local module '/mnt/petrelfs/luyiting/MultiAgentEval/lmm-r1'.
logs/20250612_154757/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 304140
2
+ Train PID: 304141
logs/20250612_154757/remote_rm_qa.log ADDED
The diff for this file is too large to render. See raw diff
 
logs/20250612_154757/train.log ADDED
The diff for this file is too large to render. See raw diff
 
logs/20250612_160431/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 381242
2
+ Train PID: 381243
logs/20250612_160431/remote_rm_qa.log ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ [2025-06-12 16:05:12,677] [INFO] [real_accelerator.py:222:get_accelerator] Setting ds_accelerator to cuda (auto detect)
2
+ load dataset success
3
+ * Serving Flask app 'math_verifier_wolatex'
4
+ * Debug mode: off
5
+ WARNING: This is a development server. Do not use it in a production deployment. Use a production WSGI server instead.
6
+ * Running on all addresses (0.0.0.0)
7
+ * Running on http://127.0.0.1:2323
8
+ * Running on http://10.140.1.140:2323
9
+ Press CTRL+C to quit
logs/20250612_160431/train.log ADDED
The diff for this file is too large to render. See raw diff
 
logs/20250612_161405/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 320735
2
+ Train PID: 320736
logs/20250612_161405/remote_rm_qa.log ADDED
The diff for this file is too large to render. See raw diff
 
logs/20250612_161405/train.log ADDED
The diff for this file is too large to render. See raw diff
 
logs/20250612_170355/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 248821
2
+ Train PID: 248822
logs/20250612_170355/remote_rm_qa.log ADDED
File without changes
logs/20250612_170355/train.log ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ 2025-06-12 17:04:18,788 INFO dashboard_sdk.py:338 -- Uploading package gcs://_ray_pkg_62b42fe85ef00416.zip.
2
+ 2025-06-12 17:04:18,788 INFO packaging.py:575 -- Creating a file package for local module '/mnt/petrelfs/luyiting/MultiAgentEval/lmm-r1'.
logs/20250612_170651/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 172289
2
+ Train PID: 172290
logs/20250612_170651/remote_rm_qa.log ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ [2025-06-12 17:07:34,666] [INFO] [real_accelerator.py:222:get_accelerator] Setting ds_accelerator to cuda (auto detect)
2
+ load dataset success
3
+ * Serving Flask app 'math_verifier_wolatex'
4
+ * Debug mode: off
5
+ WARNING: This is a development server. Do not use it in a production deployment. Use a production WSGI server instead.
6
+ * Running on all addresses (0.0.0.0)
7
+ * Running on http://127.0.0.1:2323
8
+ * Running on http://10.140.1.80:2323
9
+ Press CTRL+C to quit
logs/20250612_170651/train.log ADDED
The diff for this file is too large to render. See raw diff
 
logs/20250612_174005/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 288885
2
+ Train PID: 288886
logs/20250612_174005/remote_rm_qa.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a04dbe13bd42f7c9cb1651b827dca300d970b572a09b2e7843ee19e539e88966
3
+ size 18985266
logs/20250612_174005/train.log ADDED
The diff for this file is too large to render. See raw diff
 
logs/20250612_195753/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 21232
2
+ Train PID: 21233
logs/20250612_195753/remote_rm_qa.log ADDED
File without changes
logs/20250612_195753/train.log ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ 2025-06-12 19:58:21,564 INFO dashboard_sdk.py:338 -- Uploading package gcs://_ray_pkg_62b42fe85ef00416.zip.
2
+ 2025-06-12 19:58:21,564 INFO packaging.py:575 -- Creating a file package for local module '/mnt/petrelfs/luyiting/MultiAgentEval/lmm-r1'.
logs/20250612_213203/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 158429
2
+ Train PID: 158430
logs/20250612_213203/remote_rm_qa.log ADDED
File without changes
logs/20250612_213203/train.log ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ 2025-06-12 21:32:24,467 INFO dashboard_sdk.py:338 -- Uploading package gcs://_ray_pkg_62b42fe85ef00416.zip.
2
+ 2025-06-12 21:32:24,468 INFO packaging.py:575 -- Creating a file package for local module '/mnt/petrelfs/luyiting/MultiAgentEval/lmm-r1'.
logs/20250612_230441/process_pids.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Remote RM PID: 57294
2
+ Train PID: 57295
logs/20250612_230441/remote_rm_qa.log ADDED
File without changes
logs/20250612_230441/train.log ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Traceback (most recent call last):
2
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/urllib3/connection.py", line 198, in _new_conn
3
+ sock = connection.create_connection(
4
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/urllib3/util/connection.py", line 85, in create_connection
5
+ raise err
6
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/urllib3/util/connection.py", line 73, in create_connection
7
+ sock.connect(sa)
8
+ ConnectionRefusedError: [Errno 111] Connection refused
9
+
10
+ The above exception was the direct cause of the following exception:
11
+
12
+ Traceback (most recent call last):
13
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/urllib3/connectionpool.py", line 787, in urlopen
14
+ response = self._make_request(
15
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/urllib3/connectionpool.py", line 493, in _make_request
16
+ conn.request(
17
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/urllib3/connection.py", line 445, in request
18
+ self.endheaders()
19
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/http/client.py", line 1278, in endheaders
20
+ self._send_output(message_body, encode_chunked=encode_chunked)
21
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/http/client.py", line 1038, in _send_output
22
+ self.send(msg)
23
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/http/client.py", line 976, in send
24
+ self.connect()
25
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/urllib3/connection.py", line 276, in connect
26
+ self.sock = self._new_conn()
27
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/urllib3/connection.py", line 213, in _new_conn
28
+ raise NewConnectionError(
29
+ urllib3.exceptions.NewConnectionError: <urllib3.connection.HTTPConnection object at 0x7f2d87219cc0>: Failed to establish a new connection: [Errno 111] Connection refused
30
+
31
+ The above exception was the direct cause of the following exception:
32
+
33
+ Traceback (most recent call last):
34
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/requests/adapters.py", line 667, in send
35
+ resp = conn.urlopen(
36
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/urllib3/connectionpool.py", line 841, in urlopen
37
+ retries = retries.increment(
38
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/urllib3/util/retry.py", line 519, in increment
39
+ raise MaxRetryError(_pool, url, reason) from reason # type: ignore[arg-type]
40
+ urllib3.exceptions.MaxRetryError: HTTPConnectionPool(host='127.0.0.1', port=2970): Max retries exceeded with url: /api/version (Caused by NewConnectionError('<urllib3.connection.HTTPConnection object at 0x7f2d87219cc0>: Failed to establish a new connection: [Errno 111] Connection refused'))
41
+
42
+ During handling of the above exception, another exception occurred:
43
+
44
+ Traceback (most recent call last):
45
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/ray/dashboard/modules/dashboard_sdk.py", line 262, in _check_connection_and_version_with_url
46
+ r = self._do_request("GET", url)
47
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/ray/dashboard/modules/dashboard_sdk.py", line 303, in _do_request
48
+ return requests.request(
49
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/requests/api.py", line 59, in request
50
+ return session.request(method=method, url=url, **kwargs)
51
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/requests/sessions.py", line 589, in request
52
+ resp = self.send(prep, **send_kwargs)
53
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/requests/sessions.py", line 703, in send
54
+ r = adapter.send(request, **kwargs)
55
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/requests/adapters.py", line 700, in send
56
+ raise ConnectionError(e, request=request)
57
+ requests.exceptions.ConnectionError: HTTPConnectionPool(host='127.0.0.1', port=2970): Max retries exceeded with url: /api/version (Caused by NewConnectionError('<urllib3.connection.HTTPConnection object at 0x7f2d87219cc0>: Failed to establish a new connection: [Errno 111] Connection refused'))
58
+
59
+ During handling of the above exception, another exception occurred:
60
+
61
+ Traceback (most recent call last):
62
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/bin/ray", line 8, in <module>
63
+ sys.exit(main())
64
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/ray/scripts/scripts.py", line 2690, in main
65
+ return cli()
66
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/click/core.py", line 1161, in __call__
67
+ return self.main(*args, **kwargs)
68
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/click/core.py", line 1082, in main
69
+ rv = self.invoke(ctx)
70
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/click/core.py", line 1697, in invoke
71
+ return _process_result(sub_ctx.command.invoke(sub_ctx))
72
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/click/core.py", line 1697, in invoke
73
+ return _process_result(sub_ctx.command.invoke(sub_ctx))
74
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/click/core.py", line 1443, in invoke
75
+ return ctx.invoke(self.callback, **ctx.params)
76
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/click/core.py", line 788, in invoke
77
+ return __callback(*args, **kwargs)
78
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/ray/dashboard/modules/job/cli_utils.py", line 54, in wrapper
79
+ return func(*args, **kwargs)
80
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/ray/autoscaler/_private/cli_logger.py", line 823, in wrapper
81
+ return f(*args, **kwargs)
82
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/ray/dashboard/modules/job/cli.py", line 267, in submit
83
+ client = _get_sdk_client(
84
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/ray/dashboard/modules/job/cli.py", line 32, in _get_sdk_client
85
+ client = JobSubmissionClient(
86
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/ray/dashboard/modules/job/sdk.py", line 105, in __init__
87
+ self._check_connection_and_version(
88
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/ray/dashboard/modules/dashboard_sdk.py", line 248, in _check_connection_and_version
89
+ self._check_connection_and_version_with_url(min_version, version_error_message)
90
+ File "/mnt/petrelfs/luyiting/anaconda3/envs/lmmr1/lib/python3.10/site-packages/ray/dashboard/modules/dashboard_sdk.py", line 278, in _check_connection_and_version_with_url
91
+ raise ConnectionError(
92
+ ConnectionError: Failed to connect to Ray at address: http://127.0.0.1:2970.