QwenQKing commited on Nov 30, 2025

Commit

e9444ea

verified ·

1 Parent(s): 29698b8

Upload 34 files

Browse files

Files changed (35) hide show

.gitattributes +1 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_0.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_1.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_2.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_3.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_4.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_5.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_6.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_7.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/added_tokens.json +28 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/chat_template.jinja +54 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/config.json +68 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/merges.txt +0 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/special_tokens_map.json +31 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/tokenizer.json +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/tokenizer_config.json +239 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/vocab.json +0 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_0.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_1.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_2.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_3.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_4.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_5.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_6.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_7.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_0.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_1.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_2.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_3.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_4.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_5.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_6.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_7.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/global_step_320/data.pt +3 -0
grpo-qwen3-4b-gpt-4o-mini/latest_checkpointed_iteration.txt +1 -0

.gitattributes CHANGED Viewed

@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 Prompt-R1-gpt-oss/grpo-qwen3-4b-gpt-oss-20b/global_step_320/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text

 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 Prompt-R1-gpt-oss/grpo-qwen3-4b-gpt-oss-20b/global_step_320/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_0.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:72b51bf1b0d4b0128df5dee5bee1c15833e4860694eb76b49eb6eb0926daf3d5
+size 14632

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_1.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aff608a732eab60c3366f023a7d4420aa340473fef199653ac6e6f3b2f8b856a
+size 14632

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_2.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:28cd19a699e313878fe80d3763bb8e0d829812e32cdd4a2f153b09af90537c8e
+size 14632

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_3.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a260a1d92ac1ff26bd749b3c31a5a2a42e553e1bcb94c0dd18ec8350bdcc9944
+size 14632

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_4.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:19b60d94742a405087a6228635181850e1f562ccfce273a27f1869c49198a716
+size 14632

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_5.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:532d4dd4db32406de8567628f3da6b28ac9182dd8cc55ca5d42cd490dec47b8d
+size 14632

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_6.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dcddadcd27b294f2b43c593caa6a7bcc2e2aa8e9fc2213772e8c897dd4d722a9
+size 14632

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/extra_state_world_size_8_rank_7.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3fe1510c1aa9a10a55f15d0e2bd28e6f306f8a8b0a9472b0fe34020a149fd636
+size 14632

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/added_tokens.json ADDED Viewed

	@@ -0,0 +1,28 @@

+{
+  "</think>": 151668,
+  "</tool_call>": 151658,
+  "</tool_response>": 151666,
+  "<think>": 151667,
+  "<tool_call>": 151657,
+  "<tool_response>": 151665,
+  "<|box_end|>": 151649,
+  "<|box_start|>": 151648,
+  "<|endoftext|>": 151643,
+  "<|file_sep|>": 151664,
+  "<|fim_middle|>": 151660,
+  "<|fim_pad|>": 151662,
+  "<|fim_prefix|>": 151659,
+  "<|fim_suffix|>": 151661,
+  "<|im_end|>": 151645,
+  "<|im_start|>": 151644,
+  "<|image_pad|>": 151655,
+  "<|object_ref_end|>": 151647,
+  "<|object_ref_start|>": 151646,
+  "<|quad_end|>": 151651,
+  "<|quad_start|>": 151650,
+  "<|repo_name|>": 151663,
+  "<|video_pad|>": 151656,
+  "<|vision_end|>": 151653,
+  "<|vision_pad|>": 151654,
+  "<|vision_start|>": 151652
+}

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/chat_template.jinja ADDED Viewed

	@@ -0,0 +1,54 @@

+{%- if tools %}
+    {{- '<|im_start|>system\n' }}
+    {%- if messages[0]['role'] == 'system' %}
+        {{- messages[0]['content'] }}
+    {%- else %}
+        {{- 'You are Qwen, created by Alibaba Cloud. You are a great assistant. ' }}
+    {%- endif %}
+    {{- "\n\n# Tools\n\nYou can call one or more powerful Large Language Models to answer the user's questions. But you MUST provide the tool with an explanation and analysis of the problem, as well as your thought process.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
+    {%- for tool in tools %}
+        {{- "\n" }}
+        {{- tool | tojson }}
+    {%- endfor %}
+    {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <interaction_prompt></interaction_prompt> XML tags:\n<interaction_prompt>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</interaction_prompt><|im_end|>\n" }}
+{%- else %}
+    {%- if messages[0]['role'] == 'system' %}
+        {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }}
+    {%- else %}
+        {{- '<|im_start|>system\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\n' }}
+    {%- endif %}
+{%- endif %}
+{%- for message in messages %}
+    {%- if (message.role == "user") or (message.role == "system" and not loop.first) or (message.role == "assistant" and not message.tool_calls) %}
+        {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}
+    {%- elif message.role == "assistant" %}
+        {{- '<|im_start|>' + message.role }}
+        {%- if message.content %}
+            {{- '\n' + message.content }}
+        {%- endif %}
+        {%- for tool_call in message.tool_calls %}
+            {%- if tool_call.function is defined %}
+                {%- set tool_call = tool_call.function %}
+            {%- endif %}
+            {{- '\n<interaction_prompt>\n{"name": "' }}
+            {{- tool_call.name }}
+            {{- '", "arguments": ' }}
+            {{- tool_call.arguments | tojson }}
+            {{- '}\n</interaction_prompt>' }}
+        {%- endfor %}
+        {{- '<|im_end|>\n' }}
+    {%- elif message.role == "tool" %}
+        {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != "tool") %}
+            {{- '<|im_start|>user' }}
+        {%- endif %}
+        {{- '\n<interaction_response>\n' }}
+        {{- message.content }}
+        {{- '\n</interaction_response>' }}
+        {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
+            {{- '<|im_end|>\n' }}
+        {%- endif %}
+    {%- endif %}
+{%- endfor %}
+{%- if add_generation_prompt %}
+    {{- '<|im_start|>assistant\n' }}
+{%- endif %}

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/config.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "architectures": [
+    "Qwen3ForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "dtype": "float32",
+  "eos_token_id": 151645,
+  "head_dim": 128,
+  "hidden_act": "silu",
+  "hidden_size": 2560,
+  "initializer_range": 0.02,
+  "intermediate_size": 9728,
+  "layer_types": [
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention"
+  ],
+  "max_position_embeddings": 40960,
+  "max_window_layers": 36,
+  "model_type": "qwen3",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 36,
+  "num_key_value_heads": 8,
+  "pad_token_id": 151643,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": null,
+  "rope_theta": 1000000,
+  "sliding_window": null,
+  "tie_word_embeddings": true,
+  "transformers_version": "4.56.2",
+  "use_cache": true,
+  "use_sliding_window": false,
+  "vocab_size": 151936
+}

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>",
+    "<|object_ref_start|>",
+    "<|object_ref_end|>",
+    "<|box_start|>",
+    "<|box_end|>",
+    "<|quad_start|>",
+    "<|quad_end|>",
+    "<|vision_start|>",
+    "<|vision_end|>",
+    "<|vision_pad|>",
+    "<|image_pad|>",
+    "<|video_pad|>"
+  ],
+  "eos_token": {
+    "content": "<|im_end|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
+size 11422654

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,239 @@

+{
+  "add_bos_token": false,
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "151643": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151644": {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151645": {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151646": {
+      "content": "<|object_ref_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151647": {
+      "content": "<|object_ref_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151648": {
+      "content": "<|box_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151649": {
+      "content": "<|box_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151650": {
+      "content": "<|quad_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151651": {
+      "content": "<|quad_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151652": {
+      "content": "<|vision_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151653": {
+      "content": "<|vision_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151654": {
+      "content": "<|vision_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151655": {
+      "content": "<|image_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151656": {
+      "content": "<|video_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151657": {
+      "content": "<tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151658": {
+      "content": "</tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151659": {
+      "content": "<|fim_prefix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151660": {
+      "content": "<|fim_middle|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151661": {
+      "content": "<|fim_suffix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151662": {
+      "content": "<|fim_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151663": {
+      "content": "<|repo_name|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151664": {
+      "content": "<|file_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151665": {
+      "content": "<tool_response>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151666": {
+      "content": "</tool_response>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151667": {
+      "content": "<think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151668": {
+      "content": "</think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>",
+    "<|object_ref_start|>",
+    "<|object_ref_end|>",
+    "<|box_start|>",
+    "<|box_end|>",
+    "<|quad_start|>",
+    "<|quad_end|>",
+    "<|vision_start|>",
+    "<|vision_end|>",
+    "<|vision_pad|>",
+    "<|image_pad|>",
+    "<|video_pad|>"
+  ],
+  "bos_token": null,
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|im_end|>",
+  "errors": "replace",
+  "extra_special_tokens": {},
+  "model_max_length": 131072,
+  "pad_token": "<|endoftext|>",
+  "split_special_tokens": false,
+  "tokenizer_class": "Qwen2Tokenizer",
+  "unk_token": null
+}

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/huggingface/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_0.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:28173c76762f9f40cac47fa0836e903e43d66f639f1955737aaf2ba9f1fc634e
+size 2205943162

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_1.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cf52b3e17fe0a20ff62f225961b777ffb8bc7d1c3c9a544417e34a1a8b60f1ff
+size 2205943162

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_2.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dcfb039dfcf48c1f9616ece434be7066b81e4ed6a3e394784fc3d5b243a66621
+size 2205943162

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_3.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2854913d7dac2ed424ae703abc2e4523dbd1eeb3df6b47ea46271c199942086e
+size 2205943162

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_4.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7fcff8e8dca569acdf60f5c3f8aeeb69cb43762d3de282d06a80633f412a939f
+size 2205943162

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_5.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c8c41e83d72ccd834c18569a4afb58b0cfc25b89f410f87298e162b4605d4884
+size 2205943162

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_6.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:82983b780fd8adde91f5cabd402207efccfd5fe87ef390790604de6bffbc26e4
+size 2205943162

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/model_world_size_8_rank_7.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ca25f42d3dd9ae9b312a108734b2f2021c91c2488bf630c026710545bd6786b2
+size 2205943162

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_0.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3760dfbf4c1ac88ac3239e1665c5a972f6b4a3a80338227d773474a12d0601d4
+size 4022501290

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_1.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:670600914f093c38f0640b2a50967920a7d87805aa61c2c2359bd3c49d6301bf
+size 4022501290

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_2.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d831645b9233de05dbf8ecf9083527507fa1a3df1e7ed027af360955e6c2c797
+size 4022501290

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_3.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:530cc0a45af3054e8dc14d05b6694cca391e6aac414eb552502e140b89673b84
+size 4022501290

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_4.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:69b2fb27540df94fc1ab2dea44f8c019ac317022b93a3cbaef193079351d23f2
+size 4022501290

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_5.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9211a7abf8020003f414420b41ce27a45d10e74b24a034b1700dcc5dce007312
+size 4022501290

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_6.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e7dabdaba41600b92416662d47a85d249ea2fea7efc538f53595a9e2f4f5cb82
+size 4022501290

grpo-qwen3-4b-gpt-4o-mini/global_step_320/actor/optim_world_size_8_rank_7.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:35490e63dda35b9145d1746d9cd1fe83a396926f3d9372d45d931bc71bb83dce
+size 4022501290

grpo-qwen3-4b-gpt-4o-mini/global_step_320/data.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f3a51225c1ab27330c7d330a8210191d5b14c9270684562d704182bcfc5312d2
+size 1492

grpo-qwen3-4b-gpt-4o-mini/latest_checkpointed_iteration.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ 320