Final adapter for shaer_grpo_20260411_223409
Browse files- generations_export_summary.json +6 -6
- plots/chain_metrics.jsonl +2 -0
- plots/meter_by_meter_run.png +2 -2
- plots/reward_panels_eval_chain.png +2 -2
- plots/reward_panels_eval_run.png +2 -2
- plotter.log +10 -0
- run_summary.json +25 -25
- train.log +1 -0
- train_stdout.log +1278 -0
generations_export_summary.json
CHANGED
|
@@ -1,10 +1,10 @@
|
|
| 1 |
{
|
| 2 |
"enabled": true,
|
| 3 |
"repo_id": "Shaer-AI/Shaer-adapters-grpo-generations",
|
| 4 |
-
"run_export_dir": "/root/workspace/Shaer/grpo/outputs/hf_generations_exports/
|
| 5 |
-
"chain_export_dir": "/root/workspace/Shaer/grpo/outputs/hf_generations_exports/
|
| 6 |
-
"chain_run_count":
|
| 7 |
-
"run_generation_rows":
|
| 8 |
-
"run_metric_rows":
|
| 9 |
-
"chain_metric_rows":
|
| 10 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"enabled": true,
|
| 3 |
"repo_id": "Shaer-AI/Shaer-adapters-grpo-generations",
|
| 4 |
+
"run_export_dir": "/root/workspace/Shaer/grpo/outputs/hf_generations_exports/shaer_grpo_20260411_223409/runs/shaer_grpo_20260411_223409",
|
| 5 |
+
"chain_export_dir": "/root/workspace/Shaer/grpo/outputs/hf_generations_exports/shaer_grpo_20260411_223409/chains/shaer_grpo_20260411_192107",
|
| 6 |
+
"chain_run_count": 2,
|
| 7 |
+
"run_generation_rows": 26712,
|
| 8 |
+
"run_metric_rows": 2704,
|
| 9 |
+
"chain_metric_rows": 4216
|
| 10 |
}
|
plots/chain_metrics.jsonl
CHANGED
|
@@ -4212,3 +4212,5 @@
|
|
| 4212 |
{"timestamp_utc": "2026-04-12T03:43:26Z", "mode": "train", "global_step": 3298, "epoch": 0.13246575892677834, "loss": 0.0017, "grad_norm": 2.183478593826294, "learning_rate": 9.090909090909092e-09, "num_tokens": 7518824.0, "completions/mean_length": 65.375, "completions/min_length": 65.0, "completions/max_length": 66.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 65.375, "completions/min_terminated_length": 65.0, "completions/max_terminated_length": 66.0, "rewards/meter/mean": 0.9922501444816589, "rewards/meter/std": 0.004244488663971424, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9922501444816589, "rewards/total_composite/std": 0.004244488663971424, "reward": 0.9922501444816589, "reward_std": 0.0042444937862455845, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.013568882830440998, "sampling/sampling_logp_difference/max": 0.7026901245117188, "sampling/importance_sampling_ratio/min": 0.49525120854377747, "sampling/importance_sampling_ratio/mean": 1.0067819356918335, "sampling/importance_sampling_ratio/max": 1.4506497383117676, "entropy": 0.11512181628495455, "clip_ratio/low_mean": 0.0037878789007663727, "clip_ratio/low_min": 0.0037878789007663727, "clip_ratio/high_mean": 0.005710955825634301, "clip_ratio/high_max": 0.005710955825634301, "clip_ratio/region_mean": 0.009498834726400673, "reward_total_mean": 0.9922501444816589, "reward_meter_mean": 0.9922501444816589, "reward_meter_std": 0.004244488663971424, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9922501444816589, "reward_total_composite_std": 0.004244488663971424, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4131.0}
|
| 4213 |
{"timestamp_utc": "2026-04-12T03:43:32Z", "mode": "train", "global_step": 3299, "epoch": 0.1325059244085633, "loss": 0.0057, "grad_norm": 3.7170727252960205, "learning_rate": 6.060606060606061e-09, "num_tokens": 7521612.0, "completions/mean_length": 166.5, "completions/min_length": 159.0, "completions/max_length": 170.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 166.5, "completions/min_terminated_length": 159.0, "completions/max_terminated_length": 170.0, "rewards/meter/mean": 0.9987373352050781, "rewards/meter/std": 0.000354176911059767, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9987373352050781, "rewards/total_composite/std": 0.000354176911059767, "reward": 0.9987373352050781, "reward_std": 0.00035417175968177617, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.03916100785136223, "sampling/sampling_logp_difference/max": 1.9973111152648926, "sampling/importance_sampling_ratio/min": 0.13569968938827515, "sampling/importance_sampling_ratio/mean": 1.001840591430664, "sampling/importance_sampling_ratio/max": 2.0, "entropy": 0.3029062431305647, "clip_ratio/low_mean": 0.01500677247531712, "clip_ratio/low_min": 0.01500677247531712, "clip_ratio/high_mean": 0.015017259865999222, "clip_ratio/high_max": 0.015017259865999222, "clip_ratio/region_mean": 0.030024032341316342, "reward_total_mean": 0.9987373352050781, "reward_meter_mean": 0.9987373352050781, "reward_meter_std": 0.000354176911059767, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9987373352050781, "reward_total_composite_std": 0.000354176911059767, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4132.0}
|
| 4214 |
{"timestamp_utc": "2026-04-12T03:43:36Z", "mode": "train", "global_step": 3300, "epoch": 0.13254608989034825, "loss": 0.0153, "grad_norm": 6.677674293518066, "learning_rate": 3.0303030303030304e-09, "num_tokens": 7523188.0, "completions/mean_length": 46.0, "completions/min_length": 46.0, "completions/max_length": 46.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 46.0, "completions/min_terminated_length": 46.0, "completions/max_terminated_length": 46.0, "rewards/meter/mean": 0.9442145824432373, "rewards/meter/std": 0.003297017654404044, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9442145824432373, "rewards/total_composite/std": 0.003297017654404044, "reward": 0.9442145824432373, "reward_std": 0.0032970213796943426, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.021698685362935066, "sampling/sampling_logp_difference/max": 2.1988744735717773, "sampling/importance_sampling_ratio/min": 0.11092793941497803, "sampling/importance_sampling_ratio/mean": 1.0027215480804443, "sampling/importance_sampling_ratio/max": 1.663463830947876, "entropy": 0.09115941543132067, "clip_ratio/low_mean": 0.00815217406488955, "clip_ratio/low_min": 0.00815217406488955, "clip_ratio/high_mean": 0.0027173913549631834, "clip_ratio/high_max": 0.0027173913549631834, "clip_ratio/region_mean": 0.010869565419852734, "reward_total_mean": 0.9442145824432373, "reward_meter_mean": 0.9442145824432373, "reward_meter_std": 0.003297017654404044, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9442145824432373, "reward_total_composite_std": 0.003297017654404044, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4133.0}
|
|
|
|
|
|
|
|
|
| 4212 |
{"timestamp_utc": "2026-04-12T03:43:26Z", "mode": "train", "global_step": 3298, "epoch": 0.13246575892677834, "loss": 0.0017, "grad_norm": 2.183478593826294, "learning_rate": 9.090909090909092e-09, "num_tokens": 7518824.0, "completions/mean_length": 65.375, "completions/min_length": 65.0, "completions/max_length": 66.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 65.375, "completions/min_terminated_length": 65.0, "completions/max_terminated_length": 66.0, "rewards/meter/mean": 0.9922501444816589, "rewards/meter/std": 0.004244488663971424, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9922501444816589, "rewards/total_composite/std": 0.004244488663971424, "reward": 0.9922501444816589, "reward_std": 0.0042444937862455845, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.013568882830440998, "sampling/sampling_logp_difference/max": 0.7026901245117188, "sampling/importance_sampling_ratio/min": 0.49525120854377747, "sampling/importance_sampling_ratio/mean": 1.0067819356918335, "sampling/importance_sampling_ratio/max": 1.4506497383117676, "entropy": 0.11512181628495455, "clip_ratio/low_mean": 0.0037878789007663727, "clip_ratio/low_min": 0.0037878789007663727, "clip_ratio/high_mean": 0.005710955825634301, "clip_ratio/high_max": 0.005710955825634301, "clip_ratio/region_mean": 0.009498834726400673, "reward_total_mean": 0.9922501444816589, "reward_meter_mean": 0.9922501444816589, "reward_meter_std": 0.004244488663971424, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9922501444816589, "reward_total_composite_std": 0.004244488663971424, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4131.0}
|
| 4213 |
{"timestamp_utc": "2026-04-12T03:43:32Z", "mode": "train", "global_step": 3299, "epoch": 0.1325059244085633, "loss": 0.0057, "grad_norm": 3.7170727252960205, "learning_rate": 6.060606060606061e-09, "num_tokens": 7521612.0, "completions/mean_length": 166.5, "completions/min_length": 159.0, "completions/max_length": 170.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 166.5, "completions/min_terminated_length": 159.0, "completions/max_terminated_length": 170.0, "rewards/meter/mean": 0.9987373352050781, "rewards/meter/std": 0.000354176911059767, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9987373352050781, "rewards/total_composite/std": 0.000354176911059767, "reward": 0.9987373352050781, "reward_std": 0.00035417175968177617, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.03916100785136223, "sampling/sampling_logp_difference/max": 1.9973111152648926, "sampling/importance_sampling_ratio/min": 0.13569968938827515, "sampling/importance_sampling_ratio/mean": 1.001840591430664, "sampling/importance_sampling_ratio/max": 2.0, "entropy": 0.3029062431305647, "clip_ratio/low_mean": 0.01500677247531712, "clip_ratio/low_min": 0.01500677247531712, "clip_ratio/high_mean": 0.015017259865999222, "clip_ratio/high_max": 0.015017259865999222, "clip_ratio/region_mean": 0.030024032341316342, "reward_total_mean": 0.9987373352050781, "reward_meter_mean": 0.9987373352050781, "reward_meter_std": 0.000354176911059767, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9987373352050781, "reward_total_composite_std": 0.000354176911059767, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4132.0}
|
| 4214 |
{"timestamp_utc": "2026-04-12T03:43:36Z", "mode": "train", "global_step": 3300, "epoch": 0.13254608989034825, "loss": 0.0153, "grad_norm": 6.677674293518066, "learning_rate": 3.0303030303030304e-09, "num_tokens": 7523188.0, "completions/mean_length": 46.0, "completions/min_length": 46.0, "completions/max_length": 46.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 46.0, "completions/min_terminated_length": 46.0, "completions/max_terminated_length": 46.0, "rewards/meter/mean": 0.9442145824432373, "rewards/meter/std": 0.003297017654404044, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9442145824432373, "rewards/total_composite/std": 0.003297017654404044, "reward": 0.9442145824432373, "reward_std": 0.0032970213796943426, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.021698685362935066, "sampling/sampling_logp_difference/max": 2.1988744735717773, "sampling/importance_sampling_ratio/min": 0.11092793941497803, "sampling/importance_sampling_ratio/mean": 1.0027215480804443, "sampling/importance_sampling_ratio/max": 1.663463830947876, "entropy": 0.09115941543132067, "clip_ratio/low_mean": 0.00815217406488955, "clip_ratio/low_min": 0.00815217406488955, "clip_ratio/high_mean": 0.0027173913549631834, "clip_ratio/high_max": 0.0027173913549631834, "clip_ratio/region_mean": 0.010869565419852734, "reward_total_mean": 0.9442145824432373, "reward_meter_mean": 0.9442145824432373, "reward_meter_std": 0.003297017654404044, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9442145824432373, "reward_total_composite_std": 0.003297017654404044, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4133.0}
|
| 4215 |
+
{"timestamp_utc": "2026-04-12T03:45:00Z", "mode": "train", "global_step": 3300, "epoch": 0.13254608989034825, "train_runtime": 18489.879, "train_samples_per_second": 1.428, "train_steps_per_second": 0.178, "total_flos": 0.0, "train_loss": 0.0004697396774788627, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4133.0}
|
| 4216 |
+
{"timestamp_utc": "2026-04-12T03:44:57Z", "mode": "eval", "global_step": 3300, "epoch": 0.13254608989034825, "eval_loss": NaN, "eval_runtime": 80.3156, "eval_samples_per_second": 1.295, "eval_steps_per_second": 0.162, "eval_num_tokens": 7523188.0, "eval_completions/mean_length": 213.14423076923077, "eval_completions/min_length": 61.23076923076923, "eval_completions/max_length": 421.38461538461536, "eval_completions/clipped_ratio": 0.009615384615384616, "eval_completions/mean_terminated_length": 209.98489027756912, "eval_completions/min_terminated_length": 61.23076923076923, "eval_completions/max_terminated_length": 412.2307692307692, "eval_rewards/meter/mean": 0.7804106657321637, "eval_rewards/meter/std": 0.3429693900621854, "eval_rewards/count_adherence/mean": 0.9621203220807589, "eval_rewards/count_adherence/std": 0.06154714152216911, "eval_rewards/arabic_clean/mean": 1.0, "eval_rewards/arabic_clean/std": 0.0, "eval_rewards/repeat_penalty/mean": 0.9574309633328364, "eval_rewards/repeat_penalty/std": 0.07397974411455485, "eval_rewards/total_composite/mean": 0.7239617155148432, "eval_rewards/total_composite/std": 0.3431667788670613, "eval_reward": 0.7239617155148432, "eval_reward_std": NaN, "eval_frac_reward_zero_std": 0.0, "eval_sampling/sampling_logp_difference/mean": 0.03249364231641476, "eval_sampling/sampling_logp_difference/max": 1.2331663278432994, "eval_sampling/importance_sampling_ratio/min": 0.2969068231490942, "eval_sampling/importance_sampling_ratio/mean": 1.0095902956449068, "eval_sampling/importance_sampling_ratio/max": 1.6007587084403405, "eval_entropy": 0.38235602699793303, "eval_clip_ratio/low_mean": 0.0, "eval_clip_ratio/low_min": 0.0, "eval_clip_ratio/high_mean": 0.0, "eval_clip_ratio/high_max": 0.0, "eval_clip_ratio/region_mean": 0.0, "eval_reward_total_mean": 0.7239617155148432, "eval_reward_meter_mean": 0.7804106657321637, "eval_reward_meter_std": 0.3429693900621854, "eval_reward_count_adherence_mean": 0.9621203220807589, "eval_reward_count_adherence_std": 0.06154714152216911, "eval_reward_arabic_clean_mean": 1.0, "eval_reward_arabic_clean_std": 0.0, "eval_reward_repeat_penalty_mean": 0.9574309633328364, "eval_reward_repeat_penalty_std": 0.07397974411455485, "eval_reward_total_composite_mean": 0.7239617155148432, "eval_reward_total_composite_std": 0.3431667788670613, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4133.0}
|
plots/meter_by_meter_run.png
CHANGED
|
Git LFS Details
|
|
Git LFS Details
|
plots/reward_panels_eval_chain.png
CHANGED
|
Git LFS Details
|
|
Git LFS Details
|
plots/reward_panels_eval_run.png
CHANGED
|
Git LFS Details
|
|
Git LFS Details
|
plotter.log
CHANGED
|
@@ -3588,3 +3588,13 @@
|
|
| 3588 |
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/arabic_gate_chain.png
|
| 3589 |
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_run.png
|
| 3590 |
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_chain.png
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3588 |
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/arabic_gate_chain.png
|
| 3589 |
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_run.png
|
| 3590 |
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_chain.png
|
| 3591 |
+
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/reward_panels_train_run.png
|
| 3592 |
+
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/reward_panels_eval_run.png
|
| 3593 |
+
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/reward_panels_train_chain.png
|
| 3594 |
+
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/reward_panels_eval_chain.png
|
| 3595 |
+
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/kl_run.png
|
| 3596 |
+
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/kl_chain.png
|
| 3597 |
+
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/arabic_gate_run.png
|
| 3598 |
+
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/arabic_gate_chain.png
|
| 3599 |
+
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_run.png
|
| 3600 |
+
[plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_chain.png
|
run_summary.json
CHANGED
|
@@ -1,35 +1,35 @@
|
|
| 1 |
{
|
| 2 |
-
"timestamp_utc": "2026-04-
|
| 3 |
-
"mode": "
|
| 4 |
-
"created_at_utc": "2026-04-
|
| 5 |
-
"run_id": "
|
| 6 |
-
"run_dir": "/root/workspace/Shaer/grpo/outputs/
|
| 7 |
-
"chain_id": "
|
| 8 |
-
"root_run_id": "
|
| 9 |
-
"parent_run_id": "",
|
| 10 |
-
"parent_run_dir": "",
|
| 11 |
-
"run_sequence_index":
|
| 12 |
"output_repo": "Shaer-AI/Shaer-adapters-grpo",
|
| 13 |
"resume_decision": {
|
| 14 |
-
"timestamp_utc": "2026-04-
|
| 15 |
-
"resume_mode": "
|
| 16 |
-
"requested_spec": "",
|
| 17 |
-
"result": "
|
| 18 |
-
"reason": "
|
| 19 |
-
"local_resume_path":
|
| 20 |
"remote_repo": null,
|
| 21 |
"remote_prefix": null,
|
| 22 |
-
"compatibility": "
|
| 23 |
-
"config_fingerprint": "
|
| 24 |
},
|
| 25 |
-
"best_model_checkpoint": "/root/workspace/Shaer/grpo/outputs/
|
| 26 |
-
"global_step":
|
| 27 |
"train_metrics": {
|
| 28 |
-
"train_runtime":
|
| 29 |
-
"train_samples_per_second":
|
| 30 |
-
"train_steps_per_second": 0.
|
| 31 |
"total_flos": 0.0,
|
| 32 |
-
"train_loss": 0.
|
| 33 |
},
|
| 34 |
-
"final_adapter_dir": "/root/workspace/Shaer/grpo/outputs/
|
| 35 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"timestamp_utc": "2026-04-12T03:45:42Z",
|
| 3 |
+
"mode": "train",
|
| 4 |
+
"created_at_utc": "2026-04-11T22:36:28Z",
|
| 5 |
+
"run_id": "shaer_grpo_20260411_223409",
|
| 6 |
+
"run_dir": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409",
|
| 7 |
+
"chain_id": "shaer_grpo_20260411_192107",
|
| 8 |
+
"root_run_id": "shaer_grpo_20260411_192107",
|
| 9 |
+
"parent_run_id": "shaer_grpo_20260411_192107",
|
| 10 |
+
"parent_run_dir": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_192107",
|
| 11 |
+
"run_sequence_index": 1,
|
| 12 |
"output_repo": "Shaer-AI/Shaer-adapters-grpo",
|
| 13 |
"resume_decision": {
|
| 14 |
+
"timestamp_utc": "2026-04-11T22:36:28Z",
|
| 15 |
+
"resume_mode": "from_path",
|
| 16 |
+
"requested_spec": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_192107/checkpoint-650",
|
| 17 |
+
"result": "resume",
|
| 18 |
+
"reason": "explicit_local_path",
|
| 19 |
+
"local_resume_path": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_192107/checkpoint-650",
|
| 20 |
"remote_repo": null,
|
| 21 |
"remote_prefix": null,
|
| 22 |
+
"compatibility": "fingerprint_mismatch",
|
| 23 |
+
"config_fingerprint": "dddf85cc86110a84f67b563540177d5e59b5c500695e99fe984dfc39dac36c3f"
|
| 24 |
},
|
| 25 |
+
"best_model_checkpoint": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/checkpoint-3100",
|
| 26 |
+
"global_step": 3300,
|
| 27 |
"train_metrics": {
|
| 28 |
+
"train_runtime": 18489.879,
|
| 29 |
+
"train_samples_per_second": 1.428,
|
| 30 |
+
"train_steps_per_second": 0.178,
|
| 31 |
"total_flos": 0.0,
|
| 32 |
+
"train_loss": 0.0004697396774788627
|
| 33 |
},
|
| 34 |
+
"final_adapter_dir": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/final_adapter"
|
| 35 |
}
|
train.log
CHANGED
|
@@ -2713,3 +2713,4 @@
|
|
| 2713 |
2026-04-12 03:43:36,813 | INFO | train_grpo_train | metrics_logged mode=train step=3300
|
| 2714 |
2026-04-12 03:44:57,274 | INFO | train_grpo_train | metrics_logged mode=eval step=3300
|
| 2715 |
2026-04-12 03:45:00,970 | INFO | train_grpo_train | metrics_logged mode=train step=3300
|
|
|
|
|
|
| 2713 |
2026-04-12 03:43:36,813 | INFO | train_grpo_train | metrics_logged mode=train step=3300
|
| 2714 |
2026-04-12 03:44:57,274 | INFO | train_grpo_train | metrics_logged mode=eval step=3300
|
| 2715 |
2026-04-12 03:45:00,970 | INFO | train_grpo_train | metrics_logged mode=train step=3300
|
| 2716 |
+
2026-04-12 03:46:19,803 | INFO | train_grpo_train | pushing final adapter to hub repo=Shaer-AI/Shaer-adapters-grpo
|
train_stdout.log
CHANGED
|
@@ -10362,3 +10362,1281 @@ The tokenizer has new PAD/BOS/EOS tokens that differ from the model config and g
|
|
| 10362 |
|
| 10363 |
...ots/arabic_gate_chain.png: 100%|ββββββββββ| 98.8kB / 98.8kB
|
| 10364 |
|
| 10365 |
.../meter_by_meter_chain.png: 100%|ββββββββββ| 1.06MB / 1.06MB
|
| 10366 |
|
| 10367 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 756kB / 756kB
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10368 |
..._223409/generations.jsonl: 8%|β | 47.5MB / 614MB [A[A
|
|
|
|
|
|
|
| 10369 |
..._223409/generations.jsonl: 8%|β | 47.5MB / 614MB [A[A
|
|
|
|
|
|
|
| 10370 |
..._223409/generations.jsonl: 15%|ββ | 90.6MB / 614MB [A[A
|
|
|
|
|
|
|
| 10371 |
..._223409/generations.jsonl: 22%|βββ | 136MB / 614MB [A[A
|
|
|
|
|
|
|
| 10372 |
..._223409/generations.jsonl: 29%|βββ | 177MB / 614MB [A[A
|
|
|
|
|
|
|
| 10373 |
..._223409/generations.jsonl: 46%|βββββ | 284MB / 614MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10374 |
..._223409/generations.jsonl: 52%|ββββββ | 321MB / 614MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10375 |
..._223409/generations.jsonl: 60%|ββββββ | 366MB / 614MB [A[A
|
|
|
|
|
|
|
| 10376 |
..._223409/generations.jsonl: 67%|βββββββ | 413MB / 614MB [A[A
|
|
|
|
|
|
|
| 10377 |
..._223409/generations.jsonl: 85%|βββββββββ | 519MB / 614MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10378 |
..._223409/generations.jsonl: 91%|βββββββββ | 560MB / 614MB [A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10379 |
...23409/generations.parquet: 100%|ββββββββββ| 53.5MB / 53.8MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10380 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 670kB / 673kB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10381 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.1kB / 27.2kB [A[A[A[A[A
|
|
|
|
|
|
|
| 10382 |
..._223409/generations.jsonl: 100%|ββββββββββ| 613MB / 614MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10383 |
...23409/generations.parquet: 100%|ββββββββββ| 53.5MB / 53.8MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10384 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 670kB / 673kB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10385 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.1kB / 27.2kB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
| 10386 |
..._223409/generations.jsonl: 100%|ββββββββββ| 613MB / 614MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10387 |
...23409/generations.parquet: 100%|ββββββββββ| 53.5MB / 53.8MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10388 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 670kB / 673kB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10389 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.1kB / 27.2kB [A[A[A[A[A
|
|
|
|
|
|
|
| 10390 |
..._223409/generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10391 |
...23409/generations.parquet: 100%|ββββββββββ| 53.8MB / 53.8MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10392 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 673kB / 673kB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10393 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.2kB / 27.2kB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
| 10394 |
..._223409/generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10395 |
...23409/generations.parquet: 100%|ββββββββββ| 53.8MB / 53.8MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10396 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 673kB / 673kB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10397 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.2kB / 27.2kB [A[A[A[A[A
|
|
|
|
|
|
|
| 10398 |
..._223409/generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10399 |
...23409/generations.parquet: 100%|ββββββββββ| 53.8MB / 53.8MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10400 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 673kB / 673kB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10401 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.2kB / 27.2kB [A[A[A[A[A
|
|
|
|
|
|
|
| 10402 |
..._223409/generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10403 |
...23409/generations.parquet: 100%|ββββββββββ| 53.8MB / 53.8MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10404 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 673kB / 673kB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10405 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.2kB / 27.2kB [A[A[A[A[A
|
|
|
|
|
|
|
| 10406 |
..._223409/generations.jsonl: 100%|ββββββββββ| 614MB / 614MB
|
|
|
|
| 10407 |
...23409/generations.parquet: 100%|ββββββββββ| 53.8MB / 53.8MB
|
|
|
|
| 10408 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 673kB / 673kB
|
|
|
|
| 10409 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.2kB / 27.2kB
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10410 |
...107/chain_metrics.parquet: 100%|ββββββββββ| 982kB / 982kB [A[A
|
|
|
|
|
|
|
|
|
|
| 10411 |
...7/chain_reward_curves.png: 100%|ββββββββββ| 27.8kB / 27.8kB [A[A[A
|
|
|
|
|
|
|
| 10412 |
...107/chain_metrics.parquet: 100%|ββββββββββ| 982kB / 982kB [A[A
|
|
|
|
|
|
|
|
|
|
| 10413 |
...7/chain_reward_curves.png: 100%|ββββββββββ| 27.8kB / 27.8kB [A[A[A
|
|
|
|
|
|
|
|
|
|
| 10414 |
...107/chain_metrics.parquet: 100%|ββββββββββ| 982kB / 982kB [A[A
|
|
|
|
|
|
|
|
|
|
| 10415 |
...7/chain_reward_curves.png: 100%|ββββββββββ| 27.8kB / 27.8kB [A[A[A
|
|
|
|
|
|
|
| 10416 |
...107/chain_metrics.parquet: 100%|ββββββββββ| 982kB / 982kB [A[A
|
|
|
|
|
|
|
|
|
|
| 10417 |
...7/chain_reward_curves.png: 100%|ββββββββββ| 27.8kB / 27.8kB [A[A[A
|
|
|
|
|
|
|
| 10418 |
...107/chain_metrics.parquet: 100%|ββββββββββ| 982kB / 982kB
|
|
|
|
| 10419 |
...7/chain_reward_curves.png: 100%|ββββββββββ| 27.8kB / 27.8kB
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10420 |
..._223409/training_args.bin: 100%|ββββββββββ| 7.50kB / 7.50kB [A[A
|
|
|
|
|
|
|
|
|
|
| 10421 |
...plots/arabic_gate_run.png: 100%|ββββββββββ| 81.1kB / 81.1kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10422 |
...ots/arabic_gate_chain.png: 100%|ββββββββββ| 98.8kB / 98.8kB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10423 |
...l_adapter/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10424 |
...adapter/training_args.bin: 100%|ββββββββββ| 7.50kB / 7.50kB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10425 |
...1_223409/plots/kl_run.png: 100%|ββββββββββ| 24.6kB / 24.6kB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10426 |
...223409/plots/kl_chain.png: 100%|ββββββββββ| 33.4kB / 33.4kB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10427 |
.../meter_by_meter_chain.png: 100%|ββββββββββ| 1.06MB / 1.06MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10428 |
...rd_panels_train_chain.png: 100%|ββββββββββ| 350kB / 350kB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10429 |
...adapter_model.safetensors: 10%|β | 64.0MB / 640MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10430 |
..._223409/training_args.bin: 100%|ββββββββββ| 7.50kB / 7.50kB [A[A
|
|
|
|
|
|
|
|
|
|
| 10431 |
...plots/arabic_gate_run.png: 100%|ββββββββββ| 81.1kB / 81.1kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10432 |
...ots/arabic_gate_chain.png: 100%|ββββββββββ| 98.8kB / 98.8kB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10433 |
...l_adapter/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10434 |
...adapter/training_args.bin: 100%|ββββββββββ| 7.50kB / 7.50kB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10435 |
...1_223409/plots/kl_run.png: 100%|ββββββββββ| 24.6kB / 24.6kB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10436 |
...223409/plots/kl_chain.png: 100%|ββββββββββ| 33.4kB / 33.4kB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10437 |
.../meter_by_meter_chain.png: 100%|ββββββββββ| 1.06MB / 1.06MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10438 |
...rd_panels_train_chain.png: 100%|ββββββββββ| 350kB / 350kB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10439 |
[+ 8 files] : 18%|ββ | 440MB / 2.42GB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10440 |
...rd_panels_train_chain.png: 100%|ββββββββββ| 350kB / 350kB [A[A
|
|
|
|
|
|
|
|
|
|
| 10441 |
...adapter_model.safetensors: 20%|ββ | 128MB / 640MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10442 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10443 |
...adapter_model.safetensors: 19%|ββ | 120MB / 640MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10444 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10445 |
...409/all_generations.jsonl: 20%|ββ | 120MB / 614MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10446 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10447 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10448 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10449 |
[+ 1 files] : 100%|ββββββββββ| 107MB / 107MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10450 |
...adapter_model.safetensors: 28%|βββ | 176MB / 640MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10451 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10452 |
...adapter_model.safetensors: 28%|βββ | 176MB / 640MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10453 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10454 |
...409/all_generations.jsonl: 29%|βββ | 176MB / 614MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10455 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10456 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10457 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10458 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10459 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10460 |
...adapter_model.safetensors: 38%|ββββ | 240MB / 640MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10461 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10462 |
...adapter_model.safetensors: 38%|ββββ | 240MB / 640MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10463 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10464 |
...409/all_generations.jsonl: 38%|ββββ | 232MB / 614MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10465 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10466 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10467 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10468 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10469 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10470 |
...adapter_model.safetensors: 46%|βββββ | 296MB / 640MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10471 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10472 |
...adapter_model.safetensors: 46%|βββββ | 296MB / 640MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10473 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10474 |
...409/all_generations.jsonl: 47%|βββββ | 288MB / 614MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10475 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10476 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10477 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10478 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10479 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10480 |
...adapter_model.safetensors: 55%|ββββββ | 352MB / 640MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10481 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10482 |
...adapter_model.safetensors: 55%|ββββββ | 352MB / 640MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10483 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10484 |
...409/all_generations.jsonl: 56%|ββββββ | 344MB / 614MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10485 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10486 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10487 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10488 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10489 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10490 |
...adapter_model.safetensors: 64%|βββββββ | 408MB / 640MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10491 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10492 |
...adapter_model.safetensors: 64%|βββββββ | 408MB / 640MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10493 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10494 |
...409/all_generations.jsonl: 65%|βββββββ | 400MB / 614MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10495 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10496 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10497 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10498 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10499 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10500 |
...adapter_model.safetensors: 73%|ββββββββ | 464MB / 640MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10501 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10502 |
...adapter_model.safetensors: 74%|ββββββββ | 472MB / 640MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10503 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10504 |
...409/all_generations.jsonl: 74%|ββββββββ | 456MB / 614MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10505 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10506 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10507 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10508 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10509 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10510 |
...adapter_model.safetensors: 83%|βββββββββ | 528MB / 640MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10511 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10512 |
...adapter_model.safetensors: 83%|βββββββββ | 528MB / 640MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10513 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10514 |
...409/all_generations.jsonl: 85%|βββββββββ | 520MB / 614MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10515 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10516 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10517 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10518 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10519 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10520 |
...adapter_model.safetensors: 91%|ββββββββββ| 584MB / 640MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10521 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10522 |
...adapter_model.safetensors: 91%|ββββββββββ| 584MB / 640MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10523 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10524 |
...409/all_generations.jsonl: 94%|ββββββββββ| 576MB / 614MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10525 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10526 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10527 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10528 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10529 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10530 |
...adapter_model.safetensors: 100%|ββββββββββ| 640MB / 640MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10531 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10532 |
...adapter_model.safetensors: 100%|ββββββββββ| 640MB / 640MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10533 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10534 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10535 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10536 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10537 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10538 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10539 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10540 |
...adapter_model.safetensors: 100%|ββββββββββ| 640MB / 640MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10541 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10542 |
...adapter_model.safetensors: 100%|ββββββββββ| 640MB / 640MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10543 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10544 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10545 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10546 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10547 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10548 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10549 |
[+ 3 files] : 100%|ββββββββββ| 2.61MB / 2.61MB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
| 10550 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10551 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10552 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10553 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10554 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10555 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10556 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10557 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 754kB / 754kB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10558 |
...ard_panels_eval_chain.png: 100%|ββββββββββ| 318kB / 318kB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10559 |
...eward_panels_eval_run.png: 100%|ββββββββββ| 310kB / 310kB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10560 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10561 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10562 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10563 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10564 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10565 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10566 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10567 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 754kB / 754kB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10568 |
...ard_panels_eval_chain.png: 100%|ββββββββββ| 318kB / 318kB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10569 |
...eward_panels_eval_run.png: 100%|ββββββββββ| 310kB / 310kB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10570 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10571 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10572 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10573 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10574 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10575 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10576 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10577 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 754kB / 754kB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10578 |
...ard_panels_eval_chain.png: 100%|ββββββββββ| 318kB / 318kB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10579 |
...eward_panels_eval_run.png: 100%|ββββββββββ| 310kB / 310kB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10580 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A
|
|
|
|
|
|
|
|
|
|
| 10581 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10582 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10583 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10584 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10585 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10586 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10587 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 754kB / 754kB [A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10588 |
...ard_panels_eval_chain.png: 100%|ββββββββββ| 318kB / 318kB [A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10589 |
...eward_panels_eval_run.png: 100%|ββββββββββ| 310kB / 310kB [A[A[A[A[A[A[A[A[A[A[A
|
|
|
|
|
|
|
| 10590 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB
|
|
|
|
| 10591 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB
|
|
|
|
| 10592 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB
|
|
|
|
| 10593 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB
|
|
|
|
| 10594 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB
|
|
|
|
| 10595 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB
|
|
|
|
| 10596 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB
|
|
|
|
| 10597 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 754kB / 754kB
|
|
|
|
| 10598 |
...ard_panels_eval_chain.png: 100%|ββββββββββ| 318kB / 318kB
|
|
|
|
| 10599 |
...eward_panels_eval_run.png: 100%|ββββββββββ| 310kB / 310kB
|
|
|
|
| 10362 |
|
| 10363 |
...ots/arabic_gate_chain.png: 100%|ββββββββββ| 98.8kB / 98.8kB
|
| 10364 |
|
| 10365 |
.../meter_by_meter_chain.png: 100%|ββββββββββ| 1.06MB / 1.06MB
|
| 10366 |
|
| 10367 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 756kB / 756kB
|
| 10368 |
+
No files have been modified since last commit. Skipping to prevent empty commit.
|
| 10369 |
+
|
| 10370 |
+
|
| 10371 |
+
|
| 10372 |
+
|
| 10373 |
..._223409/generations.jsonl: 8%|β | 47.5MB / 614MB [A[A
|
| 10374 |
+
|
| 10375 |
+
|
| 10376 |
..._223409/generations.jsonl: 8%|β | 47.5MB / 614MB [A[A
|
| 10377 |
+
|
| 10378 |
+
|
| 10379 |
..._223409/generations.jsonl: 15%|ββ | 90.6MB / 614MB [A[A
|
| 10380 |
+
|
| 10381 |
+
|
| 10382 |
..._223409/generations.jsonl: 22%|βββ | 136MB / 614MB [A[A
|
| 10383 |
+
|
| 10384 |
+
|
| 10385 |
..._223409/generations.jsonl: 29%|βββ | 177MB / 614MB [A[A
|
| 10386 |
+
|
| 10387 |
+
|
| 10388 |
..._223409/generations.jsonl: 46%|βββββ | 284MB / 614MB [A[A
|
| 10389 |
+
|
| 10390 |
+
|
| 10391 |
+
|
| 10392 |
..._223409/generations.jsonl: 52%|ββββββ | 321MB / 614MB [A[A
|
| 10393 |
+
|
| 10394 |
+
|
| 10395 |
+
|
| 10396 |
..._223409/generations.jsonl: 60%|ββββββ | 366MB / 614MB [A[A
|
| 10397 |
+
|
| 10398 |
+
|
| 10399 |
..._223409/generations.jsonl: 67%|βββββββ | 413MB / 614MB [A[A
|
| 10400 |
+
|
| 10401 |
+
|
| 10402 |
..._223409/generations.jsonl: 85%|βββββββββ | 519MB / 614MB [A[A
|
| 10403 |
+
|
| 10404 |
+
|
| 10405 |
+
|
| 10406 |
..._223409/generations.jsonl: 91%|βββββββββ | 560MB / 614MB [A[A
|
| 10407 |
+
|
| 10408 |
+
|
| 10409 |
+
|
| 10410 |
+
|
| 10411 |
...23409/generations.parquet: 100%|ββββββββββ| 53.5MB / 53.8MB [A[A[A
|
| 10412 |
+
|
| 10413 |
+
|
| 10414 |
+
|
| 10415 |
+
|
| 10416 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 670kB / 673kB [A[A[A[A
|
| 10417 |
+
|
| 10418 |
+
|
| 10419 |
+
|
| 10420 |
+
|
| 10421 |
+
|
| 10422 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.1kB / 27.2kB [A[A[A[A[A
|
| 10423 |
+
|
| 10424 |
+
|
| 10425 |
..._223409/generations.jsonl: 100%|ββββββββββ| 613MB / 614MB [A[A
|
| 10426 |
+
|
| 10427 |
+
|
| 10428 |
+
|
| 10429 |
...23409/generations.parquet: 100%|ββββββββββ| 53.5MB / 53.8MB [A[A[A
|
| 10430 |
+
|
| 10431 |
+
|
| 10432 |
+
|
| 10433 |
+
|
| 10434 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 670kB / 673kB [A[A[A[A
|
| 10435 |
+
|
| 10436 |
+
|
| 10437 |
+
|
| 10438 |
+
|
| 10439 |
+
|
| 10440 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.1kB / 27.2kB [A[A[A[A[A
|
| 10441 |
+
|
| 10442 |
+
|
| 10443 |
+
|
| 10444 |
..._223409/generations.jsonl: 100%|ββββββββββ| 613MB / 614MB [A[A
|
| 10445 |
+
|
| 10446 |
+
|
| 10447 |
+
|
| 10448 |
...23409/generations.parquet: 100%|ββββββββββ| 53.5MB / 53.8MB [A[A[A
|
| 10449 |
+
|
| 10450 |
+
|
| 10451 |
+
|
| 10452 |
+
|
| 10453 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 670kB / 673kB [A[A[A[A
|
| 10454 |
+
|
| 10455 |
+
|
| 10456 |
+
|
| 10457 |
+
|
| 10458 |
+
|
| 10459 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.1kB / 27.2kB [A[A[A[A[A
|
| 10460 |
+
|
| 10461 |
+
|
| 10462 |
..._223409/generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A
|
| 10463 |
+
|
| 10464 |
+
|
| 10465 |
+
|
| 10466 |
...23409/generations.parquet: 100%|ββββββββββ| 53.8MB / 53.8MB [A[A[A
|
| 10467 |
+
|
| 10468 |
+
|
| 10469 |
+
|
| 10470 |
+
|
| 10471 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 673kB / 673kB [A[A[A[A
|
| 10472 |
+
|
| 10473 |
+
|
| 10474 |
+
|
| 10475 |
+
|
| 10476 |
+
|
| 10477 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.2kB / 27.2kB [A[A[A[A[A
|
| 10478 |
+
|
| 10479 |
+
|
| 10480 |
+
|
| 10481 |
..._223409/generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A
|
| 10482 |
+
|
| 10483 |
+
|
| 10484 |
+
|
| 10485 |
...23409/generations.parquet: 100%|ββββββββββ| 53.8MB / 53.8MB [A[A[A
|
| 10486 |
+
|
| 10487 |
+
|
| 10488 |
+
|
| 10489 |
+
|
| 10490 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 673kB / 673kB [A[A[A[A
|
| 10491 |
+
|
| 10492 |
+
|
| 10493 |
+
|
| 10494 |
+
|
| 10495 |
+
|
| 10496 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.2kB / 27.2kB [A[A[A[A[A
|
| 10497 |
+
|
| 10498 |
+
|
| 10499 |
..._223409/generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A
|
| 10500 |
+
|
| 10501 |
+
|
| 10502 |
+
|
| 10503 |
...23409/generations.parquet: 100%|ββββββββββ| 53.8MB / 53.8MB [A[A[A
|
| 10504 |
+
|
| 10505 |
+
|
| 10506 |
+
|
| 10507 |
+
|
| 10508 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 673kB / 673kB [A[A[A[A
|
| 10509 |
+
|
| 10510 |
+
|
| 10511 |
+
|
| 10512 |
+
|
| 10513 |
+
|
| 10514 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.2kB / 27.2kB [A[A[A[A[A
|
| 10515 |
+
|
| 10516 |
+
|
| 10517 |
..._223409/generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A
|
| 10518 |
+
|
| 10519 |
+
|
| 10520 |
+
|
| 10521 |
...23409/generations.parquet: 100%|ββββββββββ| 53.8MB / 53.8MB [A[A[A
|
| 10522 |
+
|
| 10523 |
+
|
| 10524 |
+
|
| 10525 |
+
|
| 10526 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 673kB / 673kB [A[A[A[A
|
| 10527 |
+
|
| 10528 |
+
|
| 10529 |
+
|
| 10530 |
+
|
| 10531 |
+
|
| 10532 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.2kB / 27.2kB [A[A[A[A[A
|
| 10533 |
+
|
| 10534 |
+
|
| 10535 |
..._223409/generations.jsonl: 100%|ββββββββββ| 614MB / 614MB
|
| 10536 |
+
|
| 10537 |
...23409/generations.parquet: 100%|ββββββββββ| 53.8MB / 53.8MB
|
| 10538 |
+
|
| 10539 |
...11_223409/metrics.parquet: 100%|ββββββββββ| 673kB / 673kB
|
| 10540 |
+
|
| 10541 |
...409/reward_curves_run.png: 100%|ββββββββββ| 27.2kB / 27.2kB
|
| 10542 |
+
|
| 10543 |
+
|
| 10544 |
+
|
| 10545 |
+
|
| 10546 |
...107/chain_metrics.parquet: 100%|ββββββββββ| 982kB / 982kB [A[A
|
| 10547 |
+
|
| 10548 |
+
|
| 10549 |
+
|
| 10550 |
...7/chain_reward_curves.png: 100%|ββββββββββ| 27.8kB / 27.8kB [A[A[A
|
| 10551 |
+
|
| 10552 |
+
|
| 10553 |
...107/chain_metrics.parquet: 100%|ββββββββββ| 982kB / 982kB [A[A
|
| 10554 |
+
|
| 10555 |
+
|
| 10556 |
+
|
| 10557 |
...7/chain_reward_curves.png: 100%|ββββββββββ| 27.8kB / 27.8kB [A[A[A
|
| 10558 |
+
|
| 10559 |
+
|
| 10560 |
+
|
| 10561 |
...107/chain_metrics.parquet: 100%|ββββββββββ| 982kB / 982kB [A[A
|
| 10562 |
+
|
| 10563 |
+
|
| 10564 |
+
|
| 10565 |
...7/chain_reward_curves.png: 100%|ββββββββββ| 27.8kB / 27.8kB [A[A[A
|
| 10566 |
+
|
| 10567 |
+
|
| 10568 |
...107/chain_metrics.parquet: 100%|ββββββββββ| 982kB / 982kB [A[A
|
| 10569 |
+
|
| 10570 |
+
|
| 10571 |
+
|
| 10572 |
...7/chain_reward_curves.png: 100%|ββββββββββ| 27.8kB / 27.8kB [A[A[A
|
| 10573 |
+
|
| 10574 |
+
|
| 10575 |
...107/chain_metrics.parquet: 100%|ββββββββββ| 982kB / 982kB
|
| 10576 |
+
|
| 10577 |
...7/chain_reward_curves.png: 100%|ββββββββββ| 27.8kB / 27.8kB
|
| 10578 |
+
2026-04-12 03:46:19,803 | INFO | train_grpo_train | pushing final adapter to hub repo=Shaer-AI/Shaer-adapters-grpo
|
| 10579 |
+
|
| 10580 |
+
|
| 10581 |
+
|
| 10582 |
+
|
| 10583 |
..._223409/training_args.bin: 100%|ββββββββββ| 7.50kB / 7.50kB [A[A
|
| 10584 |
+
|
| 10585 |
+
|
| 10586 |
+
|
| 10587 |
...plots/arabic_gate_run.png: 100%|ββββββββββ| 81.1kB / 81.1kB [A[A[A
|
| 10588 |
+
|
| 10589 |
+
|
| 10590 |
+
|
| 10591 |
+
|
| 10592 |
...ots/arabic_gate_chain.png: 100%|ββββββββββ| 98.8kB / 98.8kB [A[A[A[A
|
| 10593 |
+
|
| 10594 |
+
|
| 10595 |
+
|
| 10596 |
+
|
| 10597 |
+
|
| 10598 |
...l_adapter/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A
|
| 10599 |
+
|
| 10600 |
+
|
| 10601 |
+
|
| 10602 |
+
|
| 10603 |
+
|
| 10604 |
+
|
| 10605 |
...adapter/training_args.bin: 100%|ββββββββββ| 7.50kB / 7.50kB [A[A[A[A[A[A
|
| 10606 |
+
|
| 10607 |
+
|
| 10608 |
+
|
| 10609 |
+
|
| 10610 |
+
|
| 10611 |
+
|
| 10612 |
+
|
| 10613 |
...1_223409/plots/kl_run.png: 100%|ββββββββββ| 24.6kB / 24.6kB [A[A[A[A[A[A[A
|
| 10614 |
+
|
| 10615 |
+
|
| 10616 |
+
|
| 10617 |
+
|
| 10618 |
+
|
| 10619 |
+
|
| 10620 |
+
|
| 10621 |
+
|
| 10622 |
...223409/plots/kl_chain.png: 100%|ββββββββββ| 33.4kB / 33.4kB [A[A[A[A[A[A[A[A
|
| 10623 |
+
|
| 10624 |
+
|
| 10625 |
+
|
| 10626 |
+
|
| 10627 |
+
|
| 10628 |
+
|
| 10629 |
+
|
| 10630 |
+
|
| 10631 |
+
|
| 10632 |
.../meter_by_meter_chain.png: 100%|ββββββββββ| 1.06MB / 1.06MB [A[A[A[A[A[A[A[A[A
|
| 10633 |
+
|
| 10634 |
+
|
| 10635 |
+
|
| 10636 |
+
|
| 10637 |
+
|
| 10638 |
+
|
| 10639 |
+
|
| 10640 |
+
|
| 10641 |
+
|
| 10642 |
+
|
| 10643 |
...rd_panels_train_chain.png: 100%|ββββββββββ| 350kB / 350kB [A[A[A[A[A[A[A[A[A[A
|
| 10644 |
+
|
| 10645 |
+
|
| 10646 |
+
|
| 10647 |
+
|
| 10648 |
+
|
| 10649 |
+
|
| 10650 |
+
|
| 10651 |
+
|
| 10652 |
+
|
| 10653 |
+
|
| 10654 |
+
|
| 10655 |
...adapter_model.safetensors: 10%|β | 64.0MB / 640MB [A[A[A[A[A[A[A[A[A[A[A
|
| 10656 |
+
|
| 10657 |
+
|
| 10658 |
..._223409/training_args.bin: 100%|ββββββββββ| 7.50kB / 7.50kB [A[A
|
| 10659 |
+
|
| 10660 |
+
|
| 10661 |
+
|
| 10662 |
...plots/arabic_gate_run.png: 100%|ββββββββββ| 81.1kB / 81.1kB [A[A[A
|
| 10663 |
+
|
| 10664 |
+
|
| 10665 |
+
|
| 10666 |
+
|
| 10667 |
...ots/arabic_gate_chain.png: 100%|ββββββββββ| 98.8kB / 98.8kB [A[A[A[A
|
| 10668 |
+
|
| 10669 |
+
|
| 10670 |
+
|
| 10671 |
+
|
| 10672 |
+
|
| 10673 |
...l_adapter/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A
|
| 10674 |
+
|
| 10675 |
+
|
| 10676 |
+
|
| 10677 |
+
|
| 10678 |
+
|
| 10679 |
+
|
| 10680 |
...adapter/training_args.bin: 100%|ββββββββββ| 7.50kB / 7.50kB [A[A[A[A[A[A
|
| 10681 |
+
|
| 10682 |
+
|
| 10683 |
+
|
| 10684 |
+
|
| 10685 |
+
|
| 10686 |
+
|
| 10687 |
+
|
| 10688 |
...1_223409/plots/kl_run.png: 100%|ββββββββββ| 24.6kB / 24.6kB [A[A[A[A[A[A[A
|
| 10689 |
+
|
| 10690 |
+
|
| 10691 |
+
|
| 10692 |
+
|
| 10693 |
+
|
| 10694 |
+
|
| 10695 |
+
|
| 10696 |
+
|
| 10697 |
...223409/plots/kl_chain.png: 100%|ββββββββββ| 33.4kB / 33.4kB [A[A[A[A[A[A[A[A
|
| 10698 |
+
|
| 10699 |
+
|
| 10700 |
+
|
| 10701 |
+
|
| 10702 |
+
|
| 10703 |
+
|
| 10704 |
+
|
| 10705 |
+
|
| 10706 |
+
|
| 10707 |
.../meter_by_meter_chain.png: 100%|ββββββββββ| 1.06MB / 1.06MB [A[A[A[A[A[A[A[A[A
|
| 10708 |
+
|
| 10709 |
+
|
| 10710 |
+
|
| 10711 |
+
|
| 10712 |
+
|
| 10713 |
+
|
| 10714 |
+
|
| 10715 |
+
|
| 10716 |
+
|
| 10717 |
+
|
| 10718 |
...rd_panels_train_chain.png: 100%|ββββββββββ| 350kB / 350kB [A[A[A[A[A[A[A[A[A[A
|
| 10719 |
+
|
| 10720 |
+
|
| 10721 |
+
|
| 10722 |
+
|
| 10723 |
+
|
| 10724 |
+
|
| 10725 |
+
|
| 10726 |
+
|
| 10727 |
+
|
| 10728 |
+
|
| 10729 |
+
|
| 10730 |
[+ 8 files] : 18%|ββ | 440MB / 2.42GB [A[A[A[A[A[A[A[A[A[A[A
|
| 10731 |
+
|
| 10732 |
+
|
| 10733 |
...rd_panels_train_chain.png: 100%|ββββββββββ| 350kB / 350kB [A[A
|
| 10734 |
+
|
| 10735 |
+
|
| 10736 |
+
|
| 10737 |
...adapter_model.safetensors: 20%|ββ | 128MB / 640MB [A[A[A
|
| 10738 |
+
|
| 10739 |
+
|
| 10740 |
+
|
| 10741 |
+
|
| 10742 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A[A
|
| 10743 |
+
|
| 10744 |
+
|
| 10745 |
+
|
| 10746 |
+
|
| 10747 |
+
|
| 10748 |
...adapter_model.safetensors: 19%|ββ | 120MB / 640MB [A[A[A[A[A
|
| 10749 |
+
|
| 10750 |
+
|
| 10751 |
+
|
| 10752 |
+
|
| 10753 |
+
|
| 10754 |
+
|
| 10755 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A
|
| 10756 |
+
|
| 10757 |
+
|
| 10758 |
+
|
| 10759 |
+
|
| 10760 |
+
|
| 10761 |
+
|
| 10762 |
+
|
| 10763 |
...409/all_generations.jsonl: 20%|ββ | 120MB / 614MB [A[A[A[A[A[A[A
|
| 10764 |
+
|
| 10765 |
+
|
| 10766 |
+
|
| 10767 |
+
|
| 10768 |
+
|
| 10769 |
+
|
| 10770 |
+
|
| 10771 |
+
|
| 10772 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
| 10773 |
+
|
| 10774 |
+
|
| 10775 |
+
|
| 10776 |
+
|
| 10777 |
+
|
| 10778 |
+
|
| 10779 |
+
|
| 10780 |
+
|
| 10781 |
+
|
| 10782 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
| 10783 |
+
|
| 10784 |
+
|
| 10785 |
+
|
| 10786 |
+
|
| 10787 |
+
|
| 10788 |
+
|
| 10789 |
+
|
| 10790 |
+
|
| 10791 |
+
|
| 10792 |
+
|
| 10793 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
| 10794 |
+
|
| 10795 |
+
|
| 10796 |
+
|
| 10797 |
+
|
| 10798 |
+
|
| 10799 |
+
|
| 10800 |
+
|
| 10801 |
+
|
| 10802 |
+
|
| 10803 |
+
|
| 10804 |
+
|
| 10805 |
[+ 1 files] : 100%|ββββββββββ| 107MB / 107MB [A[A[A[A[A[A[A[A[A[A[A
|
| 10806 |
+
|
| 10807 |
+
|
| 10808 |
...adapter_model.safetensors: 28%|βββ | 176MB / 640MB [A[A
|
| 10809 |
+
|
| 10810 |
+
|
| 10811 |
+
|
| 10812 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
| 10813 |
+
|
| 10814 |
+
|
| 10815 |
+
|
| 10816 |
+
|
| 10817 |
...adapter_model.safetensors: 28%|βββ | 176MB / 640MB [A[A[A[A
|
| 10818 |
+
|
| 10819 |
+
|
| 10820 |
+
|
| 10821 |
+
|
| 10822 |
+
|
| 10823 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 10824 |
+
|
| 10825 |
+
|
| 10826 |
+
|
| 10827 |
+
|
| 10828 |
+
|
| 10829 |
+
|
| 10830 |
...409/all_generations.jsonl: 29%|βββ | 176MB / 614MB [A[A[A[A[A[A
|
| 10831 |
+
|
| 10832 |
+
|
| 10833 |
+
|
| 10834 |
+
|
| 10835 |
+
|
| 10836 |
+
|
| 10837 |
+
|
| 10838 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 10839 |
+
|
| 10840 |
+
|
| 10841 |
+
|
| 10842 |
+
|
| 10843 |
+
|
| 10844 |
+
|
| 10845 |
+
|
| 10846 |
+
|
| 10847 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
| 10848 |
+
|
| 10849 |
+
|
| 10850 |
+
|
| 10851 |
+
|
| 10852 |
+
|
| 10853 |
+
|
| 10854 |
+
|
| 10855 |
+
|
| 10856 |
+
|
| 10857 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
| 10858 |
+
|
| 10859 |
+
|
| 10860 |
+
|
| 10861 |
+
|
| 10862 |
+
|
| 10863 |
+
|
| 10864 |
+
|
| 10865 |
+
|
| 10866 |
+
|
| 10867 |
+
|
| 10868 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
| 10869 |
+
|
| 10870 |
+
|
| 10871 |
+
|
| 10872 |
+
|
| 10873 |
+
|
| 10874 |
+
|
| 10875 |
+
|
| 10876 |
+
|
| 10877 |
+
|
| 10878 |
+
|
| 10879 |
+
|
| 10880 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
| 10881 |
+
|
| 10882 |
+
|
| 10883 |
...adapter_model.safetensors: 38%|ββββ | 240MB / 640MB [A[A
|
| 10884 |
+
|
| 10885 |
+
|
| 10886 |
+
|
| 10887 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
| 10888 |
+
|
| 10889 |
+
|
| 10890 |
+
|
| 10891 |
+
|
| 10892 |
...adapter_model.safetensors: 38%|ββββ | 240MB / 640MB [A[A[A[A
|
| 10893 |
+
|
| 10894 |
+
|
| 10895 |
+
|
| 10896 |
+
|
| 10897 |
+
|
| 10898 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 10899 |
+
|
| 10900 |
+
|
| 10901 |
+
|
| 10902 |
+
|
| 10903 |
+
|
| 10904 |
+
|
| 10905 |
...409/all_generations.jsonl: 38%|ββββ | 232MB / 614MB [A[A[A[A[A[A
|
| 10906 |
+
|
| 10907 |
+
|
| 10908 |
+
|
| 10909 |
+
|
| 10910 |
+
|
| 10911 |
+
|
| 10912 |
+
|
| 10913 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 10914 |
+
|
| 10915 |
+
|
| 10916 |
+
|
| 10917 |
+
|
| 10918 |
+
|
| 10919 |
+
|
| 10920 |
+
|
| 10921 |
+
|
| 10922 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
| 10923 |
+
|
| 10924 |
+
|
| 10925 |
+
|
| 10926 |
+
|
| 10927 |
+
|
| 10928 |
+
|
| 10929 |
+
|
| 10930 |
+
|
| 10931 |
+
|
| 10932 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
| 10933 |
+
|
| 10934 |
+
|
| 10935 |
+
|
| 10936 |
+
|
| 10937 |
+
|
| 10938 |
+
|
| 10939 |
+
|
| 10940 |
+
|
| 10941 |
+
|
| 10942 |
+
|
| 10943 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
| 10944 |
+
|
| 10945 |
+
|
| 10946 |
+
|
| 10947 |
+
|
| 10948 |
+
|
| 10949 |
+
|
| 10950 |
+
|
| 10951 |
+
|
| 10952 |
+
|
| 10953 |
+
|
| 10954 |
+
|
| 10955 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
| 10956 |
+
|
| 10957 |
+
|
| 10958 |
...adapter_model.safetensors: 46%|βββββ | 296MB / 640MB [A[A
|
| 10959 |
+
|
| 10960 |
+
|
| 10961 |
+
|
| 10962 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
| 10963 |
+
|
| 10964 |
+
|
| 10965 |
+
|
| 10966 |
+
|
| 10967 |
...adapter_model.safetensors: 46%|βββββ | 296MB / 640MB [A[A[A[A
|
| 10968 |
+
|
| 10969 |
+
|
| 10970 |
+
|
| 10971 |
+
|
| 10972 |
+
|
| 10973 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 10974 |
+
|
| 10975 |
+
|
| 10976 |
+
|
| 10977 |
+
|
| 10978 |
+
|
| 10979 |
+
|
| 10980 |
...409/all_generations.jsonl: 47%|βββββ | 288MB / 614MB [A[A[A[A[A[A
|
| 10981 |
+
|
| 10982 |
+
|
| 10983 |
+
|
| 10984 |
+
|
| 10985 |
+
|
| 10986 |
+
|
| 10987 |
+
|
| 10988 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 10989 |
+
|
| 10990 |
+
|
| 10991 |
+
|
| 10992 |
+
|
| 10993 |
+
|
| 10994 |
+
|
| 10995 |
+
|
| 10996 |
+
|
| 10997 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
| 10998 |
+
|
| 10999 |
+
|
| 11000 |
+
|
| 11001 |
+
|
| 11002 |
+
|
| 11003 |
+
|
| 11004 |
+
|
| 11005 |
+
|
| 11006 |
+
|
| 11007 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
| 11008 |
+
|
| 11009 |
+
|
| 11010 |
+
|
| 11011 |
+
|
| 11012 |
+
|
| 11013 |
+
|
| 11014 |
+
|
| 11015 |
+
|
| 11016 |
+
|
| 11017 |
+
|
| 11018 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
| 11019 |
+
|
| 11020 |
+
|
| 11021 |
+
|
| 11022 |
+
|
| 11023 |
+
|
| 11024 |
+
|
| 11025 |
+
|
| 11026 |
+
|
| 11027 |
+
|
| 11028 |
+
|
| 11029 |
+
|
| 11030 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
| 11031 |
+
|
| 11032 |
+
|
| 11033 |
...adapter_model.safetensors: 55%|ββββββ | 352MB / 640MB [A[A
|
| 11034 |
+
|
| 11035 |
+
|
| 11036 |
+
|
| 11037 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
| 11038 |
+
|
| 11039 |
+
|
| 11040 |
+
|
| 11041 |
+
|
| 11042 |
...adapter_model.safetensors: 55%|ββββββ | 352MB / 640MB [A[A[A[A
|
| 11043 |
+
|
| 11044 |
+
|
| 11045 |
+
|
| 11046 |
+
|
| 11047 |
+
|
| 11048 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 11049 |
+
|
| 11050 |
+
|
| 11051 |
+
|
| 11052 |
+
|
| 11053 |
+
|
| 11054 |
+
|
| 11055 |
...409/all_generations.jsonl: 56%|ββββββ | 344MB / 614MB [A[A[A[A[A[A
|
| 11056 |
+
|
| 11057 |
+
|
| 11058 |
+
|
| 11059 |
+
|
| 11060 |
+
|
| 11061 |
+
|
| 11062 |
+
|
| 11063 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 11064 |
+
|
| 11065 |
+
|
| 11066 |
+
|
| 11067 |
+
|
| 11068 |
+
|
| 11069 |
+
|
| 11070 |
+
|
| 11071 |
+
|
| 11072 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
| 11073 |
+
|
| 11074 |
+
|
| 11075 |
+
|
| 11076 |
+
|
| 11077 |
+
|
| 11078 |
+
|
| 11079 |
+
|
| 11080 |
+
|
| 11081 |
+
|
| 11082 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
| 11083 |
+
|
| 11084 |
+
|
| 11085 |
+
|
| 11086 |
+
|
| 11087 |
+
|
| 11088 |
+
|
| 11089 |
+
|
| 11090 |
+
|
| 11091 |
+
|
| 11092 |
+
|
| 11093 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
| 11094 |
+
|
| 11095 |
+
|
| 11096 |
+
|
| 11097 |
+
|
| 11098 |
+
|
| 11099 |
+
|
| 11100 |
+
|
| 11101 |
+
|
| 11102 |
+
|
| 11103 |
+
|
| 11104 |
+
|
| 11105 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
| 11106 |
+
|
| 11107 |
+
|
| 11108 |
...adapter_model.safetensors: 64%|βββββββ | 408MB / 640MB [A[A
|
| 11109 |
+
|
| 11110 |
+
|
| 11111 |
+
|
| 11112 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
| 11113 |
+
|
| 11114 |
+
|
| 11115 |
+
|
| 11116 |
+
|
| 11117 |
...adapter_model.safetensors: 64%|βββββββ | 408MB / 640MB [A[A[A[A
|
| 11118 |
+
|
| 11119 |
+
|
| 11120 |
+
|
| 11121 |
+
|
| 11122 |
+
|
| 11123 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 11124 |
+
|
| 11125 |
+
|
| 11126 |
+
|
| 11127 |
+
|
| 11128 |
+
|
| 11129 |
+
|
| 11130 |
...409/all_generations.jsonl: 65%|βββββββ | 400MB / 614MB [A[A[A[A[A[A
|
| 11131 |
+
|
| 11132 |
+
|
| 11133 |
+
|
| 11134 |
+
|
| 11135 |
+
|
| 11136 |
+
|
| 11137 |
+
|
| 11138 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 11139 |
+
|
| 11140 |
+
|
| 11141 |
+
|
| 11142 |
+
|
| 11143 |
+
|
| 11144 |
+
|
| 11145 |
+
|
| 11146 |
+
|
| 11147 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
| 11148 |
+
|
| 11149 |
+
|
| 11150 |
+
|
| 11151 |
+
|
| 11152 |
+
|
| 11153 |
+
|
| 11154 |
+
|
| 11155 |
+
|
| 11156 |
+
|
| 11157 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
| 11158 |
+
|
| 11159 |
+
|
| 11160 |
+
|
| 11161 |
+
|
| 11162 |
+
|
| 11163 |
+
|
| 11164 |
+
|
| 11165 |
+
|
| 11166 |
+
|
| 11167 |
+
|
| 11168 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
| 11169 |
+
|
| 11170 |
+
|
| 11171 |
+
|
| 11172 |
+
|
| 11173 |
+
|
| 11174 |
+
|
| 11175 |
+
|
| 11176 |
+
|
| 11177 |
+
|
| 11178 |
+
|
| 11179 |
+
|
| 11180 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
| 11181 |
+
|
| 11182 |
+
|
| 11183 |
...adapter_model.safetensors: 73%|ββββββββ | 464MB / 640MB [A[A
|
| 11184 |
+
|
| 11185 |
+
|
| 11186 |
+
|
| 11187 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
| 11188 |
+
|
| 11189 |
+
|
| 11190 |
+
|
| 11191 |
+
|
| 11192 |
...adapter_model.safetensors: 74%|ββββββββ | 472MB / 640MB [A[A[A[A
|
| 11193 |
+
|
| 11194 |
+
|
| 11195 |
+
|
| 11196 |
+
|
| 11197 |
+
|
| 11198 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 11199 |
+
|
| 11200 |
+
|
| 11201 |
+
|
| 11202 |
+
|
| 11203 |
+
|
| 11204 |
+
|
| 11205 |
...409/all_generations.jsonl: 74%|ββββββββ | 456MB / 614MB [A[A[A[A[A[A
|
| 11206 |
+
|
| 11207 |
+
|
| 11208 |
+
|
| 11209 |
+
|
| 11210 |
+
|
| 11211 |
+
|
| 11212 |
+
|
| 11213 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 11214 |
+
|
| 11215 |
+
|
| 11216 |
+
|
| 11217 |
+
|
| 11218 |
+
|
| 11219 |
+
|
| 11220 |
+
|
| 11221 |
+
|
| 11222 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
| 11223 |
+
|
| 11224 |
+
|
| 11225 |
+
|
| 11226 |
+
|
| 11227 |
+
|
| 11228 |
+
|
| 11229 |
+
|
| 11230 |
+
|
| 11231 |
+
|
| 11232 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
| 11233 |
+
|
| 11234 |
+
|
| 11235 |
+
|
| 11236 |
+
|
| 11237 |
+
|
| 11238 |
+
|
| 11239 |
+
|
| 11240 |
+
|
| 11241 |
+
|
| 11242 |
+
|
| 11243 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
| 11244 |
+
|
| 11245 |
+
|
| 11246 |
+
|
| 11247 |
+
|
| 11248 |
+
|
| 11249 |
+
|
| 11250 |
+
|
| 11251 |
+
|
| 11252 |
+
|
| 11253 |
+
|
| 11254 |
+
|
| 11255 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
| 11256 |
+
|
| 11257 |
+
|
| 11258 |
...adapter_model.safetensors: 83%|βββββββββ | 528MB / 640MB [A[A
|
| 11259 |
+
|
| 11260 |
+
|
| 11261 |
+
|
| 11262 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
| 11263 |
+
|
| 11264 |
+
|
| 11265 |
+
|
| 11266 |
+
|
| 11267 |
...adapter_model.safetensors: 83%|βββββββββ | 528MB / 640MB [A[A[A[A
|
| 11268 |
+
|
| 11269 |
+
|
| 11270 |
+
|
| 11271 |
+
|
| 11272 |
+
|
| 11273 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 11274 |
+
|
| 11275 |
+
|
| 11276 |
+
|
| 11277 |
+
|
| 11278 |
+
|
| 11279 |
+
|
| 11280 |
...409/all_generations.jsonl: 85%|βββββββββ | 520MB / 614MB [A[A[A[A[A[A
|
| 11281 |
+
|
| 11282 |
+
|
| 11283 |
+
|
| 11284 |
+
|
| 11285 |
+
|
| 11286 |
+
|
| 11287 |
+
|
| 11288 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 11289 |
+
|
| 11290 |
+
|
| 11291 |
+
|
| 11292 |
+
|
| 11293 |
+
|
| 11294 |
+
|
| 11295 |
+
|
| 11296 |
+
|
| 11297 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
| 11298 |
+
|
| 11299 |
+
|
| 11300 |
+
|
| 11301 |
+
|
| 11302 |
+
|
| 11303 |
+
|
| 11304 |
+
|
| 11305 |
+
|
| 11306 |
+
|
| 11307 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
| 11308 |
+
|
| 11309 |
+
|
| 11310 |
+
|
| 11311 |
+
|
| 11312 |
+
|
| 11313 |
+
|
| 11314 |
+
|
| 11315 |
+
|
| 11316 |
+
|
| 11317 |
+
|
| 11318 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
| 11319 |
+
|
| 11320 |
+
|
| 11321 |
+
|
| 11322 |
+
|
| 11323 |
+
|
| 11324 |
+
|
| 11325 |
+
|
| 11326 |
+
|
| 11327 |
+
|
| 11328 |
+
|
| 11329 |
+
|
| 11330 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
| 11331 |
+
|
| 11332 |
+
|
| 11333 |
...adapter_model.safetensors: 91%|ββββββββββ| 584MB / 640MB [A[A
|
| 11334 |
+
|
| 11335 |
+
|
| 11336 |
+
|
| 11337 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
| 11338 |
+
|
| 11339 |
+
|
| 11340 |
+
|
| 11341 |
+
|
| 11342 |
...adapter_model.safetensors: 91%|ββββββββββ| 584MB / 640MB [A[A[A[A
|
| 11343 |
+
|
| 11344 |
+
|
| 11345 |
+
|
| 11346 |
+
|
| 11347 |
+
|
| 11348 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 11349 |
+
|
| 11350 |
+
|
| 11351 |
+
|
| 11352 |
+
|
| 11353 |
+
|
| 11354 |
+
|
| 11355 |
...409/all_generations.jsonl: 94%|ββββββββββ| 576MB / 614MB [A[A[A[A[A[A
|
| 11356 |
+
|
| 11357 |
+
|
| 11358 |
+
|
| 11359 |
+
|
| 11360 |
+
|
| 11361 |
+
|
| 11362 |
+
|
| 11363 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 11364 |
+
|
| 11365 |
+
|
| 11366 |
+
|
| 11367 |
+
|
| 11368 |
+
|
| 11369 |
+
|
| 11370 |
+
|
| 11371 |
+
|
| 11372 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
| 11373 |
+
|
| 11374 |
+
|
| 11375 |
+
|
| 11376 |
+
|
| 11377 |
+
|
| 11378 |
+
|
| 11379 |
+
|
| 11380 |
+
|
| 11381 |
+
|
| 11382 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
| 11383 |
+
|
| 11384 |
+
|
| 11385 |
+
|
| 11386 |
+
|
| 11387 |
+
|
| 11388 |
+
|
| 11389 |
+
|
| 11390 |
+
|
| 11391 |
+
|
| 11392 |
+
|
| 11393 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
| 11394 |
+
|
| 11395 |
+
|
| 11396 |
+
|
| 11397 |
+
|
| 11398 |
+
|
| 11399 |
+
|
| 11400 |
+
|
| 11401 |
+
|
| 11402 |
+
|
| 11403 |
+
|
| 11404 |
+
|
| 11405 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
| 11406 |
+
|
| 11407 |
+
|
| 11408 |
...adapter_model.safetensors: 100%|ββββββββββ| 640MB / 640MB [A[A
|
| 11409 |
+
|
| 11410 |
+
|
| 11411 |
+
|
| 11412 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
| 11413 |
+
|
| 11414 |
+
|
| 11415 |
+
|
| 11416 |
+
|
| 11417 |
...adapter_model.safetensors: 100%|ββββββββββ| 640MB / 640MB [A[A[A[A
|
| 11418 |
+
|
| 11419 |
+
|
| 11420 |
+
|
| 11421 |
+
|
| 11422 |
+
|
| 11423 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 11424 |
+
|
| 11425 |
+
|
| 11426 |
+
|
| 11427 |
+
|
| 11428 |
+
|
| 11429 |
+
|
| 11430 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A[A[A[A
|
| 11431 |
+
|
| 11432 |
+
|
| 11433 |
+
|
| 11434 |
+
|
| 11435 |
+
|
| 11436 |
+
|
| 11437 |
+
|
| 11438 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 11439 |
+
|
| 11440 |
+
|
| 11441 |
+
|
| 11442 |
+
|
| 11443 |
+
|
| 11444 |
+
|
| 11445 |
+
|
| 11446 |
+
|
| 11447 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
| 11448 |
+
|
| 11449 |
+
|
| 11450 |
+
|
| 11451 |
+
|
| 11452 |
+
|
| 11453 |
+
|
| 11454 |
+
|
| 11455 |
+
|
| 11456 |
+
|
| 11457 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
| 11458 |
+
|
| 11459 |
+
|
| 11460 |
+
|
| 11461 |
+
|
| 11462 |
+
|
| 11463 |
+
|
| 11464 |
+
|
| 11465 |
+
|
| 11466 |
+
|
| 11467 |
+
|
| 11468 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
| 11469 |
+
|
| 11470 |
+
|
| 11471 |
+
|
| 11472 |
+
|
| 11473 |
+
|
| 11474 |
+
|
| 11475 |
+
|
| 11476 |
+
|
| 11477 |
+
|
| 11478 |
+
|
| 11479 |
+
|
| 11480 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A[A[A[A
|
| 11481 |
+
|
| 11482 |
+
|
| 11483 |
...adapter_model.safetensors: 100%|ββββββββββ| 640MB / 640MB [A[A
|
| 11484 |
+
|
| 11485 |
+
|
| 11486 |
+
|
| 11487 |
...ward_panels_train_run.png: 100%|ββββββββββ| 342kB / 342kB [A[A[A
|
| 11488 |
+
|
| 11489 |
+
|
| 11490 |
+
|
| 11491 |
+
|
| 11492 |
...adapter_model.safetensors: 100%|ββββββββββ| 640MB / 640MB [A[A[A[A
|
| 11493 |
+
|
| 11494 |
+
|
| 11495 |
+
|
| 11496 |
+
|
| 11497 |
+
|
| 11498 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 11499 |
+
|
| 11500 |
+
|
| 11501 |
+
|
| 11502 |
+
|
| 11503 |
+
|
| 11504 |
+
|
| 11505 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A[A[A[A
|
| 11506 |
+
|
| 11507 |
+
|
| 11508 |
+
|
| 11509 |
+
|
| 11510 |
+
|
| 11511 |
+
|
| 11512 |
+
|
| 11513 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 11514 |
+
|
| 11515 |
+
|
| 11516 |
+
|
| 11517 |
+
|
| 11518 |
+
|
| 11519 |
+
|
| 11520 |
+
|
| 11521 |
+
|
| 11522 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A
|
| 11523 |
+
|
| 11524 |
+
|
| 11525 |
+
|
| 11526 |
+
|
| 11527 |
+
|
| 11528 |
+
|
| 11529 |
+
|
| 11530 |
+
|
| 11531 |
+
|
| 11532 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A
|
| 11533 |
+
|
| 11534 |
+
|
| 11535 |
+
|
| 11536 |
+
|
| 11537 |
+
|
| 11538 |
+
|
| 11539 |
+
|
| 11540 |
+
|
| 11541 |
+
|
| 11542 |
+
|
| 11543 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A[A[A[A
|
| 11544 |
+
|
| 11545 |
+
|
| 11546 |
+
|
| 11547 |
+
|
| 11548 |
+
|
| 11549 |
+
|
| 11550 |
+
|
| 11551 |
+
|
| 11552 |
+
|
| 11553 |
+
|
| 11554 |
+
|
| 11555 |
[+ 3 files] : 100%|ββββββββββ| 2.61MB / 2.61MB [A[A[A[A[A[A[A[A[A[A[A
|
| 11556 |
+
|
| 11557 |
+
|
| 11558 |
+
|
| 11559 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A
|
| 11560 |
+
|
| 11561 |
+
|
| 11562 |
+
|
| 11563 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A
|
| 11564 |
+
|
| 11565 |
+
|
| 11566 |
+
|
| 11567 |
+
|
| 11568 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A
|
| 11569 |
+
|
| 11570 |
+
|
| 11571 |
+
|
| 11572 |
+
|
| 11573 |
+
|
| 11574 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 11575 |
+
|
| 11576 |
+
|
| 11577 |
+
|
| 11578 |
+
|
| 11579 |
+
|
| 11580 |
+
|
| 11581 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A
|
| 11582 |
+
|
| 11583 |
+
|
| 11584 |
+
|
| 11585 |
+
|
| 11586 |
+
|
| 11587 |
+
|
| 11588 |
+
|
| 11589 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 11590 |
+
|
| 11591 |
+
|
| 11592 |
+
|
| 11593 |
+
|
| 11594 |
+
|
| 11595 |
+
|
| 11596 |
+
|
| 11597 |
+
|
| 11598 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A
|
| 11599 |
+
|
| 11600 |
+
|
| 11601 |
+
|
| 11602 |
+
|
| 11603 |
+
|
| 11604 |
+
|
| 11605 |
+
|
| 11606 |
+
|
| 11607 |
+
|
| 11608 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 754kB / 754kB [A[A[A[A[A[A[A[A[A
|
| 11609 |
+
|
| 11610 |
+
|
| 11611 |
+
|
| 11612 |
+
|
| 11613 |
+
|
| 11614 |
+
|
| 11615 |
+
|
| 11616 |
+
|
| 11617 |
+
|
| 11618 |
+
|
| 11619 |
...ard_panels_eval_chain.png: 100%|ββββββββββ| 318kB / 318kB [A[A[A[A[A[A[A[A[A[A
|
| 11620 |
+
|
| 11621 |
+
|
| 11622 |
+
|
| 11623 |
+
|
| 11624 |
+
|
| 11625 |
+
|
| 11626 |
+
|
| 11627 |
+
|
| 11628 |
+
|
| 11629 |
+
|
| 11630 |
+
|
| 11631 |
...eward_panels_eval_run.png: 100%|ββββββββββ| 310kB / 310kB [A[A[A[A[A[A[A[A[A[A[A
|
| 11632 |
+
|
| 11633 |
+
|
| 11634 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A
|
| 11635 |
+
|
| 11636 |
+
|
| 11637 |
+
|
| 11638 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A
|
| 11639 |
+
|
| 11640 |
+
|
| 11641 |
+
|
| 11642 |
+
|
| 11643 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A
|
| 11644 |
+
|
| 11645 |
+
|
| 11646 |
+
|
| 11647 |
+
|
| 11648 |
+
|
| 11649 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 11650 |
+
|
| 11651 |
+
|
| 11652 |
+
|
| 11653 |
+
|
| 11654 |
+
|
| 11655 |
+
|
| 11656 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A
|
| 11657 |
+
|
| 11658 |
+
|
| 11659 |
+
|
| 11660 |
+
|
| 11661 |
+
|
| 11662 |
+
|
| 11663 |
+
|
| 11664 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 11665 |
+
|
| 11666 |
+
|
| 11667 |
+
|
| 11668 |
+
|
| 11669 |
+
|
| 11670 |
+
|
| 11671 |
+
|
| 11672 |
+
|
| 11673 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A
|
| 11674 |
+
|
| 11675 |
+
|
| 11676 |
+
|
| 11677 |
+
|
| 11678 |
+
|
| 11679 |
+
|
| 11680 |
+
|
| 11681 |
+
|
| 11682 |
+
|
| 11683 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 754kB / 754kB [A[A[A[A[A[A[A[A[A
|
| 11684 |
+
|
| 11685 |
+
|
| 11686 |
+
|
| 11687 |
+
|
| 11688 |
+
|
| 11689 |
+
|
| 11690 |
+
|
| 11691 |
+
|
| 11692 |
+
|
| 11693 |
+
|
| 11694 |
...ard_panels_eval_chain.png: 100%|ββββββββββ| 318kB / 318kB [A[A[A[A[A[A[A[A[A[A
|
| 11695 |
+
|
| 11696 |
+
|
| 11697 |
+
|
| 11698 |
+
|
| 11699 |
+
|
| 11700 |
+
|
| 11701 |
+
|
| 11702 |
+
|
| 11703 |
+
|
| 11704 |
+
|
| 11705 |
+
|
| 11706 |
...eward_panels_eval_run.png: 100%|ββββββββββ| 310kB / 310kB [A[A[A[A[A[A[A[A[A[A[A
|
| 11707 |
+
|
| 11708 |
+
|
| 11709 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A
|
| 11710 |
+
|
| 11711 |
+
|
| 11712 |
+
|
| 11713 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A
|
| 11714 |
+
|
| 11715 |
+
|
| 11716 |
+
|
| 11717 |
+
|
| 11718 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A
|
| 11719 |
+
|
| 11720 |
+
|
| 11721 |
+
|
| 11722 |
+
|
| 11723 |
+
|
| 11724 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 11725 |
+
|
| 11726 |
+
|
| 11727 |
+
|
| 11728 |
+
|
| 11729 |
+
|
| 11730 |
+
|
| 11731 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A
|
| 11732 |
+
|
| 11733 |
+
|
| 11734 |
+
|
| 11735 |
+
|
| 11736 |
+
|
| 11737 |
+
|
| 11738 |
+
|
| 11739 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 11740 |
+
|
| 11741 |
+
|
| 11742 |
+
|
| 11743 |
+
|
| 11744 |
+
|
| 11745 |
+
|
| 11746 |
+
|
| 11747 |
+
|
| 11748 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A
|
| 11749 |
+
|
| 11750 |
+
|
| 11751 |
+
|
| 11752 |
+
|
| 11753 |
+
|
| 11754 |
+
|
| 11755 |
+
|
| 11756 |
+
|
| 11757 |
+
|
| 11758 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 754kB / 754kB [A[A[A[A[A[A[A[A[A
|
| 11759 |
+
|
| 11760 |
+
|
| 11761 |
+
|
| 11762 |
+
|
| 11763 |
+
|
| 11764 |
+
|
| 11765 |
+
|
| 11766 |
+
|
| 11767 |
+
|
| 11768 |
+
|
| 11769 |
...ard_panels_eval_chain.png: 100%|ββββββββββ| 318kB / 318kB [A[A[A[A[A[A[A[A[A[A
|
| 11770 |
+
|
| 11771 |
+
|
| 11772 |
+
|
| 11773 |
+
|
| 11774 |
+
|
| 11775 |
+
|
| 11776 |
+
|
| 11777 |
+
|
| 11778 |
+
|
| 11779 |
+
|
| 11780 |
+
|
| 11781 |
...eward_panels_eval_run.png: 100%|ββββββββββ| 310kB / 310kB [A[A[A[A[A[A[A[A[A[A[A
|
| 11782 |
+
|
| 11783 |
+
|
| 11784 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A
|
| 11785 |
+
|
| 11786 |
+
|
| 11787 |
+
|
| 11788 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB [A[A[A
|
| 11789 |
+
|
| 11790 |
+
|
| 11791 |
+
|
| 11792 |
+
|
| 11793 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A
|
| 11794 |
+
|
| 11795 |
+
|
| 11796 |
+
|
| 11797 |
+
|
| 11798 |
+
|
| 11799 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A
|
| 11800 |
+
|
| 11801 |
+
|
| 11802 |
+
|
| 11803 |
+
|
| 11804 |
+
|
| 11805 |
+
|
| 11806 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A
|
| 11807 |
+
|
| 11808 |
+
|
| 11809 |
+
|
| 11810 |
+
|
| 11811 |
+
|
| 11812 |
+
|
| 11813 |
+
|
| 11814 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB [A[A[A[A[A[A[A
|
| 11815 |
+
|
| 11816 |
+
|
| 11817 |
+
|
| 11818 |
+
|
| 11819 |
+
|
| 11820 |
+
|
| 11821 |
+
|
| 11822 |
+
|
| 11823 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB [A[A[A[A[A[A[A[A
|
| 11824 |
+
|
| 11825 |
+
|
| 11826 |
+
|
| 11827 |
+
|
| 11828 |
+
|
| 11829 |
+
|
| 11830 |
+
|
| 11831 |
+
|
| 11832 |
+
|
| 11833 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 754kB / 754kB [A[A[A[A[A[A[A[A[A
|
| 11834 |
+
|
| 11835 |
+
|
| 11836 |
+
|
| 11837 |
+
|
| 11838 |
+
|
| 11839 |
+
|
| 11840 |
+
|
| 11841 |
+
|
| 11842 |
+
|
| 11843 |
+
|
| 11844 |
...ard_panels_eval_chain.png: 100%|ββββββββββ| 318kB / 318kB [A[A[A[A[A[A[A[A[A[A
|
| 11845 |
+
|
| 11846 |
+
|
| 11847 |
+
|
| 11848 |
+
|
| 11849 |
+
|
| 11850 |
+
|
| 11851 |
+
|
| 11852 |
+
|
| 11853 |
+
|
| 11854 |
+
|
| 11855 |
+
|
| 11856 |
...eward_panels_eval_run.png: 100%|ββββββββββ| 310kB / 310kB [A[A[A[A[A[A[A[A[A[A[A
|
| 11857 |
+
|
| 11858 |
+
|
| 11859 |
...unt_adherence_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB
|
| 11860 |
+
|
| 11861 |
...409/all_generations.jsonl: 100%|ββββββββββ| 614MB / 614MB
|
| 11862 |
+
|
| 11863 |
..._arabic_clean_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB
|
| 11864 |
+
|
| 11865 |
.../reward_meter_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB
|
| 11866 |
+
|
| 11867 |
...tal_composite_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB
|
| 11868 |
+
|
| 11869 |
...epeat_penalty_debug.jsonl: 100%|ββββββββββ| 106MB / 106MB
|
| 11870 |
+
|
| 11871 |
...11_223409/tokenizer.model: 100%|ββββββββββ| 1.23MB / 1.23MB
|
| 11872 |
+
|
| 11873 |
...ts/meter_by_meter_run.png: 100%|ββββββββββ| 754kB / 754kB
|
| 11874 |
+
|
| 11875 |
...ard_panels_eval_chain.png: 100%|ββββββββββ| 318kB / 318kB
|
| 11876 |
+
|
| 11877 |
...eward_panels_eval_run.png: 100%|ββββββββββ| 310kB / 310kB
|