Transformers
Safetensors
trl
grpo
arabic-poetry
classical-arabic
lora
AhmadAbbass commited on
Commit
45def9d
Β·
verified Β·
1 Parent(s): e8c9887

Final adapter for shaer_grpo_20260411_223409

Browse files
generations_export_summary.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
  "enabled": true,
3
  "repo_id": "Shaer-AI/Shaer-adapters-grpo-generations",
4
- "run_export_dir": "/root/workspace/Shaer/grpo/outputs/hf_generations_exports/sanity_20260411_174336/runs/sanity_20260411_174336",
5
- "chain_export_dir": "/root/workspace/Shaer/grpo/outputs/hf_generations_exports/sanity_20260411_174336/chains/sanity_20260411_174336",
6
- "chain_run_count": 1,
7
- "run_generation_rows": 32,
8
- "run_metric_rows": 5,
9
- "chain_metric_rows": 5
10
  }
 
1
  {
2
  "enabled": true,
3
  "repo_id": "Shaer-AI/Shaer-adapters-grpo-generations",
4
+ "run_export_dir": "/root/workspace/Shaer/grpo/outputs/hf_generations_exports/shaer_grpo_20260411_223409/runs/shaer_grpo_20260411_223409",
5
+ "chain_export_dir": "/root/workspace/Shaer/grpo/outputs/hf_generations_exports/shaer_grpo_20260411_223409/chains/shaer_grpo_20260411_192107",
6
+ "chain_run_count": 2,
7
+ "run_generation_rows": 26712,
8
+ "run_metric_rows": 2704,
9
+ "chain_metric_rows": 4216
10
  }
plots/chain_metrics.jsonl CHANGED
@@ -4212,3 +4212,5 @@
4212
  {"timestamp_utc": "2026-04-12T03:43:26Z", "mode": "train", "global_step": 3298, "epoch": 0.13246575892677834, "loss": 0.0017, "grad_norm": 2.183478593826294, "learning_rate": 9.090909090909092e-09, "num_tokens": 7518824.0, "completions/mean_length": 65.375, "completions/min_length": 65.0, "completions/max_length": 66.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 65.375, "completions/min_terminated_length": 65.0, "completions/max_terminated_length": 66.0, "rewards/meter/mean": 0.9922501444816589, "rewards/meter/std": 0.004244488663971424, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9922501444816589, "rewards/total_composite/std": 0.004244488663971424, "reward": 0.9922501444816589, "reward_std": 0.0042444937862455845, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.013568882830440998, "sampling/sampling_logp_difference/max": 0.7026901245117188, "sampling/importance_sampling_ratio/min": 0.49525120854377747, "sampling/importance_sampling_ratio/mean": 1.0067819356918335, "sampling/importance_sampling_ratio/max": 1.4506497383117676, "entropy": 0.11512181628495455, "clip_ratio/low_mean": 0.0037878789007663727, "clip_ratio/low_min": 0.0037878789007663727, "clip_ratio/high_mean": 0.005710955825634301, "clip_ratio/high_max": 0.005710955825634301, "clip_ratio/region_mean": 0.009498834726400673, "reward_total_mean": 0.9922501444816589, "reward_meter_mean": 0.9922501444816589, "reward_meter_std": 0.004244488663971424, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9922501444816589, "reward_total_composite_std": 0.004244488663971424, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4131.0}
4213
  {"timestamp_utc": "2026-04-12T03:43:32Z", "mode": "train", "global_step": 3299, "epoch": 0.1325059244085633, "loss": 0.0057, "grad_norm": 3.7170727252960205, "learning_rate": 6.060606060606061e-09, "num_tokens": 7521612.0, "completions/mean_length": 166.5, "completions/min_length": 159.0, "completions/max_length": 170.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 166.5, "completions/min_terminated_length": 159.0, "completions/max_terminated_length": 170.0, "rewards/meter/mean": 0.9987373352050781, "rewards/meter/std": 0.000354176911059767, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9987373352050781, "rewards/total_composite/std": 0.000354176911059767, "reward": 0.9987373352050781, "reward_std": 0.00035417175968177617, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.03916100785136223, "sampling/sampling_logp_difference/max": 1.9973111152648926, "sampling/importance_sampling_ratio/min": 0.13569968938827515, "sampling/importance_sampling_ratio/mean": 1.001840591430664, "sampling/importance_sampling_ratio/max": 2.0, "entropy": 0.3029062431305647, "clip_ratio/low_mean": 0.01500677247531712, "clip_ratio/low_min": 0.01500677247531712, "clip_ratio/high_mean": 0.015017259865999222, "clip_ratio/high_max": 0.015017259865999222, "clip_ratio/region_mean": 0.030024032341316342, "reward_total_mean": 0.9987373352050781, "reward_meter_mean": 0.9987373352050781, "reward_meter_std": 0.000354176911059767, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9987373352050781, "reward_total_composite_std": 0.000354176911059767, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4132.0}
4214
  {"timestamp_utc": "2026-04-12T03:43:36Z", "mode": "train", "global_step": 3300, "epoch": 0.13254608989034825, "loss": 0.0153, "grad_norm": 6.677674293518066, "learning_rate": 3.0303030303030304e-09, "num_tokens": 7523188.0, "completions/mean_length": 46.0, "completions/min_length": 46.0, "completions/max_length": 46.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 46.0, "completions/min_terminated_length": 46.0, "completions/max_terminated_length": 46.0, "rewards/meter/mean": 0.9442145824432373, "rewards/meter/std": 0.003297017654404044, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9442145824432373, "rewards/total_composite/std": 0.003297017654404044, "reward": 0.9442145824432373, "reward_std": 0.0032970213796943426, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.021698685362935066, "sampling/sampling_logp_difference/max": 2.1988744735717773, "sampling/importance_sampling_ratio/min": 0.11092793941497803, "sampling/importance_sampling_ratio/mean": 1.0027215480804443, "sampling/importance_sampling_ratio/max": 1.663463830947876, "entropy": 0.09115941543132067, "clip_ratio/low_mean": 0.00815217406488955, "clip_ratio/low_min": 0.00815217406488955, "clip_ratio/high_mean": 0.0027173913549631834, "clip_ratio/high_max": 0.0027173913549631834, "clip_ratio/region_mean": 0.010869565419852734, "reward_total_mean": 0.9442145824432373, "reward_meter_mean": 0.9442145824432373, "reward_meter_std": 0.003297017654404044, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9442145824432373, "reward_total_composite_std": 0.003297017654404044, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4133.0}
 
 
 
4212
  {"timestamp_utc": "2026-04-12T03:43:26Z", "mode": "train", "global_step": 3298, "epoch": 0.13246575892677834, "loss": 0.0017, "grad_norm": 2.183478593826294, "learning_rate": 9.090909090909092e-09, "num_tokens": 7518824.0, "completions/mean_length": 65.375, "completions/min_length": 65.0, "completions/max_length": 66.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 65.375, "completions/min_terminated_length": 65.0, "completions/max_terminated_length": 66.0, "rewards/meter/mean": 0.9922501444816589, "rewards/meter/std": 0.004244488663971424, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9922501444816589, "rewards/total_composite/std": 0.004244488663971424, "reward": 0.9922501444816589, "reward_std": 0.0042444937862455845, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.013568882830440998, "sampling/sampling_logp_difference/max": 0.7026901245117188, "sampling/importance_sampling_ratio/min": 0.49525120854377747, "sampling/importance_sampling_ratio/mean": 1.0067819356918335, "sampling/importance_sampling_ratio/max": 1.4506497383117676, "entropy": 0.11512181628495455, "clip_ratio/low_mean": 0.0037878789007663727, "clip_ratio/low_min": 0.0037878789007663727, "clip_ratio/high_mean": 0.005710955825634301, "clip_ratio/high_max": 0.005710955825634301, "clip_ratio/region_mean": 0.009498834726400673, "reward_total_mean": 0.9922501444816589, "reward_meter_mean": 0.9922501444816589, "reward_meter_std": 0.004244488663971424, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9922501444816589, "reward_total_composite_std": 0.004244488663971424, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4131.0}
4213
  {"timestamp_utc": "2026-04-12T03:43:32Z", "mode": "train", "global_step": 3299, "epoch": 0.1325059244085633, "loss": 0.0057, "grad_norm": 3.7170727252960205, "learning_rate": 6.060606060606061e-09, "num_tokens": 7521612.0, "completions/mean_length": 166.5, "completions/min_length": 159.0, "completions/max_length": 170.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 166.5, "completions/min_terminated_length": 159.0, "completions/max_terminated_length": 170.0, "rewards/meter/mean": 0.9987373352050781, "rewards/meter/std": 0.000354176911059767, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9987373352050781, "rewards/total_composite/std": 0.000354176911059767, "reward": 0.9987373352050781, "reward_std": 0.00035417175968177617, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.03916100785136223, "sampling/sampling_logp_difference/max": 1.9973111152648926, "sampling/importance_sampling_ratio/min": 0.13569968938827515, "sampling/importance_sampling_ratio/mean": 1.001840591430664, "sampling/importance_sampling_ratio/max": 2.0, "entropy": 0.3029062431305647, "clip_ratio/low_mean": 0.01500677247531712, "clip_ratio/low_min": 0.01500677247531712, "clip_ratio/high_mean": 0.015017259865999222, "clip_ratio/high_max": 0.015017259865999222, "clip_ratio/region_mean": 0.030024032341316342, "reward_total_mean": 0.9987373352050781, "reward_meter_mean": 0.9987373352050781, "reward_meter_std": 0.000354176911059767, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9987373352050781, "reward_total_composite_std": 0.000354176911059767, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4132.0}
4214
  {"timestamp_utc": "2026-04-12T03:43:36Z", "mode": "train", "global_step": 3300, "epoch": 0.13254608989034825, "loss": 0.0153, "grad_norm": 6.677674293518066, "learning_rate": 3.0303030303030304e-09, "num_tokens": 7523188.0, "completions/mean_length": 46.0, "completions/min_length": 46.0, "completions/max_length": 46.0, "completions/clipped_ratio": 0.0, "completions/mean_terminated_length": 46.0, "completions/min_terminated_length": 46.0, "completions/max_terminated_length": 46.0, "rewards/meter/mean": 0.9442145824432373, "rewards/meter/std": 0.003297017654404044, "rewards/count_adherence/mean": 1.0, "rewards/count_adherence/std": 0.0, "rewards/arabic_clean/mean": 1.0, "rewards/arabic_clean/std": 0.0, "rewards/repeat_penalty/mean": 1.0, "rewards/repeat_penalty/std": 0.0, "rewards/total_composite/mean": 0.9442145824432373, "rewards/total_composite/std": 0.003297017654404044, "reward": 0.9442145824432373, "reward_std": 0.0032970213796943426, "frac_reward_zero_std": 0.0, "sampling/sampling_logp_difference/mean": 0.021698685362935066, "sampling/sampling_logp_difference/max": 2.1988744735717773, "sampling/importance_sampling_ratio/min": 0.11092793941497803, "sampling/importance_sampling_ratio/mean": 1.0027215480804443, "sampling/importance_sampling_ratio/max": 1.663463830947876, "entropy": 0.09115941543132067, "clip_ratio/low_mean": 0.00815217406488955, "clip_ratio/low_min": 0.00815217406488955, "clip_ratio/high_mean": 0.0027173913549631834, "clip_ratio/high_max": 0.0027173913549631834, "clip_ratio/region_mean": 0.010869565419852734, "reward_total_mean": 0.9442145824432373, "reward_meter_mean": 0.9442145824432373, "reward_meter_std": 0.003297017654404044, "reward_count_adherence_mean": 1.0, "reward_count_adherence_std": 0.0, "reward_arabic_clean_mean": 1.0, "reward_arabic_clean_std": 0.0, "reward_repeat_penalty_mean": 1.0, "reward_repeat_penalty_std": 0.0, "reward_total_composite_mean": 0.9442145824432373, "reward_total_composite_std": 0.003297017654404044, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4133.0}
4215
+ {"timestamp_utc": "2026-04-12T03:45:00Z", "mode": "train", "global_step": 3300, "epoch": 0.13254608989034825, "train_runtime": 18489.879, "train_samples_per_second": 1.428, "train_steps_per_second": 0.178, "total_flos": 0.0, "train_loss": 0.0004697396774788627, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4133.0}
4216
+ {"timestamp_utc": "2026-04-12T03:44:57Z", "mode": "eval", "global_step": 3300, "epoch": 0.13254608989034825, "eval_loss": NaN, "eval_runtime": 80.3156, "eval_samples_per_second": 1.295, "eval_steps_per_second": 0.162, "eval_num_tokens": 7523188.0, "eval_completions/mean_length": 213.14423076923077, "eval_completions/min_length": 61.23076923076923, "eval_completions/max_length": 421.38461538461536, "eval_completions/clipped_ratio": 0.009615384615384616, "eval_completions/mean_terminated_length": 209.98489027756912, "eval_completions/min_terminated_length": 61.23076923076923, "eval_completions/max_terminated_length": 412.2307692307692, "eval_rewards/meter/mean": 0.7804106657321637, "eval_rewards/meter/std": 0.3429693900621854, "eval_rewards/count_adherence/mean": 0.9621203220807589, "eval_rewards/count_adherence/std": 0.06154714152216911, "eval_rewards/arabic_clean/mean": 1.0, "eval_rewards/arabic_clean/std": 0.0, "eval_rewards/repeat_penalty/mean": 0.9574309633328364, "eval_rewards/repeat_penalty/std": 0.07397974411455485, "eval_rewards/total_composite/mean": 0.7239617155148432, "eval_rewards/total_composite/std": 0.3431667788670613, "eval_reward": 0.7239617155148432, "eval_reward_std": NaN, "eval_frac_reward_zero_std": 0.0, "eval_sampling/sampling_logp_difference/mean": 0.03249364231641476, "eval_sampling/sampling_logp_difference/max": 1.2331663278432994, "eval_sampling/importance_sampling_ratio/min": 0.2969068231490942, "eval_sampling/importance_sampling_ratio/mean": 1.0095902956449068, "eval_sampling/importance_sampling_ratio/max": 1.6007587084403405, "eval_entropy": 0.38235602699793303, "eval_clip_ratio/low_mean": 0.0, "eval_clip_ratio/low_min": 0.0, "eval_clip_ratio/high_mean": 0.0, "eval_clip_ratio/high_max": 0.0, "eval_clip_ratio/region_mean": 0.0, "eval_reward_total_mean": 0.7239617155148432, "eval_reward_meter_mean": 0.7804106657321637, "eval_reward_meter_std": 0.3429693900621854, "eval_reward_count_adherence_mean": 0.9621203220807589, "eval_reward_count_adherence_std": 0.06154714152216911, "eval_reward_arabic_clean_mean": 1.0, "eval_reward_arabic_clean_std": 0.0, "eval_reward_repeat_penalty_mean": 0.9574309633328364, "eval_reward_repeat_penalty_std": 0.07397974411455485, "eval_reward_total_composite_mean": 0.7239617155148432, "eval_reward_total_composite_std": 0.3431667788670613, "run_id": "shaer_grpo_20260411_223409", "run_sequence_index": 1, "_plot_step": 4133.0}
plots/meter_by_meter_run.png CHANGED

Git LFS Details

  • SHA256: d868c70e622fbac3593d013cb6d94b421b8c3ed4f5cfe15da6f3740148f21d3a
  • Pointer size: 131 Bytes
  • Size of remote file: 756 kB

Git LFS Details

  • SHA256: bf06fc506155b47f640c4d4f4a45b12be23930daaa6bbe952978406ec30f7923
  • Pointer size: 131 Bytes
  • Size of remote file: 754 kB
plots/reward_panels_eval_chain.png CHANGED

Git LFS Details

  • SHA256: 5f1431275a4ee379e0ec8996fb82f19d1742c5ba2f808ea4cbe3fd29730efe10
  • Pointer size: 131 Bytes
  • Size of remote file: 319 kB

Git LFS Details

  • SHA256: e71bbad57b559a2ddfb27320070b5e76f4937a0926a81cd7e791340fdb1cd8f6
  • Pointer size: 131 Bytes
  • Size of remote file: 318 kB
plots/reward_panels_eval_run.png CHANGED

Git LFS Details

  • SHA256: a67e09297ee5cb901c1208abb5cba2cf7c0780998ed5869401319b4e74b7999d
  • Pointer size: 131 Bytes
  • Size of remote file: 309 kB

Git LFS Details

  • SHA256: 40d7e8ffe5e4ed533011d71774de85d38a45acd78c319cf6469bb8d3631e8733
  • Pointer size: 131 Bytes
  • Size of remote file: 310 kB
plotter.log CHANGED
@@ -3588,3 +3588,13 @@
3588
  [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/arabic_gate_chain.png
3589
  [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_run.png
3590
  [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_chain.png
 
 
 
 
 
 
 
 
 
 
 
3588
  [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/arabic_gate_chain.png
3589
  [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_run.png
3590
  [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_chain.png
3591
+ [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/reward_panels_train_run.png
3592
+ [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/reward_panels_eval_run.png
3593
+ [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/reward_panels_train_chain.png
3594
+ [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/reward_panels_eval_chain.png
3595
+ [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/kl_run.png
3596
+ [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/kl_chain.png
3597
+ [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/arabic_gate_run.png
3598
+ [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/arabic_gate_chain.png
3599
+ [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_run.png
3600
+ [plot_live_rewards] updated /root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/plots/meter_by_meter_chain.png
run_summary.json CHANGED
@@ -1,35 +1,35 @@
1
  {
2
- "timestamp_utc": "2026-04-11T17:48:47Z",
3
- "mode": "sanity",
4
- "created_at_utc": "2026-04-11T17:46:58Z",
5
- "run_id": "sanity_20260411_174336",
6
- "run_dir": "/root/workspace/Shaer/grpo/outputs/sanity_check/sanity_20260411_174336",
7
- "chain_id": "sanity_20260411_174336",
8
- "root_run_id": "sanity_20260411_174336",
9
- "parent_run_id": "",
10
- "parent_run_dir": "",
11
- "run_sequence_index": 0,
12
  "output_repo": "Shaer-AI/Shaer-adapters-grpo",
13
  "resume_decision": {
14
- "timestamp_utc": "2026-04-11T17:46:58Z",
15
- "resume_mode": "fresh",
16
- "requested_spec": "",
17
- "result": "fresh",
18
- "reason": "explicit_fresh",
19
- "local_resume_path": null,
20
  "remote_repo": null,
21
  "remote_prefix": null,
22
- "compatibility": "unchecked",
23
- "config_fingerprint": "91c7b4340e889a3a285a9b7b3adb2c6025c061c0e14a1dcaa5a2178c5369cf3b"
24
  },
25
- "best_model_checkpoint": "/root/workspace/Shaer/grpo/outputs/sanity_check/sanity_20260411_174336/checkpoint-2",
26
- "global_step": 2,
27
  "train_metrics": {
28
- "train_runtime": 29.2695,
29
- "train_samples_per_second": 0.547,
30
- "train_steps_per_second": 0.068,
31
  "total_flos": 0.0,
32
- "train_loss": 0.12583593279123306
33
  },
34
- "final_adapter_dir": "/root/workspace/Shaer/grpo/outputs/sanity_check/sanity_20260411_174336/final_adapter"
35
  }
 
1
  {
2
+ "timestamp_utc": "2026-04-12T03:45:42Z",
3
+ "mode": "train",
4
+ "created_at_utc": "2026-04-11T22:36:28Z",
5
+ "run_id": "shaer_grpo_20260411_223409",
6
+ "run_dir": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409",
7
+ "chain_id": "shaer_grpo_20260411_192107",
8
+ "root_run_id": "shaer_grpo_20260411_192107",
9
+ "parent_run_id": "shaer_grpo_20260411_192107",
10
+ "parent_run_dir": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_192107",
11
+ "run_sequence_index": 1,
12
  "output_repo": "Shaer-AI/Shaer-adapters-grpo",
13
  "resume_decision": {
14
+ "timestamp_utc": "2026-04-11T22:36:28Z",
15
+ "resume_mode": "from_path",
16
+ "requested_spec": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_192107/checkpoint-650",
17
+ "result": "resume",
18
+ "reason": "explicit_local_path",
19
+ "local_resume_path": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_192107/checkpoint-650",
20
  "remote_repo": null,
21
  "remote_prefix": null,
22
+ "compatibility": "fingerprint_mismatch",
23
+ "config_fingerprint": "dddf85cc86110a84f67b563540177d5e59b5c500695e99fe984dfc39dac36c3f"
24
  },
25
+ "best_model_checkpoint": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/checkpoint-3100",
26
+ "global_step": 3300,
27
  "train_metrics": {
28
+ "train_runtime": 18489.879,
29
+ "train_samples_per_second": 1.428,
30
+ "train_steps_per_second": 0.178,
31
  "total_flos": 0.0,
32
+ "train_loss": 0.0004697396774788627
33
  },
34
+ "final_adapter_dir": "/root/workspace/Shaer/grpo/outputs/train/shaer_grpo_20260411_223409/final_adapter"
35
  }
train.log CHANGED
@@ -2713,3 +2713,4 @@
2713
  2026-04-12 03:43:36,813 | INFO | train_grpo_train | metrics_logged mode=train step=3300
2714
  2026-04-12 03:44:57,274 | INFO | train_grpo_train | metrics_logged mode=eval step=3300
2715
  2026-04-12 03:45:00,970 | INFO | train_grpo_train | metrics_logged mode=train step=3300
 
 
2713
  2026-04-12 03:43:36,813 | INFO | train_grpo_train | metrics_logged mode=train step=3300
2714
  2026-04-12 03:44:57,274 | INFO | train_grpo_train | metrics_logged mode=eval step=3300
2715
  2026-04-12 03:45:00,970 | INFO | train_grpo_train | metrics_logged mode=train step=3300
2716
+ 2026-04-12 03:46:19,803 | INFO | train_grpo_train | pushing final adapter to hub repo=Shaer-AI/Shaer-adapters-grpo
train_stdout.log CHANGED
@@ -10362,3 +10362,1281 @@ The tokenizer has new PAD/BOS/EOS tokens that differ from the model config and g
10362
 
10363
  ...ots/arabic_gate_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 98.8kB / 98.8kB
10364
 
10365
  .../meter_by_meter_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.06MB / 1.06MB
10366
 
10367
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 756kB / 756kB
 
 
 
 
 
10368
  ..._223409/generations.jsonl: 8%|β–Š | 47.5MB / 614MB 
 
 
10369
  ..._223409/generations.jsonl: 8%|β–Š | 47.5MB / 614MB 
 
 
10370
  ..._223409/generations.jsonl: 15%|β–ˆβ– | 90.6MB / 614MB 
 
 
10371
  ..._223409/generations.jsonl: 22%|β–ˆβ–ˆβ– | 136MB / 614MB 
 
 
10372
  ..._223409/generations.jsonl: 29%|β–ˆβ–ˆβ–‰ | 177MB / 614MB 
 
 
10373
  ..._223409/generations.jsonl: 46%|β–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 284MB / 614MB 
 
 
 
10374
  ..._223409/generations.jsonl: 52%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 321MB / 614MB 
 
 
 
10375
  ..._223409/generations.jsonl: 60%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 366MB / 614MB 
 
 
10376
  ..._223409/generations.jsonl: 67%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 413MB / 614MB 
 
 
10377
  ..._223409/generations.jsonl: 85%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 519MB / 614MB 
 
 
 
10378
  ..._223409/generations.jsonl: 91%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 560MB / 614MB 
 
 
 
 
10379
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 53.5MB / 53.8MB 
 
 
 
 
10380
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 670kB / 673kB 
 
 
 
 
 
10381
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 27.1kB / 27.2kB 
 
 
10382
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 613MB / 614MB 
 
 
 
10383
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 53.5MB / 53.8MB 
 
 
 
 
10384
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 670kB / 673kB 
 
 
 
 
 
10385
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 27.1kB / 27.2kB 
 
 
 
10386
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 613MB / 614MB 
 
 
 
10387
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 53.5MB / 53.8MB 
 
 
 
 
10388
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 670kB / 673kB 
 
 
 
 
 
10389
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 27.1kB / 27.2kB 
 
 
10390
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
 
 
 
10391
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 53.8MB / 53.8MB 
 
 
 
 
10392
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 673kB / 673kB 
 
 
 
 
 
10393
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.2kB / 27.2kB 
 
 
 
10394
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
 
 
 
10395
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 53.8MB / 53.8MB 
 
 
 
 
10396
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 673kB / 673kB 
 
 
 
 
 
10397
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.2kB / 27.2kB 
 
 
10398
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
 
 
 
10399
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 53.8MB / 53.8MB 
 
 
 
 
10400
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 673kB / 673kB 
 
 
 
 
 
10401
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.2kB / 27.2kB 
 
 
10402
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
 
 
 
10403
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 53.8MB / 53.8MB 
 
 
 
 
10404
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 673kB / 673kB 
 
 
 
 
 
10405
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.2kB / 27.2kB 
 
 
10406
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB
 
10407
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 53.8MB / 53.8MB
 
10408
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 673kB / 673kB
 
10409
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.2kB / 27.2kB
 
 
 
 
10410
  ...107/chain_metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 982kB / 982kB 
 
 
 
10411
  ...7/chain_reward_curves.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.8kB / 27.8kB 
 
 
10412
  ...107/chain_metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 982kB / 982kB 
 
 
 
10413
  ...7/chain_reward_curves.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.8kB / 27.8kB 
 
 
 
10414
  ...107/chain_metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 982kB / 982kB 
 
 
 
10415
  ...7/chain_reward_curves.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.8kB / 27.8kB 
 
 
10416
  ...107/chain_metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 982kB / 982kB 
 
 
 
10417
  ...7/chain_reward_curves.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.8kB / 27.8kB 
 
 
10418
  ...107/chain_metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 982kB / 982kB
 
10419
  ...7/chain_reward_curves.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.8kB / 27.8kB
 
 
 
 
 
10420
  ..._223409/training_args.bin: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 7.50kB / 7.50kB 
 
 
 
10421
  ...plots/arabic_gate_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 81.1kB / 81.1kB 
 
 
 
 
10422
  ...ots/arabic_gate_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 98.8kB / 98.8kB 
 
 
 
 
 
10423
  ...l_adapter/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
 
 
 
 
10424
  ...adapter/training_args.bin: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 7.50kB / 7.50kB 
 
 
 
 
 
 
 
10425
  ...1_223409/plots/kl_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 24.6kB / 24.6kB 
 
 
 
 
 
 
 
 
10426
  ...223409/plots/kl_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 33.4kB / 33.4kB 
 
 
 
 
 
 
 
 
 
10427
  .../meter_by_meter_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.06MB / 1.06MB 
 
 
 
 
 
 
 
 
 
 
10428
  ...rd_panels_train_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 350kB / 350kB 
 
 
 
 
 
 
 
 
 
 
 
10429
  ...adapter_model.safetensors: 10%|β–ˆ | 64.0MB / 640MB 
 
 
10430
  ..._223409/training_args.bin: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 7.50kB / 7.50kB 
 
 
 
10431
  ...plots/arabic_gate_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 81.1kB / 81.1kB 
 
 
 
 
10432
  ...ots/arabic_gate_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 98.8kB / 98.8kB 
 
 
 
 
 
10433
  ...l_adapter/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
 
 
 
 
10434
  ...adapter/training_args.bin: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 7.50kB / 7.50kB 
 
 
 
 
 
 
 
10435
  ...1_223409/plots/kl_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 24.6kB / 24.6kB 
 
 
 
 
 
 
 
 
10436
  ...223409/plots/kl_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 33.4kB / 33.4kB 
 
 
 
 
 
 
 
 
 
10437
  .../meter_by_meter_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.06MB / 1.06MB 
 
 
 
 
 
 
 
 
 
 
10438
  ...rd_panels_train_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 350kB / 350kB 
 
 
 
 
 
 
 
 
 
 
 
10439
  [+ 8 files] : 18%|β–ˆβ–Š | 440MB / 2.42GB 
 
 
10440
  ...rd_panels_train_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 350kB / 350kB 
 
 
 
10441
  ...adapter_model.safetensors: 20%|β–ˆβ–ˆ | 128MB / 640MB 
 
 
 
 
10442
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
 
 
 
 
 
10443
  ...adapter_model.safetensors: 19%|β–ˆβ–‰ | 120MB / 640MB 
 
 
 
 
 
 
10444
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
10445
  ...409/all_generations.jsonl: 20%|β–ˆβ–‰ | 120MB / 614MB 
 
 
 
 
 
 
 
 
10446
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
10447
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
10448
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
 
10449
  [+ 1 files] : 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 107MB / 107MB 
 
 
10450
  ...adapter_model.safetensors: 28%|β–ˆβ–ˆβ–Š | 176MB / 640MB 
 
 
 
10451
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
 
 
 
 
10452
  ...adapter_model.safetensors: 28%|β–ˆβ–ˆβ–Š | 176MB / 640MB 
 
 
 
 
 
10453
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10454
  ...409/all_generations.jsonl: 29%|β–ˆβ–ˆβ–Š | 176MB / 614MB 
 
 
 
 
 
 
 
10455
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10456
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
10457
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
10458
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
 
10459
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
10460
  ...adapter_model.safetensors: 38%|β–ˆβ–ˆβ–ˆβ–Š | 240MB / 640MB 
 
 
 
10461
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
 
 
 
 
10462
  ...adapter_model.safetensors: 38%|β–ˆβ–ˆβ–ˆβ–Š | 240MB / 640MB 
 
 
 
 
 
10463
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10464
  ...409/all_generations.jsonl: 38%|β–ˆβ–ˆβ–ˆβ–Š | 232MB / 614MB 
 
 
 
 
 
 
 
10465
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10466
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
10467
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
10468
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
 
10469
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
10470
  ...adapter_model.safetensors: 46%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 296MB / 640MB 
 
 
 
10471
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
 
 
 
 
10472
  ...adapter_model.safetensors: 46%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 296MB / 640MB 
 
 
 
 
 
10473
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10474
  ...409/all_generations.jsonl: 47%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 288MB / 614MB 
 
 
 
 
 
 
 
10475
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10476
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
10477
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
10478
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
 
10479
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
10480
  ...adapter_model.safetensors: 55%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 352MB / 640MB 
 
 
 
10481
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
 
 
 
 
10482
  ...adapter_model.safetensors: 55%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 352MB / 640MB 
 
 
 
 
 
10483
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10484
  ...409/all_generations.jsonl: 56%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 344MB / 614MB 
 
 
 
 
 
 
 
10485
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10486
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
10487
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
10488
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
 
10489
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
10490
  ...adapter_model.safetensors: 64%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 408MB / 640MB 
 
 
 
10491
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
 
 
 
 
10492
  ...adapter_model.safetensors: 64%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 408MB / 640MB 
 
 
 
 
 
10493
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10494
  ...409/all_generations.jsonl: 65%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 400MB / 614MB 
 
 
 
 
 
 
 
10495
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10496
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
10497
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
10498
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
 
10499
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
10500
  ...adapter_model.safetensors: 73%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 464MB / 640MB 
 
 
 
10501
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
 
 
 
 
10502
  ...adapter_model.safetensors: 74%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 472MB / 640MB 
 
 
 
 
 
10503
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10504
  ...409/all_generations.jsonl: 74%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 456MB / 614MB 
 
 
 
 
 
 
 
10505
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10506
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
10507
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
10508
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
 
10509
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
10510
  ...adapter_model.safetensors: 83%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 528MB / 640MB 
 
 
 
10511
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
 
 
 
 
10512
  ...adapter_model.safetensors: 83%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 528MB / 640MB 
 
 
 
 
 
10513
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10514
  ...409/all_generations.jsonl: 85%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 520MB / 614MB 
 
 
 
 
 
 
 
10515
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10516
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
10517
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
10518
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
 
10519
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
10520
  ...adapter_model.safetensors: 91%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 584MB / 640MB 
 
 
 
10521
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
 
 
 
 
10522
  ...adapter_model.safetensors: 91%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 584MB / 640MB 
 
 
 
 
 
10523
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10524
  ...409/all_generations.jsonl: 94%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 576MB / 614MB 
 
 
 
 
 
 
 
10525
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10526
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
10527
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
10528
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
 
10529
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
10530
  ...adapter_model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 640MB / 640MB 
 
 
 
10531
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
 
 
 
 
10532
  ...adapter_model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 640MB / 640MB 
 
 
 
 
 
10533
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10534
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
 
 
 
 
 
 
 
10535
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10536
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
10537
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
10538
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
 
10539
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
10540
  ...adapter_model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 640MB / 640MB 
 
 
 
10541
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
 
 
 
 
10542
  ...adapter_model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 640MB / 640MB 
 
 
 
 
 
10543
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10544
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
 
 
 
 
 
 
 
10545
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10546
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
10547
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
10548
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
 
 
 
10549
  [+ 3 files] : 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.61MB / 2.61MB 
 
 
 
10550
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
10551
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
 
 
 
 
10552
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
10553
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10554
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
10555
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10556
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
 
 
 
 
 
 
 
10557
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 754kB / 754kB 
 
 
 
 
 
 
 
 
 
 
10558
  ...ard_panels_eval_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 318kB / 318kB 
 
 
 
 
 
 
 
 
 
 
 
10559
  ...eward_panels_eval_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 310kB / 310kB 
 
 
10560
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
10561
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
 
 
 
 
10562
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
10563
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10564
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
10565
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10566
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
 
 
 
 
 
 
 
10567
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 754kB / 754kB 
 
 
 
 
 
 
 
 
 
 
10568
  ...ard_panels_eval_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 318kB / 318kB 
 
 
 
 
 
 
 
 
 
 
 
10569
  ...eward_panels_eval_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 310kB / 310kB 
 
 
10570
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
10571
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
 
 
 
 
10572
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
10573
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10574
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
10575
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10576
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
 
 
 
 
 
 
 
10577
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 754kB / 754kB 
 
 
 
 
 
 
 
 
 
 
10578
  ...ard_panels_eval_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 318kB / 318kB 
 
 
 
 
 
 
 
 
 
 
 
10579
  ...eward_panels_eval_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 310kB / 310kB 
 
 
10580
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
10581
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
 
 
 
 
10582
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
10583
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
10584
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
10585
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
 
 
 
 
 
 
 
 
10586
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
 
 
 
 
 
 
 
 
 
10587
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 754kB / 754kB 
 
 
 
 
 
 
 
 
 
 
10588
  ...ard_panels_eval_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 318kB / 318kB 
 
 
 
 
 
 
 
 
 
 
 
10589
  ...eward_panels_eval_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 310kB / 310kB 
 
 
10590
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB
 
10591
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB
 
10592
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB
 
10593
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB
 
10594
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB
 
10595
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB
 
10596
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB
 
10597
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 754kB / 754kB
 
10598
  ...ard_panels_eval_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 318kB / 318kB
 
10599
  ...eward_panels_eval_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 310kB / 310kB
 
10362
 
10363
  ...ots/arabic_gate_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 98.8kB / 98.8kB
10364
 
10365
  .../meter_by_meter_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.06MB / 1.06MB
10366
 
10367
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 756kB / 756kB
10368
+ No files have been modified since last commit. Skipping to prevent empty commit.
10369
+
10370
+
10371
+
10372
+
10373
  ..._223409/generations.jsonl: 8%|β–Š | 47.5MB / 614MB 
10374
+
10375
+
10376
  ..._223409/generations.jsonl: 8%|β–Š | 47.5MB / 614MB 
10377
+
10378
+
10379
  ..._223409/generations.jsonl: 15%|β–ˆβ– | 90.6MB / 614MB 
10380
+
10381
+
10382
  ..._223409/generations.jsonl: 22%|β–ˆβ–ˆβ– | 136MB / 614MB 
10383
+
10384
+
10385
  ..._223409/generations.jsonl: 29%|β–ˆβ–ˆβ–‰ | 177MB / 614MB 
10386
+
10387
+
10388
  ..._223409/generations.jsonl: 46%|β–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 284MB / 614MB 
10389
+
10390
+
10391
+
10392
  ..._223409/generations.jsonl: 52%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 321MB / 614MB 
10393
+
10394
+
10395
+
10396
  ..._223409/generations.jsonl: 60%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 366MB / 614MB 
10397
+
10398
+
10399
  ..._223409/generations.jsonl: 67%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 413MB / 614MB 
10400
+
10401
+
10402
  ..._223409/generations.jsonl: 85%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 519MB / 614MB 
10403
+
10404
+
10405
+
10406
  ..._223409/generations.jsonl: 91%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 560MB / 614MB 
10407
+
10408
+
10409
+
10410
+
10411
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 53.5MB / 53.8MB 
10412
+
10413
+
10414
+
10415
+
10416
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 670kB / 673kB 
10417
+
10418
+
10419
+
10420
+
10421
+
10422
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 27.1kB / 27.2kB 
10423
+
10424
+
10425
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 613MB / 614MB 
10426
+
10427
+
10428
+
10429
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 53.5MB / 53.8MB 
10430
+
10431
+
10432
+
10433
+
10434
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 670kB / 673kB 
10435
+
10436
+
10437
+
10438
+
10439
+
10440
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 27.1kB / 27.2kB 
10441
+
10442
+
10443
+
10444
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 613MB / 614MB 
10445
+
10446
+
10447
+
10448
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 53.5MB / 53.8MB 
10449
+
10450
+
10451
+
10452
+
10453
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 670kB / 673kB 
10454
+
10455
+
10456
+
10457
+
10458
+
10459
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 27.1kB / 27.2kB 
10460
+
10461
+
10462
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
10463
+
10464
+
10465
+
10466
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 53.8MB / 53.8MB 
10467
+
10468
+
10469
+
10470
+
10471
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 673kB / 673kB 
10472
+
10473
+
10474
+
10475
+
10476
+
10477
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.2kB / 27.2kB 
10478
+
10479
+
10480
+
10481
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
10482
+
10483
+
10484
+
10485
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 53.8MB / 53.8MB 
10486
+
10487
+
10488
+
10489
+
10490
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 673kB / 673kB 
10491
+
10492
+
10493
+
10494
+
10495
+
10496
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.2kB / 27.2kB 
10497
+
10498
+
10499
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
10500
+
10501
+
10502
+
10503
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 53.8MB / 53.8MB 
10504
+
10505
+
10506
+
10507
+
10508
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 673kB / 673kB 
10509
+
10510
+
10511
+
10512
+
10513
+
10514
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.2kB / 27.2kB 
10515
+
10516
+
10517
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
10518
+
10519
+
10520
+
10521
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 53.8MB / 53.8MB 
10522
+
10523
+
10524
+
10525
+
10526
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 673kB / 673kB 
10527
+
10528
+
10529
+
10530
+
10531
+
10532
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.2kB / 27.2kB 
10533
+
10534
+
10535
  ..._223409/generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB
10536
+
10537
  ...23409/generations.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 53.8MB / 53.8MB
10538
+
10539
  ...11_223409/metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 673kB / 673kB
10540
+
10541
  ...409/reward_curves_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.2kB / 27.2kB
10542
+
10543
+
10544
+
10545
+
10546
  ...107/chain_metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 982kB / 982kB 
10547
+
10548
+
10549
+
10550
  ...7/chain_reward_curves.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.8kB / 27.8kB 
10551
+
10552
+
10553
  ...107/chain_metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 982kB / 982kB 
10554
+
10555
+
10556
+
10557
  ...7/chain_reward_curves.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.8kB / 27.8kB 
10558
+
10559
+
10560
+
10561
  ...107/chain_metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 982kB / 982kB 
10562
+
10563
+
10564
+
10565
  ...7/chain_reward_curves.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.8kB / 27.8kB 
10566
+
10567
+
10568
  ...107/chain_metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 982kB / 982kB 
10569
+
10570
+
10571
+
10572
  ...7/chain_reward_curves.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.8kB / 27.8kB 
10573
+
10574
+
10575
  ...107/chain_metrics.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 982kB / 982kB
10576
+
10577
  ...7/chain_reward_curves.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 27.8kB / 27.8kB
10578
+ 2026-04-12 03:46:19,803 | INFO | train_grpo_train | pushing final adapter to hub repo=Shaer-AI/Shaer-adapters-grpo
10579
+
10580
+
10581
+
10582
+
10583
  ..._223409/training_args.bin: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 7.50kB / 7.50kB 
10584
+
10585
+
10586
+
10587
  ...plots/arabic_gate_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 81.1kB / 81.1kB 
10588
+
10589
+
10590
+
10591
+
10592
  ...ots/arabic_gate_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 98.8kB / 98.8kB 
10593
+
10594
+
10595
+
10596
+
10597
+
10598
  ...l_adapter/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
10599
+
10600
+
10601
+
10602
+
10603
+
10604
+
10605
  ...adapter/training_args.bin: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 7.50kB / 7.50kB 
10606
+
10607
+
10608
+
10609
+
10610
+
10611
+
10612
+
10613
  ...1_223409/plots/kl_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 24.6kB / 24.6kB 
10614
+
10615
+
10616
+
10617
+
10618
+
10619
+
10620
+
10621
+
10622
  ...223409/plots/kl_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 33.4kB / 33.4kB 
10623
+
10624
+
10625
+
10626
+
10627
+
10628
+
10629
+
10630
+
10631
+
10632
  .../meter_by_meter_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.06MB / 1.06MB 
10633
+
10634
+
10635
+
10636
+
10637
+
10638
+
10639
+
10640
+
10641
+
10642
+
10643
  ...rd_panels_train_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 350kB / 350kB 
10644
+
10645
+
10646
+
10647
+
10648
+
10649
+
10650
+
10651
+
10652
+
10653
+
10654
+
10655
  ...adapter_model.safetensors: 10%|β–ˆ | 64.0MB / 640MB 
10656
+
10657
+
10658
  ..._223409/training_args.bin: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 7.50kB / 7.50kB 
10659
+
10660
+
10661
+
10662
  ...plots/arabic_gate_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 81.1kB / 81.1kB 
10663
+
10664
+
10665
+
10666
+
10667
  ...ots/arabic_gate_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 98.8kB / 98.8kB 
10668
+
10669
+
10670
+
10671
+
10672
+
10673
  ...l_adapter/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
10674
+
10675
+
10676
+
10677
+
10678
+
10679
+
10680
  ...adapter/training_args.bin: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 7.50kB / 7.50kB 
10681
+
10682
+
10683
+
10684
+
10685
+
10686
+
10687
+
10688
  ...1_223409/plots/kl_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 24.6kB / 24.6kB 
10689
+
10690
+
10691
+
10692
+
10693
+
10694
+
10695
+
10696
+
10697
  ...223409/plots/kl_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 33.4kB / 33.4kB 
10698
+
10699
+
10700
+
10701
+
10702
+
10703
+
10704
+
10705
+
10706
+
10707
  .../meter_by_meter_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.06MB / 1.06MB 
10708
+
10709
+
10710
+
10711
+
10712
+
10713
+
10714
+
10715
+
10716
+
10717
+
10718
  ...rd_panels_train_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 350kB / 350kB 
10719
+
10720
+
10721
+
10722
+
10723
+
10724
+
10725
+
10726
+
10727
+
10728
+
10729
+
10730
  [+ 8 files] : 18%|β–ˆβ–Š | 440MB / 2.42GB 
10731
+
10732
+
10733
  ...rd_panels_train_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 350kB / 350kB 
10734
+
10735
+
10736
+
10737
  ...adapter_model.safetensors: 20%|β–ˆβ–ˆ | 128MB / 640MB 
10738
+
10739
+
10740
+
10741
+
10742
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
10743
+
10744
+
10745
+
10746
+
10747
+
10748
  ...adapter_model.safetensors: 19%|β–ˆβ–‰ | 120MB / 640MB 
10749
+
10750
+
10751
+
10752
+
10753
+
10754
+
10755
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10756
+
10757
+
10758
+
10759
+
10760
+
10761
+
10762
+
10763
  ...409/all_generations.jsonl: 20%|β–ˆβ–‰ | 120MB / 614MB 
10764
+
10765
+
10766
+
10767
+
10768
+
10769
+
10770
+
10771
+
10772
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10773
+
10774
+
10775
+
10776
+
10777
+
10778
+
10779
+
10780
+
10781
+
10782
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10783
+
10784
+
10785
+
10786
+
10787
+
10788
+
10789
+
10790
+
10791
+
10792
+
10793
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10794
+
10795
+
10796
+
10797
+
10798
+
10799
+
10800
+
10801
+
10802
+
10803
+
10804
+
10805
  [+ 1 files] : 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 107MB / 107MB 
10806
+
10807
+
10808
  ...adapter_model.safetensors: 28%|β–ˆβ–ˆβ–Š | 176MB / 640MB 
10809
+
10810
+
10811
+
10812
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
10813
+
10814
+
10815
+
10816
+
10817
  ...adapter_model.safetensors: 28%|β–ˆβ–ˆβ–Š | 176MB / 640MB 
10818
+
10819
+
10820
+
10821
+
10822
+
10823
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10824
+
10825
+
10826
+
10827
+
10828
+
10829
+
10830
  ...409/all_generations.jsonl: 29%|β–ˆβ–ˆβ–Š | 176MB / 614MB 
10831
+
10832
+
10833
+
10834
+
10835
+
10836
+
10837
+
10838
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10839
+
10840
+
10841
+
10842
+
10843
+
10844
+
10845
+
10846
+
10847
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10848
+
10849
+
10850
+
10851
+
10852
+
10853
+
10854
+
10855
+
10856
+
10857
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10858
+
10859
+
10860
+
10861
+
10862
+
10863
+
10864
+
10865
+
10866
+
10867
+
10868
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10869
+
10870
+
10871
+
10872
+
10873
+
10874
+
10875
+
10876
+
10877
+
10878
+
10879
+
10880
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
10881
+
10882
+
10883
  ...adapter_model.safetensors: 38%|β–ˆβ–ˆβ–ˆβ–Š | 240MB / 640MB 
10884
+
10885
+
10886
+
10887
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
10888
+
10889
+
10890
+
10891
+
10892
  ...adapter_model.safetensors: 38%|β–ˆβ–ˆβ–ˆβ–Š | 240MB / 640MB 
10893
+
10894
+
10895
+
10896
+
10897
+
10898
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10899
+
10900
+
10901
+
10902
+
10903
+
10904
+
10905
  ...409/all_generations.jsonl: 38%|β–ˆβ–ˆβ–ˆβ–Š | 232MB / 614MB 
10906
+
10907
+
10908
+
10909
+
10910
+
10911
+
10912
+
10913
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10914
+
10915
+
10916
+
10917
+
10918
+
10919
+
10920
+
10921
+
10922
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10923
+
10924
+
10925
+
10926
+
10927
+
10928
+
10929
+
10930
+
10931
+
10932
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10933
+
10934
+
10935
+
10936
+
10937
+
10938
+
10939
+
10940
+
10941
+
10942
+
10943
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10944
+
10945
+
10946
+
10947
+
10948
+
10949
+
10950
+
10951
+
10952
+
10953
+
10954
+
10955
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
10956
+
10957
+
10958
  ...adapter_model.safetensors: 46%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 296MB / 640MB 
10959
+
10960
+
10961
+
10962
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
10963
+
10964
+
10965
+
10966
+
10967
  ...adapter_model.safetensors: 46%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 296MB / 640MB 
10968
+
10969
+
10970
+
10971
+
10972
+
10973
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10974
+
10975
+
10976
+
10977
+
10978
+
10979
+
10980
  ...409/all_generations.jsonl: 47%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 288MB / 614MB 
10981
+
10982
+
10983
+
10984
+
10985
+
10986
+
10987
+
10988
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10989
+
10990
+
10991
+
10992
+
10993
+
10994
+
10995
+
10996
+
10997
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
10998
+
10999
+
11000
+
11001
+
11002
+
11003
+
11004
+
11005
+
11006
+
11007
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11008
+
11009
+
11010
+
11011
+
11012
+
11013
+
11014
+
11015
+
11016
+
11017
+
11018
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11019
+
11020
+
11021
+
11022
+
11023
+
11024
+
11025
+
11026
+
11027
+
11028
+
11029
+
11030
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
11031
+
11032
+
11033
  ...adapter_model.safetensors: 55%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 352MB / 640MB 
11034
+
11035
+
11036
+
11037
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
11038
+
11039
+
11040
+
11041
+
11042
  ...adapter_model.safetensors: 55%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 352MB / 640MB 
11043
+
11044
+
11045
+
11046
+
11047
+
11048
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11049
+
11050
+
11051
+
11052
+
11053
+
11054
+
11055
  ...409/all_generations.jsonl: 56%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 344MB / 614MB 
11056
+
11057
+
11058
+
11059
+
11060
+
11061
+
11062
+
11063
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11064
+
11065
+
11066
+
11067
+
11068
+
11069
+
11070
+
11071
+
11072
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11073
+
11074
+
11075
+
11076
+
11077
+
11078
+
11079
+
11080
+
11081
+
11082
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11083
+
11084
+
11085
+
11086
+
11087
+
11088
+
11089
+
11090
+
11091
+
11092
+
11093
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11094
+
11095
+
11096
+
11097
+
11098
+
11099
+
11100
+
11101
+
11102
+
11103
+
11104
+
11105
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
11106
+
11107
+
11108
  ...adapter_model.safetensors: 64%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 408MB / 640MB 
11109
+
11110
+
11111
+
11112
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
11113
+
11114
+
11115
+
11116
+
11117
  ...adapter_model.safetensors: 64%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 408MB / 640MB 
11118
+
11119
+
11120
+
11121
+
11122
+
11123
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11124
+
11125
+
11126
+
11127
+
11128
+
11129
+
11130
  ...409/all_generations.jsonl: 65%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 400MB / 614MB 
11131
+
11132
+
11133
+
11134
+
11135
+
11136
+
11137
+
11138
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11139
+
11140
+
11141
+
11142
+
11143
+
11144
+
11145
+
11146
+
11147
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11148
+
11149
+
11150
+
11151
+
11152
+
11153
+
11154
+
11155
+
11156
+
11157
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11158
+
11159
+
11160
+
11161
+
11162
+
11163
+
11164
+
11165
+
11166
+
11167
+
11168
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11169
+
11170
+
11171
+
11172
+
11173
+
11174
+
11175
+
11176
+
11177
+
11178
+
11179
+
11180
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
11181
+
11182
+
11183
  ...adapter_model.safetensors: 73%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 464MB / 640MB 
11184
+
11185
+
11186
+
11187
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
11188
+
11189
+
11190
+
11191
+
11192
  ...adapter_model.safetensors: 74%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 472MB / 640MB 
11193
+
11194
+
11195
+
11196
+
11197
+
11198
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11199
+
11200
+
11201
+
11202
+
11203
+
11204
+
11205
  ...409/all_generations.jsonl: 74%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 456MB / 614MB 
11206
+
11207
+
11208
+
11209
+
11210
+
11211
+
11212
+
11213
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11214
+
11215
+
11216
+
11217
+
11218
+
11219
+
11220
+
11221
+
11222
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11223
+
11224
+
11225
+
11226
+
11227
+
11228
+
11229
+
11230
+
11231
+
11232
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11233
+
11234
+
11235
+
11236
+
11237
+
11238
+
11239
+
11240
+
11241
+
11242
+
11243
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11244
+
11245
+
11246
+
11247
+
11248
+
11249
+
11250
+
11251
+
11252
+
11253
+
11254
+
11255
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
11256
+
11257
+
11258
  ...adapter_model.safetensors: 83%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 528MB / 640MB 
11259
+
11260
+
11261
+
11262
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
11263
+
11264
+
11265
+
11266
+
11267
  ...adapter_model.safetensors: 83%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 528MB / 640MB 
11268
+
11269
+
11270
+
11271
+
11272
+
11273
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11274
+
11275
+
11276
+
11277
+
11278
+
11279
+
11280
  ...409/all_generations.jsonl: 85%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 520MB / 614MB 
11281
+
11282
+
11283
+
11284
+
11285
+
11286
+
11287
+
11288
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11289
+
11290
+
11291
+
11292
+
11293
+
11294
+
11295
+
11296
+
11297
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11298
+
11299
+
11300
+
11301
+
11302
+
11303
+
11304
+
11305
+
11306
+
11307
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11308
+
11309
+
11310
+
11311
+
11312
+
11313
+
11314
+
11315
+
11316
+
11317
+
11318
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11319
+
11320
+
11321
+
11322
+
11323
+
11324
+
11325
+
11326
+
11327
+
11328
+
11329
+
11330
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
11331
+
11332
+
11333
  ...adapter_model.safetensors: 91%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 584MB / 640MB 
11334
+
11335
+
11336
+
11337
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
11338
+
11339
+
11340
+
11341
+
11342
  ...adapter_model.safetensors: 91%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 584MB / 640MB 
11343
+
11344
+
11345
+
11346
+
11347
+
11348
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11349
+
11350
+
11351
+
11352
+
11353
+
11354
+
11355
  ...409/all_generations.jsonl: 94%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 576MB / 614MB 
11356
+
11357
+
11358
+
11359
+
11360
+
11361
+
11362
+
11363
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11364
+
11365
+
11366
+
11367
+
11368
+
11369
+
11370
+
11371
+
11372
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11373
+
11374
+
11375
+
11376
+
11377
+
11378
+
11379
+
11380
+
11381
+
11382
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11383
+
11384
+
11385
+
11386
+
11387
+
11388
+
11389
+
11390
+
11391
+
11392
+
11393
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11394
+
11395
+
11396
+
11397
+
11398
+
11399
+
11400
+
11401
+
11402
+
11403
+
11404
+
11405
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
11406
+
11407
+
11408
  ...adapter_model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 640MB / 640MB 
11409
+
11410
+
11411
+
11412
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
11413
+
11414
+
11415
+
11416
+
11417
  ...adapter_model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 640MB / 640MB 
11418
+
11419
+
11420
+
11421
+
11422
+
11423
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11424
+
11425
+
11426
+
11427
+
11428
+
11429
+
11430
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
11431
+
11432
+
11433
+
11434
+
11435
+
11436
+
11437
+
11438
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11439
+
11440
+
11441
+
11442
+
11443
+
11444
+
11445
+
11446
+
11447
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11448
+
11449
+
11450
+
11451
+
11452
+
11453
+
11454
+
11455
+
11456
+
11457
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11458
+
11459
+
11460
+
11461
+
11462
+
11463
+
11464
+
11465
+
11466
+
11467
+
11468
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11469
+
11470
+
11471
+
11472
+
11473
+
11474
+
11475
+
11476
+
11477
+
11478
+
11479
+
11480
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
11481
+
11482
+
11483
  ...adapter_model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 640MB / 640MB 
11484
+
11485
+
11486
+
11487
  ...ward_panels_train_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 342kB / 342kB 
11488
+
11489
+
11490
+
11491
+
11492
  ...adapter_model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 640MB / 640MB 
11493
+
11494
+
11495
+
11496
+
11497
+
11498
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11499
+
11500
+
11501
+
11502
+
11503
+
11504
+
11505
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
11506
+
11507
+
11508
+
11509
+
11510
+
11511
+
11512
+
11513
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11514
+
11515
+
11516
+
11517
+
11518
+
11519
+
11520
+
11521
+
11522
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11523
+
11524
+
11525
+
11526
+
11527
+
11528
+
11529
+
11530
+
11531
+
11532
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11533
+
11534
+
11535
+
11536
+
11537
+
11538
+
11539
+
11540
+
11541
+
11542
+
11543
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11544
+
11545
+
11546
+
11547
+
11548
+
11549
+
11550
+
11551
+
11552
+
11553
+
11554
+
11555
  [+ 3 files] : 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.61MB / 2.61MB 
11556
+
11557
+
11558
+
11559
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11560
+
11561
+
11562
+
11563
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
11564
+
11565
+
11566
+
11567
+
11568
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11569
+
11570
+
11571
+
11572
+
11573
+
11574
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11575
+
11576
+
11577
+
11578
+
11579
+
11580
+
11581
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11582
+
11583
+
11584
+
11585
+
11586
+
11587
+
11588
+
11589
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11590
+
11591
+
11592
+
11593
+
11594
+
11595
+
11596
+
11597
+
11598
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
11599
+
11600
+
11601
+
11602
+
11603
+
11604
+
11605
+
11606
+
11607
+
11608
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 754kB / 754kB 
11609
+
11610
+
11611
+
11612
+
11613
+
11614
+
11615
+
11616
+
11617
+
11618
+
11619
  ...ard_panels_eval_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 318kB / 318kB 
11620
+
11621
+
11622
+
11623
+
11624
+
11625
+
11626
+
11627
+
11628
+
11629
+
11630
+
11631
  ...eward_panels_eval_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 310kB / 310kB 
11632
+
11633
+
11634
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11635
+
11636
+
11637
+
11638
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
11639
+
11640
+
11641
+
11642
+
11643
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11644
+
11645
+
11646
+
11647
+
11648
+
11649
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11650
+
11651
+
11652
+
11653
+
11654
+
11655
+
11656
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11657
+
11658
+
11659
+
11660
+
11661
+
11662
+
11663
+
11664
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11665
+
11666
+
11667
+
11668
+
11669
+
11670
+
11671
+
11672
+
11673
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
11674
+
11675
+
11676
+
11677
+
11678
+
11679
+
11680
+
11681
+
11682
+
11683
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 754kB / 754kB 
11684
+
11685
+
11686
+
11687
+
11688
+
11689
+
11690
+
11691
+
11692
+
11693
+
11694
  ...ard_panels_eval_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 318kB / 318kB 
11695
+
11696
+
11697
+
11698
+
11699
+
11700
+
11701
+
11702
+
11703
+
11704
+
11705
+
11706
  ...eward_panels_eval_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 310kB / 310kB 
11707
+
11708
+
11709
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11710
+
11711
+
11712
+
11713
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
11714
+
11715
+
11716
+
11717
+
11718
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11719
+
11720
+
11721
+
11722
+
11723
+
11724
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11725
+
11726
+
11727
+
11728
+
11729
+
11730
+
11731
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11732
+
11733
+
11734
+
11735
+
11736
+
11737
+
11738
+
11739
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11740
+
11741
+
11742
+
11743
+
11744
+
11745
+
11746
+
11747
+
11748
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
11749
+
11750
+
11751
+
11752
+
11753
+
11754
+
11755
+
11756
+
11757
+
11758
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 754kB / 754kB 
11759
+
11760
+
11761
+
11762
+
11763
+
11764
+
11765
+
11766
+
11767
+
11768
+
11769
  ...ard_panels_eval_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 318kB / 318kB 
11770
+
11771
+
11772
+
11773
+
11774
+
11775
+
11776
+
11777
+
11778
+
11779
+
11780
+
11781
  ...eward_panels_eval_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 310kB / 310kB 
11782
+
11783
+
11784
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11785
+
11786
+
11787
+
11788
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB 
11789
+
11790
+
11791
+
11792
+
11793
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11794
+
11795
+
11796
+
11797
+
11798
+
11799
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11800
+
11801
+
11802
+
11803
+
11804
+
11805
+
11806
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11807
+
11808
+
11809
+
11810
+
11811
+
11812
+
11813
+
11814
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB 
11815
+
11816
+
11817
+
11818
+
11819
+
11820
+
11821
+
11822
+
11823
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB 
11824
+
11825
+
11826
+
11827
+
11828
+
11829
+
11830
+
11831
+
11832
+
11833
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 754kB / 754kB 
11834
+
11835
+
11836
+
11837
+
11838
+
11839
+
11840
+
11841
+
11842
+
11843
+
11844
  ...ard_panels_eval_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 318kB / 318kB 
11845
+
11846
+
11847
+
11848
+
11849
+
11850
+
11851
+
11852
+
11853
+
11854
+
11855
+
11856
  ...eward_panels_eval_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 310kB / 310kB 
11857
+
11858
+
11859
  ...unt_adherence_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB
11860
+
11861
  ...409/all_generations.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 614MB / 614MB
11862
+
11863
  ..._arabic_clean_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB
11864
+
11865
  .../reward_meter_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB
11866
+
11867
  ...tal_composite_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB
11868
+
11869
  ...epeat_penalty_debug.jsonl: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 106MB / 106MB
11870
+
11871
  ...11_223409/tokenizer.model: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.23MB / 1.23MB
11872
+
11873
  ...ts/meter_by_meter_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 754kB / 754kB
11874
+
11875
  ...ard_panels_eval_chain.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 318kB / 318kB
11876
+
11877
  ...eward_panels_eval_run.png: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 310kB / 310kB