kangdawei commited on
Commit
1fe3afb
·
verified ·
1 Parent(s): 468868e

Training in progress, step 500

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83f6e433e6707b91809656a1e7cba206a4da91466f5c6ca3ccef9a19f985d279
3
  size 3554214752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afd9333507eed970c20ed3a3c435ac53593432de3be813e6cf1b138c06a438b7
3
  size 3554214752
reward_data/all_rewards.csv CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3a245404d28266d115b4c6fe39b8bb677ce1b309ec7fbc38d7475274529a491
3
- size 390127795
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:555b53d2bae2130eeadb5f522c7a4cd2ce8d7192f3becead04e946f9c40ed721
3
+ size 407266796
reward_plots/advantage_plot_step_450.png ADDED
reward_plots/advantage_plot_step_460.png ADDED
reward_plots/advantage_plot_step_470.png ADDED
reward_plots/advantage_plot_step_480.png ADDED
reward_plots/advantage_plot_step_490.png ADDED
reward_plots/reward_comparison_step_450.png ADDED
reward_plots/reward_comparison_step_460.png ADDED
reward_plots/reward_comparison_step_470.png ADDED
reward_plots/reward_comparison_step_480.png ADDED
reward_plots/reward_comparison_step_490.png ADDED
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a22fc1d522a0b79c9b8f3177e4ca4948438e8211a9c52684b08a9001db881319
3
  size 8504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90f11d4fd97b2eca8c10ca216d8a817cb13fbf9aacf4df10df7ebeed7606d514
3
  size 8504