Pramodith commited on
Commit
121a6c0
·
verified ·
1 Parent(s): a0a2655

Uploaded using `kernel-builder`.

Browse files
Files changed (1) hide show
  1. README.md +6 -6
README.md CHANGED
@@ -285,40 +285,40 @@ shape, mean over 100 iterations. Baseline runs once after warmup.
285
 
286
  <picture>
287
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/bnpo_loss_eager/bnpo_loss_eager_dark_animation.svg">
288
- <img width="80%" src="benchmark_results/bnpo_loss_eager/bnpo_loss_eager_light_animation.svg" alt="BNPO loss latency vs eager PyTorch">
289
  </picture>
290
 
291
  ### BNPO Loss vs torch.compile
292
 
293
  <picture>
294
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/bnpo_loss_compiled/bnpo_loss_compiled_dark_animation.svg">
295
- <img width="80%" src="benchmark_results/bnpo_loss_compiled/bnpo_loss_compiled_light_animation.svg" alt="BNPO loss latency vs torch.compile">
296
  </picture>
297
 
298
  ### GRPO Loss vs eager PyTorch
299
 
300
  <picture>
301
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/grpo_loss_eager/grpo_loss_eager_dark_animation.svg">
302
- <img width="80%" src="benchmark_results/grpo_loss_eager/grpo_loss_eager_light_animation.svg" alt="GRPO loss latency vs eager PyTorch">
303
  </picture>
304
 
305
  ### GRPO Loss vs torch.compile
306
 
307
  <picture>
308
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/grpo_loss_compiled/grpo_loss_compiled_dark_animation.svg">
309
- <img width="80%" src="benchmark_results/grpo_loss_compiled/grpo_loss_compiled_light_animation.svg" alt="GRPO loss latency vs torch.compile">
310
  </picture>
311
 
312
  ### Reverse KL vs eager PyTorch
313
 
314
  <picture>
315
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/reverse_kl_eager/reverse_kl_eager_dark_animation.svg">
316
- <img width="80%" src="benchmark_results/reverse_kl_eager/reverse_kl_eager_light_animation.svg" alt="Reverse KL latency vs eager PyTorch">
317
  </picture>
318
 
319
  ### Reverse KL vs torch.compile
320
 
321
  <picture>
322
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/reverse_kl_compiled/reverse_kl_compiled_dark_animation.svg">
323
- <img width="80%" src="benchmark_results/reverse_kl_compiled/reverse_kl_compiled_light_animation.svg" alt="Reverse KL latency vs torch.compile">
324
  </picture>
 
285
 
286
  <picture>
287
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/bnpo_loss_eager/bnpo_loss_eager_dark_animation.svg">
288
+ <img width="90%" src="benchmark_results/bnpo_loss_eager/bnpo_loss_eager_light_animation.svg" alt="BNPO loss latency vs eager PyTorch">
289
  </picture>
290
 
291
  ### BNPO Loss vs torch.compile
292
 
293
  <picture>
294
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/bnpo_loss_compiled/bnpo_loss_compiled_dark_animation.svg">
295
+ <img width="90%" src="benchmark_results/bnpo_loss_compiled/bnpo_loss_compiled_light_animation.svg" alt="BNPO loss latency vs torch.compile">
296
  </picture>
297
 
298
  ### GRPO Loss vs eager PyTorch
299
 
300
  <picture>
301
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/grpo_loss_eager/grpo_loss_eager_dark_animation.svg">
302
+ <img width="90%" src="benchmark_results/grpo_loss_eager/grpo_loss_eager_light_animation.svg" alt="GRPO loss latency vs eager PyTorch">
303
  </picture>
304
 
305
  ### GRPO Loss vs torch.compile
306
 
307
  <picture>
308
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/grpo_loss_compiled/grpo_loss_compiled_dark_animation.svg">
309
+ <img width="90%" src="benchmark_results/grpo_loss_compiled/grpo_loss_compiled_light_animation.svg" alt="GRPO loss latency vs torch.compile">
310
  </picture>
311
 
312
  ### Reverse KL vs eager PyTorch
313
 
314
  <picture>
315
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/reverse_kl_eager/reverse_kl_eager_dark_animation.svg">
316
+ <img width="90%" src="benchmark_results/reverse_kl_eager/reverse_kl_eager_light_animation.svg" alt="Reverse KL latency vs eager PyTorch">
317
  </picture>
318
 
319
  ### Reverse KL vs torch.compile
320
 
321
  <picture>
322
  <source media="(prefers-color-scheme: dark)" srcset="benchmark_results/reverse_kl_compiled/reverse_kl_compiled_dark_animation.svg">
323
+ <img width="90%" src="benchmark_results/reverse_kl_compiled/reverse_kl_compiled_light_animation.svg" alt="Reverse KL latency vs torch.compile">
324
  </picture>