winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_80_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 19, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_5e-06_beta_0_80_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 19, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_6400_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_160_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_3840_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 1
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_11520_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_1280_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_12800_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_320_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_2560_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_10240_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_5120_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_640_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_7680_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-06_beta_0_8960_all_37_epoch_1_layer_all Text Generation • 8B • Updated Nov 17, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_7680_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_6400_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_12800_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_8960_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_5120_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_320_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_1280_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_80_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_11520_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 1
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_2560_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_640_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_3840_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_10240_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 2
winnieyangwannan/entity_grpo_Llama-3.1-8B-Instruct_lora_0_lr_1e-05_beta_0_160_all_37_epoch_3_layer_all Text Generation • 8B • Updated Nov 16, 2025 • 1
winnieyangwannan/evwc_Qwen2.5-VL-7B-Instruct_mlp-down_pnas_layer_18_6_all_37_0.001_1280_15 Image-Text-to-Text • 8B • Updated Sep 23, 2025 • 2