Upload exp_phase8_reasoning_grounded_rl_t1_r128_alpha1_s2_20260506_203542/best.pt with huggingface_hub 47f1043 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_gspo_FIXED_BIGLR_gspo_FIXED_BIGLR_20260506_045433/best.pt with huggingface_hub 56bc1f0 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_gspo_FIXED_1k_gspo_FIXED_1k_20260506_041329/best.pt with huggingface_hub 32e1ed2 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_gspo_FIXED_1k_gspo_FIXED_1k_20260506_041329/best.pt with huggingface_hub 7447eba verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_gspo_BIGLR_s2_gspo_BIGLR_s2_20260506_035116/best.pt with huggingface_hub ff3ce22 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_gspo_BIGLR_s2_gspo_BIGLR_s2_20260506_035116/best.pt with huggingface_hub 18512fc verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_gspo_BIGLR_gspo_BIGLR_20260506_033533/best.pt with huggingface_hub 7c0723f verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_gspo_BIGLR_gspo_BIGLR_20260506_033533/best.pt with huggingface_hub fcdfad4 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_gspo_BIGLR_1k_gspo_BIGLR_1k_20260506_035238/best.pt with huggingface_hub aa09b98 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_gspo_BIGLR_1k_gspo_BIGLR_1k_20260506_035238/best.pt with huggingface_hub d46b22b verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_grpo_BIGLR_grpo_BIGLR_20260506_035116/best.pt with huggingface_hub 74f9bb2 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_grpo_BIGLR_grpo_BIGLR_20260506_035116/best.pt with huggingface_hub a575289 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_dapo_BIGLR_s2_dapo_BIGLR_s2_20260506_042733/best.pt with huggingface_hub 254eb23 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_dapo_BIGLR_s2_dapo_BIGLR_s2_20260506_042733/best.pt with huggingface_hub 09dbd6e verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_dapo_BIGLR_dapo_BIGLR_20260506_035116/best.pt with huggingface_hub c3955a6 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_dapo_BIGLR_dapo_BIGLR_20260506_035116/best.pt with huggingface_hub 7e0eecf verified explcre commited on 11 days ago
Upload exp_phase8_reasoning_grounded_rl_t3_r128_alpha1_s2_par_20260506_221253/log.jsonl with huggingface_hub c66ff97 verified explcre commited on 11 days ago
Upload exp_phase8_reasoning_grounded_rl_t1_r128_alpha1_s2_20260506_203542/log.jsonl with huggingface_hub f658d35 verified explcre commited on 11 days ago
Upload exp_phase8_reasoning_grounded_rl_t3_r128_alpha1_s2_par_20260506_221253/best.pt with huggingface_hub 211cd8f verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_dapo_BIGLR_1k_dapo_BIGLR_1k_20260506_035301/best.pt with huggingface_hub 0588aba verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pb_dapo_BIGLR_1k_dapo_BIGLR_1k_20260506_035301/best.pt with huggingface_hub 5b710b8 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s3_20260506_125416/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub 3d3fa1d verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s3_20260506_125416/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub 914a444 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s3_20260506_125416/motif_score_postRL_multinom_t1.5.json with huggingface_hub 8e1581a verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s3_20260506_125416/motif_score_postRL_multinom_t1.5.json with huggingface_hub 193317a verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s2_20260506_125416/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub 91f50b5 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s2_20260506_125416/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub 7083b6e verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s2_20260506_125416/motif_score_postRL_multinom_t1.5.json with huggingface_hub 7e71b84 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s2_20260506_125416/motif_score_postRL_multinom_t1.5.json with huggingface_hub 4f4fd8a verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_grpo_20260506_125418/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub d22bb5c verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_grpo_20260506_125418/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub 40eb93a verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_grpo_20260506_125418/motif_score_postRL_multinom_t1.5.json with huggingface_hub 99dd475 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_grpo_20260506_125418/motif_score_postRL_multinom_t1.5.json with huggingface_hub cd547e4 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_dapo_s2_20260506_125416/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub ec17908 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_dapo_s2_20260506_125416/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub d84bc9a verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_dapo_s2_20260506_125416/motif_score_postRL_multinom_t1.5.json with huggingface_hub 3d39b48 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_dapo_s2_20260506_125416/motif_score_postRL_multinom_t1.5.json with huggingface_hub 8d257f9 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_dapo_20260506_125418/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub 47e6c90 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_dapo_20260506_125418/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub c8102aa verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_dapo_20260506_125418/motif_score_postRL_multinom_t1.5.json with huggingface_hub 11375e8 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_dapo_20260506_125418/motif_score_postRL_multinom_t1.5.json with huggingface_hub e464dd3 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_20260506_124633/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub 2fff47e verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_20260506_124633/motif_score_postRL_multinom_t1.5_AUDIT.json with huggingface_hub ef55af8 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_20260506_124633/motif_score_postRL_multinom_t1.5.json with huggingface_hub 84157e8 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_20260506_124633/motif_score_postRL_multinom_t1.5.json with huggingface_hub 533c2a2 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s3_20260506_125416/motif_score_postRL_multinom_t1.5_AUDIT.md with huggingface_hub dfd761e verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s3_20260506_125416/motif_score_postRL_multinom_t1.5_AUDIT.md with huggingface_hub 04d3fd8 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s3_20260506_125416/motif_score_postRL_multinom_t1.5.md with huggingface_hub a8bf318 verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s3_20260506_125416/motif_score_postRL_multinom_t1.5.md with huggingface_hub 464eb2f verified explcre commited on 11 days ago
Upload cycle_70_lab_L0/exp_rl_pathb_650m_FULL_AUDIT_gspo_s2_20260506_125416/motif_score_postRL_multinom_t1.5_AUDIT.md with huggingface_hub 358acb2 verified explcre commited on 11 days ago