{ "action_in_proj_cfg": { "_target_": "alpamayo_r1.models.action_in_proj.PerWaypointActionInProjV2", "hidden_size": 512, "max_freq": 100.0, "num_enc_layers": 2, "num_fourier_feats": 20 }, "action_out_proj_cfg": { "_target_": "torch.nn.Linear" }, "action_space_cfg": { "_target_": "alpamayo_r1.action_space.UnicycleAccelCurvatureActionSpace", "a_lambda": 0.0001, "a_ridge": 0.0001, "accel_bounds": [ -9.8, 9.8 ], "accel_mean": 0.02902694707164455, "accel_std": 0.6810426736454882, "curvature_bounds": [ -0.33, 0.33 ], "curvature_mean": 0.0002692167976330542, "curvature_std": 0.026148280660833106, "dt": 0.1, "kappa_lambda": 0.0001, "kappa_ridge": 0.0001, "n_waypoints": 64, "theta_lambda": 1e-06, "theta_ridge": 1e-08, "v_lambda": 1e-06, "v_ridge": 0.0001 }, "add_special_tokens": true, "architectures": [ "AlpamayoR1" ], "attn_implementation": null, "diffusion_cfg": { "_target_": "alpamayo_r1.diffusion.flow_matching.FlowMatching", "int_method": "euler", "x_dims": "???" }, "dtype": "float16", "expert_cfg": { "dtype": "bfloat16", "head_dim": 128, "hidden_size": 2048, "intermediate_size": 8256, "num_attention_heads": 16 }, "expert_non_causal_attention": true, "hist_traj_tokenizer_cfg": { "_target_": "alpamayo_r1.models.delta_tokenizer.DeltaTrajectoryTokenizer" }, "keep_same_dtype": true, "max_pixels": 196608, "min_pixels": 163840, "model_dtype": "bfloat16", "model_type": "alpamayo_r1", "quantization_config": { "_load_in_4bit": true, "_load_in_8bit": false, "bnb_4bit_compute_dtype": "float32", "bnb_4bit_quant_storage": "uint8", "bnb_4bit_quant_type": "fp4", "bnb_4bit_use_double_quant": false, "llm_int8_enable_fp32_cpu_offload": false, "llm_int8_has_fp16_weight": false, "llm_int8_skip_modules": null, "llm_int8_threshold": 6.0, "load_in_4bit": true, "load_in_8bit": false, "quant_method": "bitsandbytes" }, "tokens_per_future_traj": 128, "tokens_per_history_traj": 48, "traj_token_ids": { "future": 155685, "future_end": 155683, "future_start": 155681, "history": 155684, "history_end": 155676, "history_start": 155674 }, "traj_token_start_idx": 151669, "traj_tokenizer_cfg": { "_recursive_": false, "_target_": "alpamayo_r1.action_space.discrete_action_space.DiscreteTrajectoryTokenizer", "action_space_cfg": { "_target_": "alpamayo_r1.action_space.UnicycleAccelCurvatureActionSpace", "a_lambda": 0.0001, "a_ridge": 0.0001, "accel_bounds": [ -9.8, 9.8 ], "accel_mean": 0.02902694707164455, "accel_std": 0.6810426736454882, "curvature_bounds": [ -0.33, 0.33 ], "curvature_mean": 0.0002692167976330542, "curvature_std": 0.026148280660833106, "dt": 0.1, "kappa_lambda": 0.0001, "kappa_ridge": 0.0001, "n_waypoints": 64, "theta_lambda": 1e-06, "theta_ridge": 1e-08, "v_lambda": 1e-06, "v_ridge": 0.0001 }, "dims_max": [ 10, 10 ], "dims_min": [ -10, -10 ], "num_bins": 3000 }, "traj_vocab_size": 4000, "transformers_version": "4.57.3", "vlm_backend": "qwenvl3", "vlm_name_or_path": "Qwen/Qwen3-VL-8B-Instruct", "vocab_size": 155697 }