{ "action_in_proj_cfg": { "_target_": "alpamayo_r1.models.action_in_proj.PerWaypointActionInProjV2", "hidden_size": 512, "max_freq": 100.0, "num_enc_layers": 2, "num_fourier_feats": 20 }, "action_out_proj_cfg": { "_target_": "torch.nn.Linear" }, "action_space_cfg": { "_target_": "alpamayo_r1.action_space.UnicycleAccelCurvatureActionSpace", "a_lambda": 0.0001, "a_ridge": 0.0001, "accel_bounds": [ -9.8, 9.8 ], "accel_mean": 0.02902694707164455, "accel_std": 0.6810426736454882, "curvature_bounds": [ -0.33, 0.33 ], "curvature_mean": 0.0002692167976330542, "curvature_std": 0.026148280660833106, "dt": 0.1, "kappa_lambda": 0.0001, "kappa_ridge": 0.0001, "n_waypoints": 64, "theta_lambda": 1e-06, "theta_ridge": 1e-08, "v_lambda": 1e-06, "v_ridge": 0.0001 }, "add_special_tokens": true, "architectures": [ "AlpamayoR1" ], "attn_implementation": "flash_attention_2", "diffusion_cfg": { "_target_": "alpamayo_r1.diffusion.flow_matching.FlowMatching", "int_method": "euler", "x_dims": "???" }, "dtype": "bfloat16", "expert_cfg": { "dtype": "bfloat16", "head_dim": 128, "hidden_size": 2048, "intermediate_size": 8256, "num_attention_heads": 16 }, "expert_non_causal_attention": true, "hist_traj_tokenizer_cfg": { "_target_": "alpamayo_r1.models.delta_tokenizer.DeltaTrajectoryTokenizer" }, "keep_same_dtype": true, "max_pixels": 196608, "min_pixels": 163840, "model_dtype": "bfloat16", "model_type": "alpamayo_r1", "tokens_per_future_traj": 128, "tokens_per_history_traj": 48, "traj_token_ids": { "future": 155685, "future_end": 155683, "future_start": 155681, "history": 155684, "history_end": 155676, "history_start": 155674 }, "traj_token_start_idx": 151669, "traj_tokenizer_cfg": { "_recursive_": false, "_target_": "alpamayo_r1.action_space.discrete_action_space.DiscreteTrajectoryTokenizer", "action_space_cfg": { "_target_": "alpamayo_r1.action_space.UnicycleAccelCurvatureActionSpace", "a_lambda": 0.0001, "a_ridge": 0.0001, "accel_bounds": [ -9.8, 9.8 ], "accel_mean": 0.02902694707164455, "accel_std": 0.6810426736454882, "curvature_bounds": [ -0.33, 0.33 ], "curvature_mean": 0.0002692167976330542, "curvature_std": 0.026148280660833106, "dt": 0.1, "kappa_lambda": 0.0001, "kappa_ridge": 0.0001, "n_waypoints": 64, "theta_lambda": 1e-06, "theta_ridge": 1e-08, "v_lambda": 1e-06, "v_ridge": 0.0001 }, "dims_max": [ 10, 10 ], "dims_min": [ -10, -10 ], "num_bins": 3000 }, "traj_vocab_size": 4000, "transformers_version": "4.57.1", "vlm_backend": "qwenvl3", "vocab_size": 155697 }