Safetensors
alpamayo_r1
Alpamayo-R1-10B / config.json
BorisIvanovic's picture
Update config.json (#2)
fdf4c01 verified
{
"action_in_proj_cfg": {
"_target_": "alpamayo_r1.models.action_in_proj.PerWaypointActionInProjV2",
"hidden_size": 512,
"max_freq": 100.0,
"num_enc_layers": 2,
"num_fourier_feats": 20
},
"action_out_proj_cfg": {
"_target_": "torch.nn.Linear"
},
"action_space_cfg": {
"_target_": "alpamayo_r1.action_space.UnicycleAccelCurvatureActionSpace",
"a_lambda": 0.0001,
"a_ridge": 0.0001,
"accel_bounds": [
-9.8,
9.8
],
"accel_mean": 0.02902694707164455,
"accel_std": 0.6810426736454882,
"curvature_bounds": [
-0.33,
0.33
],
"curvature_mean": 0.0002692167976330542,
"curvature_std": 0.026148280660833106,
"dt": 0.1,
"kappa_lambda": 0.0001,
"kappa_ridge": 0.0001,
"n_waypoints": 64,
"theta_lambda": 1e-06,
"theta_ridge": 1e-08,
"v_lambda": 1e-06,
"v_ridge": 0.0001
},
"add_special_tokens": true,
"architectures": [
"AlpamayoR1"
],
"attn_implementation": "flash_attention_2",
"diffusion_cfg": {
"_target_": "alpamayo_r1.diffusion.flow_matching.FlowMatching",
"int_method": "euler",
"x_dims": "???"
},
"dtype": "bfloat16",
"expert_cfg": {
"dtype": "bfloat16",
"head_dim": 128,
"hidden_size": 2048,
"intermediate_size": 8256,
"num_attention_heads": 16
},
"expert_non_causal_attention": true,
"hist_traj_tokenizer_cfg": {
"_target_": "alpamayo_r1.models.delta_tokenizer.DeltaTrajectoryTokenizer"
},
"keep_same_dtype": true,
"max_pixels": 196608,
"min_pixels": 163840,
"model_dtype": "bfloat16",
"model_type": "alpamayo_r1",
"tokens_per_future_traj": 128,
"tokens_per_history_traj": 48,
"traj_token_ids": {
"future": 155685,
"future_end": 155683,
"future_start": 155681,
"history": 155684,
"history_end": 155676,
"history_start": 155674
},
"traj_token_start_idx": 151669,
"traj_tokenizer_cfg": {
"_recursive_": false,
"_target_": "alpamayo_r1.action_space.discrete_action_space.DiscreteTrajectoryTokenizer",
"action_space_cfg": {
"_target_": "alpamayo_r1.action_space.UnicycleAccelCurvatureActionSpace",
"a_lambda": 0.0001,
"a_ridge": 0.0001,
"accel_bounds": [
-9.8,
9.8
],
"accel_mean": 0.02902694707164455,
"accel_std": 0.6810426736454882,
"curvature_bounds": [
-0.33,
0.33
],
"curvature_mean": 0.0002692167976330542,
"curvature_std": 0.026148280660833106,
"dt": 0.1,
"kappa_lambda": 0.0001,
"kappa_ridge": 0.0001,
"n_waypoints": 64,
"theta_lambda": 1e-06,
"theta_ridge": 1e-08,
"v_lambda": 1e-06,
"v_ridge": 0.0001
},
"dims_max": [
10,
10
],
"dims_min": [
-10,
-10
],
"num_bins": 3000
},
"traj_vocab_size": 4000,
"transformers_version": "4.57.1",
"vlm_backend": "qwenvl3",
"vocab_size": 155697
}