gpt2vla-tiny / config.json
jellyho's picture
Update config.json
e6b58a9 verified
{
"BC": true,
"action_dim": null,
"action_len": null,
"action_levels": 2,
"action_vocab_size": 256,
"activation_function": "gelu_new",
"attn_pdrop": 0.1,
"backbone_layers": -1,
"bos_token_id": 50256,
"ema_freq": 5,
"ema_tau": 0.005,
"embd_pdrop": 0.1,
"eos_token_id": 50256,
"gamma": 0.98,
"global_normalization": null,
"image_encoder_hidden_dim": 512,
"image_size": null,
"initializer_range": 0.02,
"layer_norm_epsilon": 1e-05,
"model_type": "GPT2VLA",
"n_embd": 128,
"n_head": 4,
"n_inner": 512,
"n_layer": 3,
"n_positions": 1024,
"normalization": null,
"postprocess_logits": "sigmoid",
"q_loss_fn": "mse",
"reorder_and_upcast_attn": false,
"resid_pdrop": 0.1,
"scale_attn_by_inverse_layer_idx": false,
"scale_attn_weights": true,
"sentence_encoder_hidden_dim": 384,
"state_dim": null,
"stopping_token": "|",
"summary_activation": null,
"summary_first_dropout": 0.1,
"summary_proj_to_labels": true,
"summary_type": "cls_index",
"summary_use_proj": true,
"tokenizer": "FAST",
"tokenizer_path": "physical-intelligence/fast",
"transformers_version": "4.50.0.dev0",
"use_cache": true,
"use_dual_q_head": false,
"use_ema": false,
"use_mc_returns": true,
"use_new_q_head": false,
"use_state": true,
"vocab_size": 50257,
"vocab_start": null
}