openvla-maniskill / config.json
P1oris's picture
Upload config
f33bdd1 verified
raw
history blame
3.37 kB
{
"arch_specifier": "no-align+fused-gelu-mlp",
"auto_map": {
"AutoConfig": "configuration_prismatic.OpenVLAConfig"
},
"hf_llm_id": "meta-llama/Llama-2-7b-hf",
"image_resize_strategy": "resize-naive",
"image_sizes": [
224,
224
],
"llm_backbone_id": "llama2-7b-pure",
"llm_max_length": 2048,
"model_type": "openvla",
"n_action_bins": 256,
"norm_stats": {
"maniskill_push_cube": {
"action": {
"mask": [
true,
true,
true,
true,
true,
true,
false
],
"max": [
0.47712400555610657,
0.2541411817073822,
0.04444180056452751,
0.924456000328064,
0.5537124276161194,
0.5364292860031128,
-0.18357177078723907
],
"mean": [
0.017237788066267967,
0.0016865554498508573,
-0.08430713415145874,
-0.0007431917474605143,
-0.025497792288661003,
-0.0010811244137585163,
-0.9999881982803345
],
"min": [
-0.2606317400932312,
-0.2698182761669159,
-0.5802842974662781,
-0.05909932777285576,
-0.8009798526763916,
-0.18609920144081116,
-1.0
],
"q01": [
-0.20719055607914924,
-0.14252015054225922,
-0.29591195851564406,
-0.036601713225245476,
-0.2631440430879593,
-0.0376842637732625,
-1.0
],
"q99": [
0.20013775676488874,
0.1397389918565747,
0.008089204132556885,
0.02753601264208554,
0.1532172134518619,
0.04092058923095453,
-1.0
],
"std": [
0.09168525040149689,
0.04248384013772011,
0.08058354258537292,
0.010035122744739056,
0.08161655068397522,
0.012614610604941845,
0.003108547069132328
]
},
"num_trajectories": 999,
"num_transitions": 68978,
"proprio": {
"max": [
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0
],
"mean": [
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0
],
"min": [
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0
],
"q01": [
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0
],
"q99": [
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0
],
"std": [
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0
]
}
}
},
"output_projector_states": false,
"pad_to_multiple_of": 64,
"pad_token_id": 32000,
"text_config": {
"model_type": "llama"
},
"timm_model_ids": [
"vit_large_patch14_reg4_dinov2.lvd142m",
"vit_so400m_patch14_siglip_224"
],
"timm_override_act_layers": [
null,
null
],
"torch_dtype": "bfloat16",
"transformers_version": "4.46.2",
"use_fused_vision_backbone": true,
"vision_backbone_id": "dinosiglip-vit-so-224px"
}