37 lines
999 B
JSON
37 lines
999 B
JSON
{
|
|
"pred_head_dropout_prob": 0.1,
|
|
"attention_probs_dropout_prob": 0.1,
|
|
"finetuning_task": null,
|
|
"hidden_act": "gelu",
|
|
"hidden_dropout_prob": 0.1,
|
|
"hidden_size": 768,
|
|
"image_feat_size": 768,
|
|
"image_prob_size": 1000,
|
|
"angle_feat_size": 4,
|
|
"obj_feat_size": 768,
|
|
"obj_prob_size": 1000,
|
|
"img_feature_type": "imagenet",
|
|
"initializer_range": 0.02,
|
|
"intermediate_size": 3072,
|
|
"num_l_layers": 9,
|
|
"num_x_layers": 4,
|
|
"num_pano_layers": 2,
|
|
"layer_norm_eps": 1e-12,
|
|
"max_position_embeddings": 512,
|
|
"max_action_steps": 100,
|
|
"num_attention_heads": 12,
|
|
"num_hidden_layers": 12,
|
|
"num_labels": 2,
|
|
"output_attentions": false,
|
|
"output_hidden_states": false,
|
|
"pruned_heads": {},
|
|
"torchscript": false,
|
|
"type_vocab_size": 2,
|
|
"update_lang_bert": true,
|
|
"vocab_size": 30522,
|
|
"use_lang2visn_attn": true,
|
|
"graph_sprels": true,
|
|
"glocal_fuse": true,
|
|
"lang_bert_name": "bert-base-uncased"
|
|
}
|
|
|