Update activation dropout

This commit is contained in:
Qian Liu 2022-02-24 12:53:15 +00:00 committed by huggingface-web
parent e195be4528
commit a1180b7b52
1 changed files with 73 additions and 74 deletions

View File

@ -1,74 +1,73 @@
{ {
"_name_or_path": "tapex-base", "_name_or_path": "bart-base",
"activation_dropout": 0.1, "activation_dropout": 0.0,
"activation_function": "gelu", "activation_function": "gelu",
"add_bias_logits": false, "add_bias_logits": false,
"add_final_layer_norm": false, "add_final_layer_norm": false,
"architectures": [ "architectures": [
"BartModel" "BartModel"
], ],
"attention_dropout": 0.1, "attention_dropout": 0.1,
"bos_token_id": 0, "bos_token_id": 0,
"classif_dropout": 0.1, "classifier_dropout": 0.0,
"classifier_dropout": 0.0, "d_model": 768,
"d_model": 768, "decoder_attention_heads": 12,
"decoder_attention_heads": 12, "decoder_ffn_dim": 3072,
"decoder_ffn_dim": 3072, "decoder_layerdrop": 0.0,
"decoder_layerdrop": 0.0, "decoder_layers": 6,
"decoder_layers": 6, "decoder_start_token_id": 2,
"decoder_start_token_id": 2, "dropout": 0.1,
"dropout": 0.1, "early_stopping": true,
"early_stopping": true, "encoder_attention_heads": 12,
"encoder_attention_heads": 12, "encoder_ffn_dim": 3072,
"encoder_ffn_dim": 3072, "encoder_layerdrop": 0.0,
"encoder_layerdrop": 0.0, "encoder_layers": 6,
"encoder_layers": 6, "eos_token_id": 2,
"eos_token_id": 2, "forced_eos_token_id": 2,
"forced_eos_token_id": 2, "gradient_checkpointing": false,
"gradient_checkpointing": false, "id2label": {
"id2label": { "0": "LABEL_0",
"0": "LABEL_0", "1": "LABEL_1",
"1": "LABEL_1", "2": "LABEL_2"
"2": "LABEL_2" },
}, "init_std": 0.02,
"init_std": 0.02, "is_encoder_decoder": true,
"is_encoder_decoder": true, "label2id": {
"label2id": { "LABEL_0": 0,
"LABEL_0": 0, "LABEL_1": 1,
"LABEL_1": 1, "LABEL_2": 2
"LABEL_2": 2 },
}, "max_position_embeddings": 1024,
"max_position_embeddings": 1024, "model_type": "bart",
"model_type": "bart", "no_repeat_ngram_size": 3,
"no_repeat_ngram_size": 3, "normalize_before": false,
"normalize_before": false, "normalize_embedding": true,
"normalize_embedding": true, "num_beams": 4,
"num_beams": 4, "num_hidden_layers": 6,
"num_hidden_layers": 6, "pad_token_id": 1,
"pad_token_id": 1, "scale_embedding": false,
"scale_embedding": false, "task_specific_params": {
"task_specific_params": { "summarization": {
"summarization": { "length_penalty": 1.0,
"length_penalty": 1.0, "max_length": 128,
"max_length": 128, "min_length": 12,
"min_length": 12, "num_beams": 4
"num_beams": 4 },
}, "summarization_cnn": {
"summarization_cnn": { "length_penalty": 2.0,
"length_penalty": 2.0, "max_length": 142,
"max_length": 142, "min_length": 56,
"min_length": 56, "num_beams": 4
"num_beams": 4 },
}, "summarization_xsum": {
"summarization_xsum": { "length_penalty": 1.0,
"length_penalty": 1.0, "max_length": 62,
"max_length": 62, "min_length": 11,
"min_length": 11, "num_beams": 6
"num_beams": 6 }
} },
}, "torch_dtype": "float32",
"torch_dtype": "float32", "transformers_version": "4.12.0.dev0",
"transformers_version": "4.12.0.dev0", "use_cache": true,
"use_cache": true, "vocab_size": 50265
"vocab_size": 50265 }
}