diff --git a/config.json b/config.json index 405ba56..2de7319 100644 --- a/config.json +++ b/config.json @@ -1,4 +1,5 @@ { + "_name_or_path": "./", "activation_dropout": 0.1, "activation_function": "relu", "add_bias_logits": false, @@ -9,18 +10,23 @@ "attention_dropout": 0.1, "bos_token_id": 0, "classif_dropout": 0.0, + "classifier_dropout": 0.0, "d_model": 1024, "decoder_attention_heads": 16, "decoder_ffn_dim": 4096, "decoder_layerdrop": 0.0, "decoder_layers": 16, + "decoder_start_token_id": 0, + "do_blenderbot_90_layernorm": false, "dropout": 0.1, "encoder_attention_heads": 16, "encoder_ffn_dim": 4096, "encoder_layerdrop": 0.0, "encoder_layers": 16, "eos_token_id": 1, - "extra_pos_embeddings": 1, + "extra_pos_embeddings": 0, + "force_bos_token_to_be_generated": false, + "gradient_checkpointing": false, "id2label": { "0": "LABEL_0", "1": "LABEL_1", @@ -44,5 +50,7 @@ "pad_token_id": 0, "scale_embedding": true, "static_position_embeddings": true, + "transformers_version": "4.2.0dev0", + "use_cache": true, "vocab_size": 96103 } diff --git a/tf_model.h5 b/tf_model.h5 new file mode 100644 index 0000000..f70cb47 --- /dev/null +++ b/tf_model.h5 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4411d0ec75cc3504b3081e190d4fc52b0fe4a42f2f1cde4b016202c8355905bd +size 2279695208