From 899fa3ee8006648e3597110c9de1ccce285694ff Mon Sep 17 00:00:00 2001 From: Moritz Laurer Date: Sun, 5 Dec 2021 16:18:20 +0000 Subject: [PATCH] add model --- config.json | 45 +++++++++++++++++++++++++++++++++++++++++++++ pytorch_model.bin | 3 +++ 2 files changed, 48 insertions(+) create mode 100644 config.json create mode 100644 pytorch_model.bin diff --git a/config.json b/config.json new file mode 100644 index 0000000..57806d1 --- /dev/null +++ b/config.json @@ -0,0 +1,45 @@ +{ + "_name_or_path": "./results/nli-few-shot/xnli/mDeBERTa-v3-base/mDeBERTa-v3-base-mnli-xnli", + "architectures": [ + "DebertaV2ForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "entailment", + "1": "neutral", + "2": "contradiction" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "contradiction": 2, + "entailment": 0, + "neutral": 1 + }, + "layer_norm_eps": 1e-07, + "max_position_embeddings": 512, + "max_relative_positions": -1, + "model_type": "deberta-v2", + "norm_rel_ebd": "layer_norm", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "pad_token_id": 0, + "pooler_dropout": 0, + "pooler_hidden_act": "gelu", + "pooler_hidden_size": 768, + "pos_att_type": [ + "p2c", + "c2p" + ], + "position_biased_input": false, + "position_buckets": 256, + "relative_attention": true, + "share_att_key": true, + "torch_dtype": "float32", + "transformers_version": "4.12.5", + "type_vocab_size": 0, + "vocab_size": 251000 +} diff --git a/pytorch_model.bin b/pytorch_model.bin new file mode 100644 index 0000000..552c334 --- /dev/null +++ b/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41a7c036b017f7daf61250807dd8c7c8d66c84859e02da02083ec3178939d026 +size 1115330795