diff --git a/config.json b/config.json new file mode 100644 index 0000000..4f2b30f --- /dev/null +++ b/config.json @@ -0,0 +1,38 @@ +{ + "architectures": [ + "LongformerForQuestionAnswering" + ], + "attention_mode": "longformer", + "attention_probs_dropout_prob": 0.1, + "attention_window": [ + 512, + 512, + 512, + 512, + 512, + 512, + 512, + 512, + 512, + 512, + 512, + 512 + ], + "bos_token_id": 0, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "ignore_attention_mask": false, + "initializer_range": 0.02, + "intermediate_size": 3072, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 4098, + "model_type": "longformer", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "pad_token_id": 1, + "sep_token_id": 2, + "type_vocab_size": 1, + "vocab_size": 50265 +}