diff --git a/config.json b/config.json new file mode 100644 index 0000000..d82497e --- /dev/null +++ b/config.json @@ -0,0 +1,26 @@ +{ + "activation_dropout": 0.0, + "activation_function": "relu", + "architectures": [ + "OPTModel" + ], + "attention_dropout": 0.0, + "bos_token_id": 0, + "d_model": 2048, + "do_layer_norm_before": true, + "dropout": 0.1, + "eos_token_id": 2, + "ffn_dim": 8192, + "init_std": 0.02, + "layerdrop": 0.0, + "max_position_embeddings": 2048, + "model_type": "opt", + "num_attention_heads": 32, + "num_hidden_layers": 24, + "pad_token_id": 1, + "torch_dtype": "float16", + "transformers_version": "4.19.0.dev0", + "use_cache": true, + "vocab_size": 50272, + "word_embed_proj_dim": 2048 +} diff --git a/pytorch_model.bin b/pytorch_model.bin new file mode 100644 index 0000000..e9aab1c --- /dev/null +++ b/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b777a0670f416a2dde4075ace465cb0e453df30d2ef0a674b8b8486c013e2000 +size 2631628157