diff --git a/config.json b/config.json index 0738121..b294553 100644 --- a/config.json +++ b/config.json @@ -1,4 +1,5 @@ { + "_name_or_path": "opt-1.3b", "activation_dropout": 0.0, "activation_function": "relu", "architectures": [ @@ -6,23 +7,22 @@ ], "attention_dropout": 0.0, "bos_token_id": 2, - "hidden_size": 2048, "do_layer_norm_before": true, "dropout": 0.1, "eos_token_id": 2, "ffn_dim": 8192, - + "hidden_size": 2048, "init_std": 0.02, "layerdrop": 0.0, "max_position_embeddings": 2048, + "model_type": "opt", "num_attention_heads": 32, "num_hidden_layers": 24, "pad_token_id": 1, + "prefix": "", "torch_dtype": "float16", - "transformers_version": "4.19.0.dev0", - + "transformers_version": "4.20.0.dev0", "use_cache": true, "vocab_size": 50272, - "word_embed_proj_dim": 2048, - "prefix": "" + "word_embed_proj_dim": 2048 } diff --git a/tf_model.h5 b/tf_model.h5 index 54ccb14..d7a3f79 100644 --- a/tf_model.h5 +++ b/tf_model.h5 @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cab5d1b7b11900213091184b559d3201ddaeaa4a2c12bef4ae14a90ceee7113c -size 5263424312 +oid sha256:774f854fb3f9f6723cfec007648e34f33457144ebdbd0b361a6edbef2777f371 +size 2631916344