From 918ad376364058dee23512629bc385380c98e57d Mon Sep 17 00:00:00 2001 From: valhalla Date: Tue, 15 Mar 2022 14:34:01 +0100 Subject: [PATCH] add TF model --- config.json | 14 +++++++++----- tf_model.h5 | 3 +++ 2 files changed, 12 insertions(+), 5 deletions(-) create mode 100644 tf_model.h5 diff --git a/config.json b/config.json index 05e8cf2..614ae4f 100644 --- a/config.json +++ b/config.json @@ -13,24 +13,28 @@ "model_type": "gptj", "n_embd": 4096, "n_head": 16, + "n_inner": null, "n_layer": 28, "n_positions": 2048, + "resid_pdrop": 0.0, "rotary": true, "rotary_dim": 64, + "scale_attn_weights": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "summary_type": "cls_index", "summary_use_proj": true, - "transformers_version": "4.10.0.dev0", - "tokenizer_class": "GPT2Tokenizer", "task_specific_params": { "text-generation": { "do_sample": true, - "temperature": 1.0, - "max_length": 50 + "max_length": 50, + "temperature": 1.0 } }, + "tie_word_embeddings": false, + "tokenizer_class": "GPT2Tokenizer", + "transformers_version": "4.18.0.dev0", "use_cache": true, "vocab_size": 50400 -} \ No newline at end of file +} diff --git a/tf_model.h5 b/tf_model.h5 new file mode 100644 index 0000000..dbcc9b1 --- /dev/null +++ b/tf_model.h5 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99958d6ecfdab80e1feaa577a0750e247ed5129984f91d819aeac4bd5c9fb08 +size 24203955064