diff --git a/config.json b/config.json new file mode 100644 index 0000000..032298d --- /dev/null +++ b/config.json @@ -0,0 +1,25 @@ +{ + "_name_or_path": "/home/patrick/hugging_face/t5/t5-v1_1-base", + "architectures": [ + "T5ForConditionalGeneration" + ], + "d_ff": 2048, + "d_kv": 64, + "d_model": 768, + "decoder_start_token_id": 0, + "dropout_rate": 0.1, + "eos_token_id": 1, + "feed_forward_proj": "gated-gelu", + "initializer_factor": 1.0, + "is_encoder_decoder": true, + "layer_norm_epsilon": 1e-06, + "model_type": "t5", + "num_decoder_layers": 12, + "num_heads": 12, + "num_layers": 12, + "output_past": true, + "pad_token_id": 0, + "relative_attention_num_buckets": 32, + "tie_word_embeddings": false, + "vocab_size": 32128 +} diff --git a/pytorch_model.bin b/pytorch_model.bin new file mode 100644 index 0000000..259426a --- /dev/null +++ b/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d51351caeff6b750968985458a25b74622657f492c01cc62dbf3a61074725eb +size 990441433 diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..881bdbf --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1 @@ +{"eos_token": "", "unk_token": "", "pad_token": "", "additional_special_tokens": ["", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", ""]} \ No newline at end of file diff --git a/spiece.model b/spiece.model new file mode 100644 index 0000000..4e28ff6 Binary files /dev/null and b/spiece.model differ diff --git a/tf_model.h5 b/tf_model.h5 new file mode 100644 index 0000000..3cfd332 --- /dev/null +++ b/tf_model.h5 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dda737bfc489aa0a81619c4f3bb42768e777dd55197127662cef4afb60cbec5d +size 990878928 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..b114c31 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1 @@ +{"eos_token": "", "unk_token": "", "pad_token": "", "extra_ids": 100, "additional_special_tokens": ["", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", ""], "model_max_length": 512, "name_or_path": "t5-small"} \ No newline at end of file