chinese_llama_vicuna_tokenizer/config.json

25 lines
586 B
JSON
Raw Normal View History

2023-06-08 10:45:26 +00:00
{
2023-06-08 11:02:11 +00:00
"_name_or_path": "decapoda-research/llama-7b-hf",
2023-06-08 10:45:26 +00:00
"architectures": [
2023-06-08 11:02:11 +00:00
"LLaMAForCausalLM"
2023-06-08 10:45:26 +00:00
],
2023-06-08 11:02:11 +00:00
"bos_token_id": 0,
"eos_token_id": 1,
"hidden_act": "silu",
2023-06-08 10:45:26 +00:00
"hidden_size": 4096,
2023-06-08 11:02:11 +00:00
"initializer_range": 0.02,
"intermediate_size": 11008,
"max_position_embeddings": 2048,
2023-06-08 10:45:26 +00:00
"max_sequence_length": 2048,
2023-06-08 11:02:11 +00:00
"model_type": "llama",
2023-06-08 10:45:26 +00:00
"num_attention_heads": 32,
2023-06-08 11:02:11 +00:00
"num_hidden_layers": 32,
"pad_token_id": -1,
"rms_norm_eps": 1e-06,
"tie_word_embeddings": false,
2023-06-08 10:45:26 +00:00
"torch_dtype": "float16",
"transformers_version": "4.29.2",
"use_cache": true,
2023-06-08 11:02:11 +00:00
"vocab_size": 32000
2023-06-08 10:45:26 +00:00
}