Initial commit

This commit is contained in:
Rubèn Tito 2023-02-21 07:57:14 +00:00 committed by huggingface-web
parent 10269d43c0
commit 803eaf825d
8 changed files with 150558 additions and 0 deletions

40
config.json Normal file
View File

@ -0,0 +1,40 @@
{
"_name_or_path": "microsoft/layoutlmv3-base",
"architectures": [
"LayoutLMv3ForQuestionAnswering"
],
"attention_probs_dropout_prob": 0.1,
"bos_token_id": 0,
"classifier_dropout": null,
"coordinate_size": 128,
"eos_token_id": 2,
"has_relative_attention_bias": true,
"has_spatial_attention_bias": true,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"initializer_range": 0.02,
"input_size": 224,
"intermediate_size": 3072,
"layer_norm_eps": 1e-05,
"max_2d_position_embeddings": 1024,
"max_position_embeddings": 514,
"max_rel_2d_pos": 256,
"max_rel_pos": 128,
"model_type": "layoutlmv3",
"num_attention_heads": 12,
"num_channels": 3,
"num_hidden_layers": 12,
"pad_token_id": 1,
"patch_size": 16,
"rel_2d_pos_bins": 64,
"rel_pos_bins": 32,
"second_input_size": 112,
"shape_size": 128,
"text_embed": true,
"torch_dtype": "float32",
"transformers_version": "4.21.3",
"type_vocab_size": 1,
"visual_embed": true,
"vocab_size": 50265
}

50001
merges.txt Normal file

File diff suppressed because it is too large Load Diff

20
preprocessor_config.json Normal file
View File

@ -0,0 +1,20 @@
{
"apply_ocr": false,
"do_normalize": true,
"do_resize": true,
"feature_extractor_type": "LayoutLMv3FeatureExtractor",
"image_mean": [
0.5,
0.5,
0.5
],
"image_std": [
0.5,
0.5,
0.5
],
"ocr_lang": null,
"processor_class": "LayoutLMv3Processor",
"resample": 2,
"size": 224
}

BIN
pytorch_model.bin (Stored with Git LFS) Normal file

Binary file not shown.

51
special_tokens_map.json Normal file
View File

@ -0,0 +1,51 @@
{
"bos_token": {
"content": "<s>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
},
"cls_token": {
"content": "<s>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
},
"eos_token": {
"content": "</s>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
},
"mask_token": {
"content": "<mask>",
"lstrip": true,
"normalized": true,
"rstrip": false,
"single_word": false
},
"pad_token": {
"content": "<pad>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
},
"sep_token": {
"content": "</s>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
},
"unk_token": {
"content": "<unk>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
}
}

100355
tokenizer.json Normal file

File diff suppressed because it is too large Load Diff

87
tokenizer_config.json Normal file
View File

@ -0,0 +1,87 @@
{
"add_prefix_space": true,
"apply_ocr": false,
"bos_token": {
"__type": "AddedToken",
"content": "<s>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
},
"cls_token": {
"__type": "AddedToken",
"content": "<s>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
},
"cls_token_box": [
0,
0,
0,
0
],
"eos_token": {
"__type": "AddedToken",
"content": "</s>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
},
"errors": "replace",
"mask_token": {
"__type": "AddedToken",
"content": "<mask>",
"lstrip": true,
"normalized": true,
"rstrip": false,
"single_word": false
},
"model_max_length": 512,
"name_or_path": "microsoft/layoutlmv3-base",
"only_label_first_subword": true,
"pad_token": {
"__type": "AddedToken",
"content": "<pad>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
},
"pad_token_box": [
0,
0,
0,
0
],
"pad_token_label": -100,
"processor_class": "LayoutLMv3Processor",
"sep_token": {
"__type": "AddedToken",
"content": "</s>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
},
"sep_token_box": [
0,
0,
0,
0
],
"special_tokens_map_file": null,
"tokenizer_class": "LayoutLMv3Tokenizer",
"trim_offsets": true,
"unk_token": {
"__type": "AddedToken",
"content": "<unk>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
}
}

1
vocab.json Normal file

File diff suppressed because one or more lines are too long