Compare commits

..

No commits in common. "81916d20eef75766aeae71b9487fd615017b0413" and "4e134ddf6f3b0065014c45e6c864cc7cf4bf34ad" have entirely different histories.

3 changed files with 61 additions and 85 deletions

View File

@ -2,10 +2,10 @@
language: en language: en
tags: tags:
- tapas - tapas
- table-question-answering - question-answering
license: apache-2.0 license: apache-2.0
datasets: datasets:
- msr_sqa - sqa
--- ---
# TAPAS base model fine-tuned on Sequential Question Answering (SQA) # TAPAS base model fine-tuned on Sequential Question Answering (SQA)
@ -19,23 +19,6 @@ The other (non-default) version which can be used is:
Disclaimer: The team releasing TAPAS did not write a model card for this model so this model card has been written by Disclaimer: The team releasing TAPAS did not write a model card for this model so this model card has been written by
the Hugging Face team and contributors. the Hugging Face team and contributors.
## Results on SQA - Dev Accuracy
Size | Reset | Dev Accuracy | Link
-------- | --------| -------- | ----
LARGE | noreset | 0.7223 | [tapas-large-finetuned-sqa (absolute pos embeddings)](https://huggingface.co/google/tapas-large-finetuned-sqa/tree/no_reset)
LARGE | reset | 0.7289 | [tapas-large-finetuned-sqa](https://huggingface.co/google/tapas-large-finetuned-sqa/tree/main)
**BASE** | **noreset** | **0.6737** | [tapas-base-finetuned-sqa (absolute pos embeddings)](https://huggingface.co/google/tapas-base-finetuned-sqa/tree/no_reset)
**BASE** | **reset** | **0.6874** | [tapas-base-finetuned-sqa](https://huggingface.co/google/tapas-base-finetuned-sqa/tree/main)
MEDIUM | noreset | 0.6464 | [tapas-medium-finetuned-sqa (absolute pos embeddings)](https://huggingface.co/google/tapas-medium-finetuned-sqa/tree/no_reset)
MEDIUM | reset | 0.6561 | [tapas-medium-finetuned-sqa](https://huggingface.co/google/tapas-medium-finetuned-sqa/tree/main)
SMALL | noreset | 0.5876 | [tapas-small-finetuned-sqa (absolute pos embeddings)](https://huggingface.co/google/tapas-small-finetuned-sqa/tree/no_reset)
SMALL | reset | 0.6155 | [tapas-small-finetuned-sqa](https://huggingface.co/google/tapas-small-finetuned-sqa/tree/main)
MINI | noreset | 0.4574 | [tapas-mini-finetuned-sqa (absolute pos embeddings)](https://huggingface.co/google/tapas-mini-finetuned-sqa/tree/no_reset)
MINI | reset | 0.5148 | [tapas-mini-finetuned-sqa](https://huggingface.co/google/tapas-mini-finetuned-sqa/tree/main))
TINY | noreset | 0.2004 | [tapas-tiny-finetuned-sqa (absolute pos embeddings)](https://huggingface.co/google/tapas-tiny-finetuned-sqa/tree/no_reset)
TINY | reset | 0.2375 | [tapas-tiny-finetuned-sqa](https://huggingface.co/google/tapas-tiny-finetuned-sqa/tree/main)
## Model description ## Model description
TAPAS is a BERT-like transformers model pretrained on a large corpus of English data from Wikipedia in a self-supervised fashion. TAPAS is a BERT-like transformers model pretrained on a large corpus of English data from Wikipedia in a self-supervised fashion.

View File

@ -1,63 +1,59 @@
{ {
"_name_or_path": "google/tapas-base-finetuned-sqa", "aggregation_loss_weight": 1.0,
"aggregation_labels": null, "aggregation_temperature": 1.0,
"aggregation_loss_weight": 1.0, "allow_empty_column_selection": false,
"aggregation_temperature": 1.0, "answer_loss_cutoff": null,
"allow_empty_column_selection": false, "answer_loss_importance": 1.0,
"answer_loss_cutoff": null, "architectures": [
"answer_loss_importance": 1.0, "TapasForQuestionAnswering"
"architectures": [ ],
"TapasForQuestionAnswering" "attention_probs_dropout_prob": 0.1,
], "average_approximation_function": "ratio",
"attention_probs_dropout_prob": 0.1, "average_logits_per_cell": false,
"average_approximation_function": "ratio", "cell_selection_preference": null,
"average_logits_per_cell": false, "disable_per_token_loss": false,
"cell_selection_preference": null, "gradient_checkpointing": false,
"disable_per_token_loss": false, "hidden_act": "gelu",
"gradient_checkpointing": false, "hidden_dropout_prob": 0.1,
"hidden_act": "gelu", "hidden_size": 768,
"hidden_dropout_prob": 0.1, "huber_loss_delta": null,
"hidden_size": 768, "init_cell_selection_weights_to_zero": false,
"huber_loss_delta": null, "initializer_range": 0.02,
"init_cell_selection_weights_to_zero": false, "intermediate_size": 3072,
"initializer_range": 0.02, "layer_norm_eps": 1e-12,
"intermediate_size": 3072, "max_num_columns": 32,
"layer_norm_eps": 1e-12, "max_num_rows": 64,
"max_num_columns": 32, "max_position_embeddings": 1024,
"max_num_rows": 64, "model_type": "tapas",
"max_position_embeddings": 1024, "num_aggregation_labels": 0,
"model_type": "tapas", "num_attention_heads": 12,
"no_aggregation_label_index": null, "num_hidden_layers": 12,
"num_aggregation_labels": 0, "pad_token_id": 0,
"num_attention_heads": 12, "positive_label_weight": 10.0,
"num_hidden_layers": 12, "reset_position_index_per_cell": true,
"pad_token_id": 0, "select_one_column": true,
"positive_label_weight": 10.0, "softmax_temperature": 1.0,
"reset_position_index_per_cell": true, "type_vocab_size": [
"select_one_column": true, 3,
"softmax_temperature": 1.0, 256,
"transformers_version": "4.13.0.dev0", 256,
"type_vocab_size": [ 2,
3, 256,
256, 256,
256, 10
2, ],
256, "type_vocab_sizes": [
256, 3,
10 256,
], 256,
"type_vocab_sizes": [ 2,
3, 256,
256, 256,
256, 10
2, ],
256, "use_answer_as_supervision": null,
256, "use_gumbel_for_aggregation": false,
10 "use_gumbel_for_cells": false,
], "use_normalized_answer_loss": false,
"use_answer_as_supervision": null, "vocab_size": 30522
"use_gumbel_for_aggregation": false, }
"use_gumbel_for_cells": false,
"use_normalized_answer_loss": false,
"vocab_size": 30522
}

BIN
tf_model.h5 (Stored with Git LFS)

Binary file not shown.