Compare commits

...

10 Commits

Author SHA1 Message Date
Joao Gante 8d8ffc158a Adding generation config file(s) 2023-01-24 16:42:49 +00:00
lewtun c4455b515a Add evaluation results on the 3.0.0 config of cnn_dailymail (#5)
- Add evaluation results on the 3.0.0 config of cnn_dailymail (0a2da9e6569b4095d580a2f3089a505b03ad6d0a)
- Merge branch 'main' into pr/5 (32e122dd99389517fdae89aa8fd85127cb72617f)


Co-authored-by: Evaluation Bot <autoevaluator@users.noreply.huggingface.co>
2022-08-17 13:20:35 +00:00
lewtun b047d6a04d Add evaluation results on xsum dataset (#2)
- Add evaluation results on xsum dataset (5607f0182d43ebd582201f345d8167e2d0921260)
- Merge branch 'main' into pr/2 (dddd426cc6b2832527019a254827ecca1a8f3dfb)


Co-authored-by: Evaluation Bot <autoevaluator@users.noreply.huggingface.co>
2022-08-17 13:02:38 +00:00
lewtun 5a17152529 Add evaluation results on samsum dataset (#1)
- Add evaluation results on samsum dataset (81814d81846806cad273e3cd251efbd0f0ef1848)


Co-authored-by: Evaluation Bot <autoevaluator@users.noreply.huggingface.co>
2022-08-17 12:53:41 +00:00
patil-suraj a0aa5531c0 add flax model 2021-09-14 07:25:41 +00:00
Anthony Moi 2e5571fec5
Update tokenizer.json
Fixes a bug with offset tracking: https://github.com/huggingface/transformers/issues/9637
2021-02-01 12:39:02 -05:00
Patrick von Platen ef6460fcf1 upload model 2021-01-10 18:55:22 +00:00
Patrick von Platen 02a9253be8 Update special_tokens_map.json 2020-11-25 22:47:35 +00:00
Patrick von Platen b6b67ab33a Pegasus has word mask token called "MASK2" in paper 2020-11-25 22:42:44 +00:00
system 48d7b60021 Update config.json 2020-09-13 22:31:16 +00:00
7 changed files with 133 additions and 2 deletions

1
.gitattributes vendored
View File

@ -6,3 +6,4 @@
*.tar.gz filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text

102
README.md
View File

@ -2,6 +2,108 @@
language: en
tags:
- summarization
model-index:
- name: google/pegasus-xsum
results:
- task:
type: summarization
name: Summarization
dataset:
name: samsum
type: samsum
config: samsum
split: train
metrics:
- name: ROUGE-1
type: rouge
value: 21.8096
verified: true
- name: ROUGE-2
type: rouge
value: 4.2525
verified: true
- name: ROUGE-L
type: rouge
value: 17.4469
verified: true
- name: ROUGE-LSUM
type: rouge
value: 18.8907
verified: true
- name: loss
type: loss
value: 3.0317161083221436
verified: true
- name: gen_len
type: gen_len
value: 20.3122
verified: true
- task:
type: summarization
name: Summarization
dataset:
name: xsum
type: xsum
config: default
split: test
metrics:
- name: ROUGE-1
type: rouge
value: 46.8623
verified: true
- name: ROUGE-2
type: rouge
value: 24.4533
verified: true
- name: ROUGE-L
type: rouge
value: 39.0548
verified: true
- name: ROUGE-LSUM
type: rouge
value: 39.0994
verified: true
- name: loss
type: loss
value: 1.5717021226882935
verified: true
- name: gen_len
type: gen_len
value: 22.8821
verified: true
- task:
type: summarization
name: Summarization
dataset:
name: cnn_dailymail
type: cnn_dailymail
config: 3.0.0
split: test
metrics:
- name: ROUGE-1
type: rouge
value: 22.2062
verified: true
- name: ROUGE-2
type: rouge
value: 7.6701
verified: true
- name: ROUGE-L
type: rouge
value: 15.4046
verified: true
- name: ROUGE-LSUM
type: rouge
value: 19.2182
verified: true
- name: loss
type: loss
value: 2.681241273880005
verified: true
- name: gen_len
type: gen_len
value: 25.0234
verified: true
---
### Pegasus Models

View File

@ -1,4 +1,5 @@
{
"_name_or_path": "./",
"activation_dropout": 0.1,
"activation_function": "relu",
"add_bias_logits": false,
@ -9,18 +10,24 @@
"attention_dropout": 0.1,
"bos_token_id": 0,
"classif_dropout": 0.0,
"classifier_dropout": 0.0,
"d_model": 1024,
"decoder_attention_heads": 16,
"decoder_ffn_dim": 4096,
"decoder_layerdrop": 0.0,
"decoder_layers": 16,
"decoder_start_token_id": 0,
"do_blenderbot_90_layernorm": false,
"dropout": 0.1,
"encoder_attention_heads": 16,
"encoder_ffn_dim": 4096,
"encoder_layerdrop": 0.0,
"encoder_layers": 16,
"eos_token_id": 1,
"extra_pos_embeddings": 1,
"extra_pos_embeddings": 0,
"force_bos_token_to_be_generated": false,
"forced_eos_token_id": 1,
"gradient_checkpointing": false,
"id2label": {
"0": "LABEL_0",
"1": "LABEL_1",
@ -33,7 +40,7 @@
"LABEL_1": 1,
"LABEL_2": 2
},
"length_penalty": 0.8,
"length_penalty": 0.6,
"max_length": 64,
"max_position_embeddings": 512,
"model_type": "pegasus",
@ -44,5 +51,7 @@
"pad_token_id": 0,
"scale_embedding": true,
"static_position_embeddings": true,
"transformers_version": "4.11.0.dev0",
"use_cache": true,
"vocab_size": 96103
}

BIN
flax_model.msgpack (Stored with Git LFS) Normal file

Binary file not shown.

12
generation_config.json Normal file
View File

@ -0,0 +1,12 @@
{
"_from_model_config": true,
"bos_token_id": 0,
"decoder_start_token_id": 0,
"eos_token_id": 1,
"forced_eos_token_id": 1,
"length_penalty": 0.6,
"max_length": 64,
"num_beams": 8,
"pad_token_id": 0,
"transformers_version": "4.27.0.dev0"
}

BIN
tf_model.h5 (Stored with Git LFS) Normal file

Binary file not shown.

1
tokenizer.json Normal file

File diff suppressed because one or more lines are too long