Compare commits
10 Commits
cb696e15ff
...
8d8ffc158a
Author | SHA1 | Date |
---|---|---|
|
8d8ffc158a | |
|
c4455b515a | |
|
b047d6a04d | |
|
5a17152529 | |
|
a0aa5531c0 | |
|
2e5571fec5 | |
|
ef6460fcf1 | |
|
02a9253be8 | |
|
b6b67ab33a | |
|
48d7b60021 |
|
@ -6,3 +6,4 @@
|
|||
*.tar.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
|
|
102
README.md
102
README.md
|
@ -2,6 +2,108 @@
|
|||
language: en
|
||||
tags:
|
||||
- summarization
|
||||
model-index:
|
||||
- name: google/pegasus-xsum
|
||||
results:
|
||||
- task:
|
||||
type: summarization
|
||||
name: Summarization
|
||||
dataset:
|
||||
name: samsum
|
||||
type: samsum
|
||||
config: samsum
|
||||
split: train
|
||||
metrics:
|
||||
- name: ROUGE-1
|
||||
type: rouge
|
||||
value: 21.8096
|
||||
verified: true
|
||||
- name: ROUGE-2
|
||||
type: rouge
|
||||
value: 4.2525
|
||||
verified: true
|
||||
- name: ROUGE-L
|
||||
type: rouge
|
||||
value: 17.4469
|
||||
verified: true
|
||||
- name: ROUGE-LSUM
|
||||
type: rouge
|
||||
value: 18.8907
|
||||
verified: true
|
||||
- name: loss
|
||||
type: loss
|
||||
value: 3.0317161083221436
|
||||
verified: true
|
||||
- name: gen_len
|
||||
type: gen_len
|
||||
value: 20.3122
|
||||
verified: true
|
||||
- task:
|
||||
type: summarization
|
||||
name: Summarization
|
||||
dataset:
|
||||
name: xsum
|
||||
type: xsum
|
||||
config: default
|
||||
split: test
|
||||
metrics:
|
||||
- name: ROUGE-1
|
||||
type: rouge
|
||||
value: 46.8623
|
||||
verified: true
|
||||
- name: ROUGE-2
|
||||
type: rouge
|
||||
value: 24.4533
|
||||
verified: true
|
||||
- name: ROUGE-L
|
||||
type: rouge
|
||||
value: 39.0548
|
||||
verified: true
|
||||
- name: ROUGE-LSUM
|
||||
type: rouge
|
||||
value: 39.0994
|
||||
verified: true
|
||||
- name: loss
|
||||
type: loss
|
||||
value: 1.5717021226882935
|
||||
verified: true
|
||||
- name: gen_len
|
||||
type: gen_len
|
||||
value: 22.8821
|
||||
verified: true
|
||||
- task:
|
||||
type: summarization
|
||||
name: Summarization
|
||||
dataset:
|
||||
name: cnn_dailymail
|
||||
type: cnn_dailymail
|
||||
config: 3.0.0
|
||||
split: test
|
||||
metrics:
|
||||
- name: ROUGE-1
|
||||
type: rouge
|
||||
value: 22.2062
|
||||
verified: true
|
||||
- name: ROUGE-2
|
||||
type: rouge
|
||||
value: 7.6701
|
||||
verified: true
|
||||
- name: ROUGE-L
|
||||
type: rouge
|
||||
value: 15.4046
|
||||
verified: true
|
||||
- name: ROUGE-LSUM
|
||||
type: rouge
|
||||
value: 19.2182
|
||||
verified: true
|
||||
- name: loss
|
||||
type: loss
|
||||
value: 2.681241273880005
|
||||
verified: true
|
||||
- name: gen_len
|
||||
type: gen_len
|
||||
value: 25.0234
|
||||
verified: true
|
||||
---
|
||||
|
||||
### Pegasus Models
|
||||
|
|
13
config.json
13
config.json
|
@ -1,4 +1,5 @@
|
|||
{
|
||||
"_name_or_path": "./",
|
||||
"activation_dropout": 0.1,
|
||||
"activation_function": "relu",
|
||||
"add_bias_logits": false,
|
||||
|
@ -9,18 +10,24 @@
|
|||
"attention_dropout": 0.1,
|
||||
"bos_token_id": 0,
|
||||
"classif_dropout": 0.0,
|
||||
"classifier_dropout": 0.0,
|
||||
"d_model": 1024,
|
||||
"decoder_attention_heads": 16,
|
||||
"decoder_ffn_dim": 4096,
|
||||
"decoder_layerdrop": 0.0,
|
||||
"decoder_layers": 16,
|
||||
"decoder_start_token_id": 0,
|
||||
"do_blenderbot_90_layernorm": false,
|
||||
"dropout": 0.1,
|
||||
"encoder_attention_heads": 16,
|
||||
"encoder_ffn_dim": 4096,
|
||||
"encoder_layerdrop": 0.0,
|
||||
"encoder_layers": 16,
|
||||
"eos_token_id": 1,
|
||||
"extra_pos_embeddings": 1,
|
||||
"extra_pos_embeddings": 0,
|
||||
"force_bos_token_to_be_generated": false,
|
||||
"forced_eos_token_id": 1,
|
||||
"gradient_checkpointing": false,
|
||||
"id2label": {
|
||||
"0": "LABEL_0",
|
||||
"1": "LABEL_1",
|
||||
|
@ -33,7 +40,7 @@
|
|||
"LABEL_1": 1,
|
||||
"LABEL_2": 2
|
||||
},
|
||||
"length_penalty": 0.8,
|
||||
"length_penalty": 0.6,
|
||||
"max_length": 64,
|
||||
"max_position_embeddings": 512,
|
||||
"model_type": "pegasus",
|
||||
|
@ -44,5 +51,7 @@
|
|||
"pad_token_id": 0,
|
||||
"scale_embedding": true,
|
||||
"static_position_embeddings": true,
|
||||
"transformers_version": "4.11.0.dev0",
|
||||
"use_cache": true,
|
||||
"vocab_size": 96103
|
||||
}
|
||||
|
|
Binary file not shown.
|
@ -0,0 +1,12 @@
|
|||
{
|
||||
"_from_model_config": true,
|
||||
"bos_token_id": 0,
|
||||
"decoder_start_token_id": 0,
|
||||
"eos_token_id": 1,
|
||||
"forced_eos_token_id": 1,
|
||||
"length_penalty": 0.6,
|
||||
"max_length": 64,
|
||||
"num_beams": 8,
|
||||
"pad_token_id": 0,
|
||||
"transformers_version": "4.27.0.dev0"
|
||||
}
|
Binary file not shown.
File diff suppressed because one or more lines are too long
Loading…
Reference in New Issue