Compare commits
10 Commits
cb696e15ff
...
8d8ffc158a
Author | SHA1 | Date |
---|---|---|
|
8d8ffc158a | |
|
c4455b515a | |
|
b047d6a04d | |
|
5a17152529 | |
|
a0aa5531c0 | |
|
2e5571fec5 | |
|
ef6460fcf1 | |
|
02a9253be8 | |
|
b6b67ab33a | |
|
48d7b60021 |
|
@ -6,3 +6,4 @@
|
||||||
*.tar.gz filter=lfs diff=lfs merge=lfs -text
|
*.tar.gz filter=lfs diff=lfs merge=lfs -text
|
||||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||||
|
|
102
README.md
102
README.md
|
@ -2,6 +2,108 @@
|
||||||
language: en
|
language: en
|
||||||
tags:
|
tags:
|
||||||
- summarization
|
- summarization
|
||||||
|
model-index:
|
||||||
|
- name: google/pegasus-xsum
|
||||||
|
results:
|
||||||
|
- task:
|
||||||
|
type: summarization
|
||||||
|
name: Summarization
|
||||||
|
dataset:
|
||||||
|
name: samsum
|
||||||
|
type: samsum
|
||||||
|
config: samsum
|
||||||
|
split: train
|
||||||
|
metrics:
|
||||||
|
- name: ROUGE-1
|
||||||
|
type: rouge
|
||||||
|
value: 21.8096
|
||||||
|
verified: true
|
||||||
|
- name: ROUGE-2
|
||||||
|
type: rouge
|
||||||
|
value: 4.2525
|
||||||
|
verified: true
|
||||||
|
- name: ROUGE-L
|
||||||
|
type: rouge
|
||||||
|
value: 17.4469
|
||||||
|
verified: true
|
||||||
|
- name: ROUGE-LSUM
|
||||||
|
type: rouge
|
||||||
|
value: 18.8907
|
||||||
|
verified: true
|
||||||
|
- name: loss
|
||||||
|
type: loss
|
||||||
|
value: 3.0317161083221436
|
||||||
|
verified: true
|
||||||
|
- name: gen_len
|
||||||
|
type: gen_len
|
||||||
|
value: 20.3122
|
||||||
|
verified: true
|
||||||
|
- task:
|
||||||
|
type: summarization
|
||||||
|
name: Summarization
|
||||||
|
dataset:
|
||||||
|
name: xsum
|
||||||
|
type: xsum
|
||||||
|
config: default
|
||||||
|
split: test
|
||||||
|
metrics:
|
||||||
|
- name: ROUGE-1
|
||||||
|
type: rouge
|
||||||
|
value: 46.8623
|
||||||
|
verified: true
|
||||||
|
- name: ROUGE-2
|
||||||
|
type: rouge
|
||||||
|
value: 24.4533
|
||||||
|
verified: true
|
||||||
|
- name: ROUGE-L
|
||||||
|
type: rouge
|
||||||
|
value: 39.0548
|
||||||
|
verified: true
|
||||||
|
- name: ROUGE-LSUM
|
||||||
|
type: rouge
|
||||||
|
value: 39.0994
|
||||||
|
verified: true
|
||||||
|
- name: loss
|
||||||
|
type: loss
|
||||||
|
value: 1.5717021226882935
|
||||||
|
verified: true
|
||||||
|
- name: gen_len
|
||||||
|
type: gen_len
|
||||||
|
value: 22.8821
|
||||||
|
verified: true
|
||||||
|
- task:
|
||||||
|
type: summarization
|
||||||
|
name: Summarization
|
||||||
|
dataset:
|
||||||
|
name: cnn_dailymail
|
||||||
|
type: cnn_dailymail
|
||||||
|
config: 3.0.0
|
||||||
|
split: test
|
||||||
|
metrics:
|
||||||
|
- name: ROUGE-1
|
||||||
|
type: rouge
|
||||||
|
value: 22.2062
|
||||||
|
verified: true
|
||||||
|
- name: ROUGE-2
|
||||||
|
type: rouge
|
||||||
|
value: 7.6701
|
||||||
|
verified: true
|
||||||
|
- name: ROUGE-L
|
||||||
|
type: rouge
|
||||||
|
value: 15.4046
|
||||||
|
verified: true
|
||||||
|
- name: ROUGE-LSUM
|
||||||
|
type: rouge
|
||||||
|
value: 19.2182
|
||||||
|
verified: true
|
||||||
|
- name: loss
|
||||||
|
type: loss
|
||||||
|
value: 2.681241273880005
|
||||||
|
verified: true
|
||||||
|
- name: gen_len
|
||||||
|
type: gen_len
|
||||||
|
value: 25.0234
|
||||||
|
verified: true
|
||||||
---
|
---
|
||||||
|
|
||||||
### Pegasus Models
|
### Pegasus Models
|
||||||
|
|
13
config.json
13
config.json
|
@ -1,4 +1,5 @@
|
||||||
{
|
{
|
||||||
|
"_name_or_path": "./",
|
||||||
"activation_dropout": 0.1,
|
"activation_dropout": 0.1,
|
||||||
"activation_function": "relu",
|
"activation_function": "relu",
|
||||||
"add_bias_logits": false,
|
"add_bias_logits": false,
|
||||||
|
@ -9,18 +10,24 @@
|
||||||
"attention_dropout": 0.1,
|
"attention_dropout": 0.1,
|
||||||
"bos_token_id": 0,
|
"bos_token_id": 0,
|
||||||
"classif_dropout": 0.0,
|
"classif_dropout": 0.0,
|
||||||
|
"classifier_dropout": 0.0,
|
||||||
"d_model": 1024,
|
"d_model": 1024,
|
||||||
"decoder_attention_heads": 16,
|
"decoder_attention_heads": 16,
|
||||||
"decoder_ffn_dim": 4096,
|
"decoder_ffn_dim": 4096,
|
||||||
"decoder_layerdrop": 0.0,
|
"decoder_layerdrop": 0.0,
|
||||||
"decoder_layers": 16,
|
"decoder_layers": 16,
|
||||||
|
"decoder_start_token_id": 0,
|
||||||
|
"do_blenderbot_90_layernorm": false,
|
||||||
"dropout": 0.1,
|
"dropout": 0.1,
|
||||||
"encoder_attention_heads": 16,
|
"encoder_attention_heads": 16,
|
||||||
"encoder_ffn_dim": 4096,
|
"encoder_ffn_dim": 4096,
|
||||||
"encoder_layerdrop": 0.0,
|
"encoder_layerdrop": 0.0,
|
||||||
"encoder_layers": 16,
|
"encoder_layers": 16,
|
||||||
"eos_token_id": 1,
|
"eos_token_id": 1,
|
||||||
"extra_pos_embeddings": 1,
|
"extra_pos_embeddings": 0,
|
||||||
|
"force_bos_token_to_be_generated": false,
|
||||||
|
"forced_eos_token_id": 1,
|
||||||
|
"gradient_checkpointing": false,
|
||||||
"id2label": {
|
"id2label": {
|
||||||
"0": "LABEL_0",
|
"0": "LABEL_0",
|
||||||
"1": "LABEL_1",
|
"1": "LABEL_1",
|
||||||
|
@ -33,7 +40,7 @@
|
||||||
"LABEL_1": 1,
|
"LABEL_1": 1,
|
||||||
"LABEL_2": 2
|
"LABEL_2": 2
|
||||||
},
|
},
|
||||||
"length_penalty": 0.8,
|
"length_penalty": 0.6,
|
||||||
"max_length": 64,
|
"max_length": 64,
|
||||||
"max_position_embeddings": 512,
|
"max_position_embeddings": 512,
|
||||||
"model_type": "pegasus",
|
"model_type": "pegasus",
|
||||||
|
@ -44,5 +51,7 @@
|
||||||
"pad_token_id": 0,
|
"pad_token_id": 0,
|
||||||
"scale_embedding": true,
|
"scale_embedding": true,
|
||||||
"static_position_embeddings": true,
|
"static_position_embeddings": true,
|
||||||
|
"transformers_version": "4.11.0.dev0",
|
||||||
|
"use_cache": true,
|
||||||
"vocab_size": 96103
|
"vocab_size": 96103
|
||||||
}
|
}
|
||||||
|
|
Binary file not shown.
|
@ -0,0 +1,12 @@
|
||||||
|
{
|
||||||
|
"_from_model_config": true,
|
||||||
|
"bos_token_id": 0,
|
||||||
|
"decoder_start_token_id": 0,
|
||||||
|
"eos_token_id": 1,
|
||||||
|
"forced_eos_token_id": 1,
|
||||||
|
"length_penalty": 0.6,
|
||||||
|
"max_length": 64,
|
||||||
|
"num_beams": 8,
|
||||||
|
"pad_token_id": 0,
|
||||||
|
"transformers_version": "4.27.0.dev0"
|
||||||
|
}
|
Binary file not shown.
File diff suppressed because one or more lines are too long
Loading…
Reference in New Issue