Compare commits
No commits in common. "8d8ffc158a3bee9fbb03afacdfc347c823c5ec8b" and "cb696e15ff082c217317b0c2c712a32354664941" have entirely different histories.
8d8ffc158a
...
cb696e15ff
|
@ -6,4 +6,3 @@
|
||||||
*.tar.gz filter=lfs diff=lfs merge=lfs -text
|
*.tar.gz filter=lfs diff=lfs merge=lfs -text
|
||||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
|
||||||
|
|
102
README.md
102
README.md
|
@ -2,108 +2,6 @@
|
||||||
language: en
|
language: en
|
||||||
tags:
|
tags:
|
||||||
- summarization
|
- summarization
|
||||||
model-index:
|
|
||||||
- name: google/pegasus-xsum
|
|
||||||
results:
|
|
||||||
- task:
|
|
||||||
type: summarization
|
|
||||||
name: Summarization
|
|
||||||
dataset:
|
|
||||||
name: samsum
|
|
||||||
type: samsum
|
|
||||||
config: samsum
|
|
||||||
split: train
|
|
||||||
metrics:
|
|
||||||
- name: ROUGE-1
|
|
||||||
type: rouge
|
|
||||||
value: 21.8096
|
|
||||||
verified: true
|
|
||||||
- name: ROUGE-2
|
|
||||||
type: rouge
|
|
||||||
value: 4.2525
|
|
||||||
verified: true
|
|
||||||
- name: ROUGE-L
|
|
||||||
type: rouge
|
|
||||||
value: 17.4469
|
|
||||||
verified: true
|
|
||||||
- name: ROUGE-LSUM
|
|
||||||
type: rouge
|
|
||||||
value: 18.8907
|
|
||||||
verified: true
|
|
||||||
- name: loss
|
|
||||||
type: loss
|
|
||||||
value: 3.0317161083221436
|
|
||||||
verified: true
|
|
||||||
- name: gen_len
|
|
||||||
type: gen_len
|
|
||||||
value: 20.3122
|
|
||||||
verified: true
|
|
||||||
- task:
|
|
||||||
type: summarization
|
|
||||||
name: Summarization
|
|
||||||
dataset:
|
|
||||||
name: xsum
|
|
||||||
type: xsum
|
|
||||||
config: default
|
|
||||||
split: test
|
|
||||||
metrics:
|
|
||||||
- name: ROUGE-1
|
|
||||||
type: rouge
|
|
||||||
value: 46.8623
|
|
||||||
verified: true
|
|
||||||
- name: ROUGE-2
|
|
||||||
type: rouge
|
|
||||||
value: 24.4533
|
|
||||||
verified: true
|
|
||||||
- name: ROUGE-L
|
|
||||||
type: rouge
|
|
||||||
value: 39.0548
|
|
||||||
verified: true
|
|
||||||
- name: ROUGE-LSUM
|
|
||||||
type: rouge
|
|
||||||
value: 39.0994
|
|
||||||
verified: true
|
|
||||||
- name: loss
|
|
||||||
type: loss
|
|
||||||
value: 1.5717021226882935
|
|
||||||
verified: true
|
|
||||||
- name: gen_len
|
|
||||||
type: gen_len
|
|
||||||
value: 22.8821
|
|
||||||
verified: true
|
|
||||||
- task:
|
|
||||||
type: summarization
|
|
||||||
name: Summarization
|
|
||||||
dataset:
|
|
||||||
name: cnn_dailymail
|
|
||||||
type: cnn_dailymail
|
|
||||||
config: 3.0.0
|
|
||||||
split: test
|
|
||||||
metrics:
|
|
||||||
- name: ROUGE-1
|
|
||||||
type: rouge
|
|
||||||
value: 22.2062
|
|
||||||
verified: true
|
|
||||||
- name: ROUGE-2
|
|
||||||
type: rouge
|
|
||||||
value: 7.6701
|
|
||||||
verified: true
|
|
||||||
- name: ROUGE-L
|
|
||||||
type: rouge
|
|
||||||
value: 15.4046
|
|
||||||
verified: true
|
|
||||||
- name: ROUGE-LSUM
|
|
||||||
type: rouge
|
|
||||||
value: 19.2182
|
|
||||||
verified: true
|
|
||||||
- name: loss
|
|
||||||
type: loss
|
|
||||||
value: 2.681241273880005
|
|
||||||
verified: true
|
|
||||||
- name: gen_len
|
|
||||||
type: gen_len
|
|
||||||
value: 25.0234
|
|
||||||
verified: true
|
|
||||||
---
|
---
|
||||||
|
|
||||||
### Pegasus Models
|
### Pegasus Models
|
||||||
|
|
13
config.json
13
config.json
|
@ -1,5 +1,4 @@
|
||||||
{
|
{
|
||||||
"_name_or_path": "./",
|
|
||||||
"activation_dropout": 0.1,
|
"activation_dropout": 0.1,
|
||||||
"activation_function": "relu",
|
"activation_function": "relu",
|
||||||
"add_bias_logits": false,
|
"add_bias_logits": false,
|
||||||
|
@ -10,24 +9,18 @@
|
||||||
"attention_dropout": 0.1,
|
"attention_dropout": 0.1,
|
||||||
"bos_token_id": 0,
|
"bos_token_id": 0,
|
||||||
"classif_dropout": 0.0,
|
"classif_dropout": 0.0,
|
||||||
"classifier_dropout": 0.0,
|
|
||||||
"d_model": 1024,
|
"d_model": 1024,
|
||||||
"decoder_attention_heads": 16,
|
"decoder_attention_heads": 16,
|
||||||
"decoder_ffn_dim": 4096,
|
"decoder_ffn_dim": 4096,
|
||||||
"decoder_layerdrop": 0.0,
|
"decoder_layerdrop": 0.0,
|
||||||
"decoder_layers": 16,
|
"decoder_layers": 16,
|
||||||
"decoder_start_token_id": 0,
|
|
||||||
"do_blenderbot_90_layernorm": false,
|
|
||||||
"dropout": 0.1,
|
"dropout": 0.1,
|
||||||
"encoder_attention_heads": 16,
|
"encoder_attention_heads": 16,
|
||||||
"encoder_ffn_dim": 4096,
|
"encoder_ffn_dim": 4096,
|
||||||
"encoder_layerdrop": 0.0,
|
"encoder_layerdrop": 0.0,
|
||||||
"encoder_layers": 16,
|
"encoder_layers": 16,
|
||||||
"eos_token_id": 1,
|
"eos_token_id": 1,
|
||||||
"extra_pos_embeddings": 0,
|
"extra_pos_embeddings": 1,
|
||||||
"force_bos_token_to_be_generated": false,
|
|
||||||
"forced_eos_token_id": 1,
|
|
||||||
"gradient_checkpointing": false,
|
|
||||||
"id2label": {
|
"id2label": {
|
||||||
"0": "LABEL_0",
|
"0": "LABEL_0",
|
||||||
"1": "LABEL_1",
|
"1": "LABEL_1",
|
||||||
|
@ -40,7 +33,7 @@
|
||||||
"LABEL_1": 1,
|
"LABEL_1": 1,
|
||||||
"LABEL_2": 2
|
"LABEL_2": 2
|
||||||
},
|
},
|
||||||
"length_penalty": 0.6,
|
"length_penalty": 0.8,
|
||||||
"max_length": 64,
|
"max_length": 64,
|
||||||
"max_position_embeddings": 512,
|
"max_position_embeddings": 512,
|
||||||
"model_type": "pegasus",
|
"model_type": "pegasus",
|
||||||
|
@ -51,7 +44,5 @@
|
||||||
"pad_token_id": 0,
|
"pad_token_id": 0,
|
||||||
"scale_embedding": true,
|
"scale_embedding": true,
|
||||||
"static_position_embeddings": true,
|
"static_position_embeddings": true,
|
||||||
"transformers_version": "4.11.0.dev0",
|
|
||||||
"use_cache": true,
|
|
||||||
"vocab_size": 96103
|
"vocab_size": 96103
|
||||||
}
|
}
|
||||||
|
|
BIN
flax_model.msgpack (Stored with Git LFS)
BIN
flax_model.msgpack (Stored with Git LFS)
Binary file not shown.
|
@ -1,12 +0,0 @@
|
||||||
{
|
|
||||||
"_from_model_config": true,
|
|
||||||
"bos_token_id": 0,
|
|
||||||
"decoder_start_token_id": 0,
|
|
||||||
"eos_token_id": 1,
|
|
||||||
"forced_eos_token_id": 1,
|
|
||||||
"length_penalty": 0.6,
|
|
||||||
"max_length": 64,
|
|
||||||
"num_beams": 8,
|
|
||||||
"pad_token_id": 0,
|
|
||||||
"transformers_version": "4.27.0.dev0"
|
|
||||||
}
|
|
BIN
tf_model.h5 (Stored with Git LFS)
BIN
tf_model.h5 (Stored with Git LFS)
Binary file not shown.
File diff suppressed because one or more lines are too long
Loading…
Reference in New Issue