Compare commits
10 Commits
265d5b42b8
...
791c5260a7
Author | SHA1 | Date |
---|---|---|
|
791c5260a7 | |
|
84e3c23618 | |
|
e3e8a282c7 | |
|
77b3fda6c0 | |
|
2db0a0e1cc | |
|
0961f713b9 | |
|
3767886f2b | |
|
7848658c7e | |
|
2a02222200 | |
|
f5bddca01e |
|
@ -10,16 +10,16 @@ tags:
|
||||||
license: mit
|
license: mit
|
||||||
pipeline_tag: zero-shot-classification
|
pipeline_tag: zero-shot-classification
|
||||||
datasets:
|
datasets:
|
||||||
- xlni
|
- xnli
|
||||||
metrics:
|
metrics:
|
||||||
- accuracy
|
- accuracy
|
||||||
---
|
---
|
||||||
|
|
||||||
# camembert-base-xlni
|
# camembert-base-xnli
|
||||||
|
|
||||||
## Model description
|
## Model description
|
||||||
|
|
||||||
Camembert-base model fine-tuned on french part of XLNI dataset. <br>
|
Camembert-base model fine-tuned on french part of XNLI dataset. <br>
|
||||||
One of the few Zero-Shot classification model working on french 🇫🇷
|
One of the few Zero-Shot classification model working on french 🇫🇷
|
||||||
|
|
||||||
## Intended uses & limitations
|
## Intended uses & limitations
|
||||||
|
@ -70,7 +70,7 @@ prob_label_is_true[0].tolist() * 100
|
||||||
|
|
||||||
## Training data
|
## Training data
|
||||||
|
|
||||||
Training data is the french fold of the [XLNI](https://research.fb.com/publications/xnli-evaluating-cross-lingual-sentence-representations/) dataset released in 2018 by Facebook. <br>
|
Training data is the french fold of the [XNLI](https://research.fb.com/publications/xnli-evaluating-cross-lingual-sentence-representations/) dataset released in 2018 by Facebook. <br>
|
||||||
Available with great ease using the ```datasets``` library :
|
Available with great ease using the ```datasets``` library :
|
||||||
|
|
||||||
```python
|
```python
|
||||||
|
@ -86,6 +86,7 @@ Main training parameters :
|
||||||
- ```num_train_epochs = 4```
|
- ```num_train_epochs = 4```
|
||||||
- ```batch_size = 12``` (limited by GPU-memory)
|
- ```batch_size = 12``` (limited by GPU-memory)
|
||||||
- ```weight_decay = 0.01```
|
- ```weight_decay = 0.01```
|
||||||
|
- ```metric_for_best_model = "eval_accuracy"```
|
||||||
|
|
||||||
## Eval results
|
## Eval results
|
||||||
|
|
||||||
|
|
10
config.json
10
config.json
|
@ -11,16 +11,16 @@
|
||||||
"hidden_dropout_prob": 0.1,
|
"hidden_dropout_prob": 0.1,
|
||||||
"hidden_size": 768,
|
"hidden_size": 768,
|
||||||
"id2label": {
|
"id2label": {
|
||||||
"0": "contradiction",
|
"0": "entailment",
|
||||||
"1": "neutral",
|
"1": "neutral",
|
||||||
"2": "entailment"
|
"2": "contradiction"
|
||||||
},
|
},
|
||||||
"initializer_range": 0.02,
|
"initializer_range": 0.02,
|
||||||
"intermediate_size": 3072,
|
"intermediate_size": 3072,
|
||||||
"label2id": {
|
"label2id": {
|
||||||
"contradiction": 0,
|
"entailment": 0,
|
||||||
"neutral": 1,
|
"neutral": 1,
|
||||||
"entailment": 2
|
"contradiction": 2
|
||||||
},
|
},
|
||||||
"layer_norm_eps": 1e-05,
|
"layer_norm_eps": 1e-05,
|
||||||
"max_position_embeddings": 514,
|
"max_position_embeddings": 514,
|
||||||
|
@ -30,7 +30,7 @@
|
||||||
"output_past": true,
|
"output_past": true,
|
||||||
"pad_token_id": 1,
|
"pad_token_id": 1,
|
||||||
"position_embedding_type": "absolute",
|
"position_embedding_type": "absolute",
|
||||||
"transformers_version": "4.4.2",
|
"transformers_version": "4.3.3",
|
||||||
"type_vocab_size": 1,
|
"type_vocab_size": 1,
|
||||||
"use_cache": true,
|
"use_cache": true,
|
||||||
"vocab_size": 32005
|
"vocab_size": 32005
|
||||||
|
|
Binary file not shown.
Loading…
Reference in New Issue