Commit
·
3e271d0
1
Parent(s):
198d0d6
add model
Browse files- .ipynb_checkpoints/README-checkpoint.md +33 -0
- config.json +2 -2
- pytorch_model.bin +2 -2
.ipynb_checkpoints/README-checkpoint.md
ADDED
|
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
pipeline_tag: text-classification
|
| 3 |
+
tags:
|
| 4 |
+
- natural-language-inference
|
| 5 |
+
- misogyny
|
| 6 |
+
language: en
|
| 7 |
+
license: apache-2.0
|
| 8 |
+
widget:
|
| 9 |
+
- text: "Las mascarillas causan hipoxia. Wearing masks is harmful to human health"
|
| 10 |
+
example_title: "Natural Language Inference"
|
| 11 |
+
---
|
| 12 |
+
|
| 13 |
+
# bertweet-base-multi-mami
|
| 14 |
+
This is a finetuned XLM-RoBERTA model for natural language inference. It has been trained with a massive ammount of data following the ANLI pipeline training. We include data from:
|
| 15 |
+
- [mnli](https://cims.nyu.edu/~sbowman/multinli/) {train, dev and test}
|
| 16 |
+
- [snli](https://nlp.stanford.edu/projects/snli/) {train, dev and test}
|
| 17 |
+
- [xnli](https://github.com/facebookresearch/XNLI) {train, dev and test}
|
| 18 |
+
- [fever](https://fever.ai/resources.html) {train, dev and test}
|
| 19 |
+
- [anli](https://github.com/facebookresearch/anli) {train}
|
| 20 |
+
|
| 21 |
+
The model is validated on ANLI training sets, including R1, R2 and R3. The following results can be expected on the testing splits.
|
| 22 |
+
|Split|Accuracy|
|
| 23 |
+
|-|-|
|
| 24 |
+
|R1|0.6610|
|
| 25 |
+
|R2|0.4990|
|
| 26 |
+
|R3|0.4425|
|
| 27 |
+
|
| 28 |
+
# Multilabels
|
| 29 |
+
label2id={
|
| 30 |
+
"contradiction": 0,
|
| 31 |
+
"entailment": 1,
|
| 32 |
+
"neutral": 2,
|
| 33 |
+
},
|
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "xlm-roberta-large",
|
| 3 |
"architectures": [
|
| 4 |
"XLMRobertaForSequenceClassification"
|
| 5 |
],
|
|
@@ -31,7 +31,7 @@
|
|
| 31 |
"pad_token_id": 1,
|
| 32 |
"position_embedding_type": "absolute",
|
| 33 |
"torch_dtype": "float32",
|
| 34 |
-
"transformers_version": "4.
|
| 35 |
"type_vocab_size": 1,
|
| 36 |
"use_cache": true,
|
| 37 |
"vocab_size": 250002
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "xlm-roberta-large-snli_mnli_xnli_fever_r1_r2_r3",
|
| 3 |
"architectures": [
|
| 4 |
"XLMRobertaForSequenceClassification"
|
| 5 |
],
|
|
|
|
| 31 |
"pad_token_id": 1,
|
| 32 |
"position_embedding_type": "absolute",
|
| 33 |
"torch_dtype": "float32",
|
| 34 |
+
"transformers_version": "4.12.3",
|
| 35 |
"type_vocab_size": 1,
|
| 36 |
"use_cache": true,
|
| 37 |
"vocab_size": 250002
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7cce651115ecbb97dc077f548c5e3d0183737e3f88bbf55275b9ac69efd0c1d
|
| 3 |
+
size 2239732653
|