Commit
·
4e0a36a
1
Parent(s):
e7669ea
Add verifyToken field to verify evaluation results are produced by Hugging Face's automatic model evaluator (#2)
Browse files- Add verifyToken field to verify evaluation results are produced by Hugging Face's automatic model evaluator (a24d3948669aa14f8c1514cf258e91cb4060598d)
Co-authored-by: Evaluation Bot <[email protected]>
README.md
CHANGED
|
@@ -12,16 +12,16 @@ model-index:
|
|
| 12 |
- name: roberta-base-qnli
|
| 13 |
results:
|
| 14 |
- task:
|
| 15 |
-
name: Text Classification
|
| 16 |
type: text-classification
|
|
|
|
| 17 |
dataset:
|
| 18 |
name: GLUE QNLI
|
| 19 |
type: glue
|
| 20 |
args: qnli
|
| 21 |
metrics:
|
| 22 |
-
-
|
| 23 |
-
type: accuracy
|
| 24 |
value: 0.9245835621453414
|
|
|
|
| 25 |
- task:
|
| 26 |
type: natural-language-inference
|
| 27 |
name: Natural Language Inference
|
|
@@ -31,30 +31,36 @@ model-index:
|
|
| 31 |
config: qnli
|
| 32 |
split: validation
|
| 33 |
metrics:
|
| 34 |
-
-
|
| 35 |
-
type: accuracy
|
| 36 |
value: 0.924400512538898
|
|
|
|
| 37 |
verified: true
|
| 38 |
-
|
| 39 |
-
|
| 40 |
value: 0.9171997157071784
|
|
|
|
| 41 |
verified: true
|
| 42 |
-
|
| 43 |
-
|
| 44 |
value: 0.9348062296269467
|
|
|
|
| 45 |
verified: true
|
| 46 |
-
|
| 47 |
-
|
| 48 |
value: 0.9744865501321541
|
|
|
|
| 49 |
verified: true
|
| 50 |
-
|
| 51 |
-
|
| 52 |
value: 0.9259192825112107
|
|
|
|
| 53 |
verified: true
|
| 54 |
-
|
| 55 |
-
|
| 56 |
value: 0.2990749478340149
|
|
|
|
| 57 |
verified: true
|
|
|
|
| 58 |
---
|
| 59 |
|
| 60 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
|
|
|
| 12 |
- name: roberta-base-qnli
|
| 13 |
results:
|
| 14 |
- task:
|
|
|
|
| 15 |
type: text-classification
|
| 16 |
+
name: Text Classification
|
| 17 |
dataset:
|
| 18 |
name: GLUE QNLI
|
| 19 |
type: glue
|
| 20 |
args: qnli
|
| 21 |
metrics:
|
| 22 |
+
- type: accuracy
|
|
|
|
| 23 |
value: 0.9245835621453414
|
| 24 |
+
name: Accuracy
|
| 25 |
- task:
|
| 26 |
type: natural-language-inference
|
| 27 |
name: Natural Language Inference
|
|
|
|
| 31 |
config: qnli
|
| 32 |
split: validation
|
| 33 |
metrics:
|
| 34 |
+
- type: accuracy
|
|
|
|
| 35 |
value: 0.924400512538898
|
| 36 |
+
name: Accuracy
|
| 37 |
verified: true
|
| 38 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNmE1ZDY2YTAzNDFiNDdlMGFlNjk2OTkyNjVlMjgwNDJjMzBlMzkwMGZjOWNhZmY2OWFiZjVmOGZlZmU5OGUxNCIsInZlcnNpb24iOjF9._WT9aiP0YGqyVIBSqUt5E6MT6EjB8g2ol_xbl0d1RGLev-eYtACpvAex_qckbXcxqFSENjVqtGx24MqXvQZyAA
|
| 39 |
+
- type: precision
|
| 40 |
value: 0.9171997157071784
|
| 41 |
+
name: Precision
|
| 42 |
verified: true
|
| 43 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNDg3ZGEwNTNmZjc2ZDNmZGY5NzgzMDRlMzBiODc0ZDY2NDE5NDRiYzNmYzg4YzQ5ZGM0MmI0ODA5NjQ3OTcxMiIsInZlcnNpb24iOjF9.CCCWPcZ3Ut8yjdal-62KxakOqVF7Vfj_A6etOxRV4pUa1WSpdOtK4BobR59tJKtfUw_l-h32EMMGQK0ZQBNCAA
|
| 44 |
+
- type: recall
|
| 45 |
value: 0.9348062296269467
|
| 46 |
+
name: Recall
|
| 47 |
verified: true
|
| 48 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZDI0OTNkOWQ2NGYzYTQ5ZDcwNjk1NDJhYTMzNWQ2ZTkyZDcxZTA5OTFkZTNjZDBmMGZjMDQ4YmI2M2Y3ZWE2YSIsInZlcnNpb24iOjF9.gfgQq9FgLkOA4cBylEAVoJZLupqglQusjnpyd3MAk1zxLeFhYSQOiRmjjW2nPNV2cJM43bR4XPsqePWzWimzDA
|
| 49 |
+
- type: auc
|
| 50 |
value: 0.9744865501321541
|
| 51 |
+
name: AUC
|
| 52 |
verified: true
|
| 53 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiODkyODMyZTRmYTIxYmFjNWM3MWI3ZjBhOWExNDkzMjc5MGM2NmNlYmE5NjI0NDU1NjlmYTJkZWNjMDA5ZjhkMiIsInZlcnNpb24iOjF9._CNFbnkR7n2CDTj2lIc6zGSWCFCEJ0V4sj7JZ44xL_cxILp5-m7Y-Dmi43Hk19FaBLfRzdmK9UD-BScNn_vsBw
|
| 54 |
+
- type: f1
|
| 55 |
value: 0.9259192825112107
|
| 56 |
+
name: F1
|
| 57 |
verified: true
|
| 58 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiOWVjN2E1YWNkMDgyMTk0Yjc2ZGFhYzJjNjFkY2VmNmU0NjNjZWQ3N2ZhYzgzNTg2N2FlNmY4YmMyYzJkNjFhOSIsInZlcnNpb24iOjF9.I1dkHU12MMeZerjCJ8JfBMyaR1fCEHvTZfpZN-hD2hTITjgkFcTFC_jFvydSwzKo7yX0ztA5ID3qqgW4qD7bAQ
|
| 59 |
+
- type: loss
|
| 60 |
value: 0.2990749478340149
|
| 61 |
+
name: loss
|
| 62 |
verified: true
|
| 63 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZTM2ZjAwOWNjNWE3NjcwYTVmZTIyY2YzNGI3Mzk5ZjM0YjVmYjg3ODA4Mjc3NWViMDkxMDlmZWRiNTdiOGNjMCIsInZlcnNpb24iOjF9.ODKlAkIeFLR4XiugSVARPvDgVUf6bQas9gSm8r_Q8xzZISaVIOUKNs2Z7kq443LiBBulvBoPaapNPpwkBbMkAw
|
| 64 |
---
|
| 65 |
|
| 66 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|