Add verifyToken field to verify evaluation results are produced by Hugging Face's automatic model evaluator

Beep boop, I am a bot from Hugging Face's automatic model evaluator 👋! We've added a new `verifyToken` field to your evaluation results to verify that they are produced by the model evaluator. Accept this PR to ensure that your results remain listed as **verified** on the [Hub leaderboard](https://huggingface.co/spaces/autoevaluate/leaderboards).

Files changed (1) hide show

README.md +25 -19

README.md CHANGED Viewed

@@ -2,6 +2,13 @@
 license: mit
 tags:
 - generated_from_trainer
 model-index:
 - name: rob-base-superqa
   results:
@@ -14,14 +21,16 @@ model-index:
       config: adversarialQA
       split: validation
     metrics:
-    - name: Exact Match
-      type: exact_match
       value: 43.8667
       verified: true
-    - name: F1
-      type: f1
       value: 55.135
       verified: true
   - task:
       type: question-answering
       name: Question Answering
@@ -31,14 +40,16 @@ model-index:
       config: squad_v2
       split: validation
     metrics:
-    - name: Exact Match
-      type: exact_match
       value: 79.2432
       verified: true
-    - name: F1
-      type: f1
       value: 82.336
       verified: true
   - task:
       type: question-answering
       name: Question Answering
@@ -48,21 +59,16 @@ model-index:
       config: default
       split: validation
     metrics:
-    - name: Exact Match
-      type: exact_match
       value: 78.8581
       verified: true
-    - name: F1
-      type: f1
       value: 82.8261
       verified: true
-task:
-- question-answering
-datasets:
-- squad_v2
-- quoref
-- adversarial_qa
-- duorc
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You

 license: mit
 tags:
 - generated_from_trainer
+datasets:
+- squad_v2
+- quoref
+- adversarial_qa
+- duorc
+task:
+- question-answering
 model-index:
 - name: rob-base-superqa
   results:
       config: adversarialQA
       split: validation
     metrics:
+    - type: exact_match
       value: 43.8667
+      name: Exact Match
       verified: true
+      verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYzIxMWZiZWM1MTJmMGIxM2I5NTFjNGI5OTJiNDdjODQ3NDNkYjRkYTI3ZmZkNGVmMGYzZDk5MTZhNDE4YzI1YiIsInZlcnNpb24iOjF9.QAj_iwD0yN2woSbGAN9xVRKoDKxldZbleFeJr77P2s7xWQBsKCuY0b5-2WIL79EcTCChvjNITeriPXqz8mGMAw
+    - type: f1
       value: 55.135
+      name: F1
       verified: true
+      verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNjJkMzZjNTVhZTI5OTVhNTU4NDcyMjM1ZWJiODVjNzBhODRmZjlmMjE0MDUzMmU4NzNlNzA5NjgyODdkNTJmZSIsInZlcnNpb24iOjF9.O0KoLquXYbF3P2PGCFW8bxYEVe_yDW-WzEqpOmbIs_e9v4tcygH19ZUYFjMDFSll91SPJ2oIbVovsUISYuknCg
   - task:
       type: question-answering
       name: Question Answering
       config: squad_v2
       split: validation
     metrics:
+    - type: exact_match
       value: 79.2432
+      name: Exact Match
       verified: true
+      verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNjBjZjhjMTMzMzZhOTg1OGYyZDY2MzZjYmQ4NmNlNWI5MWNmNTBiZjY1Njg0YTYyMmRlNzlkZDU1NTZjOWM5ZCIsInZlcnNpb24iOjF9.1vo9JoASJ_zvOVa4lTRMNPljUvMon-E6QOZ1n_KFQBMtRvRY883ECudhAzb5LGpLntyM2EN5bfyfTQ6dfjjsDg
+    - type: f1
       value: 82.336
+      name: F1
       verified: true
+      verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiOWFiZGMyMzkwOTlkMWVkZmExNjdkZTM1YjRkYzRkZDlhOGZlMjEwMGNjNjJhYjM5MjZlNDI3ZDEyNmViOGYyOSIsInZlcnNpb24iOjF9.f3xlhop8hXWCCWFXWZgyK9r8Cy5KE3gPgYNV3bRN78teN_hjYH5sDl4wMTMcPU-bsPX70_wvsuvU-r95ByF4Bg
   - task:
       type: question-answering
       name: Question Answering
       config: default
       split: validation
     metrics:
+    - type: exact_match
       value: 78.8581
+      name: Exact Match
       verified: true
+      verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZjMyYTAxOWJhYTM5YWNmNGFhZDg3NTIwN2UxN2RhYzQxYzFiODJjYTcyZTk5MGMwODNhMzA3Nzc3MDQzYjcwMiIsInZlcnNpb24iOjF9.FSNswUf1Y5ZnlS0fSm-lxsA1klUphzfDhfj00U5benVd0QiYvyeqRclC7Pw8B3RV9Oe1cZzfeDDA5fXY2A5JBw
+    - type: f1
       value: 82.8261
+      name: F1
       verified: true
+      verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNWQyMTNhZTc0MTdiMzNiNzc3YzhkNTk5ZWRkMWZlYjc4ZGU3YTFkNDkyZDg0NWFiYzFhMGQyMzZjYjcwNTE1YSIsInZlcnNpb24iOjF9.9waqQm_EBPo41pdOMmoY6r_-K7-3zUxt1AB4ndHTY50S5k5yyub8NdCJz09hBhbRd1_-1t3UT5p8HnFjAjF9DQ
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You