prabhatkr commited on
Commit
5e56315
·
verified ·
1 Parent(s): 7cf9efc

Upload README.md with huggingface_hub

Browse files
Files changed (1) hide show
  1. README.md +9 -9
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  type: text2text-generation
23
  name: Table Preservation
24
  dataset:
25
- name: -RAGBench
26
  type: G4KMU/t2-ragbench
27
  metrics:
28
  - type: accuracy
@@ -32,7 +32,7 @@ model-index:
32
  type: text-retrieval
33
  name: Multi-Doc Synthesis
34
  dataset:
35
- name: FRAMES
36
  type: google/frames-benchmark
37
  metrics:
38
  - type: accuracy
@@ -42,7 +42,7 @@ model-index:
42
  type: visual-question-answering
43
  name: Visual Reasoning
44
  dataset:
45
- name: FinRAGBench-V
46
  type: FinRAGBench/FinRAGBench-V
47
  metrics:
48
  - type: accuracy
@@ -52,7 +52,7 @@ model-index:
52
  type: text-classification
53
  name: Anti-Hallucination
54
  dataset:
55
- name: RGB
56
  type: THUDM/RGB
57
  metrics:
58
  - type: accuracy
@@ -62,7 +62,7 @@ model-index:
62
  type: tabular-classification
63
  name: End-to-End Latency
64
  dataset:
65
- name: Scale Benchmark
66
  type: FastMemory/Scale
67
  metrics:
68
  - type: accuracy
@@ -72,7 +72,7 @@ model-index:
72
  type: text-retrieval
73
  name: Multi-hop Routing
74
  dataset:
75
- name: GraphRAG-Bench
76
  type: GraphRAG-Bench/GraphRAG-Bench
77
  metrics:
78
  - type: accuracy
@@ -82,7 +82,7 @@ model-index:
82
  type: text-retrieval
83
  name: E-Commerce Graph
84
  dataset:
85
- name: STaRK-Prime
86
  type: snap-stanford/stark
87
  metrics:
88
  - type: accuracy
@@ -92,7 +92,7 @@ model-index:
92
  type: question-answering
93
  name: Biomedical Compliance
94
  dataset:
95
- name: BiomixQA
96
  type: kg-rag/BiomixQA
97
  metrics:
98
  - type: accuracy
@@ -102,7 +102,7 @@ model-index:
102
  type: text-generation
103
  name: Pipeline Eval (RAGAS)
104
  dataset:
105
- name: RAGAS Framework
106
  type: ragas/ragas-eval
107
  metrics:
108
  - type: accuracy
 
22
  type: text2text-generation
23
  name: Table Preservation
24
  dataset:
25
+ name: G4KMU/t2-ragbench
26
  type: G4KMU/t2-ragbench
27
  metrics:
28
  - type: accuracy
 
32
  type: text-retrieval
33
  name: Multi-Doc Synthesis
34
  dataset:
35
+ name: google/frames-benchmark
36
  type: google/frames-benchmark
37
  metrics:
38
  - type: accuracy
 
42
  type: visual-question-answering
43
  name: Visual Reasoning
44
  dataset:
45
+ name: FinRAGBench/FinRAGBench-V
46
  type: FinRAGBench/FinRAGBench-V
47
  metrics:
48
  - type: accuracy
 
52
  type: text-classification
53
  name: Anti-Hallucination
54
  dataset:
55
+ name: THUDM/RGB
56
  type: THUDM/RGB
57
  metrics:
58
  - type: accuracy
 
62
  type: tabular-classification
63
  name: End-to-End Latency
64
  dataset:
65
+ name: FastMemory/Scale
66
  type: FastMemory/Scale
67
  metrics:
68
  - type: accuracy
 
72
  type: text-retrieval
73
  name: Multi-hop Routing
74
  dataset:
75
+ name: GraphRAG-Bench/GraphRAG-Bench
76
  type: GraphRAG-Bench/GraphRAG-Bench
77
  metrics:
78
  - type: accuracy
 
82
  type: text-retrieval
83
  name: E-Commerce Graph
84
  dataset:
85
+ name: snap-stanford/stark
86
  type: snap-stanford/stark
87
  metrics:
88
  - type: accuracy
 
92
  type: question-answering
93
  name: Biomedical Compliance
94
  dataset:
95
+ name: kg-rag/BiomixQA
96
  type: kg-rag/BiomixQA
97
  metrics:
98
  - type: accuracy
 
102
  type: text-generation
103
  name: Pipeline Eval (RAGAS)
104
  dataset:
105
+ name: ragas/ragas-eval
106
  type: ragas/ragas-eval
107
  metrics:
108
  - type: accuracy