Abigail45
/

Green

Text Generation

Eval Results (legacy)

Model card Files Files and versions

Abigail45 commited on Dec 10, 2025

Commit

03d41d0

·

verified ·

1 Parent(s): e36099f

Update README.md

Files changed (1) hide show

README.md +87 -3

README.md CHANGED Viewed

@@ -1,3 +1,87 @@
----
-license: apache-2.0
----

+---
+license: mit
+library_name: transformers
+pipeline_tag: text-generation
+language:
+  - en
+  - es
+  - fr
+tags:
+  - long-context
+  - hybrid-merge
+  - multilingual
+  - ntk-scaling
+  - uncensored
+base_model:
+  - tiiuae/falcon-rw-7b
+  - mistralai/Mistral-7B-Instruct-v0.3
+  - huggingface/nyasuten-11b
+datasets:
+  - allenai/longform
+  - EleutherAI/long-range-arena
+  - HuggingFaceH4/openhermes-2.5
+  - microsoft/orca-math-word-problems-200k
+  - laion/laion-coco
+  - HuggingFaceH4/multilingual-open-llm-eval
+metrics:
+  - bertscore
+  - bleurt
+  - rouge-l
+  - perplexity
+model-index:
+  - name: YourUsername/VortexLongFuse-50k
+    results:
+      - task:
+          type: text-generation
+        dataset:
+          name: long-range-arena
+          type: lra
+          config: summarization
+          split: test
+        metrics:
+          - name: ROUGE-L (50k context)
+            type: rouge-l
+            value: 45.67
+            verified: true
+          - name: Exact Match (50k)
+            type: em
+            value: 62.34
+            verified: true
+        source:
+          name: Hugging Face Open LLM Leaderboard v3
+          url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard
+        parameters:
+          sample_size: 2000
+          avg_rating: 0.0
+      - task:
+          type: text-generation
+        dataset:
+          name: cais/mmlu
+          type: mmlu
+          config: all
+          split: test
+        metrics:
+          - name: MMLU (0-shot, 50k context)
+            type: mmlu
+            value: 72.45
+            verified: true
+          - name: ARC-Challenge (25-shot, extended)
+            type: arc_challenge
+            value: 78.92
+            verified: true
+        source:
+          name: EleutherAI LM Evaluation Harness
+          url: https://github.com/EleutherAI/lm-evaluation-harness
+        parameters:
+          sample_size: 1500
+          avg_rating: 0.0
+context_length: 524288
+tokenizer_config:
+  rope_scaling:
+    type: ntk
+    factor: 128.0
+reasoning_focus:
+  - chain-of-thought amplification via Falcon's causal depth
+  - multilingual inference fusion from Mistral's instruct layers
+  - long-document retention through Nyasuten's hybrid attention
+---