Spaces:

bethgelab
/

lm-similarity

Sleeping

App Files Files Community

Joschka Strueber commited on Feb 6

Commit

5c5dc6a

1 Parent(s): 64b132e

[Add, Fix] add list of ungated models

Browse files

Files changed (2) hide show

src/dataloading.py +3 -4
src/models.txt +457 -0

src/dataloading.py CHANGED Viewed

@@ -10,7 +10,7 @@ def get_leaderboard_models_reload():
     # Load prechecked models
     try:
-        ungated_models = set(line.strip() for line in open("models.txt"))
     except FileNotFoundError:
         ungated_models = set()
@@ -47,7 +47,7 @@ def get_leaderboard_models_reload():
     print(f"Number of models: {len(models)}")
     # Save model list as txt file
-    with open("models.txt", "w") as f:
         for model in models:
             f.write(model + "\n")
@@ -56,7 +56,7 @@ def get_leaderboard_models_reload():
 def get_leaderboard_models():
     # Load prechecked (ungated) models
-    with open("models.txt", "r") as f:
         ungated_models = [line.strip() for line in f]
     return sorted(ungated_models)
@@ -140,4 +140,3 @@ def load_run_data_cached(model_name, dataset_name):
 if __name__ == "__main__":
     get_leaderboard_models_reload()

     # Load prechecked models
     try:
+        ungated_models = set(line.strip() for line in open("src/models.txt"))
     except FileNotFoundError:
         ungated_models = set()
     print(f"Number of models: {len(models)}")
     # Save model list as txt file
+    with open("src/models.txt", "w") as f:
         for model in models:
             f.write(model + "\n")
 def get_leaderboard_models():
     # Load prechecked (ungated) models
+    with open("src/models.txt", "r") as f:
         ungated_models = [line.strip() for line in f]
     return sorted(ungated_models)
 if __name__ == "__main__":
     get_leaderboard_models_reload()

src/models.txt ADDED Viewed

	@@ -0,0 +1,457 @@

+Pinkstack/SuperThoughts-CoT-14B-16k-o1-QwQ
+prithivMLmods/QwQ-LCoT-14B-Conversational
+pankajmathur/orca_mini_phi-4
+01-ai/Yi-34B
+Deci/DeciLM-7B
+Qwen/Qwen1.5-7B
+meta-llama/Meta-Llama-3-8B-Instruct
+mistralai/Mistral-7B-v0.1
+microsoft/Phi-3-mini-4k-instruct
+01-ai/Yi-1.5-9B-Chat
+LLM360/K2
+01-ai/Yi-1.5-9B
+meta-llama/Meta-Llama-3-8B
+google/gemma-7b
+google/recurrentgemma-2b
+databricks/dbrx-base
+meta-llama/Meta-Llama-3-70B-Instruct
+HuggingFaceH4/zephyr-7b-beta
+HuggingFaceH4/zephyr-7b-alpha
+mistralai/Mistral-7B-v0.3
+mlabonne/AlphaMonarch-7B
+mlabonne/Beyonder-4x7B-v3
+01-ai/Yi-1.5-6B-Chat
+01-ai/Yi-1.5-6B
+01-ai/Yi-1.5-9B-32K
+01-ai/Yi-6B
+stabilityai/stablelm-2-zephyr-1_6b
+stabilityai/stablelm-2-1_6b-chat
+01-ai/Yi-6B-Chat
+stabilityai/stablelm-zephyr-3b
+01-ai/Yi-1.5-9B-Chat-16K
+stabilityai/stablelm-2-1_6b
+allenai/OLMo-7B-hf
+allenai/OLMo-7B-Instruct-hf
+allenai/OLMo-1.7-7B-hf
+Qwen/Qwen1.5-0.5B
+mistral-community/Mixtral-8x22B-v0.1
+01-ai/Yi-1.5-34B
+01-ai/Yi-1.5-34B-32K
+01-ai/Yi-34B-Chat
+microsoft/phi-1
+meta-llama/Llama-2-7b-chat-hf
+meta-llama/Llama-2-7b-hf
+meta-llama/Llama-2-70b-chat-hf
+meta-llama/Meta-Llama-3-70B
+meta-llama/Llama-2-70b-hf
+microsoft/phi-1_5
+microsoft/phi-2
+Qwen/Qwen2-1.5B
+Qwen/Qwen2-0.5B
+google/gemma-2b
+mlabonne/NeuralDaredevil-8B-abliterated
+Qwen/Qwen2-7B
+HuggingFaceH4/zephyr-7b-gemma-v0.1
+stabilityai/stablelm-2-12b-chat
+Qwen/Qwen2-7B-Instruct
+Qwen/Qwen1.5-4B-Chat
+Qwen/Qwen1.5-0.5B-Chat
+Qwen/Qwen1.5-1.8B-Chat
+Qwen/Qwen1.5-14B-Chat
+Qwen/Qwen1.5-7B-Chat
+meta-llama/Llama-2-13b-chat-hf
+Qwen/Qwen1.5-1.8B
+Qwen/Qwen1.5-14B
+tiiuae/falcon-7b
+databricks/dolly-v2-7b
+Qwen/Qwen1.5-MoE-A2.7B
+Qwen/Qwen1.5-MoE-A2.7B-Chat
+01-ai/Yi-1.5-34B-Chat
+01-ai/Yi-34B-200K
+abacusai/Smaug-34B-v0.1
+abacusai/Smaug-72B-v0.1
+google/gemma-7b-it
+HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1
+google/gemma-2b-it
+google/gemma-1.1-2b-it
+google/gemma-1.1-7b-it
+mistralai/Mistral-7B-Instruct-v0.1
+google/recurrentgemma-2b-it
+mlabonne/OrpoLlama-3-8B
+mlabonne/phixtral-2x2_8
+Qwen/Qwen2-1.5B-Instruct
+stabilityai/stablelm-2-12b
+Qwen/Qwen1.5-4B
+stabilityai/stablelm-3b-4e1t
+microsoft/Phi-3-medium-4k-instruct
+Qwen/Qwen2-0.5B-Instruct
+deepseek-ai/deepseek-llm-7b-chat
+microsoft/Phi-3-small-128k-instruct
+mistral-community/Mistral-7B-v0.2
+meta-llama/Llama-2-13b-hf
+CohereForAI/aya-23-8B
+databricks/dolly-v2-3b
+databricks/dolly-v2-12b
+deepseek-ai/deepseek-moe-16b-chat
+mistralai/Mistral-7B-Instruct-v0.3
+deepseek-ai/deepseek-moe-16b-base
+microsoft/DialoGPT-medium
+mistralai/Mixtral-8x7B-Instruct-v0.1
+deepseek-ai/deepseek-llm-7b-base
+databricks/dolly-v1-6b
+mistralai/Mixtral-8x7B-v0.1
+CohereForAI/c4ai-command-r-v01
+CohereForAI/aya-23-35B
+mistral-community/mixtral-8x22B-v0.3
+tiiuae/falcon-40b-instruct
+tiiuae/falcon-40b
+CohereForAI/c4ai-command-r-plus
+microsoft/Orca-2-7b
+Qwen/Qwen1.5-110B-Chat
+allenai/OLMo-1B-hf
+microsoft/Orca-2-13b
+LLM360/K2-Chat
+mistralai/Mixtral-8x22B-v0.1
+microsoft/Phi-3-mini-128k-instruct
+Qwen/Qwen2-72B-Instruct
+Qwen/Qwen1.5-110B
+Qwen/Qwen1.5-32B-Chat
+Qwen/Qwen2-72B
+deepseek-ai/deepseek-llm-67b-chat
+Qwen/Qwen1.5-32B
+NousResearch/Yarn-Llama-2-13b-128k
+google/recurrentgemma-9b
+google/recurrentgemma-9b-it
+pankajmathur/orca_mini_7b
+meta-llama/Meta-Llama-3.1-8B
+01-ai/Yi-1.5-34B-Chat-16K
+meta-llama/Meta-Llama-3.1-70B
+HuggingFaceTB/SmolLM-1.7B
+mlabonne/Daredevil-8B
+HuggingFaceTB/SmolLM-1.7B-Instruct
+HuggingFaceTB/SmolLM-135M-Instruct
+HuggingFaceTB/SmolLM-135M
+HuggingFaceTB/SmolLM-360M-Instruct
+HuggingFaceTB/SmolLM-360M
+meta-llama/Meta-Llama-3.1-8B-Instruct
+mistralai/Mistral-Nemo-Instruct-2407
+mistralai/Mistral-Nemo-Base-2407
+meta-llama/Meta-Llama-3.1-70B-Instruct
+mlabonne/NeuralBeagle14-7B
+mlabonne/Daredevil-8B-abliterated
+tiiuae/falcon-mamba-7b
+BAAI/Infinity-Instruct-3M-0613-Llama3-70B
+google/flan-t5-small
+stabilityai/StableBeluga2
+google/gemma-2-2b-it
+google/gemma-2-2b
+abacusai/Smaug-Llama-3-70B-Instruct-32K
+abacusai/Smaug-Qwen2-72B-Instruct
+0-hero/Matter-0.2-7B-DPO
+google/flan-t5-xl
+abacusai/Llama-3-Smaug-8B
+DeepMount00/Llama-3-8b-Ita
+google/codegemma-1.1-2b
+Qwen/Qwen2-57B-A14B-Instruct
+microsoft/Phi-3.5-mini-instruct
+microsoft/Phi-3.5-MoE-instruct
+nvidia/Mistral-NeMo-Minitron-8B-Base
+google/gemma-2-27b-it
+google/gemma-2-27b
+google/flan-t5-base
+google/flan-t5-large
+google/flan-t5-xxl
+google/flan-ul2
+AALF/gemma-2-27b-it-SimPO-37K
+microsoft/Phi-3-medium-128k-instruct
+microsoft/Phi-3-small-8k-instruct
+mlabonne/ChimeraLlama-3-8B-v3
+mlabonne/ChimeraLlama-3-8B-v2
+abacusai/Smaug-Mixtral-v0.1
+abacusai/Dracarys-72B-Instruct
+abacusai/Liberated-Qwen1.5-14B
+CoolSpring/Qwen2-0.5B-Abyme
+abacusai/bigstral-12b-32k
+google/mt5-small
+google/mt5-base
+google/umt5-base
+google/switch-base-8
+mlabonne/Meta-Llama-3.1-8B-Instruct-abliterated
+google/mt5-xxl
+abacusai/bigyi-15b
+Qwen/Qwen2.5-7B-Instruct
+Qwen/Qwen2.5-7B
+Qwen/Qwen2.5-14B-Instruct
+Qwen/Qwen2.5-14B
+mistralai/Mistral-Small-Instruct-2409
+Qwen/Qwen2.5-3B-Instruct
+Qwen/Qwen2.5-32B-Instruct
+Qwen/Qwen2.5-0.5B-Instruct
+Qwen/Qwen2.5-0.5B
+Qwen/Qwen2.5-1.5B
+Qwen/Qwen2.5-1.5B-Instruct
+Qwen/Qwen2.5-3B
+Qwen/Qwen2.5-32B
+Qwen/Qwen2.5-72B-Instruct
+Qwen/Qwen2.5-72B
+Qwen/Qwen2.5-Coder-7B-Instruct
+Qwen/Qwen2.5-Math-7B-Instruct
+CohereForAI/c4ai-command-r-plus-08-2024
+Qwen/Qwen2-Math-7B
+1TuanPham/T-VisStar-7B-v0.1
+Qwen/Qwen2.5-Coder-7B
+Qwen/Qwen2-Math-72B-Instruct
+meta-llama/Llama-3.2-1B-Instruct
+meta-llama/Llama-3.2-1B
+meta-llama/Llama-3.2-3B-Instruct
+meta-llama/Llama-3.2-3B
+mlabonne/BigQwen2.5-Echo-47B-Instruct
+nvidia/Llama-3.1-Minitron-4B-Depth-Base
+nvidia/Nemotron-Mini-4B-Instruct
+nvidia/Minitron-4B-Base
+nvidia/Minitron-8B-Base
+AALF/gemma-2-27b-it-SimPO-37K-100steps
+Qwen/Qwen2.5-Math-7B
+Goekdeniz-Guelmez/Josiefied-Qwen2.5-1.5B-Instruct-abliterated-v2
+mistralai/Codestral-22B-v0.1
+Qwen/Qwen2.5-Math-72B-Instruct
+mlabonne/BigQwen2.5-52B-Instruct
+Cran-May/T.E-8.1
+allenai/OLMoE-1B-7B-0924
+allenai/OLMoE-1B-7B-0924-Instruct
+zelk12/recoilme-gemma-2-Ataraxy-9B-v0.1
+nvidia/Mistral-NeMo-Minitron-8B-Instruct
+zelk12/recoilme-gemma-2-Gutenberg-Doppel-9B-v0.1
+google/gemma-2-2b-jpn-it
+zelk12/recoilme-gemma-2-Ataraxy-9B-v0.2
+AtAndDev/Qwen2.5-1.5B-continuous-learnt
+mlabonne/Hermes-3-Llama-3.1-70B-lorablated
+nvidia/Llama-3.1-Nemotron-70B-Instruct-HF
+Gunulhona/Gemma-Ko-Merge-PEFT
+DeepAutoAI/d2nwg_causal_gpt2
+BlackBeenie/llama-3.1-8B-Galore-openassistant-guanaco
+DeepMount00/Lexora-Lite-3B
+Qwen/Qwen2-VL-7B-Instruct
+Qwen/Qwen2-VL-72B-Instruct
+TinyLlama/TinyLlama-1.1B-Chat-v0.5
+Marsouuu/lareneg1_78B-ECE-PRYMMAL-Martial
+OpenBuddy/openbuddy-nemotron-70b-v23.1-131k
+CohereForAI/aya-expanse-8b
+CohereForAI/aya-expanse-32b
+CultriX/Qwen2.5-14B-MegaMerge-pt2
+PJMixers-Dev/LLaMa-3.2-Instruct-JankMix-v0.2-SFT-HailMary-v0.1-KTO-3B
+BramVanroy/fietje-2
+BramVanroy/fietje-2-chat
+BramVanroy/GEITje-7B-ultra
+Gunulhona/Gemma-Ko-Merge
+BramVanroy/fietje-2-instruct
+CombinHorizon/Rombos-Qwen2.5-7B-Inst-BaseMerge-TIES
+DreadPoor/Aspire_1.3-8B_model-stock
+HuggingFaceTB/SmolLM2-135M
+HuggingFaceTB/SmolLM2-135M-Instruct
+HuggingFaceTB/SmolLM2-360M
+HuggingFaceTB/SmolLM2-1.7B
+HuggingFaceTB/SmolLM2-1.7B-Instruct
+3rd-Degree-Burn/Llama-3.1-8B-Squareroot-v1
+BlackBeenie/Neos-Gemma-2-9b
+BlackBeenie/Neos-Llama-3.1-base
+Qwen/Qwen2.5-Coder-14B-Instruct
+Qwen/Qwen2.5-Coder-14B
+HuggingFaceTB/SmolLM2-360M-Instruct
+Dans-DiscountModels/Mistral-7b-v0.3-Test-E0.7
+Goekdeniz-Guelmez/Josiefied-Qwen2.5-0.5B-Instruct-abliterated-v1
+BlackBeenie/Bloslain-8B-v0.2
+3rd-Degree-Burn/L-3.1-Science-Writer-8B
+CultriX/SeQwence-14B-v5
+Aurel9/testmerge-7b
+CultriX/SeQwence-14B
+mistralai/Mistral-Large-Instruct-2411
+AALF/FuseChat-Llama-3.1-8B-Instruct-preview
+GoToCompany/llama3-8b-cpt-sahabatai-v1-instruct
+AALF/FuseChat-Llama-3.1-8B-SFT-preview
+allenai/Llama-3.1-Tulu-3-8B
+allenai/Llama-3.1-Tulu-3-8B-DPO
+allenai/Llama-3.1-Tulu-3-8B-SFT
+allenai/Llama-3.1-Tulu-3-8B-RM
+FlofloB/10k_continued_pretraining_Phi-3-mini-4k-instruct_Unsloth_merged_16bit
+nvidia/OpenMath2-Llama3.1-8B
+CultriX/Qwestion-14B
+FlofloB/10k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit
+FlofloB/40k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit
+AGI-0/smartllama3.1-8B-001
+Delta-Vector/Control-8B-V1.1
+Junhoee/Qwen-Megumin
+Dans-DiscountModels/mistral-7b-test-merged
+CultriX/SeQwence-14Bv1
+CultriX/SeQwence-14B-EvolMerge
+CultriX/SeQwence-14B-EvolMergev1
+BlackBeenie/Neos-Phi-3-14B-v0.1
+CultriX/SeQwence-14Bv3
+DreadPoor/Sweetened_Condensed_Milk-8B-Model_Stock
+allenai/Llama-3.1-Tulu-3-70B-SFT
+allenai/Llama-3.1-Tulu-3-70B
+allenai/Llama-3.1-Tulu-3-70B-DPO
+Qwen/QwQ-32B-Preview
+Norquinal/Bravo
+JackFram/llama-68m
+JackFram/llama-160m
+mistralai/Ministral-8B-Instruct-2410
+DreadPoor/Matryoshka-8B-LINEAR
+ClaudioItaly/intelligence-cod-rag-7b-v3
+MaziyarPanahi/calme-3.2-instruct-78b
+meta-llama/Llama-3.3-70B-Instruct
+DreadPoor/remember_to_breathe-8b-Model-Stock
+Corianas/Neural-Mistral-7B
+nvidia/Hymba-1.5B-Base
+nvidia/Hymba-1.5B-Instruct
+CombinHorizon/Josiefied-abliteratedV4-Qwen2.5-14B-Inst-BaseMerge-TIES
+CombinHorizon/huihui-ai-abliteratedV2-Qwen2.5-14B-Inst-BaseMerge-TIES
+meta-llama/Llama-3.1-8B
+CombinHorizon/huihui-ai-abliterated-Qwen2.5-32B-Inst-BaseMerge-TIES
+CultriX/SeQwence-14Bv2
+AuraIndustries/Aura-8B
+DRXD1000/Atlas-7B
+Qwen/Qwen2.5-Coder-32B-Instruct
+Qwen/Qwen2.5-Coder-32B
+LGAI-EXAONE/EXAONE-3.5-7.8B-Instruct
+Goekdeniz-Guelmez/josie-7b-v6.0-step2000
+Corianas/Quokka_2.7b
+tiiuae/Falcon3-7B-Base
+tiiuae/Falcon3-10B-Base
+tiiuae/Falcon3-Mamba-7B-Base
+tiiuae/Falcon3-3B-Base
+tiiuae/Falcon3-Mamba-7B-Instruct
+tiiuae/Falcon3-1B-Base
+tiiuae/Falcon3-1B-Instruct
+tiiuae/Falcon3-3B-Instruct
+tiiuae/Falcon3-10B-Instruct
+tiiuae/Falcon3-7B-Instruct
+Alsebay/Qwen2.5-7B-test-novelist
+AuraIndustries/Aura-4B
+T145/ZEUS-8B-V8
+EpistemeAI/Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-Empathy
+Aashraf995/Creative-7B-nerd
+Aashraf995/Qwen-Evo-7B
+Aashraf995/QwenStock-14B
+Aashraf995/Gemma-Evo-10B
+AuraIndustries/Aura-MoE-2x4B
+Bllossom/llama-3.2-Korean-Bllossom-AICA-5B
+AuraIndustries/Aura-MoE-2x4B-v2
+HelpingAI/Cipher-20B
+HPAI-BSC/Qwen2.5-Aloe-Beta-7B
+DreadPoor/Again-8B-Model_Stock
+PJMixers-Dev/LLaMa-3.1-Instruct-Interleaved-Zeroed-13B
+DreadPoor/Elusive_Dragon_Heart-8B-LINEAR
+CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct-2412
+CultriX/Qwen2.5-14B-Emerged
+CultriX/Qwen2.5-14B-Wernickev3
+CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct
+CohereForAI/c4ai-command-r7b-12-2024
+EpistemeAI/Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-Logic
+CombinHorizon/zetasepic-abliteratedV2-Qwen2.5-32B-Inst-BaseMerge-TIES
+NyxKrage/Microsoft_Phi-4
+DreadPoor/Casuar-9B-Model_Stock
+CultriX/Qwen2.5-14B-Unity
+CultriX/Qwen2.5-14B-Broca
+CultriX/Qwenfinity-2.5-14B
+CultriX/Qwen2.5-14B-Brocav7
+CultriX/Qwen2.5-14B-Brocav3
+CultriX/Qwen2.5-14B-Brocav6
+CultriX/Qwen2.5-14B-FinalMerge
+ContactDoctor/Bio-Medical-Llama-3-8B
+Daemontatox/RA_Reasoner
+Daemontatox/PathfinderAI
+JayHyeon/Qwen-0.5B-eDPO-5epoch
+JayHyeon/Qwen-0.5B-IRPO-5epoch
+JayHyeon/Qwen-0.5B-DPO-5epoch
+JayHyeon/Qwen2.5-0.5B-Instruct-SFT
+JayHyeon/Qwen2.5-0.5B-Instruct-SFT-IRPO-1epoch_v1
+DreadPoor/UNTESTED-VENN_1.2-8B-Model_Stock
+JayHyeon/Qwen2.5-0.5B-SFT-1e-4
+Daemontatox/AetherTOT
+Daemontatox/PixelParse_AI
+DavieLion/Llama-3.2-1B-SPIN-iter3
+JayHyeon/Qwen2.5-0.5B-SFT-2e-4-3ep
+Daemontatox/RA_Reasoner2.0
+Daemontatox/AetherSett
+Daemontatox/Sphinx2.0
+Daemontatox/PathFinderAI2.0
+JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_5e-7_3ep_0alp_0lam_2ep
+JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_7e-7_3ep_0alp_0lam_1ep
+DreadPoor/Happy_New_Year-8B-Model_Stock
+Daemontatox/TinySphinx2.0
+Daemontatox/SphinX
+Daemontatox/PathFinderAi3.0
+Daemontatox/NemoR
+JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_7e-7_2ep_0alp_0lam
+Ahdoot/StructuredThinker-v0.3-MoreStructure
+Daemontatox/RA2.0
+JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-2ep_0alp_0lam
+JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-2ep_1alp_0lam
+JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-1ep_1alp_0lam
+DebateLabKIT/Llama-3.1-Argunaut-1-8B-SFT
+JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-3ep_0alp_0lam
+Daemontatox/MawaredT1
+JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-1ep_1alp_0lam
+JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-3ep_1alp_0lam
+JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-6-3ep_0alp_0lam
+DreadPoor/Derivative-8B-Model_Stock
+Alepach/notHumpback-M1
+Alepach/notHumpback-M0
+Danielbrdz/Barcenas-10b
+Ahdoot/Test_StealthThinker
+FuseAI/FuseChat-Llama-3.1-8B-Instruct
+JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_0.5_1e-7-2ep_0alp_0lam
+DreadPoor/Derivative_V2_ALT-8B-Model_Stock
+DreadPoor/Derivative_V2-8B-Model_Stock
+Daemontatox/CogitoZ14
+Goekdeniz-Guelmez/josie-7b-v6.0
+Goekdeniz-Guelmez/josie-3b-v6.0
+allenai/OLMo-2-1124-7B-Instruct
+DreadPoor/Derivative_V3-8B-Model_Stock
+Daemontatox/CogitoZ
+microsoft/phi-4
+FlofloB/smollm2-135M_pretrained_200k_fineweb_uncovai_selected
+JayHyeon/Qwen_0.5-DPO_5e-7-2ep_0alp_0lam
+JayHyeon/Qwen_0.5-DPO_5e-7-1ep_0alp_0lam
+JayHyeon/Qwen_0.5-DPOP_5e-7-2ep_0alp_5lam
+JayHyeon/Qwen_0.5-DPOP_5e-7-3ep_0alp_5lam
+JayHyeon/Qwen_0.5-DPOP_5e-7-1ep_0alp_5lam
+JayHyeon/Qwen_0.5-DPO_3e-6-2ep_0alp_0lam
+JayHyeon/Qwen_0.5-DPO_3e-6-1ep_0alp_0lam
+JayHyeon/Qwen_0.5-DPOP_3e-6-2ep_0alp_5lam
+JayHyeon/Qwen_0.5-IRPO_3e-6-2ep_1alp_0lam
+JayHyeon/Qwen_0.5-IRPO_3e-6-3ep_1alp_0lam
+JayHyeon/Qwen_0.5-DPOP_3e-6-3ep_0alp_5lam
+JayHyeon/Qwen_0.5-IRPO_3e-6-1ep_1alp_0lam
+JayHyeon/Qwen_0.5-MDPO_0.3_5e-7-3ep_0alp_0lam
+JayHyeon/Qwen_0.5-MDPO_0.3_3e-6-3ep_0alp_0lam
+JayHyeon/Qwen_0.5-MDPO_0.7_5e-7-3ep_0alp_0lam
+JayHyeon/Qwen_0.5-MDPO_0.7_3e-6-3ep_0alp_0lam
+Sakalti/Neptuno-Alpha
+FlofloB/smollm2-135M_pretrained_400k_fineweb_uncovai_selected
+FlofloB/smollm2-135M_pretrained_600k_fineweb_uncovai_selected
+DreadPoor/BaeZel_V3-8B-Model_Stock
+Daemontatox/AetherUncensored
+FlofloB/smollm2-135M_pretrained_1400k_fineweb_uncovai_selected
+CultriX/Qwen2.5-14B-BrocaV9
+DavidAU/Gemma-The-Writer-J.GutenBerg-10B
+OpenBuddy/openbuddy-llama3.3-70b-v24.1-131k
+deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
+deepseek-ai/DeepSeek-R1-Distill-Llama-8B
+deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
+deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
+deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
+deepseek-ai/DeepSeek-R1-Distill-Llama-70B
+nvidia/AceMath-1.5B-Instruct
+nvidia/AceMath-7B-RM
+nvidia/AceMath-7B-Instruct
+nvidia/AceInstruct-1.5B
+nvidia/AceInstruct-7B
+nvidia/AceInstruct-72B
+nvidia/AceMath-72B-Instruct
+Qwen/Qwen2.5-7B-Instruct-1M
+Qwen/Qwen2.5-14B-Instruct-1M
+nvidia/AceMath-72B-RM
+mistralai/Mistral-Small-24B-Base-2501
+meta-llama/Llama-3.1-8B-Instruct