Spaces:

bethgelab
/

lm-similarity

Running

Joschka Strueber

[Add, Ref] Add more info and table on metric, move model list to data/

b90e0d3 8 days ago

14.2 kB

	Pinkstack/SuperThoughts-CoT-14B-16k-o1-QwQ
	prithivMLmods/QwQ-LCoT-14B-Conversational
	pankajmathur/orca_mini_phi-4
	01-ai/Yi-34B
	Deci/DeciLM-7B
	Qwen/Qwen1.5-7B
	meta-llama/Meta-Llama-3-8B-Instruct
	mistralai/Mistral-7B-v0.1
	microsoft/Phi-3-mini-4k-instruct
	01-ai/Yi-1.5-9B-Chat
	LLM360/K2
	01-ai/Yi-1.5-9B
	meta-llama/Meta-Llama-3-8B
	google/gemma-7b
	google/recurrentgemma-2b
	databricks/dbrx-base
	meta-llama/Meta-Llama-3-70B-Instruct
	HuggingFaceH4/zephyr-7b-beta
	HuggingFaceH4/zephyr-7b-alpha
	mistralai/Mistral-7B-v0.3
	mlabonne/AlphaMonarch-7B
	mlabonne/Beyonder-4x7B-v3
	01-ai/Yi-1.5-6B-Chat
	01-ai/Yi-1.5-6B
	01-ai/Yi-1.5-9B-32K
	01-ai/Yi-6B
	stabilityai/stablelm-2-zephyr-1_6b
	stabilityai/stablelm-2-1_6b-chat
	01-ai/Yi-6B-Chat
	stabilityai/stablelm-zephyr-3b
	01-ai/Yi-1.5-9B-Chat-16K
	stabilityai/stablelm-2-1_6b
	allenai/OLMo-7B-hf
	allenai/OLMo-7B-Instruct-hf
	allenai/OLMo-1.7-7B-hf
	Qwen/Qwen1.5-0.5B
	mistral-community/Mixtral-8x22B-v0.1
	01-ai/Yi-1.5-34B
	01-ai/Yi-1.5-34B-32K
	01-ai/Yi-34B-Chat
	microsoft/phi-1
	meta-llama/Llama-2-7b-chat-hf
	meta-llama/Llama-2-7b-hf
	meta-llama/Llama-2-70b-chat-hf
	meta-llama/Meta-Llama-3-70B
	meta-llama/Llama-2-70b-hf
	microsoft/phi-1_5
	microsoft/phi-2
	Qwen/Qwen2-1.5B
	Qwen/Qwen2-0.5B
	google/gemma-2b
	mlabonne/NeuralDaredevil-8B-abliterated
	Qwen/Qwen2-7B
	HuggingFaceH4/zephyr-7b-gemma-v0.1
	stabilityai/stablelm-2-12b-chat
	Qwen/Qwen2-7B-Instruct
	Qwen/Qwen1.5-4B-Chat
	Qwen/Qwen1.5-0.5B-Chat
	Qwen/Qwen1.5-1.8B-Chat
	Qwen/Qwen1.5-14B-Chat
	Qwen/Qwen1.5-7B-Chat
	meta-llama/Llama-2-13b-chat-hf
	Qwen/Qwen1.5-1.8B
	Qwen/Qwen1.5-14B
	tiiuae/falcon-7b
	databricks/dolly-v2-7b
	Qwen/Qwen1.5-MoE-A2.7B
	Qwen/Qwen1.5-MoE-A2.7B-Chat
	01-ai/Yi-1.5-34B-Chat
	01-ai/Yi-34B-200K
	abacusai/Smaug-34B-v0.1
	abacusai/Smaug-72B-v0.1
	google/gemma-7b-it
	HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1
	google/gemma-2b-it
	google/gemma-1.1-2b-it
	google/gemma-1.1-7b-it
	mistralai/Mistral-7B-Instruct-v0.1
	google/recurrentgemma-2b-it
	mlabonne/OrpoLlama-3-8B
	mlabonne/phixtral-2x2_8
	Qwen/Qwen2-1.5B-Instruct
	stabilityai/stablelm-2-12b
	Qwen/Qwen1.5-4B
	stabilityai/stablelm-3b-4e1t
	microsoft/Phi-3-medium-4k-instruct
	Qwen/Qwen2-0.5B-Instruct
	deepseek-ai/deepseek-llm-7b-chat
	microsoft/Phi-3-small-128k-instruct
	mistral-community/Mistral-7B-v0.2
	meta-llama/Llama-2-13b-hf
	CohereForAI/aya-23-8B
	databricks/dolly-v2-3b
	databricks/dolly-v2-12b
	deepseek-ai/deepseek-moe-16b-chat
	mistralai/Mistral-7B-Instruct-v0.3
	deepseek-ai/deepseek-moe-16b-base
	microsoft/DialoGPT-medium
	mistralai/Mixtral-8x7B-Instruct-v0.1
	deepseek-ai/deepseek-llm-7b-base
	databricks/dolly-v1-6b
	mistralai/Mixtral-8x7B-v0.1
	CohereForAI/c4ai-command-r-v01
	CohereForAI/aya-23-35B
	mistral-community/mixtral-8x22B-v0.3
	tiiuae/falcon-40b-instruct
	tiiuae/falcon-40b
	CohereForAI/c4ai-command-r-plus
	microsoft/Orca-2-7b
	Qwen/Qwen1.5-110B-Chat
	allenai/OLMo-1B-hf
	microsoft/Orca-2-13b
	LLM360/K2-Chat
	mistralai/Mixtral-8x22B-v0.1
	microsoft/Phi-3-mini-128k-instruct
	Qwen/Qwen2-72B-Instruct
	Qwen/Qwen1.5-110B
	Qwen/Qwen1.5-32B-Chat
	Qwen/Qwen2-72B
	deepseek-ai/deepseek-llm-67b-chat
	Qwen/Qwen1.5-32B
	NousResearch/Yarn-Llama-2-13b-128k
	google/recurrentgemma-9b
	google/recurrentgemma-9b-it
	pankajmathur/orca_mini_7b
	meta-llama/Meta-Llama-3.1-8B
	01-ai/Yi-1.5-34B-Chat-16K
	meta-llama/Meta-Llama-3.1-70B
	HuggingFaceTB/SmolLM-1.7B
	mlabonne/Daredevil-8B
	HuggingFaceTB/SmolLM-1.7B-Instruct
	HuggingFaceTB/SmolLM-135M-Instruct
	HuggingFaceTB/SmolLM-135M
	HuggingFaceTB/SmolLM-360M-Instruct
	HuggingFaceTB/SmolLM-360M
	meta-llama/Meta-Llama-3.1-8B-Instruct
	mistralai/Mistral-Nemo-Instruct-2407
	mistralai/Mistral-Nemo-Base-2407
	meta-llama/Meta-Llama-3.1-70B-Instruct
	mlabonne/NeuralBeagle14-7B
	mlabonne/Daredevil-8B-abliterated
	tiiuae/falcon-mamba-7b
	BAAI/Infinity-Instruct-3M-0613-Llama3-70B
	google/flan-t5-small
	stabilityai/StableBeluga2
	google/gemma-2-2b-it
	google/gemma-2-2b
	abacusai/Smaug-Llama-3-70B-Instruct-32K
	abacusai/Smaug-Qwen2-72B-Instruct
	0-hero/Matter-0.2-7B-DPO
	google/flan-t5-xl
	abacusai/Llama-3-Smaug-8B
	DeepMount00/Llama-3-8b-Ita
	google/codegemma-1.1-2b
	Qwen/Qwen2-57B-A14B-Instruct
	microsoft/Phi-3.5-mini-instruct
	microsoft/Phi-3.5-MoE-instruct
	nvidia/Mistral-NeMo-Minitron-8B-Base
	google/gemma-2-27b-it
	google/gemma-2-27b
	google/flan-t5-base
	google/flan-t5-large
	google/flan-t5-xxl
	google/flan-ul2
	AALF/gemma-2-27b-it-SimPO-37K
	microsoft/Phi-3-medium-128k-instruct
	microsoft/Phi-3-small-8k-instruct
	mlabonne/ChimeraLlama-3-8B-v3
	mlabonne/ChimeraLlama-3-8B-v2
	abacusai/Smaug-Mixtral-v0.1
	abacusai/Dracarys-72B-Instruct
	abacusai/Liberated-Qwen1.5-14B
	CoolSpring/Qwen2-0.5B-Abyme
	abacusai/bigstral-12b-32k
	google/mt5-small
	google/mt5-base
	google/umt5-base
	google/switch-base-8
	mlabonne/Meta-Llama-3.1-8B-Instruct-abliterated
	google/mt5-xxl
	abacusai/bigyi-15b
	Qwen/Qwen2.5-7B-Instruct
	Qwen/Qwen2.5-7B
	Qwen/Qwen2.5-14B-Instruct
	Qwen/Qwen2.5-14B
	mistralai/Mistral-Small-Instruct-2409
	Qwen/Qwen2.5-3B-Instruct
	Qwen/Qwen2.5-32B-Instruct
	Qwen/Qwen2.5-0.5B-Instruct
	Qwen/Qwen2.5-0.5B
	Qwen/Qwen2.5-1.5B
	Qwen/Qwen2.5-1.5B-Instruct
	Qwen/Qwen2.5-3B
	Qwen/Qwen2.5-32B
	Qwen/Qwen2.5-72B-Instruct
	Qwen/Qwen2.5-72B
	Qwen/Qwen2.5-Coder-7B-Instruct
	Qwen/Qwen2.5-Math-7B-Instruct
	CohereForAI/c4ai-command-r-plus-08-2024
	Qwen/Qwen2-Math-7B
	1TuanPham/T-VisStar-7B-v0.1
	Qwen/Qwen2.5-Coder-7B
	Qwen/Qwen2-Math-72B-Instruct
	meta-llama/Llama-3.2-1B-Instruct
	meta-llama/Llama-3.2-1B
	meta-llama/Llama-3.2-3B-Instruct
	meta-llama/Llama-3.2-3B
	mlabonne/BigQwen2.5-Echo-47B-Instruct
	nvidia/Llama-3.1-Minitron-4B-Depth-Base
	nvidia/Nemotron-Mini-4B-Instruct
	nvidia/Minitron-4B-Base
	nvidia/Minitron-8B-Base
	AALF/gemma-2-27b-it-SimPO-37K-100steps
	Qwen/Qwen2.5-Math-7B
	Goekdeniz-Guelmez/Josiefied-Qwen2.5-1.5B-Instruct-abliterated-v2
	mistralai/Codestral-22B-v0.1
	Qwen/Qwen2.5-Math-72B-Instruct
	mlabonne/BigQwen2.5-52B-Instruct
	Cran-May/T.E-8.1
	allenai/OLMoE-1B-7B-0924
	allenai/OLMoE-1B-7B-0924-Instruct
	zelk12/recoilme-gemma-2-Ataraxy-9B-v0.1
	nvidia/Mistral-NeMo-Minitron-8B-Instruct
	zelk12/recoilme-gemma-2-Gutenberg-Doppel-9B-v0.1
	google/gemma-2-2b-jpn-it
	zelk12/recoilme-gemma-2-Ataraxy-9B-v0.2
	AtAndDev/Qwen2.5-1.5B-continuous-learnt
	mlabonne/Hermes-3-Llama-3.1-70B-lorablated
	nvidia/Llama-3.1-Nemotron-70B-Instruct-HF
	Gunulhona/Gemma-Ko-Merge-PEFT
	DeepAutoAI/d2nwg_causal_gpt2
	BlackBeenie/llama-3.1-8B-Galore-openassistant-guanaco
	DeepMount00/Lexora-Lite-3B
	Qwen/Qwen2-VL-7B-Instruct
	Qwen/Qwen2-VL-72B-Instruct
	TinyLlama/TinyLlama-1.1B-Chat-v0.5
	Marsouuu/lareneg1_78B-ECE-PRYMMAL-Martial
	OpenBuddy/openbuddy-nemotron-70b-v23.1-131k
	CohereForAI/aya-expanse-8b
	CohereForAI/aya-expanse-32b
	CultriX/Qwen2.5-14B-MegaMerge-pt2
	PJMixers-Dev/LLaMa-3.2-Instruct-JankMix-v0.2-SFT-HailMary-v0.1-KTO-3B
	BramVanroy/fietje-2
	BramVanroy/fietje-2-chat
	BramVanroy/GEITje-7B-ultra
	Gunulhona/Gemma-Ko-Merge
	BramVanroy/fietje-2-instruct
	CombinHorizon/Rombos-Qwen2.5-7B-Inst-BaseMerge-TIES
	DreadPoor/Aspire_1.3-8B_model-stock
	HuggingFaceTB/SmolLM2-135M
	HuggingFaceTB/SmolLM2-135M-Instruct
	HuggingFaceTB/SmolLM2-360M
	HuggingFaceTB/SmolLM2-1.7B
	HuggingFaceTB/SmolLM2-1.7B-Instruct
	3rd-Degree-Burn/Llama-3.1-8B-Squareroot-v1
	BlackBeenie/Neos-Gemma-2-9b
	BlackBeenie/Neos-Llama-3.1-base
	Qwen/Qwen2.5-Coder-14B-Instruct
	Qwen/Qwen2.5-Coder-14B
	HuggingFaceTB/SmolLM2-360M-Instruct
	Dans-DiscountModels/Mistral-7b-v0.3-Test-E0.7
	Goekdeniz-Guelmez/Josiefied-Qwen2.5-0.5B-Instruct-abliterated-v1
	BlackBeenie/Bloslain-8B-v0.2
	3rd-Degree-Burn/L-3.1-Science-Writer-8B
	CultriX/SeQwence-14B-v5
	Aurel9/testmerge-7b
	CultriX/SeQwence-14B
	mistralai/Mistral-Large-Instruct-2411
	AALF/FuseChat-Llama-3.1-8B-Instruct-preview
	GoToCompany/llama3-8b-cpt-sahabatai-v1-instruct
	AALF/FuseChat-Llama-3.1-8B-SFT-preview
	allenai/Llama-3.1-Tulu-3-8B
	allenai/Llama-3.1-Tulu-3-8B-DPO
	allenai/Llama-3.1-Tulu-3-8B-SFT
	allenai/Llama-3.1-Tulu-3-8B-RM
	FlofloB/10k_continued_pretraining_Phi-3-mini-4k-instruct_Unsloth_merged_16bit
	nvidia/OpenMath2-Llama3.1-8B
	CultriX/Qwestion-14B
	FlofloB/10k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit
	FlofloB/40k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit
	AGI-0/smartllama3.1-8B-001
	Delta-Vector/Control-8B-V1.1
	Junhoee/Qwen-Megumin
	Dans-DiscountModels/mistral-7b-test-merged
	CultriX/SeQwence-14Bv1
	CultriX/SeQwence-14B-EvolMerge
	CultriX/SeQwence-14B-EvolMergev1
	BlackBeenie/Neos-Phi-3-14B-v0.1
	CultriX/SeQwence-14Bv3
	DreadPoor/Sweetened_Condensed_Milk-8B-Model_Stock
	allenai/Llama-3.1-Tulu-3-70B-SFT
	allenai/Llama-3.1-Tulu-3-70B
	allenai/Llama-3.1-Tulu-3-70B-DPO
	Qwen/QwQ-32B-Preview
	Norquinal/Bravo
	JackFram/llama-68m
	JackFram/llama-160m
	mistralai/Ministral-8B-Instruct-2410
	DreadPoor/Matryoshka-8B-LINEAR
	ClaudioItaly/intelligence-cod-rag-7b-v3
	MaziyarPanahi/calme-3.2-instruct-78b
	meta-llama/Llama-3.3-70B-Instruct
	DreadPoor/remember_to_breathe-8b-Model-Stock
	Corianas/Neural-Mistral-7B
	nvidia/Hymba-1.5B-Base
	nvidia/Hymba-1.5B-Instruct
	CombinHorizon/Josiefied-abliteratedV4-Qwen2.5-14B-Inst-BaseMerge-TIES
	CombinHorizon/huihui-ai-abliteratedV2-Qwen2.5-14B-Inst-BaseMerge-TIES
	meta-llama/Llama-3.1-8B
	CombinHorizon/huihui-ai-abliterated-Qwen2.5-32B-Inst-BaseMerge-TIES
	CultriX/SeQwence-14Bv2
	AuraIndustries/Aura-8B
	DRXD1000/Atlas-7B
	Qwen/Qwen2.5-Coder-32B-Instruct
	Qwen/Qwen2.5-Coder-32B
	LGAI-EXAONE/EXAONE-3.5-7.8B-Instruct
	Goekdeniz-Guelmez/josie-7b-v6.0-step2000
	Corianas/Quokka_2.7b
	tiiuae/Falcon3-7B-Base
	tiiuae/Falcon3-10B-Base
	tiiuae/Falcon3-Mamba-7B-Base
	tiiuae/Falcon3-3B-Base
	tiiuae/Falcon3-Mamba-7B-Instruct
	tiiuae/Falcon3-1B-Base
	tiiuae/Falcon3-1B-Instruct
	tiiuae/Falcon3-3B-Instruct
	tiiuae/Falcon3-10B-Instruct
	tiiuae/Falcon3-7B-Instruct
	Alsebay/Qwen2.5-7B-test-novelist
	AuraIndustries/Aura-4B
	T145/ZEUS-8B-V8
	EpistemeAI/Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-Empathy
	Aashraf995/Creative-7B-nerd
	Aashraf995/Qwen-Evo-7B
	Aashraf995/QwenStock-14B
	Aashraf995/Gemma-Evo-10B
	AuraIndustries/Aura-MoE-2x4B
	Bllossom/llama-3.2-Korean-Bllossom-AICA-5B
	AuraIndustries/Aura-MoE-2x4B-v2
	HelpingAI/Cipher-20B
	HPAI-BSC/Qwen2.5-Aloe-Beta-7B
	DreadPoor/Again-8B-Model_Stock
	PJMixers-Dev/LLaMa-3.1-Instruct-Interleaved-Zeroed-13B
	DreadPoor/Elusive_Dragon_Heart-8B-LINEAR
	CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct-2412
	CultriX/Qwen2.5-14B-Emerged
	CultriX/Qwen2.5-14B-Wernickev3
	CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct
	CohereForAI/c4ai-command-r7b-12-2024
	EpistemeAI/Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-Logic
	CombinHorizon/zetasepic-abliteratedV2-Qwen2.5-32B-Inst-BaseMerge-TIES
	NyxKrage/Microsoft_Phi-4
	DreadPoor/Casuar-9B-Model_Stock
	CultriX/Qwen2.5-14B-Unity
	CultriX/Qwen2.5-14B-Broca
	CultriX/Qwenfinity-2.5-14B
	CultriX/Qwen2.5-14B-Brocav7
	CultriX/Qwen2.5-14B-Brocav3
	CultriX/Qwen2.5-14B-Brocav6
	CultriX/Qwen2.5-14B-FinalMerge
	ContactDoctor/Bio-Medical-Llama-3-8B
	Daemontatox/RA_Reasoner
	Daemontatox/PathfinderAI
	JayHyeon/Qwen-0.5B-eDPO-5epoch
	JayHyeon/Qwen-0.5B-IRPO-5epoch
	JayHyeon/Qwen-0.5B-DPO-5epoch
	JayHyeon/Qwen2.5-0.5B-Instruct-SFT
	JayHyeon/Qwen2.5-0.5B-Instruct-SFT-IRPO-1epoch_v1
	DreadPoor/UNTESTED-VENN_1.2-8B-Model_Stock
	JayHyeon/Qwen2.5-0.5B-SFT-1e-4
	Daemontatox/AetherTOT
	Daemontatox/PixelParse_AI
	DavieLion/Llama-3.2-1B-SPIN-iter3
	JayHyeon/Qwen2.5-0.5B-SFT-2e-4-3ep
	Daemontatox/RA_Reasoner2.0
	Daemontatox/AetherSett
	Daemontatox/Sphinx2.0
	Daemontatox/PathFinderAI2.0
	JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_5e-7_3ep_0alp_0lam_2ep
	JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_7e-7_3ep_0alp_0lam_1ep
	DreadPoor/Happy_New_Year-8B-Model_Stock
	Daemontatox/TinySphinx2.0
	Daemontatox/SphinX
	Daemontatox/PathFinderAi3.0
	Daemontatox/NemoR
	JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_7e-7_2ep_0alp_0lam
	Ahdoot/StructuredThinker-v0.3-MoreStructure
	Daemontatox/RA2.0
	JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-2ep_0alp_0lam
	JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-2ep_1alp_0lam
	JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-1ep_1alp_0lam
	DebateLabKIT/Llama-3.1-Argunaut-1-8B-SFT
	JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-3ep_0alp_0lam
	Daemontatox/MawaredT1
	JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-1ep_1alp_0lam
	JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-3ep_1alp_0lam
	JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-6-3ep_0alp_0lam
	DreadPoor/Derivative-8B-Model_Stock
	Alepach/notHumpback-M1
	Alepach/notHumpback-M0
	Danielbrdz/Barcenas-10b
	Ahdoot/Test_StealthThinker
	FuseAI/FuseChat-Llama-3.1-8B-Instruct
	JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_0.5_1e-7-2ep_0alp_0lam
	DreadPoor/Derivative_V2_ALT-8B-Model_Stock
	DreadPoor/Derivative_V2-8B-Model_Stock
	Daemontatox/CogitoZ14
	Goekdeniz-Guelmez/josie-7b-v6.0
	Goekdeniz-Guelmez/josie-3b-v6.0
	allenai/OLMo-2-1124-7B-Instruct
	DreadPoor/Derivative_V3-8B-Model_Stock
	Daemontatox/CogitoZ
	microsoft/phi-4
	FlofloB/smollm2-135M_pretrained_200k_fineweb_uncovai_selected
	JayHyeon/Qwen_0.5-DPO_5e-7-2ep_0alp_0lam
	JayHyeon/Qwen_0.5-DPO_5e-7-1ep_0alp_0lam
	JayHyeon/Qwen_0.5-DPOP_5e-7-2ep_0alp_5lam
	JayHyeon/Qwen_0.5-DPOP_5e-7-3ep_0alp_5lam
	JayHyeon/Qwen_0.5-DPOP_5e-7-1ep_0alp_5lam
	JayHyeon/Qwen_0.5-DPO_3e-6-2ep_0alp_0lam
	JayHyeon/Qwen_0.5-DPO_3e-6-1ep_0alp_0lam
	JayHyeon/Qwen_0.5-DPOP_3e-6-2ep_0alp_5lam
	JayHyeon/Qwen_0.5-IRPO_3e-6-2ep_1alp_0lam
	JayHyeon/Qwen_0.5-IRPO_3e-6-3ep_1alp_0lam
	JayHyeon/Qwen_0.5-DPOP_3e-6-3ep_0alp_5lam
	JayHyeon/Qwen_0.5-IRPO_3e-6-1ep_1alp_0lam
	JayHyeon/Qwen_0.5-MDPO_0.3_5e-7-3ep_0alp_0lam
	JayHyeon/Qwen_0.5-MDPO_0.3_3e-6-3ep_0alp_0lam
	JayHyeon/Qwen_0.5-MDPO_0.7_5e-7-3ep_0alp_0lam
	JayHyeon/Qwen_0.5-MDPO_0.7_3e-6-3ep_0alp_0lam
	Sakalti/Neptuno-Alpha
	FlofloB/smollm2-135M_pretrained_400k_fineweb_uncovai_selected
	FlofloB/smollm2-135M_pretrained_600k_fineweb_uncovai_selected
	DreadPoor/BaeZel_V3-8B-Model_Stock
	Daemontatox/AetherUncensored
	FlofloB/smollm2-135M_pretrained_1400k_fineweb_uncovai_selected
	CultriX/Qwen2.5-14B-BrocaV9
	DavidAU/Gemma-The-Writer-J.GutenBerg-10B
	OpenBuddy/openbuddy-llama3.3-70b-v24.1-131k
	deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
	deepseek-ai/DeepSeek-R1-Distill-Llama-8B
	deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
	deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
	deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
	deepseek-ai/DeepSeek-R1-Distill-Llama-70B
	nvidia/AceMath-1.5B-Instruct
	nvidia/AceMath-7B-RM
	nvidia/AceMath-7B-Instruct
	nvidia/AceInstruct-1.5B
	nvidia/AceInstruct-7B
	nvidia/AceInstruct-72B
	nvidia/AceMath-72B-Instruct
	Qwen/Qwen2.5-7B-Instruct-1M
	Qwen/Qwen2.5-14B-Instruct-1M
	nvidia/AceMath-72B-RM
	mistralai/Mistral-Small-24B-Base-2501
	meta-llama/Llama-3.1-8B-Instruct