Spaces:
Running
Running
Pinkstack/SuperThoughts-CoT-14B-16k-o1-QwQ | |
prithivMLmods/QwQ-LCoT-14B-Conversational | |
pankajmathur/orca_mini_phi-4 | |
01-ai/Yi-34B | |
Deci/DeciLM-7B | |
Qwen/Qwen1.5-7B | |
meta-llama/Meta-Llama-3-8B-Instruct | |
mistralai/Mistral-7B-v0.1 | |
microsoft/Phi-3-mini-4k-instruct | |
01-ai/Yi-1.5-9B-Chat | |
LLM360/K2 | |
01-ai/Yi-1.5-9B | |
meta-llama/Meta-Llama-3-8B | |
google/gemma-7b | |
google/recurrentgemma-2b | |
databricks/dbrx-base | |
meta-llama/Meta-Llama-3-70B-Instruct | |
HuggingFaceH4/zephyr-7b-beta | |
HuggingFaceH4/zephyr-7b-alpha | |
mistralai/Mistral-7B-v0.3 | |
mlabonne/AlphaMonarch-7B | |
mlabonne/Beyonder-4x7B-v3 | |
01-ai/Yi-1.5-6B-Chat | |
01-ai/Yi-1.5-6B | |
01-ai/Yi-1.5-9B-32K | |
01-ai/Yi-6B | |
stabilityai/stablelm-2-zephyr-1_6b | |
stabilityai/stablelm-2-1_6b-chat | |
01-ai/Yi-6B-Chat | |
stabilityai/stablelm-zephyr-3b | |
01-ai/Yi-1.5-9B-Chat-16K | |
stabilityai/stablelm-2-1_6b | |
allenai/OLMo-7B-hf | |
allenai/OLMo-7B-Instruct-hf | |
allenai/OLMo-1.7-7B-hf | |
Qwen/Qwen1.5-0.5B | |
mistral-community/Mixtral-8x22B-v0.1 | |
01-ai/Yi-1.5-34B | |
01-ai/Yi-1.5-34B-32K | |
01-ai/Yi-34B-Chat | |
microsoft/phi-1 | |
meta-llama/Llama-2-7b-chat-hf | |
meta-llama/Llama-2-7b-hf | |
meta-llama/Llama-2-70b-chat-hf | |
meta-llama/Meta-Llama-3-70B | |
meta-llama/Llama-2-70b-hf | |
microsoft/phi-1_5 | |
microsoft/phi-2 | |
Qwen/Qwen2-1.5B | |
Qwen/Qwen2-0.5B | |
google/gemma-2b | |
mlabonne/NeuralDaredevil-8B-abliterated | |
Qwen/Qwen2-7B | |
HuggingFaceH4/zephyr-7b-gemma-v0.1 | |
stabilityai/stablelm-2-12b-chat | |
Qwen/Qwen2-7B-Instruct | |
Qwen/Qwen1.5-4B-Chat | |
Qwen/Qwen1.5-0.5B-Chat | |
Qwen/Qwen1.5-1.8B-Chat | |
Qwen/Qwen1.5-14B-Chat | |
Qwen/Qwen1.5-7B-Chat | |
meta-llama/Llama-2-13b-chat-hf | |
Qwen/Qwen1.5-1.8B | |
Qwen/Qwen1.5-14B | |
tiiuae/falcon-7b | |
databricks/dolly-v2-7b | |
Qwen/Qwen1.5-MoE-A2.7B | |
Qwen/Qwen1.5-MoE-A2.7B-Chat | |
01-ai/Yi-1.5-34B-Chat | |
01-ai/Yi-34B-200K | |
abacusai/Smaug-34B-v0.1 | |
abacusai/Smaug-72B-v0.1 | |
google/gemma-7b-it | |
HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1 | |
google/gemma-2b-it | |
google/gemma-1.1-2b-it | |
google/gemma-1.1-7b-it | |
mistralai/Mistral-7B-Instruct-v0.1 | |
google/recurrentgemma-2b-it | |
mlabonne/OrpoLlama-3-8B | |
mlabonne/phixtral-2x2_8 | |
Qwen/Qwen2-1.5B-Instruct | |
stabilityai/stablelm-2-12b | |
Qwen/Qwen1.5-4B | |
stabilityai/stablelm-3b-4e1t | |
microsoft/Phi-3-medium-4k-instruct | |
Qwen/Qwen2-0.5B-Instruct | |
deepseek-ai/deepseek-llm-7b-chat | |
microsoft/Phi-3-small-128k-instruct | |
mistral-community/Mistral-7B-v0.2 | |
meta-llama/Llama-2-13b-hf | |
CohereForAI/aya-23-8B | |
databricks/dolly-v2-3b | |
databricks/dolly-v2-12b | |
deepseek-ai/deepseek-moe-16b-chat | |
mistralai/Mistral-7B-Instruct-v0.3 | |
deepseek-ai/deepseek-moe-16b-base | |
microsoft/DialoGPT-medium | |
mistralai/Mixtral-8x7B-Instruct-v0.1 | |
deepseek-ai/deepseek-llm-7b-base | |
databricks/dolly-v1-6b | |
mistralai/Mixtral-8x7B-v0.1 | |
CohereForAI/c4ai-command-r-v01 | |
CohereForAI/aya-23-35B | |
mistral-community/mixtral-8x22B-v0.3 | |
tiiuae/falcon-40b-instruct | |
tiiuae/falcon-40b | |
CohereForAI/c4ai-command-r-plus | |
microsoft/Orca-2-7b | |
Qwen/Qwen1.5-110B-Chat | |
allenai/OLMo-1B-hf | |
microsoft/Orca-2-13b | |
LLM360/K2-Chat | |
mistralai/Mixtral-8x22B-v0.1 | |
microsoft/Phi-3-mini-128k-instruct | |
Qwen/Qwen2-72B-Instruct | |
Qwen/Qwen1.5-110B | |
Qwen/Qwen1.5-32B-Chat | |
Qwen/Qwen2-72B | |
deepseek-ai/deepseek-llm-67b-chat | |
Qwen/Qwen1.5-32B | |
NousResearch/Yarn-Llama-2-13b-128k | |
google/recurrentgemma-9b | |
google/recurrentgemma-9b-it | |
pankajmathur/orca_mini_7b | |
meta-llama/Meta-Llama-3.1-8B | |
01-ai/Yi-1.5-34B-Chat-16K | |
meta-llama/Meta-Llama-3.1-70B | |
HuggingFaceTB/SmolLM-1.7B | |
mlabonne/Daredevil-8B | |
HuggingFaceTB/SmolLM-1.7B-Instruct | |
HuggingFaceTB/SmolLM-135M-Instruct | |
HuggingFaceTB/SmolLM-135M | |
HuggingFaceTB/SmolLM-360M-Instruct | |
HuggingFaceTB/SmolLM-360M | |
meta-llama/Meta-Llama-3.1-8B-Instruct | |
mistralai/Mistral-Nemo-Instruct-2407 | |
mistralai/Mistral-Nemo-Base-2407 | |
meta-llama/Meta-Llama-3.1-70B-Instruct | |
mlabonne/NeuralBeagle14-7B | |
mlabonne/Daredevil-8B-abliterated | |
tiiuae/falcon-mamba-7b | |
BAAI/Infinity-Instruct-3M-0613-Llama3-70B | |
google/flan-t5-small | |
stabilityai/StableBeluga2 | |
google/gemma-2-2b-it | |
google/gemma-2-2b | |
abacusai/Smaug-Llama-3-70B-Instruct-32K | |
abacusai/Smaug-Qwen2-72B-Instruct | |
0-hero/Matter-0.2-7B-DPO | |
google/flan-t5-xl | |
abacusai/Llama-3-Smaug-8B | |
DeepMount00/Llama-3-8b-Ita | |
google/codegemma-1.1-2b | |
Qwen/Qwen2-57B-A14B-Instruct | |
microsoft/Phi-3.5-mini-instruct | |
microsoft/Phi-3.5-MoE-instruct | |
nvidia/Mistral-NeMo-Minitron-8B-Base | |
google/gemma-2-27b-it | |
google/gemma-2-27b | |
google/flan-t5-base | |
google/flan-t5-large | |
google/flan-t5-xxl | |
google/flan-ul2 | |
AALF/gemma-2-27b-it-SimPO-37K | |
microsoft/Phi-3-medium-128k-instruct | |
microsoft/Phi-3-small-8k-instruct | |
mlabonne/ChimeraLlama-3-8B-v3 | |
mlabonne/ChimeraLlama-3-8B-v2 | |
abacusai/Smaug-Mixtral-v0.1 | |
abacusai/Dracarys-72B-Instruct | |
abacusai/Liberated-Qwen1.5-14B | |
CoolSpring/Qwen2-0.5B-Abyme | |
abacusai/bigstral-12b-32k | |
google/mt5-small | |
google/mt5-base | |
google/umt5-base | |
google/switch-base-8 | |
mlabonne/Meta-Llama-3.1-8B-Instruct-abliterated | |
google/mt5-xxl | |
abacusai/bigyi-15b | |
Qwen/Qwen2.5-7B-Instruct | |
Qwen/Qwen2.5-7B | |
Qwen/Qwen2.5-14B-Instruct | |
Qwen/Qwen2.5-14B | |
mistralai/Mistral-Small-Instruct-2409 | |
Qwen/Qwen2.5-3B-Instruct | |
Qwen/Qwen2.5-32B-Instruct | |
Qwen/Qwen2.5-0.5B-Instruct | |
Qwen/Qwen2.5-0.5B | |
Qwen/Qwen2.5-1.5B | |
Qwen/Qwen2.5-1.5B-Instruct | |
Qwen/Qwen2.5-3B | |
Qwen/Qwen2.5-32B | |
Qwen/Qwen2.5-72B-Instruct | |
Qwen/Qwen2.5-72B | |
Qwen/Qwen2.5-Coder-7B-Instruct | |
Qwen/Qwen2.5-Math-7B-Instruct | |
CohereForAI/c4ai-command-r-plus-08-2024 | |
Qwen/Qwen2-Math-7B | |
1TuanPham/T-VisStar-7B-v0.1 | |
Qwen/Qwen2.5-Coder-7B | |
Qwen/Qwen2-Math-72B-Instruct | |
meta-llama/Llama-3.2-1B-Instruct | |
meta-llama/Llama-3.2-1B | |
meta-llama/Llama-3.2-3B-Instruct | |
meta-llama/Llama-3.2-3B | |
mlabonne/BigQwen2.5-Echo-47B-Instruct | |
nvidia/Llama-3.1-Minitron-4B-Depth-Base | |
nvidia/Nemotron-Mini-4B-Instruct | |
nvidia/Minitron-4B-Base | |
nvidia/Minitron-8B-Base | |
AALF/gemma-2-27b-it-SimPO-37K-100steps | |
Qwen/Qwen2.5-Math-7B | |
Goekdeniz-Guelmez/Josiefied-Qwen2.5-1.5B-Instruct-abliterated-v2 | |
mistralai/Codestral-22B-v0.1 | |
Qwen/Qwen2.5-Math-72B-Instruct | |
mlabonne/BigQwen2.5-52B-Instruct | |
Cran-May/T.E-8.1 | |
allenai/OLMoE-1B-7B-0924 | |
allenai/OLMoE-1B-7B-0924-Instruct | |
zelk12/recoilme-gemma-2-Ataraxy-9B-v0.1 | |
nvidia/Mistral-NeMo-Minitron-8B-Instruct | |
zelk12/recoilme-gemma-2-Gutenberg-Doppel-9B-v0.1 | |
google/gemma-2-2b-jpn-it | |
zelk12/recoilme-gemma-2-Ataraxy-9B-v0.2 | |
AtAndDev/Qwen2.5-1.5B-continuous-learnt | |
mlabonne/Hermes-3-Llama-3.1-70B-lorablated | |
nvidia/Llama-3.1-Nemotron-70B-Instruct-HF | |
Gunulhona/Gemma-Ko-Merge-PEFT | |
DeepAutoAI/d2nwg_causal_gpt2 | |
BlackBeenie/llama-3.1-8B-Galore-openassistant-guanaco | |
DeepMount00/Lexora-Lite-3B | |
Qwen/Qwen2-VL-7B-Instruct | |
Qwen/Qwen2-VL-72B-Instruct | |
TinyLlama/TinyLlama-1.1B-Chat-v0.5 | |
Marsouuu/lareneg1_78B-ECE-PRYMMAL-Martial | |
OpenBuddy/openbuddy-nemotron-70b-v23.1-131k | |
CohereForAI/aya-expanse-8b | |
CohereForAI/aya-expanse-32b | |
CultriX/Qwen2.5-14B-MegaMerge-pt2 | |
PJMixers-Dev/LLaMa-3.2-Instruct-JankMix-v0.2-SFT-HailMary-v0.1-KTO-3B | |
BramVanroy/fietje-2 | |
BramVanroy/fietje-2-chat | |
BramVanroy/GEITje-7B-ultra | |
Gunulhona/Gemma-Ko-Merge | |
BramVanroy/fietje-2-instruct | |
CombinHorizon/Rombos-Qwen2.5-7B-Inst-BaseMerge-TIES | |
DreadPoor/Aspire_1.3-8B_model-stock | |
HuggingFaceTB/SmolLM2-135M | |
HuggingFaceTB/SmolLM2-135M-Instruct | |
HuggingFaceTB/SmolLM2-360M | |
HuggingFaceTB/SmolLM2-1.7B | |
HuggingFaceTB/SmolLM2-1.7B-Instruct | |
3rd-Degree-Burn/Llama-3.1-8B-Squareroot-v1 | |
BlackBeenie/Neos-Gemma-2-9b | |
BlackBeenie/Neos-Llama-3.1-base | |
Qwen/Qwen2.5-Coder-14B-Instruct | |
Qwen/Qwen2.5-Coder-14B | |
HuggingFaceTB/SmolLM2-360M-Instruct | |
Dans-DiscountModels/Mistral-7b-v0.3-Test-E0.7 | |
Goekdeniz-Guelmez/Josiefied-Qwen2.5-0.5B-Instruct-abliterated-v1 | |
BlackBeenie/Bloslain-8B-v0.2 | |
3rd-Degree-Burn/L-3.1-Science-Writer-8B | |
CultriX/SeQwence-14B-v5 | |
Aurel9/testmerge-7b | |
CultriX/SeQwence-14B | |
mistralai/Mistral-Large-Instruct-2411 | |
AALF/FuseChat-Llama-3.1-8B-Instruct-preview | |
GoToCompany/llama3-8b-cpt-sahabatai-v1-instruct | |
AALF/FuseChat-Llama-3.1-8B-SFT-preview | |
allenai/Llama-3.1-Tulu-3-8B | |
allenai/Llama-3.1-Tulu-3-8B-DPO | |
allenai/Llama-3.1-Tulu-3-8B-SFT | |
allenai/Llama-3.1-Tulu-3-8B-RM | |
FlofloB/10k_continued_pretraining_Phi-3-mini-4k-instruct_Unsloth_merged_16bit | |
nvidia/OpenMath2-Llama3.1-8B | |
CultriX/Qwestion-14B | |
FlofloB/10k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit | |
FlofloB/40k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit | |
AGI-0/smartllama3.1-8B-001 | |
Delta-Vector/Control-8B-V1.1 | |
Junhoee/Qwen-Megumin | |
Dans-DiscountModels/mistral-7b-test-merged | |
CultriX/SeQwence-14Bv1 | |
CultriX/SeQwence-14B-EvolMerge | |
CultriX/SeQwence-14B-EvolMergev1 | |
BlackBeenie/Neos-Phi-3-14B-v0.1 | |
CultriX/SeQwence-14Bv3 | |
DreadPoor/Sweetened_Condensed_Milk-8B-Model_Stock | |
allenai/Llama-3.1-Tulu-3-70B-SFT | |
allenai/Llama-3.1-Tulu-3-70B | |
allenai/Llama-3.1-Tulu-3-70B-DPO | |
Qwen/QwQ-32B-Preview | |
Norquinal/Bravo | |
JackFram/llama-68m | |
JackFram/llama-160m | |
mistralai/Ministral-8B-Instruct-2410 | |
DreadPoor/Matryoshka-8B-LINEAR | |
ClaudioItaly/intelligence-cod-rag-7b-v3 | |
MaziyarPanahi/calme-3.2-instruct-78b | |
meta-llama/Llama-3.3-70B-Instruct | |
DreadPoor/remember_to_breathe-8b-Model-Stock | |
Corianas/Neural-Mistral-7B | |
nvidia/Hymba-1.5B-Base | |
nvidia/Hymba-1.5B-Instruct | |
CombinHorizon/Josiefied-abliteratedV4-Qwen2.5-14B-Inst-BaseMerge-TIES | |
CombinHorizon/huihui-ai-abliteratedV2-Qwen2.5-14B-Inst-BaseMerge-TIES | |
meta-llama/Llama-3.1-8B | |
CombinHorizon/huihui-ai-abliterated-Qwen2.5-32B-Inst-BaseMerge-TIES | |
CultriX/SeQwence-14Bv2 | |
AuraIndustries/Aura-8B | |
DRXD1000/Atlas-7B | |
Qwen/Qwen2.5-Coder-32B-Instruct | |
Qwen/Qwen2.5-Coder-32B | |
LGAI-EXAONE/EXAONE-3.5-7.8B-Instruct | |
Goekdeniz-Guelmez/josie-7b-v6.0-step2000 | |
Corianas/Quokka_2.7b | |
tiiuae/Falcon3-7B-Base | |
tiiuae/Falcon3-10B-Base | |
tiiuae/Falcon3-Mamba-7B-Base | |
tiiuae/Falcon3-3B-Base | |
tiiuae/Falcon3-Mamba-7B-Instruct | |
tiiuae/Falcon3-1B-Base | |
tiiuae/Falcon3-1B-Instruct | |
tiiuae/Falcon3-3B-Instruct | |
tiiuae/Falcon3-10B-Instruct | |
tiiuae/Falcon3-7B-Instruct | |
Alsebay/Qwen2.5-7B-test-novelist | |
AuraIndustries/Aura-4B | |
T145/ZEUS-8B-V8 | |
EpistemeAI/Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-Empathy | |
Aashraf995/Creative-7B-nerd | |
Aashraf995/Qwen-Evo-7B | |
Aashraf995/QwenStock-14B | |
Aashraf995/Gemma-Evo-10B | |
AuraIndustries/Aura-MoE-2x4B | |
Bllossom/llama-3.2-Korean-Bllossom-AICA-5B | |
AuraIndustries/Aura-MoE-2x4B-v2 | |
HelpingAI/Cipher-20B | |
HPAI-BSC/Qwen2.5-Aloe-Beta-7B | |
DreadPoor/Again-8B-Model_Stock | |
PJMixers-Dev/LLaMa-3.1-Instruct-Interleaved-Zeroed-13B | |
DreadPoor/Elusive_Dragon_Heart-8B-LINEAR | |
CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct-2412 | |
CultriX/Qwen2.5-14B-Emerged | |
CultriX/Qwen2.5-14B-Wernickev3 | |
CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct | |
CohereForAI/c4ai-command-r7b-12-2024 | |
EpistemeAI/Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-Logic | |
CombinHorizon/zetasepic-abliteratedV2-Qwen2.5-32B-Inst-BaseMerge-TIES | |
NyxKrage/Microsoft_Phi-4 | |
DreadPoor/Casuar-9B-Model_Stock | |
CultriX/Qwen2.5-14B-Unity | |
CultriX/Qwen2.5-14B-Broca | |
CultriX/Qwenfinity-2.5-14B | |
CultriX/Qwen2.5-14B-Brocav7 | |
CultriX/Qwen2.5-14B-Brocav3 | |
CultriX/Qwen2.5-14B-Brocav6 | |
CultriX/Qwen2.5-14B-FinalMerge | |
ContactDoctor/Bio-Medical-Llama-3-8B | |
Daemontatox/RA_Reasoner | |
Daemontatox/PathfinderAI | |
JayHyeon/Qwen-0.5B-eDPO-5epoch | |
JayHyeon/Qwen-0.5B-IRPO-5epoch | |
JayHyeon/Qwen-0.5B-DPO-5epoch | |
JayHyeon/Qwen2.5-0.5B-Instruct-SFT | |
JayHyeon/Qwen2.5-0.5B-Instruct-SFT-IRPO-1epoch_v1 | |
DreadPoor/UNTESTED-VENN_1.2-8B-Model_Stock | |
JayHyeon/Qwen2.5-0.5B-SFT-1e-4 | |
Daemontatox/AetherTOT | |
Daemontatox/PixelParse_AI | |
DavieLion/Llama-3.2-1B-SPIN-iter3 | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-4-3ep | |
Daemontatox/RA_Reasoner2.0 | |
Daemontatox/AetherSett | |
Daemontatox/Sphinx2.0 | |
Daemontatox/PathFinderAI2.0 | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_5e-7_3ep_0alp_0lam_2ep | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_7e-7_3ep_0alp_0lam_1ep | |
DreadPoor/Happy_New_Year-8B-Model_Stock | |
Daemontatox/TinySphinx2.0 | |
Daemontatox/SphinX | |
Daemontatox/PathFinderAi3.0 | |
Daemontatox/NemoR | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_7e-7_2ep_0alp_0lam | |
Ahdoot/StructuredThinker-v0.3-MoreStructure | |
Daemontatox/RA2.0 | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-2ep_0alp_0lam | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-2ep_1alp_0lam | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-1ep_1alp_0lam | |
DebateLabKIT/Llama-3.1-Argunaut-1-8B-SFT | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-3ep_0alp_0lam | |
Daemontatox/MawaredT1 | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-1ep_1alp_0lam | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-3ep_1alp_0lam | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-6-3ep_0alp_0lam | |
DreadPoor/Derivative-8B-Model_Stock | |
Alepach/notHumpback-M1 | |
Alepach/notHumpback-M0 | |
Danielbrdz/Barcenas-10b | |
Ahdoot/Test_StealthThinker | |
FuseAI/FuseChat-Llama-3.1-8B-Instruct | |
JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_0.5_1e-7-2ep_0alp_0lam | |
DreadPoor/Derivative_V2_ALT-8B-Model_Stock | |
DreadPoor/Derivative_V2-8B-Model_Stock | |
Daemontatox/CogitoZ14 | |
Goekdeniz-Guelmez/josie-7b-v6.0 | |
Goekdeniz-Guelmez/josie-3b-v6.0 | |
allenai/OLMo-2-1124-7B-Instruct | |
DreadPoor/Derivative_V3-8B-Model_Stock | |
Daemontatox/CogitoZ | |
microsoft/phi-4 | |
FlofloB/smollm2-135M_pretrained_200k_fineweb_uncovai_selected | |
JayHyeon/Qwen_0.5-DPO_5e-7-2ep_0alp_0lam | |
JayHyeon/Qwen_0.5-DPO_5e-7-1ep_0alp_0lam | |
JayHyeon/Qwen_0.5-DPOP_5e-7-2ep_0alp_5lam | |
JayHyeon/Qwen_0.5-DPOP_5e-7-3ep_0alp_5lam | |
JayHyeon/Qwen_0.5-DPOP_5e-7-1ep_0alp_5lam | |
JayHyeon/Qwen_0.5-DPO_3e-6-2ep_0alp_0lam | |
JayHyeon/Qwen_0.5-DPO_3e-6-1ep_0alp_0lam | |
JayHyeon/Qwen_0.5-DPOP_3e-6-2ep_0alp_5lam | |
JayHyeon/Qwen_0.5-IRPO_3e-6-2ep_1alp_0lam | |
JayHyeon/Qwen_0.5-IRPO_3e-6-3ep_1alp_0lam | |
JayHyeon/Qwen_0.5-DPOP_3e-6-3ep_0alp_5lam | |
JayHyeon/Qwen_0.5-IRPO_3e-6-1ep_1alp_0lam | |
JayHyeon/Qwen_0.5-MDPO_0.3_5e-7-3ep_0alp_0lam | |
JayHyeon/Qwen_0.5-MDPO_0.3_3e-6-3ep_0alp_0lam | |
JayHyeon/Qwen_0.5-MDPO_0.7_5e-7-3ep_0alp_0lam | |
JayHyeon/Qwen_0.5-MDPO_0.7_3e-6-3ep_0alp_0lam | |
Sakalti/Neptuno-Alpha | |
FlofloB/smollm2-135M_pretrained_400k_fineweb_uncovai_selected | |
FlofloB/smollm2-135M_pretrained_600k_fineweb_uncovai_selected | |
DreadPoor/BaeZel_V3-8B-Model_Stock | |
Daemontatox/AetherUncensored | |
FlofloB/smollm2-135M_pretrained_1400k_fineweb_uncovai_selected | |
CultriX/Qwen2.5-14B-BrocaV9 | |
DavidAU/Gemma-The-Writer-J.GutenBerg-10B | |
OpenBuddy/openbuddy-llama3.3-70b-v24.1-131k | |
deepseek-ai/DeepSeek-R1-Distill-Qwen-14B | |
deepseek-ai/DeepSeek-R1-Distill-Llama-8B | |
deepseek-ai/DeepSeek-R1-Distill-Qwen-7B | |
deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B | |
deepseek-ai/DeepSeek-R1-Distill-Qwen-32B | |
deepseek-ai/DeepSeek-R1-Distill-Llama-70B | |
nvidia/AceMath-1.5B-Instruct | |
nvidia/AceMath-7B-RM | |
nvidia/AceMath-7B-Instruct | |
nvidia/AceInstruct-1.5B | |
nvidia/AceInstruct-7B | |
nvidia/AceInstruct-72B | |
nvidia/AceMath-72B-Instruct | |
Qwen/Qwen2.5-7B-Instruct-1M | |
Qwen/Qwen2.5-14B-Instruct-1M | |
nvidia/AceMath-72B-RM | |
mistralai/Mistral-Small-24B-Base-2501 | |
meta-llama/Llama-3.1-8B-Instruct | |