@@ -490,24 +490,24 @@ <h2>Supported models</h2>
490490 < p > 28 architectures across 16 model families. Load any GGUF model from HuggingFace.</ p >
491491 </ div >
492492 < div class ="model-grid ">
493- < div class ="model-card "> < div class ="name "> Gemma 3/3n</ div > < div class ="status prod "> Production </ div > </ div >
494- < div class ="model-card "> < div class ="name "> Llama 3/4</ div > < div class ="status prod "> Production </ div > </ div >
495- < div class ="model-card "> < div class ="name "> Qwen 2.5</ div > < div class ="status prod "> Production </ div > </ div >
496- < div class ="model-card "> < div class ="name "> Mistral/Mixtral</ div > < div class ="status prod "> Production </ div > </ div >
497- < div class ="model-card "> < div class ="name "> Phi 3/4</ div > < div class ="status prod "> Production </ div > </ div >
493+ < div class ="model-card "> < div class ="name "> Gemma 3/3n</ div > < div class ="status prod "> Transformer </ div > </ div >
494+ < div class ="model-card "> < div class ="name "> Llama 3/4</ div > < div class ="status prod "> Transformer </ div > </ div >
495+ < div class ="model-card "> < div class ="name "> Qwen 2.5</ div > < div class ="status prod "> Transformer </ div > </ div >
496+ < div class ="model-card "> < div class ="name "> Mistral/Mixtral</ div > < div class ="status prod "> Transformer + MoE </ div > </ div >
497+ < div class ="model-card "> < div class ="name "> Phi 3/4</ div > < div class ="status prod "> Transformer </ div > </ div >
498498 < div class ="model-card "> < div class ="name "> DeepSeek V3</ div > < div class ="status prod "> MLA + MoE</ div > </ div >
499- < div class ="model-card "> < div class ="name "> GPT-2</ div > < div class ="status prod "> TinyStories </ div > </ div >
500- < div class ="model-card "> < div class ="name "> Nemotron-H</ div > < div class ="status "> Hybrid Mamba+ MoE</ div > </ div >
501- < div class ="model-card "> < div class ="name "> MiniMax M2</ div > < div class ="status "> Sigmoid MoE</ div > </ div >
502- < div class ="model-card "> < div class ="name "> Command R</ div > < div class ="status prod "> Production </ div > </ div >
503- < div class ="model-card "> < div class ="name "> Falcon</ div > < div class ="status prod "> Production </ div > </ div >
504- < div class ="model-card "> < div class ="name "> RWKV</ div > < div class ="status "> Linear attention</ div > </ div >
505- < div class ="model-card "> < div class ="name "> Mamba/Mamba 3</ div > < div class ="status "> State space</ div > </ div >
506- < div class ="model-card "> < div class ="name "> Jamba</ div > < div class ="status "> Hybrid SSM</ div > </ div >
507- < div class ="model-card "> < div class ="name "> Whisper</ div > < div class ="status "> Audio</ div > </ div >
508- < div class ="model-card "> < div class ="name "> LLaVA/Qwen-VL</ div > < div class ="status "> Vision-language</ div > </ div >
509- < div class ="model-card "> < div class ="name "> BERT</ div > < div class ="status "> Encoder</ div > </ div >
510- < div class ="model-card "> < div class ="name "> Granite TS</ div > < div class ="status "> Time series</ div > </ div >
499+ < div class ="model-card "> < div class ="name "> GPT-2</ div > < div class ="status prod "> Transformer </ div > </ div >
500+ < div class ="model-card "> < div class ="name "> Nemotron-H</ div > < div class ="status prod "> Hybrid Mamba + MoE</ div > </ div >
501+ < div class ="model-card "> < div class ="name "> MiniMax M2</ div > < div class ="status prod "> Sigmoid MoE</ div > </ div >
502+ < div class ="model-card "> < div class ="name "> Command R</ div > < div class ="status prod "> Transformer </ div > </ div >
503+ < div class ="model-card "> < div class ="name "> Falcon</ div > < div class ="status prod "> Transformer </ div > </ div >
504+ < div class ="model-card "> < div class ="name "> RWKV</ div > < div class ="status prod "> Linear attention</ div > </ div >
505+ < div class ="model-card "> < div class ="name "> Mamba/Mamba 3</ div > < div class ="status prod "> State space model </ div > </ div >
506+ < div class ="model-card "> < div class ="name "> Jamba</ div > < div class ="status prod "> Hybrid SSM + Transformer </ div > </ div >
507+ < div class ="model-card "> < div class ="name "> Whisper</ div > < div class ="status prod "> Audio transcription </ div > </ div >
508+ < div class ="model-card "> < div class ="name "> LLaVA/Qwen-VL</ div > < div class ="status prod "> Vision-language</ div > </ div >
509+ < div class ="model-card "> < div class ="name "> BERT</ div > < div class ="status prod "> Encoder</ div > </ div >
510+ < div class ="model-card "> < div class ="name "> Granite TS</ div > < div class ="status prod "> Time series</ div > </ div >
511511 </ div >
512512 < div style ="text-align:center;margin-top:32px ">
513513 < p style ="color:var(--fg3);font-size:.875rem "> Uses GGUF as the sole model format. Compatible with llama.cpp, Ollama, LM Studio, and GPT4All model files.</ p >
0 commit comments