Files
odysseus/services/hwfit/data/hf_models.json
2026-06-02 12:15:47 +09:00

19046 lines
473 KiB
JSON

[
{
"name": "echarlaix/tiny-random-PhiForCausalLM",
"provider": "echarlaix",
"parameter_count": "80K",
"parameters_raw": 80074,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 512,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phi",
"hf_downloads": 24984,
"hf_likes": 0,
"release_date": "2024-03-29",
"_discovered": true
},
{
"name": "peft-internal-testing/tiny-random-GPT2LMHeadModel",
"provider": "peft-internal-testing",
"parameter_count": "83K",
"parameters_raw": 83161,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 512,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt2",
"hf_downloads": 37534,
"hf_likes": 0,
"release_date": "2025-11-17",
"_discovered": true
},
{
"name": "peft-internal-testing/tiny-random-gpt2",
"provider": "peft-internal-testing",
"parameter_count": "112K",
"parameters_raw": 111968,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 512,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt2",
"hf_downloads": 28458,
"hf_likes": 0,
"release_date": "2025-11-17",
"_discovered": true
},
{
"name": "peft-internal-testing/tiny-random-GPTJForCausalLM",
"provider": "peft-internal-testing",
"parameter_count": "129K",
"parameters_raw": 129184,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 512,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gptj",
"hf_downloads": 38953,
"hf_likes": 0,
"release_date": "2025-11-17",
"_discovered": true
},
{
"name": "allenai/Olmo-3-7B-Instruct",
"provider": "allenai",
"parameter_count": "528K",
"parameters_raw": 528384,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 65536,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo3",
"hf_downloads": 101787,
"hf_likes": 118,
"release_date": "2025-11-19",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/Olmo-3-7B-Instruct-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "allenai/Olmo-3-7B-Think",
"provider": "allenai",
"parameter_count": "528K",
"parameters_raw": 528384,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 65536,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo3",
"hf_downloads": 44414,
"hf_likes": 88,
"release_date": "2025-11-18",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/Olmo-3-7B-Think-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "allenai/Olmo-3-7B-Think-DPO",
"provider": "allenai",
"parameter_count": "528K",
"parameters_raw": 528384,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 65536,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo3",
"hf_downloads": 21555,
"hf_likes": 7,
"release_date": "2025-11-18",
"_discovered": true
},
{
"name": "MaxJeblick/llama2-0b-unit-test",
"provider": "maxjeblick",
"parameter_count": "771K",
"parameters_raw": 770940,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 1024,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 48409,
"hf_likes": 2,
"release_date": "2023-10-25",
"_discovered": true
},
{
"name": "peft-internal-testing/tiny-random-OPTForCausalLM",
"provider": "peft-internal-testing",
"parameter_count": "812K",
"parameters_raw": 812404,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 100,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "opt",
"hf_downloads": 388627,
"hf_likes": 0,
"release_date": "2025-11-13",
"_discovered": true
},
{
"name": "hmellor/tiny-random-LlamaForCausalLM",
"provider": "hmellor",
"parameter_count": "1M",
"parameters_raw": 1062992,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 1295572,
"hf_likes": 0,
"release_date": "2025-04-29",
"_discovered": true
},
{
"name": "peft-internal-testing/tiny-dummy-qwen2",
"provider": "peft-internal-testing",
"parameter_count": "1M",
"parameters_raw": 1217480,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 102441,
"hf_likes": 0,
"release_date": "2024-07-04",
"_discovered": true
},
{
"name": "SimpleStories/SimpleStories-1.25M",
"provider": "simplestories",
"parameter_count": "1M",
"parameters_raw": 1245824,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 512,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 86406,
"hf_likes": 1,
"release_date": "2025-04-22",
"_discovered": true
},
{
"name": "optimum-intel-internal-testing/tiny-random-Phi3ForCausalLM",
"provider": "optimum-intel-internal-testing",
"parameter_count": "2M",
"parameters_raw": 2072736,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phi3",
"hf_downloads": 22058,
"hf_likes": 0,
"release_date": "2025-10-21",
"_discovered": true
},
{
"name": "llamafactory/tiny-random-qwen3",
"provider": "llamafactory",
"parameter_count": "2M",
"parameters_raw": 2439264,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Lightweight, edge deployment",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 47369,
"hf_likes": 0,
"release_date": "2026-01-06",
"_discovered": true
},
{
"name": "tiny-random/qwen3-next-moe",
"provider": "tiny-random",
"parameter_count": "3M",
"parameters_raw": 2839160,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Lightweight, edge deployment",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 27920,
"hf_likes": 4,
"release_date": "2025-09-12",
"is_moe": true,
"num_experts": 32,
"active_experts": 10,
"active_parameters": 984828,
"_discovered": true
},
{
"name": "llamafactory/tiny-random-Llama-3",
"provider": "llamafactory",
"parameter_count": "4M",
"parameters_raw": 4112464,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 950276,
"hf_likes": 3,
"release_date": "2024-06-07",
"_discovered": true
},
{
"name": "Maykeye/TinyLLama-v0",
"provider": "maykeye",
"parameter_count": "5M",
"parameters_raw": 4621392,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 32384,
"hf_likes": 43,
"release_date": "2023-07-08",
"_discovered": true
},
{
"name": "optimum-intel-internal-testing/tiny-random-gpt-oss-mxfp4",
"provider": "optimum-intel-internal-testing",
"parameter_count": "7M",
"parameters_raw": 6865444,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_oss",
"hf_downloads": 27904,
"hf_likes": 0,
"release_date": "2025-10-21",
"is_moe": true,
"num_experts": 32,
"active_experts": 4,
"active_parameters": 1158540,
"_discovered": true
},
{
"name": "hmellor/tiny-random-Gemma2ForCausalLM",
"provider": "hmellor",
"parameter_count": "8M",
"parameters_raw": 8438816,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gemma2",
"hf_downloads": 339841,
"hf_likes": 0,
"release_date": "2025-04-29",
"_discovered": true
},
{
"name": "michaelbenayoun/llama-2-tiny-4kv-heads-4layers-random",
"provider": "michaelbenayoun",
"parameter_count": "9M",
"parameters_raw": 8537216,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 52387,
"hf_likes": 0,
"release_date": "2024-03-28",
"_discovered": true
},
{
"name": "tiiuae/falcon-mamba-tiny-dev",
"provider": "TII",
"parameter_count": "9M",
"parameters_raw": 8765056,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "falcon_mamba",
"hf_downloads": 21730,
"hf_likes": 2,
"release_date": "2024-10-13",
"_discovered": true
},
{
"name": "arnir0/Tiny-LLM",
"provider": "arnir0",
"parameter_count": "13M",
"parameters_raw": 12988992,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 1024,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 54600,
"hf_likes": 45,
"release_date": "2024-11-03",
"_discovered": true
},
{
"name": "EleutherAI/pythia-14m",
"provider": "eleutherai",
"parameter_count": "14M",
"parameters_raw": 14067712,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neox",
"hf_downloads": 33322,
"hf_likes": 0,
"release_date": "2026-02-24",
"_discovered": true
},
{
"name": "hmellor/tiny-random-BambaForCausalLM",
"provider": "hmellor",
"parameter_count": "33M",
"parameters_raw": 33110760,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "bamba",
"hf_downloads": 173798,
"hf_likes": 0,
"release_date": "2025-04-29",
"_discovered": true
},
{
"name": "erwanf/gpt2-mini",
"provider": "erwanf",
"parameter_count": "39M",
"parameters_raw": 38604288,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 512,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt2",
"hf_downloads": 391187,
"hf_likes": 2,
"release_date": "2024-06-23",
"_discovered": true
},
{
"name": "EleutherAI/pythia-14m-deduped",
"provider": "eleutherai",
"parameter_count": "39M",
"parameters_raw": 39233560,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neox",
"hf_downloads": 69404,
"hf_likes": 28,
"release_date": "2023-07-19",
"_discovered": true
},
{
"name": "hyper-accel/tiny-random-llama",
"provider": "hyper-accel",
"parameter_count": "73M",
"parameters_raw": 73271808,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 44649,
"hf_likes": 0,
"release_date": "2025-02-10",
"_discovered": true
},
{
"name": "RedHatAI/SmolLM-135M-Instruct-quantized.w8a16",
"provider": "redhatai",
"parameter_count": "83M",
"parameters_raw": 83356260,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 20835,
"hf_likes": 0,
"release_date": "2024-08-22",
"_discovered": true
},
{
"name": "tiiuae/Falcon-H1-Tiny-90M-Instruct",
"provider": "TII",
"parameter_count": "91M",
"parameters_raw": 91131072,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "falcon_h1",
"hf_downloads": 301062,
"hf_likes": 33,
"release_date": "2026-01-12",
"_discovered": true
},
{
"name": "EleutherAI/pythia-70m-deduped",
"provider": "eleutherai",
"parameter_count": "96M",
"parameters_raw": 95592496,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neox",
"hf_downloads": 613928,
"hf_likes": 27,
"release_date": "2023-02-13",
"_discovered": true
},
{
"name": "gratefulasi/lumeleto",
"provider": "gratefulasi",
"parameter_count": "124M",
"parameters_raw": 124439808,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 1024,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt2",
"hf_downloads": 47679,
"hf_likes": 1,
"release_date": "2025-04-24",
"_discovered": true
},
{
"name": "peft-internal-testing/opt-125m",
"provider": "peft-internal-testing",
"parameter_count": "125M",
"parameters_raw": 125239296,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "opt",
"hf_downloads": 232784,
"hf_likes": 0,
"release_date": "2025-11-19",
"_discovered": true
},
{
"name": "state-spaces/mamba-130m-hf",
"provider": "state-spaces",
"parameter_count": "129M",
"parameters_raw": 129135360,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mamba",
"hf_downloads": 161407,
"hf_likes": 68,
"release_date": "2024-03-06",
"_discovered": true
},
{
"name": "HuggingFaceTB/SmolLM2-135M",
"provider": "huggingfacetb",
"parameter_count": "135M",
"parameters_raw": 134515008,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 954486,
"hf_likes": 168,
"release_date": "2024-10-31",
"_discovered": true
},
{
"name": "HuggingFaceTB/SmolLM2-135M-Instruct",
"provider": "huggingfacetb",
"parameter_count": "135M",
"parameters_raw": 134515008,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 603656,
"hf_likes": 295,
"release_date": "2024-10-31",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/SmolLM2-135M-Instruct-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/SmolLM2-135M-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "HuggingFaceTB/SmolLM-135M-Instruct",
"provider": "huggingfacetb",
"parameter_count": "135M",
"parameters_raw": 134515008,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 359214,
"hf_likes": 133,
"release_date": "2024-07-15",
"_discovered": true
},
{
"name": "HuggingFaceTB/SmolLM-135M",
"provider": "huggingfacetb",
"parameter_count": "135M",
"parameters_raw": 134515008,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 156129,
"hf_likes": 249,
"release_date": "2024-07-14",
"_discovered": true
},
{
"name": "nomic-ai/nomic-embed-text-v1.5",
"provider": "Nomic",
"parameter_count": "137M",
"parameters_raw": 137000000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "F16",
"context_length": 8192,
"use_case": "Text embeddings for RAG",
"pipeline_tag": "feature-extraction",
"architecture": "nomic_bert",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "EleutherAI/gpt-neo-125m",
"provider": "eleutherai",
"parameter_count": "150M",
"parameters_raw": 150364416,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neo",
"hf_downloads": 100060,
"hf_likes": 227,
"release_date": "2022-03-02",
"_discovered": true
},
{
"name": "JackFram/llama-160m",
"provider": "jackfram",
"parameter_count": "162M",
"parameters_raw": 162417792,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 46025,
"hf_likes": 36,
"release_date": "2023-05-26",
"_discovered": true
},
{
"name": "microsoft/DialoGPT-small",
"provider": "Microsoft",
"parameter_count": "176M",
"parameters_raw": 175620096,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 1024,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt2",
"hf_downloads": 58248,
"hf_likes": 143,
"release_date": "2022-03-02",
"_discovered": true
},
{
"name": "lmstudio-community/LFM2.5-1.2B-Instruct-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "183M",
"parameters_raw": 182975232,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 441394,
"hf_likes": 1,
"release_date": "2026-01-07",
"_discovered": true
},
{
"name": "rinna/japanese-gpt-neox-small",
"provider": "rinna",
"parameter_count": "204M",
"parameters_raw": 203611008,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neox",
"hf_downloads": 457560,
"hf_likes": 15,
"release_date": "2022-08-31",
"_discovered": true
},
{
"name": "EleutherAI/pythia-160m-deduped",
"provider": "eleutherai",
"parameter_count": "213M",
"parameters_raw": 212654688,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neox",
"hf_downloads": 82245,
"hf_likes": 3,
"release_date": "2023-02-08",
"_discovered": true
},
{
"name": "Vamsi/T5_Paraphrase_Paws",
"provider": "vamsi",
"parameter_count": "223M",
"parameters_raw": 222903936,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 512,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "t5",
"hf_downloads": 83813,
"hf_likes": 40,
"release_date": "2022-03-02",
"_discovered": true
},
{
"name": "TitanML/tiny-mixtral",
"provider": "titanml",
"parameter_count": "247M",
"parameters_raw": 246961152,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mixtral",
"hf_downloads": 100054,
"hf_likes": 2,
"release_date": "2024-04-24",
"is_moe": true,
"num_experts": 8,
"active_experts": 2,
"active_parameters": 71001329,
"_discovered": true
},
{
"name": "lmstudio-community/LFM2.5-1.2B-Instruct-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "256M",
"parameters_raw": 256113408,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 441834,
"hf_likes": 4,
"release_date": "2026-01-07",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-1.7B-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "269M",
"parameters_raw": 268944384,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 25290,
"hf_likes": 0,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "google/t5gemma-s-s-prefixlm",
"provider": "Google",
"parameter_count": "313M",
"parameters_raw": 312517632,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "t5gemma",
"hf_downloads": 41131,
"hf_likes": 2,
"release_date": "2025-06-19",
"_discovered": true
},
{
"name": "lmstudio-community/LFM2.5-1.2B-Instruct-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "329M",
"parameters_raw": 329251584,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 449901,
"hf_likes": 2,
"release_date": "2026-01-07",
"_discovered": true
},
{
"name": "lmstudio-community/LFM2-1.2B-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "329M",
"parameters_raw": 329251584,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 26421,
"hf_likes": 4,
"release_date": "2025-07-14",
"_discovered": true
},
{
"name": "LiquidAI/LFM2-ColBERT-350M",
"provider": "Liquid AI",
"parameter_count": "353M",
"parameters_raw": 353322752,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Semantic search, sentence similarity",
"pipeline_tag": "sentence-similarity",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2-350M",
"provider": "liquidai",
"parameter_count": "354M",
"parameters_raw": 354483968,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 41124,
"hf_likes": 235,
"release_date": "2025-07-10",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/LFM2-350M-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "HuggingFaceTB/SmolLM2-360M",
"provider": "huggingfacetb",
"parameter_count": "362M",
"parameters_raw": 361821120,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 36444,
"hf_likes": 87,
"release_date": "2024-10-31",
"_discovered": true
},
{
"name": "LiquidAI/LFM2-350M-Extract",
"provider": "Liquid AI",
"parameter_count": "354M",
"parameters_raw": 354483968,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Data extraction, structured output",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2-350M-Math",
"provider": "Liquid AI",
"parameter_count": "354M",
"parameters_raw": 354483968,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Math reasoning, chain-of-thought",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2-350M-ENJP-MT",
"provider": "Liquid AI",
"parameter_count": "354M",
"parameters_raw": 354483968,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "English-Japanese translation",
"pipeline_tag": "translation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2-350M-PII-Extract-JP",
"provider": "Liquid AI",
"parameter_count": "354M",
"parameters_raw": 354483968,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "PII extraction, Japanese",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "lmstudio-community/LFM2-350M-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "354M",
"parameters_raw": 354483968,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "mlx-8bit",
"context_length": 128000,
"use_case": "Lightweight, edge deployment",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "lmstudio-community/LFM2-350M-MLX-bf16",
"provider": "lmstudio-community",
"parameter_count": "354M",
"parameters_raw": 354483968,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.7,
"quantization": "BF16",
"context_length": 128000,
"use_case": "Lightweight, edge deployment",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "HuggingFaceTB/SmolLM-360M-Instruct",
"provider": "huggingfacetb",
"parameter_count": "362M",
"parameters_raw": 361821120,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 26935,
"hf_likes": 83,
"release_date": "2024-07-15",
"_discovered": true
},
{
"name": "openbmb/MiniCPM4-0.5B",
"provider": "openbmb",
"parameter_count": "434M",
"parameters_raw": 433873920,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 28889,
"hf_likes": 77,
"release_date": "2025-06-05",
"_discovered": true
},
{
"name": "LiquidAI/LFM2-VL-450M",
"provider": "Liquid AI",
"parameter_count": "451M",
"parameters_raw": 450822656,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Multimodal, vision and text",
"pipeline_tag": "image-text-to-text",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "lmstudio-community/Qwen3-1.7B-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "484M",
"parameters_raw": 484000768,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 28313,
"hf_likes": 1,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-0.5B-Instruct",
"provider": "Alibaba",
"parameter_count": "494M",
"parameters_raw": 494032768,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 6992099,
"hf_likes": 470,
"release_date": "2024-09-16",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-0.5B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-Coder-0.5B-Instruct",
"provider": "Alibaba",
"parameter_count": "494M",
"parameters_raw": 494032768,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1408034,
"hf_likes": 65,
"release_date": "2024-11-06",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/Qwen2.5-Coder-0.5B-Instruct-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/Qwen2.5-Coder-0.5B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-0.5B",
"provider": "Alibaba",
"parameter_count": "494M",
"parameters_raw": 494032768,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1200041,
"hf_likes": 378,
"release_date": "2024-09-15",
"_discovered": true
},
{
"name": "Qwen/Qwen2-0.5B-Instruct",
"provider": "Alibaba",
"parameter_count": "494M",
"parameters_raw": 494032768,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 259334,
"hf_likes": 200,
"release_date": "2024-06-03",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2-0.5B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Gensyn/Qwen2.5-0.5B-Instruct",
"provider": "gensyn",
"parameter_count": "494M",
"parameters_raw": 494032768,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 106514,
"hf_likes": 33,
"release_date": "2025-03-28",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-0.5B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-Coder-0.5B",
"provider": "Alibaba",
"parameter_count": "494M",
"parameters_raw": 494032768,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 64868,
"hf_likes": 44,
"release_date": "2024-11-08",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-Coder-0.5B-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "EleutherAI/pythia-410m",
"provider": "eleutherai",
"parameter_count": "506M",
"parameters_raw": 505997504,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neox",
"hf_downloads": 88847,
"hf_likes": 36,
"release_date": "2023-02-13",
"_discovered": true
},
{
"name": "EleutherAI/pythia-410m-deduped",
"provider": "eleutherai",
"parameter_count": "506M",
"parameters_raw": 505997504,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neox",
"hf_downloads": 32196,
"hf_likes": 20,
"release_date": "2023-02-13",
"_discovered": true
},
{
"name": "h2oai/h2o-danube3-500m-chat",
"provider": "h2oai",
"parameter_count": "514M",
"parameters_raw": 513590784,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 31122,
"hf_likes": 39,
"release_date": "2024-07-04",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/h2o-danube3-500m-chat-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "tiiuae/Falcon-H1-0.5B-Base",
"provider": "TII",
"parameter_count": "521M",
"parameters_raw": 521411104,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 16384,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "falcon_h1",
"hf_downloads": 25562,
"hf_likes": 16,
"release_date": "2025-05-01",
"_discovered": true
},
{
"name": "RedHatAI/Qwen3-30B-A3B-Instruct-2507-speculator.eagle3",
"provider": "redhatai",
"parameter_count": "522M",
"parameters_raw": 522152832,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 115085,
"hf_likes": 1,
"release_date": "2025-12-12",
"_discovered": true
},
{
"name": "z-lab/Qwen3-4B-DFlash-b16",
"provider": "z-lab",
"parameter_count": "537M",
"parameters_raw": 537427200,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 25679,
"hf_likes": 22,
"release_date": "2026-01-04",
"_discovered": true
},
{
"name": "bigscience/bloomz-560m",
"provider": "bigscience",
"parameter_count": "559M",
"parameters_raw": 559214592,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "bloom",
"hf_downloads": 1303926,
"hf_likes": 137,
"release_date": "2022-10-08",
"_discovered": true
},
{
"name": "bigscience/bloom-560m",
"provider": "bigscience",
"parameter_count": "559M",
"parameters_raw": 559214592,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "bloom",
"hf_downloads": 134778,
"hf_likes": 371,
"release_date": "2022-05-19",
"_discovered": true
},
{
"name": "Qwen/Qwen3-4B-MLX-4bit",
"provider": "Alibaba",
"parameter_count": "566M",
"parameters_raw": 565828096,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 65536,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 74343,
"hf_likes": 26,
"release_date": "2025-05-23",
"_discovered": true
},
{
"name": "google/t5gemma-b-b-ul2",
"provider": "Google",
"parameter_count": "591M",
"parameters_raw": 591490560,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "t5gemma",
"hf_downloads": 39788,
"hf_likes": 2,
"release_date": "2025-06-19",
"_discovered": true
},
{
"name": "google/t5gemma-b-b-prefixlm",
"provider": "Google",
"parameter_count": "591M",
"parameters_raw": 591490560,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"pipeline_tag": "text-generation",
"architecture": "t5gemma",
"hf_downloads": 1187971,
"hf_likes": 13,
"release_date": "2025-06-19",
"_discovered": true
},
{
"name": "lmstudio-community/Phi-4-mini-reasoning-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "600M",
"parameters_raw": 599546880,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phi3",
"hf_downloads": 43404,
"hf_likes": 3,
"release_date": "2025-05-01",
"_discovered": true
},
{
"name": "Qwen/Qwen1.5-0.5B-Chat",
"provider": "Alibaba",
"parameter_count": "620M",
"parameters_raw": 619570176,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 87380,
"hf_likes": 92,
"release_date": "2024-01-31",
"_discovered": true
},
{
"name": "Qwen/Qwen1.5-0.5B",
"provider": "Alibaba",
"parameter_count": "620M",
"parameters_raw": 619570176,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 26651,
"hf_likes": 173,
"release_date": "2024-01-22",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-4B-Thinking-2507-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "629M",
"parameters_raw": 628676096,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 95794,
"hf_likes": 10,
"release_date": "2025-08-06",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-4B-Instruct-2507-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "629M",
"parameters_raw": 628676096,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 66279,
"hf_likes": 3,
"release_date": "2025-08-06",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-4B-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "629M",
"parameters_raw": 628676096,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 21982,
"hf_likes": 1,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "LiquidAI/LFM2-700M",
"provider": "Liquid AI",
"parameter_count": "742M",
"parameters_raw": 742489344,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Lightweight, edge deployment",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "lmstudio-community/LFM2-700M-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "742M",
"parameters_raw": 742489344,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "mlx-8bit",
"context_length": 128000,
"use_case": "Lightweight, edge deployment",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "lmstudio-community/LFM2-700M-MLX-bf16",
"provider": "lmstudio-community",
"parameter_count": "742M",
"parameters_raw": 742489344,
"min_ram_gb": 1.7,
"recommended_ram_gb": 2.8,
"min_vram_gb": 1.5,
"quantization": "BF16",
"context_length": 128000,
"use_case": "Lightweight, edge deployment",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "Qwen/Qwen3-0.6B",
"provider": "Alibaba",
"parameter_count": "752M",
"parameters_raw": 751632384,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 11310453,
"hf_likes": 1120,
"release_date": "2025-04-27",
"gguf_sources": [
{
"repo": "unsloth/Qwen3-0.6B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen3Guard-Gen-0.6B",
"provider": "Alibaba",
"parameter_count": "752M",
"parameters_raw": 751632384,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 146728,
"hf_likes": 62,
"release_date": "2025-09-23",
"_discovered": true
},
{
"name": "Qwen/Qwen3-0.6B-FP8",
"provider": "Alibaba",
"parameter_count": "752M",
"parameters_raw": 751659264,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 1648717,
"hf_likes": 57,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-4B-Instruct-2507-MLX-5bit",
"provider": "lmstudio-community",
"parameter_count": "754M",
"parameters_raw": 754372096,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 62740,
"hf_likes": 0,
"release_date": "2025-08-06",
"_discovered": true
},
{
"name": "h2oai/h2ovl-mississippi-800m",
"provider": "h2oai",
"parameter_count": "826M",
"parameters_raw": 826295808,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "h2ovl_chat",
"hf_downloads": 1014882,
"hf_likes": 39,
"release_date": "2024-10-16",
"_discovered": true
},
{
"name": "Qwen/Qwen3.5-0.8B",
"provider": "Alibaba",
"parameter_count": "873M",
"parameters_raw": 873438784,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 93448,
"hf_likes": 208,
"release_date": "2026-02-28",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-0.8B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen3.5-0.8B-Base",
"provider": "Alibaba",
"parameter_count": "873M",
"parameters_raw": 873438784,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 4680,
"hf_likes": 37,
"release_date": "2026-02-28"
},
{
"name": "lmstudio-community/Qwen3-4B-Thinking-2507-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "880M",
"parameters_raw": 880068096,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 91703,
"hf_likes": 2,
"release_date": "2025-08-06",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-4B-Instruct-2507-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "880M",
"parameters_raw": 880068096,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 62883,
"hf_likes": 0,
"release_date": "2025-08-06",
"_discovered": true
},
{
"name": "Joaoffg/ELM",
"provider": "joaoffg",
"parameter_count": "903M",
"parameters_raw": 902891520,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 339775,
"hf_likes": 2,
"release_date": "2024-05-29",
"_discovered": true
},
{
"name": "RedHatAI/Qwen3-8B-speculator.eagle3",
"provider": "redhatai",
"parameter_count": "1.0B",
"parameters_raw": 1022037632,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 76636,
"hf_likes": 2,
"release_date": "2025-09-19",
"_discovered": true
},
{
"name": "EleutherAI/pythia-1b",
"provider": "eleutherai",
"parameter_count": "1.1B",
"parameters_raw": 1078891008,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neox",
"hf_downloads": 27818,
"hf_likes": 43,
"release_date": "2023-03-10",
"_discovered": true
},
{
"name": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
"provider": "Community",
"parameter_count": "1.1B",
"parameters_raw": 1100048384,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 1870099,
"hf_likes": 1538,
"release_date": "2023-12-30"
},
{
"name": "nm-testing/tinyllama-oneshot-w8w8-test-static-shape-change",
"provider": "nm-testing",
"parameter_count": "1.1B",
"parameters_raw": 1100048692,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 31348,
"hf_likes": 0,
"release_date": "2024-06-12",
"_discovered": true
},
{
"name": "bigcode/gpt_bigcode-santacoder",
"provider": "BigCode",
"parameter_count": "1.1B",
"parameters_raw": 1124886528,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_bigcode",
"hf_downloads": 49973,
"hf_likes": 26,
"release_date": "2023-04-06",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-4B-Thinking-2507-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "1.1B",
"parameters_raw": 1131460096,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 93477,
"hf_likes": 7,
"release_date": "2025-08-06",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-4B-Instruct-2507-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "1.1B",
"parameters_raw": 1131460096,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 63832,
"hf_likes": 1,
"release_date": "2025-08-06",
"_discovered": true
},
{
"name": "LiquidAI/LFM2.5-1.2B-Instruct",
"provider": "liquidai",
"parameter_count": "1.2B",
"parameters_raw": 1170340608,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 116655,
"hf_likes": 516,
"release_date": "2026-01-06",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/LFM2.5-1.2B-Instruct-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "lmstudio-community/LFM2-1.2B-MLX-bf16",
"provider": "lmstudio-community",
"parameter_count": "1.2B",
"parameters_raw": 1170340608,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 26071,
"hf_likes": 6,
"release_date": "2025-07-14",
"_discovered": true
},
{
"name": "LiquidAI/LFM2-1.2B",
"provider": "Liquid AI",
"parameter_count": "1.2B",
"parameters_raw": 1170340608,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "General purpose text generation",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2.5-1.2B-Base",
"provider": "Liquid AI",
"parameter_count": "1.2B",
"parameters_raw": 1170340608,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "General purpose text generation",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2.5-1.2B-Thinking",
"provider": "Liquid AI",
"parameter_count": "1.2B",
"parameters_raw": 1170340608,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Advanced reasoning, chain-of-thought",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2.5-1.2B-JP",
"provider": "Liquid AI",
"parameter_count": "1.2B",
"parameters_raw": 1170340608,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Japanese language, multilingual chat",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2-1.2B-Tool",
"provider": "Liquid AI",
"parameter_count": "1.2B",
"parameters_raw": 1170340608,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Tool calling, function calling",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2-1.2B-RAG",
"provider": "Liquid AI",
"parameter_count": "1.2B",
"parameters_raw": 1170340608,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Retrieval-augmented generation",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2-1.2B-Extract",
"provider": "Liquid AI",
"parameter_count": "1.2B",
"parameters_raw": 1170340608,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Data extraction, structured output",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "lmstudio-community/LFM2.5-1.2B-Thinking-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "1.2B",
"parameters_raw": 1170340608,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.2,
"min_vram_gb": 1.2,
"quantization": "mlx-8bit",
"context_length": 128000,
"use_case": "Advanced reasoning, chain-of-thought",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "lmstudio-community/LFM2.5-1.2B-Thinking-MLX-bf16",
"provider": "lmstudio-community",
"parameter_count": "1.2B",
"parameters_raw": 1170340608,
"min_ram_gb": 2.6,
"recommended_ram_gb": 4.4,
"min_vram_gb": 2.4,
"quantization": "BF16",
"context_length": 128000,
"use_case": "Advanced reasoning, chain-of-thought",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "allenai/OLMo-1B-hf",
"provider": "allenai",
"parameter_count": "1.2B",
"parameters_raw": 1176764416,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo",
"hf_downloads": 23538,
"hf_likes": 26,
"release_date": "2024-04-12",
"_discovered": true
},
{
"name": "Zyphra/Zamba2-1.2B-instruct",
"provider": "zyphra",
"parameter_count": "1.2B",
"parameters_raw": 1215064704,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "zamba2",
"hf_downloads": 72584,
"hf_likes": 30,
"release_date": "2024-09-19",
"_discovered": true
},
{
"name": "meta-llama/Llama-3.2-1B",
"provider": "Meta",
"parameter_count": "1.2B",
"parameters_raw": 1235814400,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 1453836,
"hf_likes": 2306,
"release_date": "2024-09-18"
},
{
"name": "hmellor/Ilama-3.2-1B",
"provider": "hmellor",
"parameter_count": "1.2B",
"parameters_raw": 1235814400,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "ilama",
"hf_downloads": 89998,
"hf_likes": 0,
"release_date": "2025-07-22",
"_discovered": true
},
{
"name": "warshanks/Jan-nano-AWQ",
"provider": "warshanks",
"parameter_count": "1.3B",
"parameters_raw": 1264206840,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.6,
"quantization": "AWQ-4bit",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 99084,
"hf_likes": 3,
"release_date": "2025-07-12",
"_discovered": true,
"format": "awq"
},
{
"name": "LGAI-EXAONE/EXAONE-4.0-1.2B",
"provider": "lgai-exaone",
"parameter_count": "1.3B",
"parameters_raw": 1279391488,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.7,
"quantization": "Q4_K_M",
"context_length": 65536,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "exaone4",
"hf_downloads": 100975,
"hf_likes": 172,
"release_date": "2025-07-11"
},
{
"name": "lmstudio-community/DeepSeek-R1-0528-Qwen3-8B-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "1.3B",
"parameters_raw": 1280062464,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.7,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 348365,
"hf_likes": 7,
"release_date": "2025-05-29",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-8B-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "1.3B",
"parameters_raw": 1280062464,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.7,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 39201,
"hf_likes": 2,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "pfnet/plamo-2-1b",
"provider": "pfnet",
"parameter_count": "1.3B",
"parameters_raw": 1291441920,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.7,
"quantization": "Q4_K_M",
"context_length": 10485760,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "plamo2",
"hf_downloads": 63725,
"hf_likes": 38,
"release_date": "2025-02-05",
"_discovered": true
},
{
"name": "EleutherAI/gpt-neo-1.3B",
"provider": "eleutherai",
"parameter_count": "1.4B",
"parameters_raw": 1365907456,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.7,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neo",
"hf_downloads": 48440,
"hf_likes": 324,
"release_date": "2022-03-02",
"_discovered": true
},
{
"name": "microsoft/phi-1_5",
"provider": "Microsoft",
"parameter_count": "1.4B",
"parameters_raw": 1418270720,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.7,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phi",
"hf_downloads": 152337,
"hf_likes": 1355,
"release_date": "2023-09-10",
"_discovered": true
},
{
"name": "starvector/starvector-1b-im2svg",
"provider": "starvector",
"parameter_count": "1.4B",
"parameters_raw": 1434095620,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.7,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "starvector",
"hf_downloads": 38196,
"hf_likes": 184,
"release_date": "2025-01-11",
"_discovered": true
},
{
"name": "allenai/OLMo-2-0425-1B",
"provider": "allenai",
"parameter_count": "1.5B",
"parameters_raw": 1484916736,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo2",
"hf_downloads": 533223,
"hf_likes": 70,
"release_date": "2025-04-17",
"_discovered": true
},
{
"name": "allenai/OLMo-2-0425-1B-Instruct",
"provider": "allenai",
"parameter_count": "1.5B",
"parameters_raw": 1484916736,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo2",
"hf_downloads": 38389,
"hf_likes": 56,
"release_date": "2025-04-29",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/OLMo-2-0425-1B-Instruct-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "RedHatAI/Llama-3.2-1B-Instruct-FP8",
"provider": "redhatai",
"parameter_count": "1.5B",
"parameters_raw": 1498482912,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 814349,
"hf_likes": 3,
"release_date": "2024-09-26",
"_discovered": true
},
{
"name": "RedHatAI/Llama-3.2-1B-Instruct-FP8-dynamic",
"provider": "redhatai",
"parameter_count": "1.5B",
"parameters_raw": 1498859520,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 1823969,
"hf_likes": 3,
"release_date": "2024-09-25",
"_discovered": true
},
{
"name": "LiquidAI/LFM2-Audio-1.5B",
"provider": "Liquid AI",
"parameter_count": "1.5B",
"parameters_raw": 1500000000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Speech-to-speech, ASR, TTS",
"pipeline_tag": "audio-to-audio",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2.5-Audio-1.5B",
"provider": "Liquid AI",
"parameter_count": "1.5B",
"parameters_raw": 1500000000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Speech-to-speech, ASR, TTS",
"pipeline_tag": "audio-to-audio",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "EleutherAI/pythia-1.4b",
"provider": "eleutherai",
"parameter_count": "1.5B",
"parameters_raw": 1515311488,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neox",
"hf_downloads": 27804,
"hf_likes": 26,
"release_date": "2023-02-09",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-Coder-1.5B-Instruct",
"provider": "Alibaba",
"parameter_count": "1.5B",
"parameters_raw": 1543714304,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1789513,
"hf_likes": 107,
"release_date": "2024-09-18",
"gguf_sources": [
{
"repo": "unsloth/Qwen2.5-Coder-1.5B-Instruct-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/Qwen2.5-Coder-1.5B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-1.5B-Instruct",
"provider": "Alibaba",
"parameter_count": "1.5B",
"parameters_raw": 1543714304,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 7037921,
"hf_likes": 627,
"release_date": "2024-09-17",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-1.5B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2-1.5B-Instruct",
"provider": "Alibaba",
"parameter_count": "1.5B",
"parameters_raw": 1543714304,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 3508972,
"hf_likes": 161,
"release_date": "2024-06-03",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-Math-1.5B",
"provider": "Alibaba",
"parameter_count": "1.5B",
"parameters_raw": 1543714304,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1064952,
"hf_likes": 102,
"release_date": "2024-09-16",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-1.5B",
"provider": "Alibaba",
"parameter_count": "1.5B",
"parameters_raw": 1543714304,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 431369,
"hf_likes": 166,
"release_date": "2024-09-15",
"_discovered": true
},
{
"name": "Qwen/Qwen2-1.5B",
"provider": "Alibaba",
"parameter_count": "1.5B",
"parameters_raw": 1543714304,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 114016,
"hf_likes": 99,
"release_date": "2024-05-31",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-Math-1.5B-Instruct",
"provider": "Alibaba",
"parameter_count": "1.5B",
"parameters_raw": 1543714304,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 80310,
"hf_likes": 54,
"release_date": "2024-09-16",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-Math-1.5B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "RedHatAI/Qwen2-1.5B-Instruct-FP8",
"provider": "redhatai",
"parameter_count": "1.5B",
"parameters_raw": 1543714304,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 24030,
"hf_likes": 0,
"release_date": "2024-06-14",
"_discovered": true
},
{
"name": "KiteFishAI/Minnow-Math-1.5B",
"provider": "kitefishai",
"parameter_count": "1.6B",
"parameters_raw": 1633781760,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 147620,
"hf_likes": 1,
"release_date": "2026-02-12",
"_discovered": true
},
{
"name": "LiquidAI/LFM2-VL-1.6B",
"provider": "Liquid AI",
"parameter_count": "1.6B",
"parameters_raw": 1584804000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Multimodal, vision and text",
"pipeline_tag": "image-text-to-text",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2.5-VL-1.6B",
"provider": "Liquid AI",
"parameter_count": "1.6B",
"parameters_raw": 1596625904,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Multimodal, vision and text",
"pipeline_tag": "image-text-to-text",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "lmstudio-community/LFM2.5-VL-1.6B-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "1.6B",
"parameters_raw": 1596625904,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "mlx-4bit",
"context_length": 32768,
"use_case": "Multimodal, vision and text",
"pipeline_tag": "image-text-to-text",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "lmstudio-community/LFM2.5-VL-1.6B-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "1.6B",
"parameters_raw": 1596625904,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.2,
"min_vram_gb": 1.2,
"quantization": "mlx-6bit",
"context_length": 32768,
"use_case": "Multimodal, vision and text",
"pipeline_tag": "image-text-to-text",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "lmstudio-community/LFM2.5-VL-1.6B-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "1.6B",
"parameters_raw": 1596625904,
"min_ram_gb": 1.8,
"recommended_ram_gb": 3.0,
"min_vram_gb": 1.6,
"quantization": "mlx-8bit",
"context_length": 32768,
"use_case": "Multimodal, vision and text",
"pipeline_tag": "image-text-to-text",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "stabilityai/stablelm-2-1_6b-chat",
"provider": "Stability AI",
"parameter_count": "1.6B",
"parameters_raw": 1644515328,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.8,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "stablelm",
"hf_downloads": 955,
"hf_likes": 34,
"release_date": "2024-04-08"
},
{
"name": "HuggingFaceTB/SmolLM-1.7B",
"provider": "huggingfacetb",
"parameter_count": "1.7B",
"parameters_raw": 1711376384,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 63387,
"hf_likes": 180,
"release_date": "2024-07-14",
"_discovered": true
},
{
"name": "HuggingFaceTB/SmolLM2-1.7B",
"provider": "huggingfacetb",
"parameter_count": "1.7B",
"parameters_raw": 1711376384,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 25638,
"hf_likes": 144,
"release_date": "2024-10-30",
"_discovered": true
},
{
"name": "cyankiwi/Nanbeige4.1-3B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "3.0B",
"parameters_raw": 3000000000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "AWQ-8bit",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 49220,
"hf_likes": 2,
"release_date": "2026-02-15",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen3-1.7B-Base",
"provider": "Alibaba",
"parameter_count": "1.7B",
"parameters_raw": 1720574976,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 295900,
"hf_likes": 64,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-1.7B-MLX-bf16",
"provider": "lmstudio-community",
"parameter_count": "1.7B",
"parameters_raw": 1720574976,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 24714,
"hf_likes": 2,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "bigscience/bloom-1b7",
"provider": "bigscience",
"parameter_count": "1.7B",
"parameters_raw": 1722408960,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "bloom",
"hf_downloads": 38813,
"hf_likes": 122,
"release_date": "2022-05-19",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-1.5B-Instruct-AWQ",
"provider": "Alibaba",
"parameter_count": "1.8B",
"parameters_raw": 1777088000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 727989,
"hf_likes": 6,
"release_date": "2024-09-17",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen2.5-Coder-1.5B-Instruct-AWQ",
"provider": "Alibaba",
"parameter_count": "1.8B",
"parameters_raw": 1777088000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 164152,
"hf_likes": 4,
"release_date": "2024-09-20",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen2-1.5B-Instruct-AWQ",
"provider": "Alibaba",
"parameter_count": "1.8B",
"parameters_raw": 1777088000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 24850,
"hf_likes": 9,
"release_date": "2024-06-06",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen2-1.5B-Instruct-GPTQ-Int4",
"provider": "Alibaba",
"parameter_count": "1.8B",
"parameters_raw": 1777675776,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "GPTQ-Int4",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 24724,
"hf_likes": 5,
"release_date": "2024-06-06",
"_discovered": true,
"format": "gptq"
},
{
"name": "RedHatAI/Qwen2.5-1.5B-quantized.w8a8",
"provider": "redhatai",
"parameter_count": "1.8B",
"parameters_raw": 1777733120,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1091974,
"hf_likes": 2,
"release_date": "2024-10-09",
"_discovered": true
},
{
"name": "Qwen/Qwen1.5-1.8B-Chat",
"provider": "Alibaba",
"parameter_count": "1.8B",
"parameters_raw": 1836828672,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 72445,
"hf_likes": 73,
"release_date": "2024-01-30",
"_discovered": true
},
{
"name": "jonathanli/induction-vl2-mdl-fswd7-20000-720p-proj-256-var",
"provider": "jonathanli",
"parameter_count": "1.9B",
"parameters_raw": 1940015872,
"min_ram_gb": 1.1,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.0,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "induction_vl2",
"hf_downloads": 24886,
"hf_likes": 0,
"release_date": "2026-02-01",
"_discovered": true
},
{
"name": "cyankiwi/granite-4.0-h-tiny-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 1997098800,
"min_ram_gb": 1.1,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.0,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granitemoehybrid",
"hf_downloads": 63040,
"hf_likes": 2,
"release_date": "2025-10-13",
"is_moe": true,
"num_experts": 64,
"active_experts": 6,
"active_parameters": 277721550,
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen3-1.7B-FP8",
"provider": "Alibaba",
"parameter_count": "2.0B",
"parameters_raw": 2031825920,
"min_ram_gb": 1.1,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.0,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 47050,
"hf_likes": 35,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "h2oai/h2ovl-mississippi-2b",
"provider": "h2oai",
"parameter_count": "2.2B",
"parameters_raw": 2152317440,
"min_ram_gb": 1.2,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.1,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "h2ovl_chat",
"hf_downloads": 1007240,
"hf_likes": 42,
"release_date": "2024-10-15",
"_discovered": true
},
{
"name": "warshanks/Qwen3-8B-abliterated-AWQ",
"provider": "warshanks",
"parameter_count": "8.2B",
"parameters_raw": 8190735872,
"min_ram_gb": 3.2,
"recommended_ram_gb": 6.4,
"min_vram_gb": 5.3,
"quantization": "AWQ-4bit",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 25559,
"hf_likes": 0,
"release_date": "2025-07-27",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen3.5-2B",
"provider": "Alibaba",
"parameter_count": "2.3B",
"parameters_raw": 2274069824,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.1,
"min_vram_gb": 1.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 46974,
"hf_likes": 115,
"release_date": "2026-02-28",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-2B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen3.5-2B-Base",
"provider": "Alibaba",
"parameter_count": "2.3B",
"parameters_raw": 2274069824,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.1,
"min_vram_gb": 1.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 3336,
"hf_likes": 33,
"release_date": "2026-02-28"
},
{
"name": "lmstudio-community/Phi-4-reasoning-plus-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "2.3B",
"parameters_raw": 2290897920,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.1,
"min_vram_gb": 1.2,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phi3",
"hf_downloads": 28622,
"hf_likes": 1,
"release_date": "2025-05-01",
"_discovered": true
},
{
"name": "lmstudio-community/DeepSeek-R1-0528-Qwen3-8B-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "2.3B",
"parameters_raw": 2303865856,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.1,
"min_vram_gb": 1.2,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 333300,
"hf_likes": 13,
"release_date": "2025-05-29",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-8B-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "2.3B",
"parameters_raw": 2303865856,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.1,
"min_vram_gb": 1.2,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 37222,
"hf_likes": 2,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-14B-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "2.3B",
"parameters_raw": 2307906560,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.1,
"min_vram_gb": 1.2,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 46163,
"hf_likes": 5,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen2.5-Coder-14B-Instruct-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "2.3B",
"parameters_raw": 2308527104,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.1,
"min_vram_gb": 1.2,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 92774,
"hf_likes": 2,
"release_date": "2024-11-11",
"_discovered": true
},
{
"name": "google/gemma-1.1-2b-it",
"provider": "Google",
"parameter_count": "2.5B",
"parameters_raw": 2506172416,
"min_ram_gb": 1.4,
"recommended_ram_gb": 2.3,
"min_vram_gb": 1.3,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gemma",
"hf_downloads": 66616,
"hf_likes": 171,
"release_date": "2024-03-26",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/gemma-1.1-2b-it-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "LiquidAI/LFM2-2.6B",
"provider": "liquidai",
"parameter_count": "2.6B",
"parameters_raw": 2569272320,
"min_ram_gb": 1.4,
"recommended_ram_gb": 2.4,
"min_vram_gb": 1.3,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 25773,
"hf_likes": 180,
"release_date": "2025-09-22",
"_discovered": true
},
{
"name": "LiquidAI/LFM2-2.6B-Exp",
"provider": "Liquid AI",
"parameter_count": "2.6B",
"parameters_raw": 2569272320,
"min_ram_gb": 1.4,
"recommended_ram_gb": 2.4,
"min_vram_gb": 1.3,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Instruction following, math, knowledge",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "LiquidAI/LFM2-2.6B-Transcript",
"provider": "Liquid AI",
"parameter_count": "2.6B",
"parameters_raw": 2569272320,
"min_ram_gb": 1.4,
"recommended_ram_gb": 2.4,
"min_vram_gb": 1.3,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Meeting transcription, summarization",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "google/gemma-2-2b-it",
"provider": "Google",
"parameter_count": "2.6B",
"parameters_raw": 2614341376,
"min_ram_gb": 1.5,
"recommended_ram_gb": 2.4,
"min_vram_gb": 1.3,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "Lightweight, edge deployment",
"pipeline_tag": "text-generation",
"architecture": "gemma2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "bartowski/gemma-2-2b-it-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Efficient-Large-Model/gemma-2-2b-it",
"provider": "efficient-large-model",
"parameter_count": "2.6B",
"parameters_raw": 2614341888,
"min_ram_gb": 1.5,
"recommended_ram_gb": 2.4,
"min_vram_gb": 1.3,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gemma2",
"hf_downloads": 50419,
"hf_likes": 3,
"release_date": "2024-12-12",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/gemma-2-2b-it-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "EleutherAI/gpt-neo-2.7B",
"provider": "eleutherai",
"parameter_count": "2.7B",
"parameters_raw": 2718416384,
"min_ram_gb": 1.5,
"recommended_ram_gb": 2.5,
"min_vram_gb": 1.4,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neo",
"hf_downloads": 23217,
"hf_likes": 501,
"release_date": "2022-03-02",
"_discovered": true
},
{
"name": "microsoft/phi-2",
"provider": "Microsoft",
"parameter_count": "2.8B",
"parameters_raw": 2779683840,
"min_ram_gb": 1.6,
"recommended_ram_gb": 2.6,
"min_vram_gb": 1.4,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phi",
"hf_downloads": 1651432,
"hf_likes": 3429,
"release_date": "2023-12-13",
"_discovered": true
},
{
"name": "stabilityai/stablelm-3b-4e1t",
"provider": "Stability AI",
"parameter_count": "2.8B",
"parameters_raw": 2795443200,
"min_ram_gb": 1.6,
"recommended_ram_gb": 2.6,
"min_vram_gb": 1.4,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "stablelm",
"hf_downloads": 24407,
"hf_likes": 312,
"release_date": "2023-09-29",
"_discovered": true
},
{
"name": "HuggingFaceTB/SmolLM3-3B",
"provider": "HuggingFace",
"parameter_count": "3B",
"parameters_raw": 3000000000,
"min_ram_gb": 1.7,
"recommended_ram_gb": 2.8,
"min_vram_gb": 1.5,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Lightweight, multilingual reasoning",
"pipeline_tag": "text-generation",
"architecture": "smollm",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-07-08",
"gguf_sources": [
{
"repo": "unsloth/SmolLM3-3B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "LiquidAI/LFM2-VL-3B",
"provider": "Liquid AI",
"parameter_count": "3.0B",
"parameters_raw": 2998975216,
"min_ram_gb": 1.7,
"recommended_ram_gb": 2.8,
"min_vram_gb": 1.5,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Multimodal, vision and text",
"pipeline_tag": "image-text-to-text",
"architecture": "lfm2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "bigscience/bloom-3b",
"provider": "bigscience",
"parameter_count": "3.0B",
"parameters_raw": 3002557440,
"min_ram_gb": 1.7,
"recommended_ram_gb": 2.8,
"min_vram_gb": 1.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "bloom",
"hf_downloads": 30567,
"hf_likes": 94,
"release_date": "2022-05-19",
"_discovered": true
},
{
"name": "bigcode/starcoder2-3b",
"provider": "BigCode",
"parameter_count": "3.0B",
"parameters_raw": 3030371328,
"min_ram_gb": 1.7,
"recommended_ram_gb": 2.8,
"min_vram_gb": 1.6,
"quantization": "Q4_K_M",
"context_length": 16384,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "starcoder2",
"hf_downloads": 97310,
"hf_likes": 216,
"release_date": "2023-11-29",
"_discovered": true
},
{
"name": "TechxGenus/gemma-1.1-2b-it-GPTQ",
"provider": "techxgenus",
"parameter_count": "3.0B",
"parameters_raw": 3031170048,
"min_ram_gb": 1.7,
"recommended_ram_gb": 2.8,
"min_vram_gb": 1.6,
"quantization": "GPTQ-Int4",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gemma",
"hf_downloads": 20793,
"hf_likes": 1,
"release_date": "2024-04-07",
"_discovered": true,
"format": "gptq"
},
{
"name": "Qwen/Qwen2.5-3B-Instruct",
"provider": "Alibaba",
"parameter_count": "3.1B",
"parameters_raw": 3085938688,
"min_ram_gb": 1.7,
"recommended_ram_gb": 2.9,
"min_vram_gb": 1.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 6598470,
"hf_likes": 409,
"release_date": "2024-09-17",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-3B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-3B",
"provider": "Alibaba",
"parameter_count": "3.1B",
"parameters_raw": 3085938688,
"min_ram_gb": 1.7,
"recommended_ram_gb": 2.9,
"min_vram_gb": 1.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 297679,
"hf_likes": 172,
"release_date": "2024-09-15",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-3B-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-Coder-3B-Instruct",
"provider": "Alibaba",
"parameter_count": "3.1B",
"parameters_raw": 3085938688,
"min_ram_gb": 1.7,
"recommended_ram_gb": 2.9,
"min_vram_gb": 1.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 126989,
"hf_likes": 96,
"release_date": "2024-11-06",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/Qwen2.5-Coder-3B-Instruct-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/Qwen2.5-Coder-3B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Salesforce/xLAM-2-3b-fc-r",
"provider": "salesforce",
"parameter_count": "3.1B",
"parameters_raw": 3085938688,
"min_ram_gb": 1.7,
"recommended_ram_gb": 2.9,
"min_vram_gb": 1.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 44516,
"hf_likes": 16,
"release_date": "2025-03-27",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-Coder-3B",
"provider": "Alibaba",
"parameter_count": "3.1B",
"parameters_raw": 3085938688,
"min_ram_gb": 1.7,
"recommended_ram_gb": 2.9,
"min_vram_gb": 1.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 42540,
"hf_likes": 40,
"release_date": "2024-11-08",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-Coder-3B-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "meta-llama/Llama-3.2-3B",
"provider": "Meta",
"parameter_count": "3.2B",
"parameters_raw": 3212749824,
"min_ram_gb": 1.8,
"recommended_ram_gb": 3.0,
"min_vram_gb": 1.6,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 1409393,
"hf_likes": 702,
"release_date": "2024-09-18"
},
{
"name": "ibm-research/PowerMoE-3b",
"provider": "ibm-research",
"parameter_count": "3.4B",
"parameters_raw": 3374286336,
"min_ram_gb": 1.9,
"recommended_ram_gb": 3.1,
"min_vram_gb": 1.7,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granitemoe",
"hf_downloads": 399266,
"hf_likes": 17,
"release_date": "2024-08-14",
"is_moe": true,
"num_experts": 40,
"active_experts": 8,
"active_parameters": 809828716,
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-3B-Instruct-AWQ",
"provider": "Alibaba",
"parameter_count": "3.4B",
"parameters_raw": 3397103616,
"min_ram_gb": 1.9,
"recommended_ram_gb": 3.2,
"min_vram_gb": 1.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 38262,
"hf_likes": 16,
"release_date": "2024-09-17",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen2.5-Coder-3B-Instruct-AWQ",
"provider": "Alibaba",
"parameter_count": "3.4B",
"parameters_raw": 3397103616,
"min_ram_gb": 1.9,
"recommended_ram_gb": 3.2,
"min_vram_gb": 1.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 21964,
"hf_likes": 5,
"release_date": "2024-11-09",
"_discovered": true,
"format": "awq"
},
{
"name": "ibm-granite/granite-3b-code-base-2k",
"provider": "ibm-granite",
"parameter_count": "3.5B",
"parameters_raw": 3482503680,
"min_ram_gb": 1.9,
"recommended_ram_gb": 3.2,
"min_vram_gb": 1.8,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 73193,
"hf_likes": 37,
"release_date": "2024-04-23",
"_discovered": true
},
{
"name": "ibm-research/PowerLM-3b",
"provider": "ibm-research",
"parameter_count": "3.5B",
"parameters_raw": 3512017152,
"min_ram_gb": 2.0,
"recommended_ram_gb": 3.3,
"min_vram_gb": 1.8,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granite",
"hf_downloads": 30013,
"hf_likes": 20,
"release_date": "2024-08-14",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-VL-3B-Instruct",
"provider": "Alibaba",
"parameter_count": "3.8B",
"parameters_raw": 3754622976,
"min_ram_gb": 2.1,
"recommended_ram_gb": 3.5,
"min_vram_gb": 1.9,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Instruction following, chat",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen2_5_vl",
"hf_downloads": 2621650,
"hf_likes": 623,
"release_date": "2025-01-26",
"gguf_sources": [
{
"repo": "unsloth/Qwen2.5-VL-3B-Instruct-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "microsoft/Phi-tiny-MoE-instruct",
"provider": "Microsoft",
"parameter_count": "3.8B",
"parameters_raw": 3755220288,
"min_ram_gb": 2.1,
"recommended_ram_gb": 3.5,
"min_vram_gb": 1.9,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phimoe",
"hf_downloads": 310211,
"hf_likes": 31,
"release_date": "2025-06-23",
"is_moe": true,
"num_experts": 16,
"active_experts": 2,
"active_parameters": 633693422,
"_discovered": true
},
{
"name": "llm-jp/llm-jp-3-3.7b-instruct",
"provider": "llm-jp",
"parameter_count": "3.8B",
"parameters_raw": 3782913024,
"min_ram_gb": 2.1,
"recommended_ram_gb": 3.5,
"min_vram_gb": 1.9,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 810462,
"hf_likes": 13,
"release_date": "2024-09-23",
"_discovered": true
},
{
"name": "microsoft/Phi-4-mini-reasoning",
"provider": "Microsoft",
"parameter_count": "3.8B",
"parameters_raw": 3800000000,
"min_ram_gb": 2.1,
"recommended_ram_gb": 3.5,
"min_vram_gb": 1.9,
"quantization": "Q4_K_M",
"context_length": 16384,
"use_case": "Lightweight reasoning",
"pipeline_tag": "text-generation",
"architecture": "phi4",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-04-01",
"gguf_sources": [
{
"repo": "unsloth/Phi-4-mini-reasoning-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "microsoft/phi-3-mini-4k-instruct",
"provider": "Microsoft",
"parameter_count": "3.8B",
"parameters_raw": 3821000000,
"min_ram_gb": 2.1,
"recommended_ram_gb": 3.6,
"min_vram_gb": 2.0,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Lightweight, edge deployment",
"pipeline_tag": "text-generation",
"architecture": "phi3",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "bartowski/phi-3-mini-4k-instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "microsoft/Phi-3.5-mini-instruct",
"provider": "Microsoft",
"parameter_count": "3.8B",
"parameters_raw": 3821000000,
"min_ram_gb": 2.1,
"recommended_ram_gb": 3.6,
"min_vram_gb": 2.0,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Lightweight, long context",
"pipeline_tag": "text-generation",
"architecture": "phi3",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "bartowski/Phi-3.5-mini-instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "zstanjj/HTML-Pruner-Phi-3.8B",
"provider": "zstanjj",
"parameter_count": "3.8B",
"parameters_raw": 3821079552,
"min_ram_gb": 2.1,
"recommended_ram_gb": 3.6,
"min_vram_gb": 2.0,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phi3",
"hf_downloads": 88805,
"hf_likes": 18,
"release_date": "2024-10-16",
"_discovered": true
},
{
"name": "Sreenington/Phi-3-mini-4k-instruct-AWQ",
"provider": "sreenington",
"parameter_count": "3.8B",
"parameters_raw": 3821079552,
"min_ram_gb": 2.1,
"recommended_ram_gb": 3.6,
"min_vram_gb": 2.0,
"quantization": "AWQ-4bit",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 40949,
"hf_likes": 5,
"release_date": "2024-05-05",
"_discovered": true,
"format": "awq"
},
{
"name": "numind/NuExtract-1.5",
"provider": "numind",
"parameter_count": "3.8B",
"parameters_raw": 3821079552,
"min_ram_gb": 2.1,
"recommended_ram_gb": 3.6,
"min_vram_gb": 2.0,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phi3",
"hf_downloads": 31247,
"hf_likes": 243,
"release_date": "2024-09-26",
"_discovered": true
},
{
"name": "kaitchup/Phi-3-mini-4k-instruct-gptq-4bit",
"provider": "kaitchup",
"parameter_count": "3.8B",
"parameters_raw": 3822095360,
"min_ram_gb": 2.1,
"recommended_ram_gb": 3.6,
"min_vram_gb": 2.0,
"quantization": "GPTQ-Int4",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phi3",
"hf_downloads": 881144,
"hf_likes": 2,
"release_date": "2024-04-25",
"_discovered": true,
"format": "gptq"
},
{
"name": "Nanbeige/Nanbeige4.1-3B",
"provider": "nanbeige",
"parameter_count": "3.9B",
"parameters_raw": 3933637120,
"min_ram_gb": 2.2,
"recommended_ram_gb": 3.7,
"min_vram_gb": 2.0,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 417673,
"hf_likes": 941,
"release_date": "2026-02-10",
"_discovered": true
},
{
"name": "google/gemma-3n-E2B-it",
"provider": "Google",
"parameter_count": "4B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.2,
"recommended_ram_gb": 3.7,
"min_vram_gb": 2.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Multimodal, on-device (effective 2B)",
"pipeline_tag": "image-text-to-text",
"architecture": "gemma3n",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-06-25",
"gguf_sources": [
{
"repo": "unsloth/gemma-3n-E2B-it-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen3-4B-Base",
"provider": "Alibaba",
"parameter_count": "4.0B",
"parameters_raw": 4022468096,
"min_ram_gb": 2.2,
"recommended_ram_gb": 3.7,
"min_vram_gb": 2.1,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 548989,
"hf_likes": 81,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "Qwen/Qwen3-4B-AWQ",
"provider": "Alibaba",
"parameter_count": "4.0B",
"parameters_raw": 4022468096,
"min_ram_gb": 2.2,
"recommended_ram_gb": 3.7,
"min_vram_gb": 2.1,
"quantization": "AWQ-4bit",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 344398,
"hf_likes": 25,
"release_date": "2025-05-05",
"_discovered": true,
"format": "awq"
},
{
"name": "typhoon-ai/typhoon2.5-qwen3-4b",
"provider": "typhoon-ai",
"parameter_count": "4.0B",
"parameters_raw": 4022468096,
"min_ram_gb": 2.2,
"recommended_ram_gb": 3.7,
"min_vram_gb": 2.1,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 51135,
"hf_likes": 2,
"release_date": "2025-09-23",
"_discovered": true
},
{
"name": "JunHowie/Qwen3-4B-Instruct-2507-GPTQ-Int4",
"provider": "junhowie",
"parameter_count": "4.0B",
"parameters_raw": 4022468096,
"min_ram_gb": 2.2,
"recommended_ram_gb": 3.7,
"min_vram_gb": 2.1,
"quantization": "GPTQ-Int4",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 36817,
"hf_likes": 2,
"release_date": "2025-09-01",
"_discovered": true,
"format": "gptq"
},
{
"name": "TIGER-Lab/VLM2Vec-Full",
"provider": "tiger-lab",
"parameter_count": "4.1B",
"parameters_raw": 4146621440,
"min_ram_gb": 2.3,
"recommended_ram_gb": 3.9,
"min_vram_gb": 2.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phi3_v",
"hf_downloads": 64160,
"hf_likes": 28,
"release_date": "2024-10-08",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-14B-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "4.2B",
"parameters_raw": 4153891840,
"min_ram_gb": 2.3,
"recommended_ram_gb": 3.9,
"min_vram_gb": 2.1,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 42084,
"hf_likes": 1,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen2.5-Coder-14B-Instruct-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "4.2B",
"parameters_raw": 4154676224,
"min_ram_gb": 2.3,
"recommended_ram_gb": 3.9,
"min_vram_gb": 2.1,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 82050,
"hf_likes": 1,
"release_date": "2024-11-11",
"_discovered": true
},
{
"name": "Qwen/Qwen3-4B-SafeRL",
"provider": "Alibaba",
"parameter_count": "4.4B",
"parameters_raw": 4411424256,
"min_ram_gb": 2.5,
"recommended_ram_gb": 4.1,
"min_vram_gb": 2.3,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 53732,
"hf_likes": 41,
"release_date": "2025-09-30",
"_discovered": true
},
{
"name": "Qwen/Qwen3-4B-Instruct-2507-FP8",
"provider": "Alibaba",
"parameter_count": "4.4B",
"parameters_raw": 4411646016,
"min_ram_gb": 2.5,
"recommended_ram_gb": 4.1,
"min_vram_gb": 2.3,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 507765,
"hf_likes": 69,
"release_date": "2025-08-06",
"_discovered": true
},
{
"name": "Qwen/Qwen3-4B-FP8",
"provider": "Alibaba",
"parameter_count": "4.4B",
"parameters_raw": 4411646016,
"min_ram_gb": 2.5,
"recommended_ram_gb": 4.1,
"min_vram_gb": 2.3,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 250469,
"hf_likes": 38,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "nvidia/Nemotron-H-4B-Base-8K",
"provider": "nvidia",
"parameter_count": "4.5B",
"parameters_raw": 4489223040,
"min_ram_gb": 2.5,
"recommended_ram_gb": 4.2,
"min_vram_gb": 2.3,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 40602,
"hf_likes": 5,
"release_date": "2025-03-20",
"_discovered": true
},
{
"name": "nvidia/Nemotron-H-4B-Instruct-128K",
"provider": "nvidia",
"parameter_count": "4.5B",
"parameters_raw": 4489223040,
"min_ram_gb": 2.5,
"recommended_ram_gb": 4.2,
"min_vram_gb": 2.3,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 38647,
"hf_likes": 8,
"release_date": "2025-04-15",
"_discovered": true
},
{
"name": "stelterlab/Qwen3-Coder-30B-A3B-Instruct-AWQ",
"provider": "stelterlab",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 10.9,
"recommended_ram_gb": 21.8,
"min_vram_gb": 18.2,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 63349,
"hf_likes": 4,
"release_date": "2025-07-31",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3300000000,
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen3.5-4B",
"provider": "Alibaba",
"parameter_count": "4.7B",
"parameters_raw": 4659865088,
"min_ram_gb": 2.6,
"recommended_ram_gb": 4.3,
"min_vram_gb": 2.4,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 99087,
"hf_likes": 202,
"release_date": "2026-02-27",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-4B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen3.5-4B-Base",
"provider": "Alibaba",
"parameter_count": "4.7B",
"parameters_raw": 4659865088,
"min_ram_gb": 2.6,
"recommended_ram_gb": 4.3,
"min_vram_gb": 2.4,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 3593,
"hf_likes": 38,
"release_date": "2026-02-27"
},
{
"name": "nvidia/Qwen3-8B-NVFP4",
"provider": "nvidia",
"parameter_count": "4.7B",
"parameters_raw": 4717851648,
"min_ram_gb": 2.6,
"recommended_ram_gb": 4.4,
"min_vram_gb": 2.4,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 32743,
"hf_likes": 14,
"release_date": "2025-09-09",
"_discovered": true
},
{
"name": "speakleash/Bielik-4.5B-v3.0-Instruct",
"provider": "speakleash",
"parameter_count": "4.8B",
"parameters_raw": 4757260288,
"min_ram_gb": 2.7,
"recommended_ram_gb": 4.4,
"min_vram_gb": 2.4,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 43008,
"hf_likes": 27,
"release_date": "2025-04-18",
"_discovered": true
},
{
"name": "XLabs-AI/xflux_text_encoders",
"provider": "xlabs-ai",
"parameter_count": "4.8B",
"parameters_raw": 4762310656,
"min_ram_gb": 2.7,
"recommended_ram_gb": 4.4,
"min_vram_gb": 2.4,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "t5",
"hf_downloads": 162123,
"hf_likes": 21,
"release_date": "2024-08-11",
"_discovered": true
},
{
"name": "stelterlab/NVIDIA-Nemotron-3-Nano-30B-A3B-AWQ",
"provider": "stelterlab",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 10.9,
"recommended_ram_gb": 21.8,
"min_vram_gb": 18.2,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 38947,
"hf_likes": 4,
"release_date": "2026-01-31",
"_discovered": true,
"format": "awq",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3300000000
},
{
"name": "lmstudio-community/Qwen3-32B-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "5.1B",
"parameters_raw": 5119652864,
"min_ram_gb": 2.9,
"recommended_ram_gb": 4.8,
"min_vram_gb": 2.6,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 26287,
"hf_likes": 4,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen2.5-Coder-32B-Instruct-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "5.1B",
"parameters_raw": 5120300032,
"min_ram_gb": 2.9,
"recommended_ram_gb": 4.8,
"min_vram_gb": 2.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 44413,
"hf_likes": 6,
"release_date": "2024-11-11",
"_discovered": true
},
{
"name": "lmstudio-community/QwQ-32B-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "5.1B",
"parameters_raw": 5120300032,
"min_ram_gb": 2.9,
"recommended_ram_gb": 4.8,
"min_vram_gb": 2.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 32595,
"hf_likes": 0,
"release_date": "2025-03-05",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-Coder-30B-A3B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 3.0,
"recommended_ram_gb": 4.9,
"min_vram_gb": 2.7,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 135548,
"hf_likes": 40,
"release_date": "2025-08-01",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3000000000,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3-30B-A3B-Instruct-2507-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 3.0,
"recommended_ram_gb": 4.9,
"min_vram_gb": 2.7,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 85989,
"hf_likes": 30,
"release_date": "2025-07-29",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3000000000,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/MiroThinker-v1.5-30B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 3.0,
"recommended_ram_gb": 4.9,
"min_vram_gb": 2.7,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 20465,
"hf_likes": 3,
"release_date": "2026-01-06",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 580405768,
"_discovered": true,
"format": "awq"
},
{
"name": "01-ai/Yi-6B-Chat",
"provider": "01.ai",
"parameter_count": "6.1B",
"parameters_raw": 6061035520,
"min_ram_gb": 3.4,
"recommended_ram_gb": 5.6,
"min_vram_gb": 3.1,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 15481,
"hf_likes": 70,
"release_date": "2023-11-22"
},
{
"name": "arcee-ai/Trinity-Nano-Preview",
"provider": "arcee-ai",
"parameter_count": "6.1B",
"parameters_raw": 6120003328,
"min_ram_gb": 3.4,
"recommended_ram_gb": 5.7,
"min_vram_gb": 3.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "afmoe",
"hf_downloads": 22294,
"hf_likes": 67,
"release_date": "2025-12-01",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 669375358,
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.7-Flash-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "6.4B",
"parameters_raw": 6407095318,
"min_ram_gb": 3.6,
"recommended_ram_gb": 6.0,
"min_vram_gb": 3.3,
"quantization": "AWQ-4bit",
"context_length": 202752,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe_lite",
"hf_downloads": 217691,
"hf_likes": 46,
"release_date": "2026-01-19",
"_discovered": true,
"format": "awq"
},
{
"name": "lmsys/vicuna-7b-v1.5",
"provider": "LMSYS",
"parameter_count": "7.0B",
"parameters_raw": 6738415616,
"min_ram_gb": 3.8,
"recommended_ram_gb": 6.3,
"min_vram_gb": 3.4,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "tartuNLP/Llammas-base-p1-GPT-4o-human-error-mix-paragraph-GEC",
"provider": "tartunlp",
"parameter_count": "6.7B",
"parameters_raw": 6738415616,
"min_ram_gb": 3.8,
"recommended_ram_gb": 6.3,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 36045,
"hf_likes": 0,
"release_date": "2025-02-11",
"_discovered": true
},
{
"name": "meta-llama/Llama-2-7b-hf",
"provider": "Meta",
"parameter_count": "6.7B",
"parameters_raw": 6738417664,
"min_ram_gb": 3.8,
"recommended_ram_gb": 6.3,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 617643,
"hf_likes": 2272,
"release_date": "2023-07-13",
"_discovered": true
},
{
"name": "huggyllama/llama-7b",
"provider": "huggyllama",
"parameter_count": "6.7B",
"parameters_raw": 6738417664,
"min_ram_gb": 3.8,
"recommended_ram_gb": 6.3,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 103505,
"hf_likes": 354,
"release_date": "2023-04-03",
"_discovered": true
},
{
"name": "NousResearch/Llama-2-7b-hf",
"provider": "NousResearch",
"parameter_count": "6.7B",
"parameters_raw": 6738417664,
"min_ram_gb": 3.8,
"recommended_ram_gb": 6.3,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 81336,
"hf_likes": 171,
"release_date": "2023-07-18",
"_discovered": true
},
{
"name": "NousResearch/Llama-2-7b-chat-hf",
"provider": "NousResearch",
"parameter_count": "6.7B",
"parameters_raw": 6738417664,
"min_ram_gb": 3.8,
"recommended_ram_gb": 6.3,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 20573,
"hf_likes": 194,
"release_date": "2023-07-18",
"_discovered": true
},
{
"name": "meta-llama/CodeLlama-7b-Instruct-hf",
"provider": "Meta",
"parameter_count": "6.7B",
"parameters_raw": 6738546688,
"min_ram_gb": 3.8,
"recommended_ram_gb": 6.3,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 5404,
"hf_likes": 59,
"release_date": "2024-03-13"
},
{
"name": "codellama/CodeLlama-7b-Instruct-hf",
"provider": "codellama",
"parameter_count": "6.7B",
"parameters_raw": 6738546688,
"min_ram_gb": 3.8,
"recommended_ram_gb": 6.3,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 16384,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 65896,
"hf_likes": 254,
"release_date": "2023-08-24",
"_discovered": true
},
{
"name": "codellama/CodeLlama-7b-hf",
"provider": "codellama",
"parameter_count": "6.7B",
"parameters_raw": 6738546688,
"min_ram_gb": 3.8,
"recommended_ram_gb": 6.3,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 16384,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 54518,
"hf_likes": 375,
"release_date": "2023-08-24",
"_discovered": true
},
{
"name": "deepseek-ai/deepseek-coder-6.7b-instruct",
"provider": "DeepSeek",
"parameter_count": "6.7B",
"parameters_raw": 6740512768,
"min_ram_gb": 3.8,
"recommended_ram_gb": 6.3,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 16384,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 97176,
"hf_likes": 478,
"release_date": "2023-10-29",
"_discovered": true
},
{
"name": "deepseek-ai/deepseek-coder-6.7b-base",
"provider": "DeepSeek",
"parameter_count": "6.7B",
"parameters_raw": 6740512768,
"min_ram_gb": 3.8,
"recommended_ram_gb": 6.3,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 16384,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 28134,
"hf_likes": 122,
"release_date": "2023-10-23",
"_discovered": true
},
{
"name": "allenai/OLMoE-1B-7B-0125",
"provider": "allenai",
"parameter_count": "6.9B",
"parameters_raw": 6919161856,
"min_ram_gb": 3.9,
"recommended_ram_gb": 6.4,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmoe",
"hf_downloads": 42434,
"hf_likes": 35,
"release_date": "2025-01-21",
"is_moe": true,
"num_experts": 64,
"active_experts": 8,
"active_parameters": 1167608556,
"_discovered": true
},
{
"name": "allenai/OLMoE-1B-7B-0125-Instruct",
"provider": "allenai",
"parameter_count": "6.9B",
"parameters_raw": 6919161856,
"min_ram_gb": 3.9,
"recommended_ram_gb": 6.4,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmoe",
"hf_downloads": 35624,
"hf_likes": 58,
"release_date": "2025-01-27",
"is_moe": true,
"num_experts": 64,
"active_experts": 8,
"active_parameters": 1167608556,
"_discovered": true
},
{
"name": "EleutherAI/pythia-6.9b",
"provider": "eleutherai",
"parameter_count": "7.0B",
"parameters_raw": 6991520256,
"min_ram_gb": 3.9,
"recommended_ram_gb": 6.5,
"min_vram_gb": 3.6,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neox",
"hf_downloads": 20516,
"hf_likes": 59,
"release_date": "2023-02-14",
"_discovered": true
},
{
"name": "openchat/openchat-3.5-0106",
"provider": "OpenChat",
"parameter_count": "7.0B",
"parameters_raw": 7000000000,
"min_ram_gb": 3.9,
"recommended_ram_gb": 6.5,
"min_vram_gb": 3.6,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "Instruction following, chat",
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "XiaomiMiMo/MiMo-7B-RL",
"provider": "Xiaomi",
"parameter_count": "7.0B",
"parameters_raw": 7000000000,
"min_ram_gb": 3.9,
"recommended_ram_gb": 6.5,
"min_vram_gb": 3.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Advanced reasoning, math and code",
"pipeline_tag": "text-generation",
"architecture": "mimo",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-05-01"
},
{
"name": "microsoft/Orca-2-7b",
"provider": "Microsoft",
"parameter_count": "7.0B",
"parameters_raw": 7016400896,
"min_ram_gb": 3.9,
"recommended_ram_gb": 6.5,
"min_vram_gb": 3.6,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Reasoning, step-by-step solutions",
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "omni-research/Tarsier-7b",
"provider": "omni-research",
"parameter_count": "7.1B",
"parameters_raw": 7063427072,
"min_ram_gb": 3.9,
"recommended_ram_gb": 6.6,
"min_vram_gb": 3.6,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llava",
"hf_downloads": 49581,
"hf_likes": 25,
"release_date": "2024-07-04",
"_discovered": true
},
{
"name": "bigcode/starcoder2-7b",
"provider": "BigCode",
"parameter_count": "7.2B",
"parameters_raw": 7173923840,
"min_ram_gb": 4.0,
"recommended_ram_gb": 6.7,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 16384,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "starcoder2",
"hf_downloads": 19199,
"hf_likes": 208,
"release_date": "2024-02-20"
},
{
"name": "tiiuae/falcon-7b-instruct",
"provider": "TII",
"parameter_count": "7.2B",
"parameters_raw": 7217189760,
"min_ram_gb": 4.0,
"recommended_ram_gb": 6.7,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "falcon",
"hf_downloads": 47656,
"hf_likes": 1031,
"release_date": "2023-04-25"
},
{
"name": "HuggingFaceH4/zephyr-7b-beta",
"provider": "HuggingFace",
"parameter_count": "7.2B",
"parameters_raw": 7241732096,
"min_ram_gb": 4.0,
"recommended_ram_gb": 6.7,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 107437,
"hf_likes": 1834,
"release_date": "2023-10-26"
},
{
"name": "mistralai/Mistral-7B-Instruct-v0.2",
"provider": "Mistral AI",
"parameter_count": "7.2B",
"parameters_raw": 7241732096,
"min_ram_gb": 4.0,
"recommended_ram_gb": 6.7,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 2920309,
"hf_likes": 3088,
"release_date": "2023-12-11",
"_discovered": true
},
{
"name": "speakleash/Bielik-7B-Instruct-v0.1",
"provider": "speakleash",
"parameter_count": "7.2B",
"parameters_raw": 7241732096,
"min_ram_gb": 4.0,
"recommended_ram_gb": 6.7,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 101914,
"hf_likes": 63,
"release_date": "2024-03-30",
"_discovered": true
},
{
"name": "prometheus-eval/prometheus-7b-v2.0",
"provider": "prometheus-eval",
"parameter_count": "7.2B",
"parameters_raw": 7241732096,
"min_ram_gb": 4.0,
"recommended_ram_gb": 6.7,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 54661,
"hf_likes": 100,
"release_date": "2024-02-13",
"_discovered": true
},
{
"name": "Salesforce/xLAM-7b-r",
"provider": "salesforce",
"parameter_count": "7.2B",
"parameters_raw": 7241732096,
"min_ram_gb": 4.0,
"recommended_ram_gb": 6.7,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 38045,
"hf_likes": 32,
"release_date": "2024-08-28",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/xLAM-7b-r-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Intel/neural-chat-7b-v3-3",
"provider": "intel",
"parameter_count": "7.2B",
"parameters_raw": 7241732096,
"min_ram_gb": 4.0,
"recommended_ram_gb": 6.7,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 27068,
"hf_likes": 80,
"release_date": "2023-12-09",
"_discovered": true
},
{
"name": "Featherless-Chat-Models/Mistral-7B-Instruct-v0.2",
"provider": "featherless-chat-models",
"parameter_count": "7.2B",
"parameters_raw": 7241732096,
"min_ram_gb": 4.0,
"recommended_ram_gb": 6.7,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 26186,
"hf_likes": 0,
"release_date": "2025-05-08",
"_discovered": true
},
{
"name": "augmxnt/shisa-gamma-7b-v1",
"provider": "augmxnt",
"parameter_count": "7.2B",
"parameters_raw": 7241732096,
"min_ram_gb": 4.0,
"recommended_ram_gb": 6.7,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 20213,
"hf_likes": 18,
"release_date": "2023-12-23",
"_discovered": true
},
{
"name": "dphn/dolphin-2.6-mistral-7b",
"provider": "dphn",
"parameter_count": "7.2B",
"parameters_raw": 7241740288,
"min_ram_gb": 4.0,
"recommended_ram_gb": 6.7,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 60305,
"hf_likes": 105,
"release_date": "2023-12-27",
"_discovered": true
},
{
"name": "mistralai/Mistral-7B-Instruct-v0.3",
"provider": "Mistral AI",
"parameter_count": "7.2B",
"parameters_raw": 7248023552,
"min_ram_gb": 4.1,
"recommended_ram_gb": 6.8,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "unknown",
"architecture": "mistral",
"hf_downloads": 1540743,
"hf_likes": 2447,
"release_date": "2024-05-22",
"gguf_sources": [
{
"repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "allenai/wildguard",
"provider": "allenai",
"parameter_count": "7.2B",
"parameters_raw": 7248031744,
"min_ram_gb": 4.1,
"recommended_ram_gb": 6.8,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 23686,
"hf_likes": 38,
"release_date": "2024-06-15",
"_discovered": true
},
{
"name": "dphn/dolphin-2.9.3-mistral-7B-32k",
"provider": "dphn",
"parameter_count": "7.2B",
"parameters_raw": 7248039936,
"min_ram_gb": 4.1,
"recommended_ram_gb": 6.8,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 79357,
"hf_likes": 57,
"release_date": "2024-06-25",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/dolphin-2.9.3-mistral-7B-32k-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "thesven/Mistral-7B-Instruct-v0.3-GPTQ",
"provider": "thesven",
"parameter_count": "7.2B",
"parameters_raw": 7249399808,
"min_ram_gb": 4.1,
"recommended_ram_gb": 6.8,
"min_vram_gb": 3.7,
"quantization": "GPTQ-Int4",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 35763,
"hf_likes": 1,
"release_date": "2024-05-22",
"_discovered": true,
"format": "gptq"
},
{
"name": "allenai/Olmo-3-7B-Instruct-SFT",
"provider": "allenai",
"parameter_count": "7.3B",
"parameters_raw": 7298011136,
"min_ram_gb": 4.1,
"recommended_ram_gb": 6.8,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 65536,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo3",
"hf_downloads": 134834,
"hf_likes": 4,
"release_date": "2025-11-17",
"_discovered": true
},
{
"name": "allenai/Olmo-3-1025-7B",
"provider": "allenai",
"parameter_count": "7.3B",
"parameters_raw": 7298011136,
"min_ram_gb": 4.1,
"recommended_ram_gb": 6.8,
"min_vram_gb": 3.7,
"quantization": "Q4_K_M",
"context_length": 65536,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo3",
"hf_downloads": 71128,
"hf_likes": 54,
"release_date": "2025-09-12",
"_discovered": true
},
{
"name": "TechxGenus/starcoder2-7b-GPTQ",
"provider": "techxgenus",
"parameter_count": "7.4B",
"parameters_raw": 7400416256,
"min_ram_gb": 4.1,
"recommended_ram_gb": 6.9,
"min_vram_gb": 3.8,
"quantization": "GPTQ-Int4",
"context_length": 16384,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "starcoder2",
"hf_downloads": 36955,
"hf_likes": 2,
"release_date": "2024-03-22",
"_discovered": true,
"format": "gptq"
},
{
"name": "tiiuae/Falcon3-7B-Instruct",
"provider": "TII",
"parameter_count": "7.5B",
"parameters_raw": 7455550464,
"min_ram_gb": 4.2,
"recommended_ram_gb": 6.9,
"min_vram_gb": 3.8,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 18394,
"hf_likes": 76,
"release_date": "2024-11-29",
"gguf_sources": [
{
"repo": "bartowski/Falcon3-7B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-7B-Instruct",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 20736120,
"hf_likes": 1108,
"release_date": "2024-09-16",
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-7B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-Coder-7B-Instruct",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1575000,
"hf_likes": 659,
"release_date": "2024-09-17",
"gguf_sources": [
{
"repo": "unsloth/Qwen2.5-Coder-7B-Instruct-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/Qwen2.5-Coder-7B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B",
"provider": "DeepSeek",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 743941,
"hf_likes": 797,
"release_date": "2025-01-20",
"gguf_sources": [
{
"repo": "unsloth/DeepSeek-R1-Distill-Qwen-7B-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/DeepSeek-R1-Distill-Qwen-7B-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-7B",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 2029944,
"hf_likes": 266,
"release_date": "2024-09-15",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-Coder-7B-Instruct-AWQ",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1107387,
"hf_likes": 19,
"release_date": "2024-09-20",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen2.5-Coder-7B-Instruct-GPTQ-Int4",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "GPTQ-Int4",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1066717,
"hf_likes": 13,
"release_date": "2024-09-20",
"_discovered": true,
"format": "gptq"
},
{
"name": "Qwen/Qwen2.5-Math-7B-Instruct",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 318106,
"hf_likes": 89,
"release_date": "2024-09-19",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-Math-7B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2-7B-Instruct",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 310355,
"hf_likes": 683,
"release_date": "2024-06-04",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2-7B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-Coder-7B",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 240132,
"hf_likes": 137,
"release_date": "2024-09-16",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-7B-Instruct-GPTQ-Int4",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "GPTQ-Int4",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 158122,
"hf_likes": 29,
"release_date": "2024-09-17",
"_discovered": true,
"format": "gptq"
},
{
"name": "Dream-org/Dream-v0-Instruct-7B",
"provider": "dream-org",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "Dream",
"hf_downloads": 73949,
"hf_likes": 154,
"release_date": "2025-04-03",
"_discovered": true
},
{
"name": "Qwen/Qwen2-7B",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 70734,
"hf_likes": 170,
"release_date": "2024-06-04",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-Math-7B",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 68238,
"hf_likes": 106,
"release_date": "2024-09-16",
"_discovered": true
},
{
"name": "DeepHat/DeepHat-V1-7B",
"provider": "deephat",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 63374,
"hf_likes": 111,
"release_date": "2025-04-25",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-7B-Instruct-1M",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 1010000,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 46699,
"hf_likes": 366,
"release_date": "2025-01-23",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-7B-Instruct-1M-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-7B-Instruct-GPTQ-Int8",
"provider": "Alibaba",
"parameter_count": "7.6B",
"parameters_raw": 7615616512,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "GPTQ-Int8",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 30708,
"hf_likes": 18,
"release_date": "2024-09-17",
"_discovered": true,
"format": "gptq"
},
{
"name": "microsoft/Phi-mini-MoE-instruct",
"provider": "Microsoft",
"parameter_count": "7.6B",
"parameters_raw": 7647632704,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.1,
"min_vram_gb": 3.9,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phimoe",
"hf_downloads": 69775,
"hf_likes": 30,
"release_date": "2025-06-23",
"is_moe": true,
"num_experts": 16,
"active_experts": 2,
"active_parameters": 1290538017,
"_discovered": true
},
{
"name": "Qwen/Qwen-7B-Chat",
"provider": "Alibaba",
"parameter_count": "7.7B",
"parameters_raw": 7721324544,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.2,
"min_vram_gb": 4.0,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen",
"hf_downloads": 195550,
"hf_likes": 787,
"release_date": "2023-08-03",
"_discovered": true
},
{
"name": "Qwen/Qwen-7B",
"provider": "Alibaba",
"parameter_count": "7.7B",
"parameters_raw": 7721324544,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.2,
"min_vram_gb": 4.0,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen",
"hf_downloads": 189346,
"hf_likes": 396,
"release_date": "2023-08-03",
"_discovered": true
},
{
"name": "Qwen/Qwen1.5-7B",
"provider": "Alibaba",
"parameter_count": "7.7B",
"parameters_raw": 7721324544,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.2,
"min_vram_gb": 4.0,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 75458,
"hf_likes": 56,
"release_date": "2024-01-22",
"_discovered": true
},
{
"name": "BSC-LT/salamandra-7b-instruct",
"provider": "bsc-lt",
"parameter_count": "7.8B",
"parameters_raw": 7768117248,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.2,
"min_vram_gb": 4.0,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 31017,
"hf_likes": 75,
"release_date": "2024-09-30",
"_discovered": true
},
{
"name": "kmhf/hf-moshiko",
"provider": "kmhf",
"parameter_count": "7.8B",
"parameters_raw": 7783880545,
"min_ram_gb": 4.3,
"recommended_ram_gb": 7.2,
"min_vram_gb": 4.0,
"quantization": "Q4_K_M",
"context_length": 3000,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "moshi",
"hf_downloads": 123900,
"hf_likes": 0,
"release_date": "2024-09-27",
"_discovered": true
},
{
"name": "XiaomiMiMo/MiMo-7B-Base",
"provider": "xiaomimimo",
"parameter_count": "7.8B",
"parameters_raw": 7833409536,
"min_ram_gb": 4.4,
"recommended_ram_gb": 7.3,
"min_vram_gb": 4.0,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mimo",
"hf_downloads": 93937,
"hf_likes": 124,
"release_date": "2025-04-29",
"_discovered": true
},
{
"name": "google/gemma-3n-E4B-it",
"provider": "Google",
"parameter_count": "8B",
"parameters_raw": 8000000000,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Multimodal, on-device (effective 4B)",
"pipeline_tag": "image-text-to-text",
"architecture": "gemma3n",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-06-25",
"gguf_sources": [
{
"repo": "unsloth/gemma-3n-E4B-it-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "mistralai/Ministral-8B-Instruct-2410",
"provider": "Mistral AI",
"parameter_count": "8.0B",
"parameters_raw": 8030261248,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "bartowski/Ministral-8B-Instruct-2410-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "meta-llama/Meta-Llama-3-8B",
"provider": "Meta",
"parameter_count": "8.0B",
"parameters_raw": 8030261248,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 2463959,
"hf_likes": 6473,
"release_date": "2024-04-17",
"_discovered": true
},
{
"name": "meta-llama/Meta-Llama-3-8B-Instruct",
"provider": "Meta",
"parameter_count": "8.0B",
"parameters_raw": 8030261248,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 1353966,
"hf_likes": 4391,
"release_date": "2024-04-17",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Meta-Llama-3-8B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "NousResearch/Hermes-3-Llama-3.1-8B",
"provider": "NousResearch",
"parameter_count": "8.0B",
"parameters_raw": 8030261248,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 635984,
"hf_likes": 391,
"release_date": "2024-07-28",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Hermes-3-Llama-3.1-8B-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "IlyaGusev/saiga_llama3_8b",
"provider": "ilyagusev",
"parameter_count": "8.0B",
"parameters_raw": 8030261248,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 399621,
"hf_likes": 137,
"release_date": "2024-04-18",
"_discovered": true
},
{
"name": "NousResearch/Meta-Llama-3.1-8B-Instruct",
"provider": "NousResearch",
"parameter_count": "8.0B",
"parameters_raw": 8030261248,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 207258,
"hf_likes": 39,
"release_date": "2024-07-24",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "meta-llama/Llama-Guard-3-8B",
"provider": "Meta",
"parameter_count": "8.0B",
"parameters_raw": 8030261248,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 163719,
"hf_likes": 272,
"release_date": "2024-07-22",
"_discovered": true
},
{
"name": "nvidia/Llama-3.1-8B-Instruct-FP8",
"provider": "nvidia",
"parameter_count": "8.0B",
"parameters_raw": 8030261248,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 93876,
"hf_likes": 32,
"release_date": "2024-08-29",
"_discovered": true
},
{
"name": "PatronusAI/Llama-3-Patronus-Lynx-8B-Instruct-v1.1",
"provider": "patronusai",
"parameter_count": "8.0B",
"parameters_raw": 8030261248,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 20626,
"hf_likes": 10,
"release_date": "2024-07-24",
"_discovered": true
},
{
"name": "RedHatAI/Meta-Llama-3.1-8B-Instruct-FP8",
"provider": "redhatai",
"parameter_count": "8.0B",
"parameters_raw": 8030261696,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 684729,
"hf_likes": 44,
"release_date": "2024-07-23",
"_discovered": true
},
{
"name": "RedHatAI/Meta-Llama-3.1-8B-FP8",
"provider": "redhatai",
"parameter_count": "8.0B",
"parameters_raw": 8030261696,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 200501,
"hf_likes": 10,
"release_date": "2024-07-31",
"_discovered": true
},
{
"name": "fdtn-ai/Foundation-Sec-1.1-8B-Instruct",
"provider": "fdtn-ai",
"parameter_count": "8.0B",
"parameters_raw": 8030326784,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 65536,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 53389,
"hf_likes": 13,
"release_date": "2025-11-18",
"_discovered": true
},
{
"name": "lmms-lab/llava-onevision-qwen2-7b-ov",
"provider": "lmms-lab",
"parameter_count": "8.0B",
"parameters_raw": 8030348832,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [
"vision"
],
"pipeline_tag": "text-generation",
"architecture": "llava",
"hf_downloads": 133340,
"hf_likes": 62,
"release_date": "2024-06-29",
"_discovered": true
},
{
"name": "RedHatAI/Meta-Llama-3.1-8B-Instruct-quantized.w4a16",
"provider": "redhatai",
"parameter_count": "8.0B",
"parameters_raw": 8031637504,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 36809,
"hf_likes": 30,
"release_date": "2024-07-26",
"_discovered": true
},
{
"name": "hugging-quants/Meta-Llama-3.1-8B-Instruct-GPTQ-INT4",
"provider": "hugging-quants",
"parameter_count": "8.0B",
"parameters_raw": 8031637504,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "GPTQ-Int4",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 27054,
"hf_likes": 41,
"release_date": "2024-07-24",
"_discovered": true,
"format": "gptq"
},
{
"name": "RedHatAI/Meta-Llama-3.1-8B-Instruct-FP8-dynamic",
"provider": "redhatai",
"parameter_count": "8.0B",
"parameters_raw": 8031637504,
"min_ram_gb": 4.5,
"recommended_ram_gb": 7.5,
"min_vram_gb": 4.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 21204,
"hf_likes": 9,
"release_date": "2024-07-23",
"_discovered": true
},
{
"name": "ibm-granite/granite-3.3-8b-instruct",
"provider": "ibm-granite",
"parameter_count": "8.2B",
"parameters_raw": 8170864640,
"min_ram_gb": 4.6,
"recommended_ram_gb": 7.6,
"min_vram_gb": 4.2,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granite",
"hf_downloads": 65699,
"hf_likes": 153,
"release_date": "2025-04-09",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/granite-3.3-8b-instruct-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen3-8B-Base",
"provider": "Alibaba",
"parameter_count": "8.2B",
"parameters_raw": 8190735360,
"min_ram_gb": 4.6,
"recommended_ram_gb": 7.6,
"min_vram_gb": 4.2,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 790734,
"hf_likes": 87,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "Qwen/Qwen3-8B-AWQ",
"provider": "Alibaba",
"parameter_count": "8.2B",
"parameters_raw": 8190735360,
"min_ram_gb": 4.6,
"recommended_ram_gb": 7.6,
"min_vram_gb": 4.2,
"quantization": "AWQ-4bit",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 327827,
"hf_likes": 37,
"release_date": "2025-05-03",
"_discovered": true,
"format": "awq"
},
{
"name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
"provider": "DeepSeek",
"parameter_count": "8.2B",
"parameters_raw": 8190735360,
"min_ram_gb": 4.6,
"recommended_ram_gb": 7.6,
"min_vram_gb": 4.2,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 148562,
"hf_likes": 1040,
"release_date": "2025-05-29",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/DeepSeek-R1-0528-Qwen3-8B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "huihui-ai/Huihui-Qwen3-8B-abliterated-v2",
"provider": "huihui-ai",
"parameter_count": "8.2B",
"parameters_raw": 8190735360,
"min_ram_gb": 4.6,
"recommended_ram_gb": 7.6,
"min_vram_gb": 4.2,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 32025,
"hf_likes": 34,
"release_date": "2025-06-18",
"_discovered": true
},
{
"name": "Qwen/Qwen3-8B-FP8",
"provider": "Alibaba",
"parameter_count": "8.2B",
"parameters_raw": 8191159296,
"min_ram_gb": 4.6,
"recommended_ram_gb": 7.6,
"min_vram_gb": 4.2,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 196191,
"hf_likes": 57,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "nytopop/Qwen3-8B.w8a8",
"provider": "nytopop",
"parameter_count": "8.2B",
"parameters_raw": 8192136192,
"min_ram_gb": 4.6,
"recommended_ram_gb": 7.6,
"min_vram_gb": 4.2,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 33985,
"hf_likes": 1,
"release_date": "2025-04-29",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-VL-7B-Instruct",
"provider": "Alibaba",
"parameter_count": "8.3B",
"parameters_raw": 8292166656,
"min_ram_gb": 4.6,
"recommended_ram_gb": 7.7,
"min_vram_gb": 4.2,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Instruction following, chat",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen2_5_vl",
"hf_downloads": 4008802,
"hf_likes": 1462,
"release_date": "2025-01-26",
"gguf_sources": [
{
"repo": "unsloth/Qwen2.5-VL-7B-Instruct-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "LiquidAI/LFM2-8B-A1B",
"provider": "liquidai",
"parameter_count": "8.3B",
"parameters_raw": 8339929856,
"min_ram_gb": 4.7,
"recommended_ram_gb": 7.8,
"min_vram_gb": 4.3,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2_moe",
"hf_downloads": 47242,
"hf_likes": 328,
"release_date": "2025-10-07",
"is_moe": true,
"num_experts": 32,
"active_experts": 4,
"active_parameters": 1407363160,
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/LFM2-8B-A1B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "nvidia/Mistral-NeMo-Minitron-8B-Instruct",
"provider": "nvidia",
"parameter_count": "8.4B",
"parameters_raw": 8414105600,
"min_ram_gb": 4.7,
"recommended_ram_gb": 7.8,
"min_vram_gb": 4.3,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 55809,
"hf_likes": 82,
"release_date": "2024-10-02",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Mistral-NeMo-Minitron-8B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "01-ai/Yi-1.5-9B-Chat",
"provider": "01.ai",
"parameter_count": "8.8B",
"parameters_raw": 8829407232,
"min_ram_gb": 4.9,
"recommended_ram_gb": 8.2,
"min_vram_gb": 4.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 19975,
"hf_likes": 148,
"release_date": "2024-05-10",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Yi-1.5-9B-Chat-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "nvidia/NVIDIA-Nemotron-Nano-9B-v2-Base",
"provider": "nvidia",
"parameter_count": "8.9B",
"parameters_raw": 8888227328,
"min_ram_gb": 5.0,
"recommended_ram_gb": 8.3,
"min_vram_gb": 4.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 165722,
"hf_likes": 43,
"release_date": "2025-08-14",
"_discovered": true
},
{
"name": "nvidia/NVIDIA-Nemotron-Nano-9B-v2-Japanese",
"provider": "nvidia",
"parameter_count": "8.9B",
"parameters_raw": 8888227328,
"min_ram_gb": 5.0,
"recommended_ram_gb": 8.3,
"min_vram_gb": 4.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nemotron_h",
"hf_downloads": 24028,
"hf_likes": 121,
"release_date": "2026-02-04",
"_discovered": true
},
{
"name": "nvidia/NVIDIA-Nemotron-Nano-9B-v2-FP8",
"provider": "nvidia",
"parameter_count": "8.9B",
"parameters_raw": 8888227432,
"min_ram_gb": 5.0,
"recommended_ram_gb": 8.3,
"min_vram_gb": 4.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nemotron_h",
"hf_downloads": 70791,
"hf_likes": 7,
"release_date": "2025-09-22",
"_discovered": true
},
{
"name": "nvidia/NVIDIA-Nemotron-Nano-9B-v2",
"provider": "NVIDIA",
"parameter_count": "9B",
"parameters_raw": 9000000000,
"min_ram_gb": 5.0,
"recommended_ram_gb": 8.4,
"min_vram_gb": 4.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Hybrid Mamba2, reasoning",
"pipeline_tag": "text-generation",
"architecture": "nemotron",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-06-01"
},
{
"name": "lmstudio-community/Qwen3-32B-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "9.2B",
"parameters_raw": 9214833664,
"min_ram_gb": 5.1,
"recommended_ram_gb": 8.6,
"min_vram_gb": 4.7,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 24718,
"hf_likes": 2,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "lmstudio-community/Qwen2.5-Coder-32B-Instruct-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "9.2B",
"parameters_raw": 9215644672,
"min_ram_gb": 5.1,
"recommended_ram_gb": 8.6,
"min_vram_gb": 4.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 41754,
"hf_likes": 3,
"release_date": "2024-11-11",
"_discovered": true
},
{
"name": "lmstudio-community/QwQ-32B-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "9.2B",
"parameters_raw": 9215644672,
"min_ram_gb": 5.1,
"recommended_ram_gb": 8.6,
"min_vram_gb": 4.7,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 32269,
"hf_likes": 0,
"release_date": "2025-03-05",
"_discovered": true
},
{
"name": "google/gemma-2-9b-it",
"provider": "Google",
"parameter_count": "9.2B",
"parameters_raw": 9241705984,
"min_ram_gb": 5.2,
"recommended_ram_gb": 8.6,
"min_vram_gb": 4.7,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gemma2",
"hf_downloads": 180627,
"hf_likes": 775,
"release_date": "2024-06-24",
"gguf_sources": [
{
"repo": "bartowski/gemma-2-9b-it-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "zai-org/glm-4-9b-chat-hf",
"provider": "zai-org",
"parameter_count": "9.4B",
"parameters_raw": 9399951360,
"min_ram_gb": 5.3,
"recommended_ram_gb": 8.8,
"min_vram_gb": 4.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm",
"hf_downloads": 22553,
"hf_likes": 24,
"release_date": "2024-10-23",
"_discovered": true
},
{
"name": "THUDM/glm-4-9b-chat",
"provider": "thudm",
"parameter_count": "9.4B",
"parameters_raw": 9399951392,
"min_ram_gb": 5.3,
"recommended_ram_gb": 8.8,
"min_vram_gb": 4.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "unknown",
"architecture": "chatglm",
"hf_downloads": 190092,
"hf_likes": 702,
"release_date": "2024-06-04",
"gguf_sources": [
{
"repo": "bartowski/glm-4-9b-chat-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "zai-org/glm-4-9b",
"provider": "zai-org",
"parameter_count": "9.4B",
"parameters_raw": 9399951392,
"min_ram_gb": 5.3,
"recommended_ram_gb": 8.8,
"min_vram_gb": 4.8,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "chatglm",
"hf_downloads": 23550,
"hf_likes": 143,
"release_date": "2024-06-04",
"_discovered": true
},
{
"name": "Qwen/Qwen3.5-9B",
"provider": "Alibaba",
"parameter_count": "9.7B",
"parameters_raw": 9653104368,
"min_ram_gb": 5.4,
"recommended_ram_gb": 9.0,
"min_vram_gb": 4.9,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 172298,
"hf_likes": 345,
"release_date": "2026-02-27",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-9B-GGUF",
"provider": "unsloth",
"file": "Qwen3.5-9B-Q4_K_M.gguf"
}
]
},
{
"name": "Qwen/Qwen3.5-9B-Base",
"provider": "Alibaba",
"parameter_count": "9.7B",
"parameters_raw": 9653104368,
"min_ram_gb": 5.4,
"recommended_ram_gb": 9.0,
"min_vram_gb": 4.9,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 5324,
"hf_likes": 38,
"release_date": "2026-02-26"
},
{
"name": "solidrust/gemma-2-9b-it-AWQ",
"provider": "solidrust",
"parameter_count": "10.2B",
"parameters_raw": 10159209984,
"min_ram_gb": 5.7,
"recommended_ram_gb": 9.5,
"min_vram_gb": 5.2,
"quantization": "AWQ-4bit",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gemma2",
"hf_downloads": 32664,
"hf_likes": 2,
"release_date": "2024-09-03",
"_discovered": true,
"format": "awq"
},
{
"name": "meta-llama/Llama-3.2-11B-Vision-Instruct",
"provider": "Meta",
"parameter_count": "11.0B",
"parameters_raw": 10665463808,
"min_ram_gb": 6.0,
"recommended_ram_gb": 9.9,
"min_vram_gb": 5.5,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Multimodal, vision and text",
"pipeline_tag": "image-text-to-text",
"architecture": "llama",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "upstage/SOLAR-10.7B-Instruct-v1.0",
"provider": "Upstage",
"parameter_count": "10.7B",
"parameters_raw": 10700000000,
"min_ram_gb": 6.0,
"recommended_ram_gb": 10.0,
"min_vram_gb": 5.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "High-performance instruction following",
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "naver-hyperclovax/HyperCLOVAX-SEED-Omni-8B",
"provider": "naver-hyperclovax",
"parameter_count": "10.7B",
"parameters_raw": 10741664520,
"min_ram_gb": 6.0,
"recommended_ram_gb": 10.0,
"min_vram_gb": 5.5,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "vlm",
"hf_downloads": 102546,
"hf_likes": 181,
"release_date": "2025-12-23",
"_discovered": true
},
{
"name": "speakleash/Bielik-11B-v3.0-Instruct",
"provider": "speakleash",
"parameter_count": "11.2B",
"parameters_raw": 11168796672,
"min_ram_gb": 6.2,
"recommended_ram_gb": 10.4,
"min_vram_gb": 5.7,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 232376,
"hf_likes": 55,
"release_date": "2025-11-07",
"_discovered": true
},
{
"name": "cjvt/GaMS3-12B-Instruct",
"provider": "cjvt",
"parameter_count": "11.8B",
"parameters_raw": 11766034176,
"min_ram_gb": 6.6,
"recommended_ram_gb": 11.0,
"min_vram_gb": 6.0,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gemma3_text",
"hf_downloads": 26653,
"hf_likes": 1,
"release_date": "2025-12-04",
"_discovered": true
},
{
"name": "EleutherAI/pythia-12b",
"provider": "eleutherai",
"parameter_count": "12.0B",
"parameters_raw": 11997067840,
"min_ram_gb": 6.7,
"recommended_ram_gb": 11.2,
"min_vram_gb": 6.1,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_neox",
"hf_downloads": 43453,
"hf_likes": 144,
"release_date": "2023-02-28",
"_discovered": true
},
{
"name": "google/gemma-3-12b-it",
"provider": "Google",
"parameter_count": "12B",
"parameters_raw": 12000000000,
"min_ram_gb": 6.7,
"recommended_ram_gb": 11.2,
"min_vram_gb": 6.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Multimodal, vision and text",
"pipeline_tag": "text-generation",
"architecture": "gemma3",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "unsloth/gemma-3-12b-it-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "mistralai/Mistral-Nemo-Instruct-2407",
"provider": "Mistral AI",
"parameter_count": "12.2B",
"parameters_raw": 12247076864,
"min_ram_gb": 6.8,
"recommended_ram_gb": 11.4,
"min_vram_gb": 6.3,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "unsloth/Mistral-Nemo-Instruct-2407-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/Mistral-Nemo-Instruct-2407-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "casperhansen/mistral-nemo-instruct-2407-awq",
"provider": "casperhansen",
"parameter_count": "12.2B",
"parameters_raw": 12247782400,
"min_ram_gb": 6.8,
"recommended_ram_gb": 11.4,
"min_vram_gb": 6.3,
"quantization": "AWQ-4bit",
"context_length": 1024000,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 189490,
"hf_likes": 12,
"release_date": "2024-07-23",
"_discovered": true,
"format": "awq"
},
{
"name": "m8than/Mistral-Nemo-Instruct-2407-lenient-chatfix",
"provider": "m8than",
"parameter_count": "12.2B",
"parameters_raw": 12247782400,
"min_ram_gb": 6.8,
"recommended_ram_gb": 11.4,
"min_vram_gb": 6.3,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 25879,
"hf_likes": 0,
"release_date": "2025-05-06",
"_discovered": true
},
{
"name": "mixtao/MixTAO-7Bx2-MoE-v8.1",
"provider": "mixtao",
"parameter_count": "12.9B",
"parameters_raw": 12879138816,
"min_ram_gb": 7.2,
"recommended_ram_gb": 12.0,
"min_vram_gb": 6.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mixtral",
"hf_downloads": 20213,
"hf_likes": 55,
"release_date": "2024-02-26",
"is_moe": true,
"num_experts": 2,
"active_experts": 2,
"active_parameters": 12879138816,
"_discovered": true
},
{
"name": "microsoft/Orca-2-13b",
"provider": "Microsoft",
"parameter_count": "13.0B",
"parameters_raw": 13015864320,
"min_ram_gb": 7.3,
"recommended_ram_gb": 12.1,
"min_vram_gb": 6.7,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Reasoning, step-by-step solutions",
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "lmsys/vicuna-13b-v1.5",
"provider": "LMSYS",
"parameter_count": "13.0B",
"parameters_raw": 13015864320,
"min_ram_gb": 7.3,
"recommended_ram_gb": 12.1,
"min_vram_gb": 6.7,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "WizardLMTeam/WizardLM-13B-V1.2",
"provider": "WizardLM",
"parameter_count": "13.0B",
"parameters_raw": 13015864320,
"min_ram_gb": 7.3,
"recommended_ram_gb": 12.1,
"min_vram_gb": 6.7,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "cais/HarmBench-Llama-2-13b-cls",
"provider": "cais",
"parameter_count": "13.0B",
"parameters_raw": 13015864320,
"min_ram_gb": 7.3,
"recommended_ram_gb": 12.1,
"min_vram_gb": 6.7,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 30370,
"hf_likes": 27,
"release_date": "2024-02-03",
"_discovered": true
},
{
"name": "meta-llama/CodeLlama-13b-Instruct-hf",
"provider": "Meta",
"parameter_count": "13.0B",
"parameters_raw": 13016028160,
"min_ram_gb": 7.3,
"recommended_ram_gb": 12.1,
"min_vram_gb": 6.7,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 6450,
"hf_likes": 27,
"release_date": "2024-03-13"
},
{
"name": "microsoft/phi-4",
"provider": "Microsoft",
"parameter_count": "14B",
"parameters_raw": 14000000000,
"min_ram_gb": 7.8,
"recommended_ram_gb": 13.0,
"min_vram_gb": 7.2,
"quantization": "Q4_K_M",
"context_length": 16384,
"use_case": "Reasoning, STEM, code generation",
"pipeline_tag": "text-generation",
"architecture": "phi",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "unsloth/phi-4-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/phi-4-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "microsoft/Phi-3-medium-14b-instruct",
"provider": "Microsoft",
"parameter_count": "14B",
"parameters_raw": 14000000000,
"min_ram_gb": 7.8,
"recommended_ram_gb": 13.0,
"min_vram_gb": 7.2,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Balanced performance and size",
"pipeline_tag": "text-generation",
"architecture": "phi3",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "microsoft/Phi-4-reasoning",
"provider": "Microsoft",
"parameter_count": "14B",
"parameters_raw": 14000000000,
"min_ram_gb": 7.8,
"recommended_ram_gb": 13.0,
"min_vram_gb": 7.2,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Advanced reasoning, math and code",
"pipeline_tag": "text-generation",
"architecture": "phi4",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-04-01",
"gguf_sources": [
{
"repo": "unsloth/Phi-4-reasoning-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "microsoft/Phi-4-multimodal-instruct",
"provider": "Microsoft",
"parameter_count": "14B",
"parameters_raw": 14000000000,
"min_ram_gb": 7.8,
"recommended_ram_gb": 13.0,
"min_vram_gb": 7.2,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Multimodal, vision and audio",
"pipeline_tag": "image-text-to-text",
"architecture": "phi4",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-04-01"
},
{
"name": "Qwen/Qwen-14B-Chat-Int4",
"provider": "Alibaba",
"parameter_count": "14.2B",
"parameters_raw": 14168796160,
"min_ram_gb": 7.9,
"recommended_ram_gb": 13.2,
"min_vram_gb": 7.3,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen",
"hf_downloads": 45732,
"hf_likes": 100,
"release_date": "2023-09-24",
"_discovered": true
},
{
"name": "Qwen/Qwen1.5-MoE-A2.7B",
"provider": "Alibaba",
"parameter_count": "14.3B",
"parameters_raw": 14315784192,
"min_ram_gb": 8.0,
"recommended_ram_gb": 13.3,
"min_vram_gb": 7.3,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2_moe",
"hf_downloads": 59931,
"hf_likes": 220,
"release_date": "2024-02-29",
"is_moe": true,
"num_experts": 60,
"active_experts": 4,
"active_parameters": 1622455541,
"_discovered": true
},
{
"name": "bullpoint/Qwen3-Coder-Next-AWQ-4bit",
"provider": "bullpoint",
"parameter_count": "14.4B",
"parameters_raw": 14444722944,
"min_ram_gb": 8.1,
"recommended_ram_gb": 13.5,
"min_vram_gb": 7.4,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 1226868,
"hf_likes": 14,
"release_date": "2026-02-03",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": 990253467,
"_discovered": true,
"format": "awq"
},
{
"name": "stelterlab/phi-4-AWQ",
"provider": "stelterlab",
"parameter_count": "14.7B",
"parameters_raw": 14659507200,
"min_ram_gb": 8.2,
"recommended_ram_gb": 13.7,
"min_vram_gb": 7.5,
"quantization": "AWQ-4bit",
"context_length": 16384,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "phi3",
"hf_downloads": 55064,
"hf_likes": 4,
"release_date": "2025-01-11",
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3-Next-80B-A3B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "80.0B",
"parameters_raw": 80000000000,
"min_ram_gb": 8.2,
"recommended_ram_gb": 13.7,
"min_vram_gb": 7.5,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 192744,
"hf_likes": 61,
"release_date": "2025-09-12",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": 3000000000,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3-Next-80B-A3B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "80.0B",
"parameters_raw": 80000000000,
"min_ram_gb": 8.2,
"recommended_ram_gb": 13.7,
"min_vram_gb": 7.5,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 168561,
"hf_likes": 22,
"release_date": "2025-09-12",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": 3000000000,
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen3-14B-AWQ",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14768307200,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "AWQ-4bit",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 258163,
"hf_likes": 57,
"release_date": "2025-05-01",
"_discovered": true,
"format": "awq"
},
{
"name": "OpenPipe/Qwen3-14B-Instruct",
"provider": "openpipe",
"parameter_count": "14.8B",
"parameters_raw": 14768307200,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 207053,
"hf_likes": 12,
"release_date": "2025-10-10",
"_discovered": true
},
{
"name": "Goekdeniz-Guelmez/Josiefied-Qwen3-14B-abliterated-v3",
"provider": "goekdeniz-guelmez",
"parameter_count": "14.8B",
"parameters_raw": 14768307200,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 55059,
"hf_likes": 24,
"release_date": "2025-05-12",
"_discovered": true
},
{
"name": "Qwen/Qwen3-14B-Base",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14768307200,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 50835,
"hf_likes": 49,
"release_date": "2025-04-28",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-14B-Instruct",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14770000000,
"min_ram_gb": 8.2,
"recommended_ram_gb": 13.7,
"min_vram_gb": 7.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-14B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen3-14B",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14770000000,
"min_ram_gb": 8.2,
"recommended_ram_gb": 13.7,
"min_vram_gb": 7.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "unsloth/Qwen3-14B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen2.5-Coder-14B-Instruct",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14770033664,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 491583,
"hf_likes": 142,
"release_date": "2024-11-06",
"gguf_sources": [
{
"repo": "unsloth/Qwen2.5-Coder-14B-Instruct-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/Qwen2.5-Coder-14B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-14B-Instruct-AWQ",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14770033664,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1077036,
"hf_likes": 27,
"release_date": "2024-09-17",
"_discovered": true,
"format": "awq"
},
{
"name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",
"provider": "DeepSeek",
"parameter_count": "14.8B",
"parameters_raw": 14770033664,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 761474,
"hf_likes": 608,
"release_date": "2025-01-20",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/DeepSeek-R1-Distill-Qwen-14B-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/DeepSeek-R1-Distill-Qwen-14B-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-Coder-14B-Instruct-AWQ",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14770033664,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 168345,
"hf_likes": 16,
"release_date": "2024-11-09",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen2.5-14B",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14770033664,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 100307,
"hf_likes": 144,
"release_date": "2024-09-15",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-14B-Instruct-GPTQ-Int4",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14770033664,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "GPTQ-Int4",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 93325,
"hf_likes": 26,
"release_date": "2024-09-17",
"_discovered": true,
"format": "gptq"
},
{
"name": "Qwen/Qwen2.5-14B-Instruct-1M",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14770033664,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "Q4_K_M",
"context_length": 1010000,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 54355,
"hf_likes": 334,
"release_date": "2025-01-23",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-14B-Instruct-1M-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "OpenDFM/ChemDFM-R-14B",
"provider": "opendfm",
"parameter_count": "14.8B",
"parameters_raw": 14770033664,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 41195,
"hf_likes": 6,
"release_date": "2025-10-26",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-14B-Instruct-GPTQ-Int8",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14770033664,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "GPTQ-Int8",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 37961,
"hf_likes": 21,
"release_date": "2024-09-17",
"_discovered": true,
"format": "gptq"
},
{
"name": "Qwen/Qwen2.5-Coder-14B",
"provider": "Alibaba",
"parameter_count": "14.8B",
"parameters_raw": 14770033664,
"min_ram_gb": 8.3,
"recommended_ram_gb": 13.8,
"min_vram_gb": 7.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 27181,
"hf_likes": 66,
"release_date": "2024-11-08",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-Coder-14B-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "WizardLMTeam/WizardCoder-15B-V1.0",
"provider": "WizardLM",
"parameter_count": "15.5B",
"parameters_raw": 15515334656,
"min_ram_gb": 8.7,
"recommended_ram_gb": 14.5,
"min_vram_gb": 7.9,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "Code generation and completion",
"pipeline_tag": "text-generation",
"architecture": "starcoder",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "nvidia/Qwen3-30B-A3B-NVFP4",
"provider": "nvidia",
"parameter_count": "15.6B",
"parameters_raw": 15583623168,
"min_ram_gb": 8.7,
"recommended_ram_gb": 14.5,
"min_vram_gb": 8.0,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 63897,
"hf_likes": 24,
"release_date": "2025-07-08",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 1704458782,
"_discovered": true
},
{
"name": "NVFP4/Qwen3-Coder-30B-A3B-Instruct-FP4",
"provider": "nvfp4",
"parameter_count": "15.6B",
"parameters_raw": 15583623168,
"min_ram_gb": 8.7,
"recommended_ram_gb": 14.5,
"min_vram_gb": 8.0,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 25920,
"hf_likes": 11,
"release_date": "2025-08-05",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 1704458782,
"_discovered": true
},
{
"name": "bigcode/starcoder2-15b",
"provider": "BigCode",
"parameter_count": "15.7B",
"parameters_raw": 15700000000,
"min_ram_gb": 8.8,
"recommended_ram_gb": 14.6,
"min_vram_gb": 8.0,
"quantization": "Q4_K_M",
"context_length": 16384,
"use_case": "Code generation and completion",
"pipeline_tag": "text-generation",
"architecture": "starcoder2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct",
"provider": "DeepSeek",
"parameter_count": "16B",
"parameters_raw": 15700000000,
"min_ram_gb": 8.8,
"recommended_ram_gb": 14.6,
"min_vram_gb": 8.0,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Code generation and completion",
"pipeline_tag": "text-generation",
"architecture": "deepseek_v2",
"is_moe": true,
"num_experts": 64,
"active_experts": 6,
"active_parameters": 2400000000,
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "bartowski/DeepSeek-Coder-V2-Lite-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "deepseek-ai/DeepSeek-V2-Lite-Chat",
"provider": "DeepSeek",
"parameter_count": "15.7B",
"parameters_raw": 15706484224,
"min_ram_gb": 8.8,
"recommended_ram_gb": 14.6,
"min_vram_gb": 8.0,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v2",
"hf_downloads": 330400,
"hf_likes": 134,
"release_date": "2024-05-15",
"is_moe": true,
"num_experts": 64,
"active_experts": 6,
"active_parameters": 2184182961,
"_discovered": true
},
{
"name": "deepseek-ai/DeepSeek-V2-Lite",
"provider": "DeepSeek",
"parameter_count": "15.7B",
"parameters_raw": 15706484224,
"min_ram_gb": 8.8,
"recommended_ram_gb": 14.6,
"min_vram_gb": 8.0,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v2",
"hf_downloads": 194737,
"hf_likes": 167,
"release_date": "2024-05-15",
"is_moe": true,
"num_experts": 64,
"active_experts": 6,
"active_parameters": 2184182961,
"_discovered": true
},
{
"name": "RedHatAI/DeepSeek-Coder-V2-Lite-Instruct-FP8",
"provider": "redhatai",
"parameter_count": "15.7B",
"parameters_raw": 15706484224,
"min_ram_gb": 8.8,
"recommended_ram_gb": 14.6,
"min_vram_gb": 8.0,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v2",
"hf_downloads": 53780,
"hf_likes": 9,
"release_date": "2024-07-17",
"is_moe": true,
"num_experts": 64,
"active_experts": 6,
"active_parameters": 2184182961,
"_discovered": true
},
{
"name": "moonshotai/Moonlight-16B-A3B",
"provider": "moonshotai",
"parameter_count": "16.0B",
"parameters_raw": 15960111936,
"min_ram_gb": 8.9,
"recommended_ram_gb": 14.9,
"min_vram_gb": 8.2,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"hf_downloads": 45835,
"hf_likes": 108,
"release_date": "2025-02-22",
"is_moe": true,
"num_experts": 256,
"active_experts": 6,
"active_parameters": 1153367458,
"_discovered": true
},
{
"name": "moonshotai/Moonlight-16B-A3B-Instruct",
"provider": "moonshotai",
"parameter_count": "16.0B",
"parameters_raw": 15960111936,
"min_ram_gb": 8.9,
"recommended_ram_gb": 14.9,
"min_vram_gb": 8.2,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"hf_downloads": 38514,
"hf_likes": 192,
"release_date": "2025-02-22",
"is_moe": true,
"num_experts": 256,
"active_experts": 6,
"active_parameters": 1153367458,
"_discovered": true
},
{
"name": "inclusionAI/LLaDA2.1-mini",
"provider": "inclusionai",
"parameter_count": "16.3B",
"parameters_raw": 16255643392,
"min_ram_gb": 9.1,
"recommended_ram_gb": 15.1,
"min_vram_gb": 8.3,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llada2_moe",
"hf_downloads": 21824,
"hf_likes": 94,
"release_date": "2026-02-09",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 1295371577,
"_discovered": true
},
{
"name": "deepseek-ai/deepseek-moe-16b-base",
"provider": "DeepSeek",
"parameter_count": "16.4B",
"parameters_raw": 16375728128,
"min_ram_gb": 9.2,
"recommended_ram_gb": 15.3,
"min_vram_gb": 8.4,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek",
"hf_downloads": 22326,
"hf_likes": 139,
"release_date": "2024-01-08",
"_discovered": true
},
{
"name": "inclusionAI/Ling-lite",
"provider": "inclusionai",
"parameter_count": "16.8B",
"parameters_raw": 16801974272,
"min_ram_gb": 9.4,
"recommended_ram_gb": 15.6,
"min_vram_gb": 8.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "bailing_moe",
"hf_downloads": 388,
"hf_likes": 78,
"release_date": "2025-02-28",
"is_moe": true,
"num_experts": 64,
"active_experts": 6,
"active_parameters": 2336524543
},
{
"name": "nvidia/Qwen3-32B-NVFP4",
"provider": "nvidia",
"parameter_count": "17.2B",
"parameters_raw": 17159312384,
"min_ram_gb": 9.6,
"recommended_ram_gb": 16.0,
"min_vram_gb": 8.8,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 26285,
"hf_likes": 11,
"release_date": "2025-09-09",
"_discovered": true
},
{
"name": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-NVFP4",
"provider": "nvidia",
"parameter_count": "18.2B",
"parameters_raw": 18237772608,
"min_ram_gb": 10.2,
"recommended_ram_gb": 17.0,
"min_vram_gb": 9.3,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nemotron_h",
"hf_downloads": 490404,
"hf_likes": 105,
"release_date": "2025-12-20",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.5-Air-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "18.6B",
"parameters_raw": 18626406504,
"min_ram_gb": 10.4,
"recommended_ram_gb": 17.3,
"min_vram_gb": 9.5,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 260177,
"hf_likes": 27,
"release_date": "2025-07-29",
"_discovered": true,
"format": "awq"
},
{
"name": "QuantTrio/GLM-4.5-Air-GPTQ-Int4-Int8Mix",
"provider": "quanttrio",
"parameter_count": "19.8B",
"parameters_raw": 19809102592,
"min_ram_gb": 11.1,
"recommended_ram_gb": 18.4,
"min_vram_gb": 10.1,
"quantization": "GPTQ-Int4",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 24759,
"hf_likes": 10,
"release_date": "2025-07-30",
"_discovered": true,
"format": "gptq"
},
{
"name": "internlm/internlm2-chat-20b",
"provider": "internlm",
"parameter_count": "19.9B",
"parameters_raw": 19861149696,
"min_ram_gb": 11.1,
"recommended_ram_gb": 18.5,
"min_vram_gb": 10.2,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "internlm2",
"hf_downloads": 20010,
"hf_likes": 88,
"release_date": "2024-01-10",
"_discovered": true
},
{
"name": "openai/gpt-oss-20b",
"provider": "openai",
"parameter_count": "21B",
"parameters_raw": 21000000000,
"min_ram_gb": 16.0,
"recommended_ram_gb": 24.0,
"min_vram_gb": 16.0,
"quantization": "BF16",
"context_length": 131072,
"use_case": "Chat, reasoning, tool use",
"is_moe": true,
"num_experts": 32,
"active_experts": 4,
"active_parameters": 3600000000,
"release_date": "2025-08-08",
"pipeline_tag": "text-generation",
"architecture": "gpt_oss",
"hf_downloads": 7259974,
"hf_likes": 4470,
"gguf_sources": [
{
"repo": "unsloth/gpt-oss-20b-GGUF",
"provider": "unsloth"
},
{
"repo": "ggml-org/gpt-oss-20b-GGUF",
"provider": "ggml-org"
},
{
"repo": "lmstudio-community/gpt-oss-20b-GGUF",
"provider": "lmstudio-community"
}
],
"capabilities": [
"tool_use"
]
},
{
"name": "RedHatAI/gpt-oss-20b",
"provider": "redhatai",
"parameter_count": "21.5B",
"parameters_raw": 21511953984,
"min_ram_gb": 12.0,
"recommended_ram_gb": 20.0,
"min_vram_gb": 11.0,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_oss",
"hf_downloads": 20506,
"hf_likes": 5,
"release_date": "2025-09-04",
"is_moe": true,
"num_experts": 32,
"active_experts": 4,
"active_parameters": 3630142231,
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/gpt-oss-20b-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "lmstudio-community/ERNIE-4.5-21B-A3B-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "21.8B",
"parameters_raw": 21825436160,
"min_ram_gb": 12.2,
"recommended_ram_gb": 20.3,
"min_vram_gb": 11.2,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "ernie4_5_moe",
"hf_downloads": 24749,
"hf_likes": 1,
"release_date": "2025-07-09",
"_discovered": true
},
{
"name": "lmstudio-community/ERNIE-4.5-21B-A3B-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "21.8B",
"parameters_raw": 21825436160,
"min_ram_gb": 12.2,
"recommended_ram_gb": 20.3,
"min_vram_gb": 11.2,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "ernie4_5_moe",
"hf_downloads": 24612,
"hf_likes": 1,
"release_date": "2025-07-10",
"_discovered": true
},
{
"name": "lmstudio-community/ERNIE-4.5-21B-A3B-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "21.8B",
"parameters_raw": 21825436160,
"min_ram_gb": 12.2,
"recommended_ram_gb": 20.3,
"min_vram_gb": 11.2,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "ernie4_5_moe",
"hf_downloads": 24573,
"hf_likes": 1,
"release_date": "2025-07-10",
"_discovered": true
},
{
"name": "solidrust/Codestral-22B-v0.1-hf-AWQ",
"provider": "solidrust",
"parameter_count": "22.2B",
"parameters_raw": 22247282688,
"min_ram_gb": 12.4,
"recommended_ram_gb": 20.7,
"min_vram_gb": 11.4,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 84893,
"hf_likes": 2,
"release_date": "2024-05-30",
"_discovered": true,
"format": "awq"
},
{
"name": "stelterlab/Mistral-Small-24B-Instruct-2501-AWQ",
"provider": "stelterlab",
"parameter_count": "23.6B",
"parameters_raw": 23572403200,
"min_ram_gb": 13.2,
"recommended_ram_gb": 22.0,
"min_vram_gb": 12.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 266172,
"hf_likes": 26,
"release_date": "2025-01-30",
"_discovered": true,
"format": "awq"
},
{
"name": "lmstudio-community/Devstral-Small-2507-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "23.6B",
"parameters_raw": 23572403200,
"min_ram_gb": 13.2,
"recommended_ram_gb": 22.0,
"min_vram_gb": 12.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 19891,
"hf_likes": 2,
"release_date": "2025-07-09",
"_discovered": true
},
{
"name": "lmstudio-community/LFM2-24B-A2B-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "23.8B",
"parameters_raw": 23843659008,
"min_ram_gb": 13.3,
"recommended_ram_gb": 22.2,
"min_vram_gb": 12.2,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2_moe",
"hf_downloads": 207367,
"hf_likes": 1,
"release_date": "2026-02-23",
"is_moe": true,
"num_experts": 64,
"active_experts": 4,
"active_parameters": 2607900202,
"_discovered": true
},
{
"name": "lmstudio-community/LFM2-24B-A2B-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "23.8B",
"parameters_raw": 23843659008,
"min_ram_gb": 13.3,
"recommended_ram_gb": 22.2,
"min_vram_gb": 12.2,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2_moe",
"hf_downloads": 205544,
"hf_likes": 2,
"release_date": "2026-02-23",
"is_moe": true,
"num_experts": 64,
"active_experts": 4,
"active_parameters": 2607900202,
"_discovered": true
},
{
"name": "lmstudio-community/LFM2-24B-A2B-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "23.8B",
"parameters_raw": 23843659008,
"min_ram_gb": 13.3,
"recommended_ram_gb": 22.2,
"min_vram_gb": 12.2,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2_moe",
"hf_downloads": 204884,
"hf_likes": 1,
"release_date": "2026-02-23",
"is_moe": true,
"num_experts": 64,
"active_experts": 4,
"active_parameters": 2607900202,
"_discovered": true
},
{
"name": "lmstudio-community/LFM2-24B-A2B-MLX-5bit",
"provider": "lmstudio-community",
"parameter_count": "23.8B",
"parameters_raw": 23843659008,
"min_ram_gb": 13.3,
"recommended_ram_gb": 22.2,
"min_vram_gb": 12.2,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2_moe",
"hf_downloads": 204308,
"hf_likes": 1,
"release_date": "2026-02-23",
"is_moe": true,
"num_experts": 64,
"active_experts": 4,
"active_parameters": 2607900202,
"_discovered": true
},
{
"name": "LiquidAI/LFM2-24B-A2B",
"provider": "Liquid AI",
"parameter_count": "23.8B",
"parameters_raw": 23843661440,
"min_ram_gb": 13.3,
"recommended_ram_gb": 22.2,
"min_vram_gb": 12.2,
"quantization": "Q4_K_M",
"context_length": 128000,
"use_case": "Agentic tasks, RAG, summarization",
"pipeline_tag": "text-generation",
"architecture": "lfm2",
"is_moe": true,
"num_experts": 32,
"active_experts": 4,
"active_parameters": 2300000000,
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-11-28"
},
{
"name": "mistralai/Mistral-Small-24B-Instruct-2501",
"provider": "Mistral AI",
"parameter_count": "24B",
"parameters_raw": 24000000000,
"min_ram_gb": 13.4,
"recommended_ram_gb": 22.4,
"min_vram_gb": 12.3,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "unsloth/Mistral-Small-24B-Instruct-2501-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/Mistral-Small-24B-Instruct-2501-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "google/gemma-2-27b-it",
"provider": "Google",
"parameter_count": "27.2B",
"parameters_raw": 27227128320,
"min_ram_gb": 15.2,
"recommended_ram_gb": 25.4,
"min_vram_gb": 13.9,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gemma2",
"hf_downloads": 409260,
"hf_likes": 560,
"release_date": "2024-06-24",
"gguf_sources": [
{
"repo": "bartowski/gemma-2-27b-it-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "google/gemma-3-27b-it",
"provider": "Google",
"parameter_count": "27.4B",
"parameters_raw": 27432406640,
"min_ram_gb": 15.3,
"recommended_ram_gb": 25.5,
"min_vram_gb": 14.1,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose",
"capabilities": [
"vision"
],
"pipeline_tag": "image-text-to-text",
"architecture": "gemma3",
"hf_downloads": 1520563,
"hf_likes": 1905,
"release_date": "2025-03-01",
"gguf_sources": [
{
"repo": "unsloth/gemma-3-27b-it-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen3.5-27B",
"provider": "Alibaba",
"parameter_count": "27.8B",
"parameters_raw": 27781427952,
"min_ram_gb": 15.5,
"recommended_ram_gb": 25.9,
"min_vram_gb": 14.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 406808,
"hf_likes": 565,
"release_date": "2026-02-24",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-27B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "lmstudio-community/GLM-4.7-Flash-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "29.9B",
"parameters_raw": 29943393920,
"min_ram_gb": 16.7,
"recommended_ram_gb": 27.9,
"min_vram_gb": 15.3,
"quantization": "Q4_K_M",
"context_length": 202752,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe_lite",
"hf_downloads": 1001623,
"hf_likes": 9,
"release_date": "2026-01-19",
"_discovered": true
},
{
"name": "lmstudio-community/GLM-4.7-Flash-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "29.9B",
"parameters_raw": 29943393920,
"min_ram_gb": 16.7,
"recommended_ram_gb": 27.9,
"min_vram_gb": 15.3,
"quantization": "Q4_K_M",
"context_length": 202752,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe_lite",
"hf_downloads": 991211,
"hf_likes": 8,
"release_date": "2026-01-19",
"_discovered": true
},
{
"name": "Qwen/Qwen3-30B-A3B-GPTQ-Int4",
"provider": "Alibaba",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "GPTQ-Int4",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 226311,
"hf_likes": 47,
"release_date": "2025-05-05",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true,
"format": "gptq"
},
{
"name": "lmstudio-community/Qwen3-Coder-30B-A3B-Instruct-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 191895,
"hf_likes": 14,
"release_date": "2025-07-31",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-Coder-30B-A3B-Instruct-MLX-5bit",
"provider": "lmstudio-community",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 185814,
"hf_likes": 4,
"release_date": "2025-08-01",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-Coder-30B-A3B-Instruct-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 181127,
"hf_likes": 12,
"release_date": "2025-07-31",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-Coder-30B-A3B-Instruct-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 179804,
"hf_likes": 4,
"release_date": "2025-07-31",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true
},
{
"name": "Qwen/Qwen3-30B-A3B-Base",
"provider": "Alibaba",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 83458,
"hf_likes": 69,
"release_date": "2025-04-28",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true
},
{
"name": "typhoon-ai/typhoon2.5-qwen3-30b-a3b",
"provider": "typhoon-ai",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 53587,
"hf_likes": 1,
"release_date": "2025-09-23",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true
},
{
"name": "QuantTrio/Qwen3-Coder-30B-A3B-Instruct-AWQ",
"provider": "quanttrio",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 46035,
"hf_likes": 6,
"release_date": "2025-08-01",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true,
"format": "awq"
},
{
"name": "lmstudio-community/Qwen3-30B-A3B-Instruct-2507-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 45854,
"hf_likes": 6,
"release_date": "2025-07-29",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-30B-A3B-Instruct-2507-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 44199,
"hf_likes": 4,
"release_date": "2025-07-29",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-30B-A3B-Instruct-2507-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 43483,
"hf_likes": 0,
"release_date": "2025-07-29",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true
},
{
"name": "Alibaba-NLP/Tongyi-DeepResearch-30B-A3B",
"provider": "alibaba-nlp",
"parameter_count": "30.5B",
"parameters_raw": 30532122624,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 26559,
"hf_likes": 802,
"release_date": "2025-09-16",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339450907,
"_discovered": true
},
{
"name": "Qwen/Qwen3-30B-A3B-Instruct-2507-FP8",
"provider": "Alibaba",
"parameter_count": "30.5B",
"parameters_raw": 30533947392,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 957458,
"hf_likes": 115,
"release_date": "2025-07-28",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339650489,
"_discovered": true
},
{
"name": "Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8",
"provider": "Alibaba",
"parameter_count": "30.5B",
"parameters_raw": 30533947392,
"min_ram_gb": 17.1,
"recommended_ram_gb": 28.4,
"min_vram_gb": 15.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 265519,
"hf_likes": 164,
"release_date": "2025-07-31",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3339650489,
"_discovered": true
},
{
"name": "QuantTrio/Qwen3-VL-30B-A3B-Instruct-AWQ",
"provider": "quanttrio",
"parameter_count": "31.1B",
"parameters_raw": 31070754032,
"min_ram_gb": 17.4,
"recommended_ram_gb": 28.9,
"min_vram_gb": 15.9,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_vl_moe",
"hf_downloads": 301353,
"hf_likes": 40,
"release_date": "2025-10-04",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 2475950709,
"_discovered": true,
"format": "awq"
},
{
"name": "QuantTrio/GLM-4.7-Flash-AWQ",
"provider": "quanttrio",
"parameter_count": "31.2B",
"parameters_raw": 31221488576,
"min_ram_gb": 17.4,
"recommended_ram_gb": 29.1,
"min_vram_gb": 16.0,
"quantization": "AWQ-4bit",
"context_length": 202752,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe_lite",
"hf_downloads": 103703,
"hf_likes": 7,
"release_date": "2026-01-21",
"_discovered": true,
"format": "awq"
},
{
"name": "lmstudio-community/NVIDIA-Nemotron-3-Nano-30B-A3B-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "31.6B",
"parameters_raw": 31577935872,
"min_ram_gb": 17.6,
"recommended_ram_gb": 29.4,
"min_vram_gb": 16.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 195432,
"hf_likes": 2,
"release_date": "2025-12-16",
"_discovered": true
},
{
"name": "lmstudio-community/NVIDIA-Nemotron-3-Nano-30B-A3B-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "31.6B",
"parameters_raw": 31577935872,
"min_ram_gb": 17.6,
"recommended_ram_gb": 29.4,
"min_vram_gb": 16.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 190541,
"hf_likes": 3,
"release_date": "2025-12-16",
"_discovered": true
},
{
"name": "lmstudio-community/NVIDIA-Nemotron-3-Nano-30B-A3B-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "31.6B",
"parameters_raw": 31577935872,
"min_ram_gb": 17.6,
"recommended_ram_gb": 29.4,
"min_vram_gb": 16.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 188175,
"hf_likes": 0,
"release_date": "2025-12-16",
"_discovered": true
},
{
"name": "lmstudio-community/NVIDIA-Nemotron-3-Nano-30B-A3B-MLX-5bit",
"provider": "lmstudio-community",
"parameter_count": "31.6B",
"parameters_raw": 31577935872,
"min_ram_gb": 17.6,
"recommended_ram_gb": 29.4,
"min_vram_gb": 16.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 188130,
"hf_likes": 0,
"release_date": "2025-12-16",
"_discovered": true
},
{
"name": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16",
"provider": "nvidia",
"parameter_count": "31.6B",
"parameters_raw": 31577937344,
"min_ram_gb": 17.6,
"recommended_ram_gb": 29.4,
"min_vram_gb": 16.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nemotron_h",
"hf_downloads": 1025721,
"hf_likes": 648,
"release_date": "2025-12-04"
},
{
"name": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-Base-BF16",
"provider": "nvidia",
"parameter_count": "31.6B",
"parameters_raw": 31577937344,
"min_ram_gb": 17.6,
"recommended_ram_gb": 29.4,
"min_vram_gb": 16.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 65364,
"hf_likes": 109,
"release_date": "2025-12-03",
"_discovered": true
},
{
"name": "OpenResearcher/OpenResearcher-30B-A3B",
"provider": "openresearcher",
"parameter_count": "31.6B",
"parameters_raw": 31577937344,
"min_ram_gb": 17.6,
"recommended_ram_gb": 29.4,
"min_vram_gb": 16.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nemotron_h",
"hf_downloads": 23630,
"hf_likes": 59,
"release_date": "2026-02-03",
"_discovered": true
},
{
"name": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-FP8",
"provider": "nvidia",
"parameter_count": "31.6B",
"parameters_raw": 31577946256,
"min_ram_gb": 17.6,
"recommended_ram_gb": 29.4,
"min_vram_gb": 16.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nemotron_h",
"hf_downloads": 1412797,
"hf_likes": 289,
"release_date": "2025-12-06",
"_discovered": true
},
{
"name": "LGAI-EXAONE/EXAONE-4.0-32B",
"provider": "LG AI",
"parameter_count": "32B",
"parameters_raw": 32000000000,
"min_ram_gb": 17.9,
"recommended_ram_gb": 29.8,
"min_vram_gb": 16.4,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Hybrid reasoning, multilingual",
"pipeline_tag": "text-generation",
"architecture": "exaone",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-07-15"
},
{
"name": "LGAI-EXAONE/EXAONE-4.0.1-32B",
"provider": "lgai-exaone",
"parameter_count": "32.0B",
"parameters_raw": 32003216384,
"min_ram_gb": 17.9,
"recommended_ram_gb": 29.8,
"min_vram_gb": 16.4,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "exaone4",
"hf_downloads": 186516,
"hf_likes": 24,
"release_date": "2025-07-29",
"_discovered": true
},
{
"name": "LGAI-EXAONE/EXAONE-4.0-32B-FP8",
"provider": "lgai-exaone",
"parameter_count": "32.0B",
"parameters_raw": 32005105664,
"min_ram_gb": 17.9,
"recommended_ram_gb": 29.8,
"min_vram_gb": 16.4,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "exaone4",
"hf_downloads": 20430,
"hf_likes": 17,
"release_date": "2025-07-11",
"_discovered": true
},
{
"name": "allenai/OLMo-2-0325-32B-Instruct",
"provider": "allenai",
"parameter_count": "32.2B",
"parameters_raw": 32234279936,
"min_ram_gb": 18.0,
"recommended_ram_gb": 30.0,
"min_vram_gb": 16.5,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo2",
"hf_downloads": 2979,
"hf_likes": 148,
"release_date": "2025-03-12",
"gguf_sources": [
{
"repo": "unsloth/OLMo-2-0325-32B-Instruct-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen2.5-32B-Instruct",
"provider": "Alibaba",
"parameter_count": "32.5B",
"parameters_raw": 32510000000,
"min_ram_gb": 18.2,
"recommended_ram_gb": 30.3,
"min_vram_gb": 16.7,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-32B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen1.5-32B-Chat",
"provider": "Alibaba",
"parameter_count": "32.5B",
"parameters_raw": 32512218112,
"min_ram_gb": 18.2,
"recommended_ram_gb": 30.3,
"min_vram_gb": 16.7,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 25041,
"hf_likes": 109,
"release_date": "2024-04-03",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen1.5-32B-Chat-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "nn-tech/MetalGPT-1",
"provider": "nn-tech",
"parameter_count": "32.8B",
"parameters_raw": 32759593984,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 20663,
"hf_likes": 38,
"release_date": "2025-12-04",
"_discovered": true
},
{
"name": "Qwen/Qwen3-32B-AWQ",
"provider": "Alibaba",
"parameter_count": "32.8B",
"parameters_raw": 32762123264,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "AWQ-4bit",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 552811,
"hf_likes": 129,
"release_date": "2025-05-01",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen2.5-Coder-32B-Instruct",
"provider": "Alibaba",
"parameter_count": "32.8B",
"parameters_raw": 32763876352,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 858975,
"hf_likes": 2000,
"release_date": "2024-11-06",
"gguf_sources": [
{
"repo": "unsloth/Qwen2.5-Coder-32B-Instruct-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/Qwen2.5-Coder-32B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
"provider": "DeepSeek",
"parameter_count": "32.8B",
"parameters_raw": 32763876352,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 873156,
"hf_likes": 1525,
"release_date": "2025-01-20",
"gguf_sources": [
{
"repo": "unsloth/DeepSeek-R1-Distill-Qwen-32B-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/DeepSeek-R1-Distill-Qwen-32B-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-32B-Instruct-AWQ",
"provider": "Alibaba",
"parameter_count": "32.8B",
"parameters_raw": 32763876352,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1643600,
"hf_likes": 94,
"release_date": "2024-09-17",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen2.5-32B",
"provider": "Alibaba",
"parameter_count": "32.8B",
"parameters_raw": 32763876352,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1453252,
"hf_likes": 173,
"release_date": "2024-09-15",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-Coder-32B-Instruct-AWQ",
"provider": "Alibaba",
"parameter_count": "32.8B",
"parameters_raw": 32763876352,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 973260,
"hf_likes": 33,
"release_date": "2024-11-09",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/QwQ-32B-AWQ",
"provider": "Alibaba",
"parameter_count": "32.8B",
"parameters_raw": 32763876352,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "AWQ-4bit",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 280279,
"hf_likes": 133,
"release_date": "2025-03-05",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen2.5-32B-Instruct-GPTQ-Int4",
"provider": "Alibaba",
"parameter_count": "32.8B",
"parameters_raw": 32763876352,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "GPTQ-Int4",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 191251,
"hf_likes": 40,
"release_date": "2024-09-17",
"_discovered": true,
"format": "gptq"
},
{
"name": "baichuan-inc/Baichuan-M2-32B",
"provider": "baichuan-inc",
"parameter_count": "32.8B",
"parameters_raw": 32763876352,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 152016,
"hf_likes": 118,
"release_date": "2025-08-10",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-32B-Instruct-GPTQ-Int8",
"provider": "Alibaba",
"parameter_count": "32.8B",
"parameters_raw": 32763876352,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "GPTQ-Int8",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 105034,
"hf_likes": 14,
"release_date": "2024-09-17",
"_discovered": true,
"format": "gptq"
},
{
"name": "Qwen/Qwen2.5-Coder-32B",
"provider": "Alibaba",
"parameter_count": "32.8B",
"parameters_raw": 32763876352,
"min_ram_gb": 18.3,
"recommended_ram_gb": 30.5,
"min_vram_gb": 16.8,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 43109,
"hf_likes": 142,
"release_date": "2024-11-08",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-Coder-32B-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "meta-llama/CodeLlama-34b-Instruct-hf",
"provider": "Meta",
"parameter_count": "33.7B",
"parameters_raw": 33743970304,
"min_ram_gb": 18.9,
"recommended_ram_gb": 31.4,
"min_vram_gb": 17.3,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 950,
"hf_likes": 19,
"release_date": "2024-03-14"
},
{
"name": "01-ai/Yi-34B-Chat",
"provider": "01.ai",
"parameter_count": "34.4B",
"parameters_raw": 34386780160,
"min_ram_gb": 19.2,
"recommended_ram_gb": 32.0,
"min_vram_gb": 17.6,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Multilingual, Chinese/English chat",
"pipeline_tag": "text-generation",
"architecture": "yi",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "dphn/dolphin-2.9.1-yi-1.5-34b",
"provider": "dphn",
"parameter_count": "34.4B",
"parameters_raw": 34388917248,
"min_ram_gb": 19.2,
"recommended_ram_gb": 32.0,
"min_vram_gb": 17.6,
"quantization": "Q4_K_M",
"context_length": 8192,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 4650971,
"hf_likes": 56,
"release_date": "2024-05-18",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/dolphin-2.9.1-yi-1.5-34b-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "CohereForAI/c4ai-command-r-v01",
"provider": "Cohere",
"parameter_count": "35B",
"parameters_raw": 35000000000,
"min_ram_gb": 19.5,
"recommended_ram_gb": 32.6,
"min_vram_gb": 17.9,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "RAG, tool use, agents",
"pipeline_tag": "text-generation",
"architecture": "cohere",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "bartowski/c4ai-command-r-v01-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen3.5-35B-A3B",
"provider": "Alibaba",
"parameter_count": "36.0B",
"parameters_raw": 35951822704,
"min_ram_gb": 20.1,
"recommended_ram_gb": 33.5,
"min_vram_gb": 18.4,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 769032,
"hf_likes": 905,
"release_date": "2026-02-24",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 3000000000,
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-35B-A3B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "lmstudio-community/Seed-OSS-36B-Instruct-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "36.2B",
"parameters_raw": 36151104512,
"min_ram_gb": 20.2,
"recommended_ram_gb": 33.7,
"min_vram_gb": 18.5,
"quantization": "Q4_K_M",
"context_length": 524288,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "seed_oss",
"hf_downloads": 46944,
"hf_likes": 2,
"release_date": "2025-08-26",
"_discovered": true
},
{
"name": "lmstudio-community/Seed-OSS-36B-Instruct-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "36.2B",
"parameters_raw": 36151104512,
"min_ram_gb": 20.2,
"recommended_ram_gb": 33.7,
"min_vram_gb": 18.5,
"quantization": "Q4_K_M",
"context_length": 524288,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "seed_oss",
"hf_downloads": 45348,
"hf_likes": 0,
"release_date": "2025-08-26",
"_discovered": true
},
{
"name": "lmstudio-community/Seed-OSS-36B-Instruct-MLX-5bit",
"provider": "lmstudio-community",
"parameter_count": "36.2B",
"parameters_raw": 36151104512,
"min_ram_gb": 20.2,
"recommended_ram_gb": 33.7,
"min_vram_gb": 18.5,
"quantization": "Q4_K_M",
"context_length": 524288,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "seed_oss",
"hf_downloads": 45061,
"hf_likes": 1,
"release_date": "2025-08-26",
"_discovered": true
},
{
"name": "lmstudio-community/Seed-OSS-36B-Instruct-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "36.2B",
"parameters_raw": 36151104512,
"min_ram_gb": 20.2,
"recommended_ram_gb": 33.7,
"min_vram_gb": 18.5,
"quantization": "Q4_K_M",
"context_length": 524288,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "seed_oss",
"hf_downloads": 44971,
"hf_likes": 0,
"release_date": "2025-08-26",
"_discovered": true
},
{
"name": "cyankiwi/MiniMax-M2.1-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "36.8B",
"parameters_raw": 36811839984,
"min_ram_gb": 20.6,
"recommended_ram_gb": 34.3,
"min_vram_gb": 18.9,
"quantization": "AWQ-4bit",
"context_length": 196608,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 36114,
"hf_likes": 16,
"release_date": "2025-12-27",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 2933443495,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/MiniMax-M2.5-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "36.8B",
"parameters_raw": 36811839984,
"min_ram_gb": 20.6,
"recommended_ram_gb": 34.3,
"min_vram_gb": 18.9,
"quantization": "AWQ-4bit",
"context_length": 196608,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 24338,
"hf_likes": 6,
"release_date": "2026-02-15",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 2933443495,
"_discovered": true,
"format": "awq"
},
{
"name": "mratsim/MiniMax-M2.5-BF16-INT4-AWQ",
"provider": "mratsim",
"parameter_count": "39.1B",
"parameters_raw": 39115692032,
"min_ram_gb": 21.9,
"recommended_ram_gb": 36.4,
"min_vram_gb": 20.0,
"quantization": "AWQ-4bit",
"context_length": 196608,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 46268,
"hf_likes": 29,
"release_date": "2026-02-14",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 3117031705,
"_discovered": true,
"format": "awq"
},
{
"name": "tiiuae/falcon-40b-instruct",
"provider": "TII",
"parameter_count": "40.0B",
"parameters_raw": 40000000000,
"min_ram_gb": 22.4,
"recommended_ram_gb": 37.3,
"min_vram_gb": 20.5,
"quantization": "Q4_K_M",
"context_length": 2048,
"use_case": "Instruction following, chat",
"pipeline_tag": "text-generation",
"architecture": "falcon",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "mistralai/Mixtral-8x7B-Instruct-v0.1",
"provider": "Mistral AI",
"parameter_count": "46.7B",
"parameters_raw": 46702792704,
"min_ram_gb": 26.1,
"recommended_ram_gb": 43.5,
"min_vram_gb": 23.9,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "unknown",
"architecture": "mixtral",
"hf_downloads": 787218,
"hf_likes": 4641,
"release_date": "2023-12-10",
"is_moe": true,
"num_experts": 8,
"active_experts": 2,
"active_parameters": 12900000000
},
{
"name": "Salesforce/xLAM-8x7b-r",
"provider": "salesforce",
"parameter_count": "46.7B",
"parameters_raw": 46702792704,
"min_ram_gb": 26.1,
"recommended_ram_gb": 43.5,
"min_vram_gb": 23.9,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mixtral",
"hf_downloads": 25430,
"hf_likes": 15,
"release_date": "2024-08-28",
"is_moe": true,
"num_experts": 8,
"active_experts": 2,
"active_parameters": 13427052901,
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/xLAM-8x7b-r-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
"provider": "NousResearch",
"parameter_count": "46.7B",
"parameters_raw": 46702809088,
"min_ram_gb": 26.1,
"recommended_ram_gb": 43.5,
"min_vram_gb": 23.9,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "mixtral",
"hf_downloads": 9050,
"hf_likes": 453,
"release_date": "2024-01-11",
"is_moe": true,
"num_experts": 8,
"active_experts": 2,
"active_parameters": 12900000000
},
{
"name": "moonshotai/Kimi-Linear-48B-A3B-Instruct",
"provider": "moonshotai",
"parameter_count": "49.1B",
"parameters_raw": 49122681728,
"min_ram_gb": 27.4,
"recommended_ram_gb": 45.7,
"min_vram_gb": 25.2,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "kimi_linear",
"hf_downloads": 35486,
"hf_likes": 546,
"release_date": "2025-10-30",
"_discovered": true
},
{
"name": "nvidia/Llama-3_3-Nemotron-Super-49B-v1_5",
"provider": "nvidia",
"parameter_count": "49.9B",
"parameters_raw": 49867145216,
"min_ram_gb": 27.9,
"recommended_ram_gb": 46.4,
"min_vram_gb": 25.5,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nemotron-nas",
"hf_downloads": 105079,
"hf_likes": 226,
"release_date": "2025-07-25",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/Llama-3_3-Nemotron-Super-49B-v1_5-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "nvidia/Llama-3_3-Nemotron-Super-49B-v1",
"provider": "nvidia",
"parameter_count": "49.9B",
"parameters_raw": 49867145216,
"min_ram_gb": 27.9,
"recommended_ram_gb": 46.4,
"min_vram_gb": 25.5,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nemotron-nas",
"hf_downloads": 23805,
"hf_likes": 320,
"release_date": "2025-03-16",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/Llama-3_3-Nemotron-Super-49B-v1-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "txn545/Qwen3.5-122B-A10B-NVFP4",
"provider": "txn545",
"parameter_count": "64.4B",
"parameters_raw": 64354266864,
"min_ram_gb": 36.0,
"recommended_ram_gb": 59.9,
"min_vram_gb": 33.0,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_5_moe",
"hf_downloads": 37707,
"hf_likes": 6,
"release_date": "2026-02-24",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 5128230639,
"_discovered": true
},
{
"name": "meta-llama/Llama-3.1-70B-Instruct",
"provider": "Meta",
"parameter_count": "70.6B",
"parameters_raw": 70553706496,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 801189,
"hf_likes": 894,
"release_date": "2024-07-16"
},
{
"name": "meta-llama/Llama-3.3-70B-Instruct",
"provider": "Meta",
"parameter_count": "70.6B",
"parameters_raw": 70553706496,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null,
"gguf_sources": [
{
"repo": "unsloth/Llama-3.3-70B-Instruct-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/Llama-3.3-70B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "casperhansen/llama-3.3-70b-instruct-awq",
"provider": "casperhansen",
"parameter_count": "70.6B",
"parameters_raw": 70553706496,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 674865,
"hf_likes": 39,
"release_date": "2024-12-06",
"_discovered": true,
"format": "awq"
},
{
"name": "kosbu/Llama-3.3-70B-Instruct-AWQ",
"provider": "kosbu",
"parameter_count": "70.6B",
"parameters_raw": 70553706496,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 505688,
"hf_likes": 10,
"release_date": "2024-12-06",
"_discovered": true,
"format": "awq"
},
{
"name": "ibnzterrell/Meta-Llama-3.3-70B-Instruct-AWQ-INT4",
"provider": "ibnzterrell",
"parameter_count": "70.6B",
"parameters_raw": 70553706496,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 138353,
"hf_likes": 30,
"release_date": "2024-12-07",
"_discovered": true,
"format": "awq"
},
{
"name": "RedHatAI/Meta-Llama-3.1-70B-Instruct-quantized.w4a16",
"provider": "redhatai",
"parameter_count": "70.6B",
"parameters_raw": 70553706496,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 116205,
"hf_likes": 32,
"release_date": "2024-07-31",
"_discovered": true
},
{
"name": "meta-llama/Llama-3.1-70B",
"provider": "Meta",
"parameter_count": "70.6B",
"parameters_raw": 70553706496,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 75498,
"hf_likes": 408,
"release_date": "2024-07-14",
"_discovered": true
},
{
"name": "meta-llama/Meta-Llama-3-70B-Instruct",
"provider": "Meta",
"parameter_count": "70.6B",
"parameters_raw": 70553706496,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 61023,
"hf_likes": 1506,
"release_date": "2024-04-17",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Meta-Llama-3-70B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "tokyotech-llm/Llama-3.1-Swallow-70B-Instruct-v0.3",
"provider": "tokyotech-llm",
"parameter_count": "70.6B",
"parameters_raw": 70553706496,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 35321,
"hf_likes": 14,
"release_date": "2024-12-25",
"_discovered": true
},
{
"name": "RedHatAI/Meta-Llama-3.1-70B-Instruct-FP8",
"provider": "redhatai",
"parameter_count": "70.6B",
"parameters_raw": 70553707616,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 39962,
"hf_likes": 50,
"release_date": "2024-07-23",
"_discovered": true
},
{
"name": "RedHatAI/Llama-3.3-70B-Instruct-FP8-dynamic",
"provider": "redhatai",
"parameter_count": "70.6B",
"parameters_raw": 70560423936,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 42062,
"hf_likes": 14,
"release_date": "2024-12-11",
"_discovered": true
},
{
"name": "RedHatAI/DeepSeek-R1-Distill-Llama-70B-FP8-dynamic",
"provider": "redhatai",
"parameter_count": "70.6B",
"parameters_raw": 70560423936,
"min_ram_gb": 39.4,
"recommended_ram_gb": 65.7,
"min_vram_gb": 36.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 26238,
"hf_likes": 10,
"release_date": "2025-02-01",
"_discovered": true
},
{
"name": "LLM360/K2-Think-V2",
"provider": "llm360",
"parameter_count": "72.6B",
"parameters_raw": 72550195200,
"min_ram_gb": 40.5,
"recommended_ram_gb": 67.6,
"min_vram_gb": 37.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 53839,
"hf_likes": 23,
"release_date": "2026-01-08",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-72B-Instruct",
"provider": "Alibaba",
"parameter_count": "72.7B",
"parameters_raw": 72706203648,
"min_ram_gb": 40.6,
"recommended_ram_gb": 67.7,
"min_vram_gb": 37.2,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 558153,
"hf_likes": 916,
"release_date": "2024-09-16",
"gguf_sources": [
{
"repo": "bartowski/Qwen2.5-72B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2.5-72B",
"provider": "Alibaba",
"parameter_count": "72.7B",
"parameters_raw": 72706203648,
"min_ram_gb": 40.6,
"recommended_ram_gb": 67.7,
"min_vram_gb": 37.2,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 45193,
"hf_likes": 89,
"release_date": "2024-09-15",
"_discovered": true
},
{
"name": "Qwen/Qwen2-72B-Instruct",
"provider": "Alibaba",
"parameter_count": "72.7B",
"parameters_raw": 72706203648,
"min_ram_gb": 40.6,
"recommended_ram_gb": 67.7,
"min_vram_gb": 37.2,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 40930,
"hf_likes": 719,
"release_date": "2024-05-28",
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/Qwen2-72B-Instruct-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "Qwen/Qwen2-72B",
"provider": "Alibaba",
"parameter_count": "72.7B",
"parameters_raw": 72706203648,
"min_ram_gb": 40.6,
"recommended_ram_gb": 67.7,
"min_vram_gb": 37.2,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 34455,
"hf_likes": 200,
"release_date": "2024-05-22",
"_discovered": true
},
{
"name": "huihui-ai/Qwen2.5-72B-Instruct-abliterated",
"provider": "huihui-ai",
"parameter_count": "72.7B",
"parameters_raw": 72706203648,
"min_ram_gb": 40.6,
"recommended_ram_gb": 67.7,
"min_vram_gb": 37.2,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 20754,
"hf_likes": 35,
"release_date": "2024-10-26",
"_discovered": true
},
{
"name": "Qwen/Qwen2.5-72B-Instruct-AWQ",
"provider": "Alibaba",
"parameter_count": "73.0B",
"parameters_raw": 72957861888,
"min_ram_gb": 40.8,
"recommended_ram_gb": 67.9,
"min_vram_gb": 37.4,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 922364,
"hf_likes": 75,
"release_date": "2024-09-17",
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen2.5-72B-Instruct-GPTQ-Int8",
"provider": "Alibaba",
"parameter_count": "73.0B",
"parameters_raw": 72957861888,
"min_ram_gb": 40.8,
"recommended_ram_gb": 67.9,
"min_vram_gb": 37.4,
"quantization": "GPTQ-Int8",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 42593,
"hf_likes": 28,
"release_date": "2024-09-17",
"_discovered": true,
"format": "gptq"
},
{
"name": "NexVeridian/Qwen3-Coder-Next-8bit",
"provider": "nexveridian",
"parameter_count": "79.7B",
"parameters_raw": 79674388992,
"min_ram_gb": 44.5,
"recommended_ram_gb": 74.2,
"min_vram_gb": 40.8,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 300258,
"hf_likes": 0,
"release_date": "2026-02-03",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": 5462052829,
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-Next-80B-A3B-Instruct-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "79.7B",
"parameters_raw": 79674388992,
"min_ram_gb": 44.5,
"recommended_ram_gb": 74.2,
"min_vram_gb": 40.8,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 48644,
"hf_likes": 7,
"release_date": "2025-09-15",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": 5462052829,
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-Next-80B-A3B-Instruct-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "79.7B",
"parameters_raw": 79674388992,
"min_ram_gb": 44.5,
"recommended_ram_gb": 74.2,
"min_vram_gb": 40.8,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 48355,
"hf_likes": 2,
"release_date": "2025-09-15",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": 5462052829,
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-Next-80B-A3B-Instruct-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "79.7B",
"parameters_raw": 79674388992,
"min_ram_gb": 44.5,
"recommended_ram_gb": 74.2,
"min_vram_gb": 40.8,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 47109,
"hf_likes": 0,
"release_date": "2025-09-15",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": 5462052829,
"_discovered": true
},
{
"name": "lmstudio-community/Qwen3-Next-80B-A3B-Instruct-MLX-5bit",
"provider": "lmstudio-community",
"parameter_count": "79.7B",
"parameters_raw": 79674388992,
"min_ram_gb": 44.5,
"recommended_ram_gb": 74.2,
"min_vram_gb": 40.8,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 47029,
"hf_likes": 0,
"release_date": "2025-09-15",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": 5462052829,
"_discovered": true
},
{
"name": "Qwen/Qwen3-Coder-Next",
"provider": "Alibaba",
"parameter_count": "80B",
"parameters_raw": 80000000000,
"min_ram_gb": 44.8,
"recommended_ram_gb": 74.6,
"min_vram_gb": 41.0,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Code generation, agentic coding",
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"is_moe": true,
"num_experts": 64,
"active_experts": 4,
"active_parameters": 3000000000,
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2026-01-30",
"gguf_sources": [
{
"repo": "unsloth/Qwen3-Coder-Next-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen3-Coder-Next-FP8",
"provider": "Alibaba",
"parameter_count": "79.7B",
"parameters_raw": 79679212800,
"min_ram_gb": 44.5,
"recommended_ram_gb": 74.2,
"min_vram_gb": 40.8,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 398505,
"hf_likes": 100,
"release_date": "2026-02-01",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": 5462383530,
"_discovered": true
},
{
"name": "Qwen/Qwen3-Next-80B-A3B-Instruct",
"provider": "Alibaba",
"parameter_count": "81.3B",
"parameters_raw": 81324862720,
"min_ram_gb": 45.4,
"recommended_ram_gb": 75.7,
"min_vram_gb": 41.7,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 1224711,
"hf_likes": 945,
"release_date": "2025-09-09",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": 5575200546,
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/Qwen3-Next-80B-A3B-Instruct-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen3-Next-80B-A3B-Instruct-FP8",
"provider": "Alibaba",
"parameter_count": "81.3B",
"parameters_raw": 81329784384,
"min_ram_gb": 45.4,
"recommended_ram_gb": 75.7,
"min_vram_gb": 41.7,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 148887,
"hf_likes": 82,
"release_date": "2025-09-22",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": 5575537949,
"_discovered": true
},
{
"name": "Qwen/Qwen1.5-110B-Chat-AWQ",
"provider": "Alibaba",
"parameter_count": "111.2B",
"parameters_raw": 111209914368,
"min_ram_gb": 62.1,
"recommended_ram_gb": 103.6,
"min_vram_gb": 57.0,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 320397,
"hf_likes": 9,
"release_date": "2024-04-27",
"_discovered": true,
"format": "awq"
},
{
"name": "lmstudio-community/gpt-oss-120b-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "116.8B",
"parameters_raw": 116829154368,
"min_ram_gb": 65.3,
"recommended_ram_gb": 108.8,
"min_vram_gb": 59.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_oss",
"hf_downloads": 61730,
"hf_likes": 12,
"release_date": "2025-08-05",
"is_moe": true,
"num_experts": 128,
"active_experts": 4,
"active_parameters": 9309823238,
"_discovered": true
},
{
"name": "axolotl-ai-co/gpt-oss-120b-dequantized",
"provider": "axolotl-ai-co",
"parameter_count": "116.8B",
"parameters_raw": 116829156672,
"min_ram_gb": 65.3,
"recommended_ram_gb": 108.8,
"min_vram_gb": 59.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gpt_oss",
"hf_downloads": 34254,
"hf_likes": 0,
"release_date": "2025-08-07",
"is_moe": true,
"num_experts": 128,
"active_experts": 4,
"active_parameters": 9309823421,
"_discovered": true
},
{
"name": "openai/gpt-oss-120b",
"provider": "openai",
"parameter_count": "117B",
"parameters_raw": 117000000000,
"min_ram_gb": 80.0,
"recommended_ram_gb": 96.0,
"min_vram_gb": 80.0,
"quantization": "BF16",
"context_length": 131072,
"use_case": "Chat, reasoning, tool use",
"is_moe": true,
"num_experts": 128,
"active_experts": 4,
"active_parameters": 5100000000,
"release_date": "2025-08-08",
"pipeline_tag": "text-generation",
"architecture": "gpt_oss",
"hf_downloads": 4628743,
"hf_likes": 4600,
"gguf_sources": [
{
"repo": "ggml-org/gpt-oss-120b-GGUF",
"provider": "ggml-org"
},
{
"repo": "unsloth/gpt-oss-120b-GGUF",
"provider": "unsloth"
}
],
"capabilities": [
"tool_use"
]
},
{
"name": "Qwen/Qwen3.5-122B-A10B",
"provider": "Alibaba",
"parameter_count": "125.1B",
"parameters_raw": 125086497008,
"min_ram_gb": 69.9,
"recommended_ram_gb": 116.5,
"min_vram_gb": 64.1,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 171055,
"hf_likes": 389,
"release_date": "2026-02-24",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 10000000000,
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-122B-A10B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "mistralai/Mixtral-8x22B-Instruct-v0.1",
"provider": "Mistral AI",
"parameter_count": "140.6B",
"parameters_raw": 140630071296,
"min_ram_gb": 78.6,
"recommended_ram_gb": 131.0,
"min_vram_gb": 72.0,
"quantization": "Q4_K_M",
"context_length": 65536,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "unknown",
"architecture": "mixtral",
"hf_downloads": 15022,
"hf_likes": 746,
"release_date": "2024-04-16",
"is_moe": true,
"num_experts": 8,
"active_experts": 2,
"active_parameters": 39100000000
},
{
"name": "MaziyarPanahi/Mixtral-8x22B-Instruct-v0.1-AWQ",
"provider": "maziyarpanahi",
"parameter_count": "140.6B",
"parameters_raw": 140630071296,
"min_ram_gb": 78.6,
"recommended_ram_gb": 131.0,
"min_vram_gb": 72.0,
"quantization": "AWQ-4bit",
"context_length": 65536,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mixtral",
"hf_downloads": 40221,
"hf_likes": 13,
"release_date": "2024-04-18",
"is_moe": true,
"num_experts": 8,
"active_experts": 2,
"active_parameters": 40431145496,
"_discovered": true,
"format": "awq"
},
{
"name": "rednote-hilab/dots.llm1.inst",
"provider": "rednote-hilab",
"parameter_count": "142.8B",
"parameters_raw": 142774381696,
"min_ram_gb": 79.8,
"recommended_ram_gb": 133.0,
"min_vram_gb": 73.1,
"quantization": "Q4_K_M",
"context_length": 32768,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "dots1",
"hf_downloads": 5040,
"hf_likes": 175,
"release_date": "2025-05-14",
"gguf_sources": [
{
"repo": "unsloth/dots.llm1.inst-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "bigscience/bloom",
"provider": "bigscience",
"parameter_count": "176.2B",
"parameters_raw": 176247271424,
"min_ram_gb": 98.5,
"recommended_ram_gb": 164.1,
"min_vram_gb": 90.3,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "bloom",
"hf_downloads": 4896,
"hf_likes": 4986,
"release_date": "2022-05-19"
},
{
"name": "tiiuae/falcon-180B-chat",
"provider": "TII",
"parameter_count": "179.5B",
"parameters_raw": 179522565120,
"min_ram_gb": 100.3,
"recommended_ram_gb": 167.2,
"min_vram_gb": 92.0,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "falcon",
"hf_downloads": 65,
"hf_likes": 545,
"release_date": "2023-09-04"
},
{
"name": "stepfun-ai/Step-3.5-Flash",
"provider": "stepfun-ai",
"parameter_count": "199.4B",
"parameters_raw": 199384301376,
"min_ram_gb": 111.4,
"recommended_ram_gb": 185.7,
"min_vram_gb": 102.1,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "step3p5",
"hf_downloads": 327178,
"hf_likes": 674,
"release_date": "2026-02-01",
"_discovered": true
},
{
"name": "lmstudio-community/MiniMax-M2.5-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "228.7B",
"parameters_raw": 228689748992,
"min_ram_gb": 127.8,
"recommended_ram_gb": 213.0,
"min_vram_gb": 117.1,
"quantization": "Q4_K_M",
"context_length": 196608,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 112426,
"hf_likes": 1,
"release_date": "2026-02-13",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 18223714369,
"_discovered": true
},
{
"name": "lmstudio-community/MiniMax-M2.5-MLX-4bit",
"provider": "lmstudio-community",
"parameter_count": "228.7B",
"parameters_raw": 228689748992,
"min_ram_gb": 127.8,
"recommended_ram_gb": 213.0,
"min_vram_gb": 117.1,
"quantization": "Q4_K_M",
"context_length": 196608,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 105419,
"hf_likes": 0,
"release_date": "2026-02-13",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 18223714369,
"_discovered": true
},
{
"name": "lmstudio-community/MiniMax-M2.5-MLX-6bit",
"provider": "lmstudio-community",
"parameter_count": "228.7B",
"parameters_raw": 228689748992,
"min_ram_gb": 127.8,
"recommended_ram_gb": 213.0,
"min_vram_gb": 117.1,
"quantization": "Q4_K_M",
"context_length": 196608,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 103821,
"hf_likes": 0,
"release_date": "2026-02-13",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 18223714369,
"_discovered": true
},
{
"name": "lmstudio-community/MiniMax-M2-MLX-8bit",
"provider": "lmstudio-community",
"parameter_count": "228.7B",
"parameters_raw": 228689748992,
"min_ram_gb": 127.8,
"recommended_ram_gb": 213.0,
"min_vram_gb": 117.1,
"quantization": "Q4_K_M",
"context_length": 196608,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax",
"hf_downloads": 19959,
"hf_likes": 0,
"release_date": "2025-10-29",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 18223714369,
"_discovered": true
},
{
"name": "QuantTrio/MiniMax-M2-AWQ",
"provider": "quanttrio",
"parameter_count": "228.7B",
"parameters_raw": 228689764864,
"min_ram_gb": 127.8,
"recommended_ram_gb": 213.0,
"min_vram_gb": 117.1,
"quantization": "AWQ-4bit",
"context_length": 196608,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mixtral",
"hf_downloads": 586558,
"hf_likes": 8,
"release_date": "2025-10-28",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 18223715635,
"_discovered": true,
"format": "awq"
},
{
"name": "QuantTrio/MiniMax-M2.5-AWQ",
"provider": "quanttrio",
"parameter_count": "228.7B",
"parameters_raw": 228689764864,
"min_ram_gb": 127.8,
"recommended_ram_gb": 213.0,
"min_vram_gb": 117.1,
"quantization": "AWQ-4bit",
"context_length": 196608,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 45340,
"hf_likes": 10,
"release_date": "2026-02-15",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 18223715635,
"_discovered": true,
"format": "awq"
},
{
"name": "MiniMaxAI/MiniMax-M2.5",
"provider": "MiniMaxAI",
"parameter_count": "228.7B",
"parameters_raw": 228700000000,
"min_ram_gb": 240.0,
"recommended_ram_gb": 280.0,
"min_vram_gb": 240.0,
"quantization": "FP8",
"context_length": 196608,
"use_case": "Chat, reasoning, tool use",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 13600000000,
"release_date": "2025-06-01",
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 526151,
"hf_likes": 1252,
"gguf_sources": [],
"capabilities": [
"tool_use"
]
},
{
"name": "MiniMaxAI/MiniMax-M2",
"provider": "minimaxai",
"parameter_count": "228.7B",
"parameters_raw": 228703644928,
"min_ram_gb": 127.8,
"recommended_ram_gb": 213.0,
"min_vram_gb": 117.1,
"quantization": "Q4_K_M",
"context_length": 196608,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 275243,
"hf_likes": 1485,
"release_date": "2025-10-22",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 18224821702,
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/MiniMax-M2-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "MiniMaxAI/MiniMax-M2.1",
"provider": "minimaxai",
"parameter_count": "228.7B",
"parameters_raw": 228703644928,
"min_ram_gb": 127.8,
"recommended_ram_gb": 213.0,
"min_vram_gb": 117.1,
"quantization": "Q4_K_M",
"context_length": 196608,
"use_case": "Lightweight, edge deployment",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 72189,
"hf_likes": 1257,
"release_date": "2025-12-20",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 18224821702,
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/MiniMax-M2.1-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen3-235B-A22B",
"provider": "Alibaba",
"parameter_count": "235.1B",
"parameters_raw": 235093634560,
"min_ram_gb": 131.4,
"recommended_ram_gb": 218.9,
"min_vram_gb": 120.4,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 684371,
"hf_likes": 1077,
"release_date": "2025-04-27",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 22000000000,
"gguf_sources": [
{
"repo": "unsloth/Qwen3-235B-A22B-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "Qwen/Qwen3-235B-A22B-Instruct-2507-FP8",
"provider": "Alibaba",
"parameter_count": "235.1B",
"parameters_raw": 235107904512,
"min_ram_gb": 131.4,
"recommended_ram_gb": 219.0,
"min_vram_gb": 120.4,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 802366,
"hf_likes": 146,
"release_date": "2025-07-21",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 25714927049,
"_discovered": true
},
{
"name": "Qwen/Qwen3-235B-A22B-Thinking-2507-FP8",
"provider": "Alibaba",
"parameter_count": "235.1B",
"parameters_raw": 235107904512,
"min_ram_gb": 131.4,
"recommended_ram_gb": 219.0,
"min_vram_gb": 120.4,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 77936,
"hf_likes": 83,
"release_date": "2025-07-25",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 25714927049,
"_discovered": true
},
{
"name": "Qwen/Qwen3-235B-A22B-FP8",
"provider": "Alibaba",
"parameter_count": "235.1B",
"parameters_raw": 235107904512,
"min_ram_gb": 131.4,
"recommended_ram_gb": 219.0,
"min_vram_gb": 120.4,
"quantization": "Q4_K_M",
"context_length": 40960,
"use_case": "General purpose text generation",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 32322,
"hf_likes": 90,
"release_date": "2025-04-28",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 25714927049,
"_discovered": true
},
{
"name": "casperhansen/deepseek-coder-v2-instruct-awq",
"provider": "casperhansen",
"parameter_count": "235.7B",
"parameters_raw": 235741434880,
"min_ram_gb": 131.7,
"recommended_ram_gb": 219.6,
"min_vram_gb": 120.8,
"quantization": "AWQ-4bit",
"context_length": 163840,
"use_case": "Code generation and completion",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v2",
"hf_downloads": 155456,
"hf_likes": 11,
"release_date": "2024-07-03",
"is_moe": true,
"num_experts": 64,
"active_experts": 6,
"active_parameters": 32782793288,
"_discovered": true,
"format": "awq"
},
{
"name": "deepseek-ai/DeepSeek-V2.5",
"provider": "DeepSeek",
"parameter_count": "235.7B",
"parameters_raw": 235741434880,
"min_ram_gb": 131.7,
"recommended_ram_gb": 219.6,
"min_vram_gb": 120.8,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v2",
"hf_downloads": 84805,
"hf_likes": 733,
"release_date": "2024-09-05",
"is_moe": true,
"num_experts": 64,
"active_experts": 6,
"active_parameters": 32782793288,
"_discovered": true,
"gguf_sources": [
{
"repo": "bartowski/DeepSeek-V2.5-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "RedHatAI/DeepSeek-V2.5-1210-FP8",
"provider": "redhatai",
"parameter_count": "235.7B",
"parameters_raw": 235741492480,
"min_ram_gb": 131.7,
"recommended_ram_gb": 219.6,
"min_vram_gb": 120.8,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v2",
"hf_downloads": 54313,
"hf_likes": 4,
"release_date": "2025-01-04",
"is_moe": true,
"num_experts": 64,
"active_experts": 6,
"active_parameters": 32782801298,
"_discovered": true
},
{
"name": "LGAI-EXAONE/K-EXAONE-236B-A23B",
"provider": "lgai-exaone",
"parameter_count": "237.1B",
"parameters_raw": 237099669632,
"min_ram_gb": 132.5,
"recommended_ram_gb": 220.8,
"min_vram_gb": 121.4,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "exaone_moe",
"hf_downloads": 23695,
"hf_likes": 549,
"release_date": "2025-12-26",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 25932776361,
"_discovered": true
},
{
"name": "baidu/ERNIE-4.5-300B-A47B-Paddle",
"provider": "baidu",
"parameter_count": "300.5B",
"parameters_raw": 300474051776,
"min_ram_gb": 167.9,
"recommended_ram_gb": 279.8,
"min_vram_gb": 153.9,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "ernie4_5_moe",
"hf_downloads": 332,
"hf_likes": 12,
"release_date": "2025-06-28"
},
{
"name": "XiaomiMiMo/MiMo-V2-Flash",
"provider": "xiaomimimo",
"parameter_count": "309.8B",
"parameters_raw": 309785318400,
"min_ram_gb": 173.1,
"recommended_ram_gb": 288.5,
"min_vram_gb": 158.7,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mimo_v2_flash",
"hf_downloads": 536830,
"hf_likes": 636,
"release_date": "2025-12-16",
"gguf_sources": [
{
"repo": "unsloth/MiMo-V2-Flash-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "zai-org/GLM-4.6",
"provider": "zai-org",
"parameter_count": "356.8B",
"parameters_raw": 356785898816,
"min_ram_gb": 199.4,
"recommended_ram_gb": 332.3,
"min_vram_gb": 182.8,
"quantization": "Q4_K_M",
"context_length": 202752,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 81982,
"hf_likes": 1204,
"release_date": "2025-09-29",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/GLM-4.6-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "zai-org/GLM-4.5",
"provider": "zai-org",
"parameter_count": "358.3B",
"parameters_raw": 358337791296,
"min_ram_gb": 200.2,
"recommended_ram_gb": 333.7,
"min_vram_gb": 183.6,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 42566,
"hf_likes": 1396,
"release_date": "2025-07-20",
"_discovered": true,
"gguf_sources": [
{
"repo": "unsloth/GLM-4.5-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "nvidia/DeepSeek-R1-0528-NVFP4-v2",
"provider": "nvidia",
"parameter_count": "393.6B",
"parameters_raw": 393632819968,
"min_ram_gb": 220.0,
"recommended_ram_gb": 366.6,
"min_vram_gb": 201.6,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"hf_downloads": 142525,
"hf_likes": 16,
"release_date": "2025-07-21",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 31367615334,
"_discovered": true
},
{
"name": "nvidia/DeepSeek-V3.1-NVFP4",
"provider": "nvidia",
"parameter_count": "393.6B",
"parameters_raw": 393632819968,
"min_ram_gb": 220.0,
"recommended_ram_gb": 366.6,
"min_vram_gb": 201.6,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"hf_downloads": 37723,
"hf_likes": 13,
"release_date": "2025-11-21",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 31367615334,
"_discovered": true
},
{
"name": "nvidia/DeepSeek-V3.2-NVFP4",
"provider": "nvidia",
"parameter_count": "394.5B",
"parameters_raw": 394498304256,
"min_ram_gb": 220.4,
"recommended_ram_gb": 367.4,
"min_vram_gb": 202.1,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v32",
"hf_downloads": 21598,
"hf_likes": 7,
"release_date": "2025-12-30",
"_discovered": true
},
{
"name": "nvidia/DeepSeek-V3-0324-NVFP4",
"provider": "nvidia",
"parameter_count": "396.8B",
"parameters_raw": 396767013632,
"min_ram_gb": 221.7,
"recommended_ram_gb": 369.5,
"min_vram_gb": 203.2,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"hf_downloads": 84851,
"hf_likes": 14,
"release_date": "2025-05-03",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 31617371393,
"_discovered": true
},
{
"name": "nvidia/DeepSeek-R1-NVFP4",
"provider": "nvidia",
"parameter_count": "396.8B",
"parameters_raw": 396767013632,
"min_ram_gb": 221.7,
"recommended_ram_gb": 369.5,
"min_vram_gb": 203.2,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"hf_downloads": 43986,
"hf_likes": 271,
"release_date": "2025-02-21",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 31617371393,
"_discovered": true
},
{
"name": "meta-llama/Llama-4-Maverick-17B-128E-Instruct",
"provider": "Meta",
"parameter_count": "401.6B",
"parameters_raw": 401583781376,
"min_ram_gb": 224.4,
"recommended_ram_gb": 374.0,
"min_vram_gb": 205.7,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [
"vision"
],
"pipeline_tag": "image-text-to-text",
"architecture": "llama4",
"hf_downloads": 6341,
"hf_likes": 466,
"release_date": "2025-04-01",
"is_moe": true,
"num_experts": 16,
"active_experts": 1,
"active_parameters": 17000000000
},
{
"name": "Qwen/Qwen3.5-397B-A17B",
"provider": "Alibaba",
"parameter_count": "403.4B",
"parameters_raw": 403397928944,
"min_ram_gb": 225.4,
"recommended_ram_gb": 375.7,
"min_vram_gb": 206.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision",
"tool_use"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 1291825,
"hf_likes": 1214,
"release_date": "2026-02-16",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 17000000000
},
{
"name": "meta-llama/Llama-3.1-405B-Instruct",
"provider": "Meta",
"parameter_count": "405.9B",
"parameters_raw": 405853388800,
"min_ram_gb": 226.8,
"recommended_ram_gb": 378.0,
"min_vram_gb": 207.9,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 173410,
"hf_likes": 592,
"release_date": "2024-07-16"
},
{
"name": "meta-llama/Llama-3.1-405B-Instruct-FP8",
"provider": "Meta",
"parameter_count": "405.9B",
"parameters_raw": 405868625920,
"min_ram_gb": 226.8,
"recommended_ram_gb": 378.0,
"min_vram_gb": 207.9,
"quantization": "Q4_K_M",
"context_length": 4096,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 22040,
"hf_likes": 193,
"release_date": "2024-07-20",
"_discovered": true
},
{
"name": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
"provider": "Alibaba",
"parameter_count": "480.2B",
"parameters_raw": 480154875392,
"min_ram_gb": 268.3,
"recommended_ram_gb": 447.2,
"min_vram_gb": 245.9,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Code generation and completion",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 75486,
"hf_likes": 1304,
"release_date": "2025-07-22",
"is_moe": true,
"num_experts": 160,
"active_experts": 8,
"active_parameters": 35000000000
},
{
"name": "meituan-longcat/LongCat-Flash-Chat",
"provider": "meituan-longcat",
"parameter_count": "561.9B",
"parameters_raw": 561862880256,
"min_ram_gb": 314.0,
"recommended_ram_gb": 523.3,
"min_vram_gb": 287.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "unknown",
"hf_downloads": 30116,
"hf_likes": 526,
"release_date": "2025-08-29",
"_discovered": true
},
{
"name": "deepseek-ai/DeepSeek-R1",
"provider": "DeepSeek",
"parameter_count": "684.5B",
"parameters_raw": 684531386000,
"min_ram_gb": 382.5,
"recommended_ram_gb": 637.5,
"min_vram_gb": 350.6,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"hf_downloads": 1026085,
"hf_likes": 13108,
"release_date": "2025-01-20",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 37000000000,
"gguf_sources": [
{
"repo": "unsloth/DeepSeek-R1-GGUF",
"provider": "unsloth"
},
{
"repo": "bartowski/DeepSeek-R1-GGUF",
"provider": "bartowski"
}
]
},
{
"name": "deepseek-ai/DeepSeek-R1-0528",
"provider": "DeepSeek",
"parameter_count": "684.5B",
"parameters_raw": 684531386000,
"min_ram_gb": 382.5,
"recommended_ram_gb": 637.5,
"min_vram_gb": 350.6,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "Advanced reasoning, chain-of-thought",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"hf_downloads": 1050237,
"hf_likes": 2403,
"release_date": "2025-05-28",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 54548594820,
"_discovered": true
},
{
"name": "deepseek-ai/DeepSeek-V3-0324",
"provider": "DeepSeek",
"parameter_count": "684.5B",
"parameters_raw": 684531386000,
"min_ram_gb": 382.5,
"recommended_ram_gb": 637.5,
"min_vram_gb": 350.6,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"hf_downloads": 270362,
"hf_likes": 3088,
"release_date": "2025-03-24",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 54548594820,
"_discovered": true
},
{
"name": "deepseek-ai/DeepSeek-V3",
"provider": "DeepSeek",
"parameter_count": "685B",
"parameters_raw": 685000000000,
"min_ram_gb": 382.8,
"recommended_ram_gb": 638.0,
"min_vram_gb": 351.3,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "State-of-the-art, MoE architecture",
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 37000000000,
"hf_downloads": 0,
"hf_likes": 0,
"release_date": null
},
{
"name": "deepseek-ai/DeepSeek-V3.2-Speciale",
"provider": "DeepSeek",
"parameter_count": "685B",
"parameters_raw": 685000000000,
"min_ram_gb": 383.2,
"recommended_ram_gb": 638.7,
"min_vram_gb": 351.3,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Advanced reasoning, chain-of-thought",
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 37000000000,
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-12-01"
},
{
"name": "QuantTrio/DeepSeek-V3.2-AWQ",
"provider": "quanttrio",
"parameter_count": "685.0B",
"parameters_raw": 685011996928,
"min_ram_gb": 382.8,
"recommended_ram_gb": 638.0,
"min_vram_gb": 350.9,
"quantization": "AWQ-4bit",
"context_length": 163840,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v32",
"hf_downloads": 103286,
"hf_likes": 11,
"release_date": "2025-12-03",
"_discovered": true,
"format": "awq"
},
{
"name": "deepseek-ai/DeepSeek-V3.2",
"provider": "DeepSeek",
"parameter_count": "685.4B",
"parameters_raw": 685396921376,
"min_ram_gb": 383.0,
"recommended_ram_gb": 638.3,
"min_vram_gb": 351.1,
"quantization": "Q4_K_M",
"context_length": 163840,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v32",
"hf_downloads": 362520,
"hf_likes": 1280,
"release_date": "2025-12-01"
},
{
"name": "zai-org/GLM-5",
"provider": "zai-org",
"parameter_count": "753.9B",
"parameters_raw": 753864139008,
"min_ram_gb": 421.3,
"recommended_ram_gb": 702.1,
"min_vram_gb": 386.1,
"quantization": "Q4_K_M",
"context_length": 202752,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm_moe_dsa",
"hf_downloads": 205187,
"hf_likes": 1698,
"release_date": "2026-02-11"
},
{
"name": "moonshotai/Kimi-K2-Instruct",
"provider": "moonshotai",
"parameter_count": "1026.5B",
"parameters_raw": 1026470731056,
"min_ram_gb": 573.6,
"recommended_ram_gb": 956.0,
"min_vram_gb": 525.8,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "kimi_k2",
"hf_downloads": 151155,
"hf_likes": 2324,
"release_date": "2025-07-11"
},
{
"name": "moonshotai/Kimi-K2-Instruct-0905",
"provider": "moonshotai",
"parameter_count": "1026.5B",
"parameters_raw": 1026470735448,
"min_ram_gb": 573.6,
"recommended_ram_gb": 956.0,
"min_vram_gb": 525.8,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "kimi_k2",
"hf_downloads": 28801,
"hf_likes": 683,
"release_date": "2025-09-03",
"_discovered": true
},
{
"name": "moonshotai/Kimi-K2.5",
"provider": "moonshotai",
"parameter_count": "1058.6B",
"parameters_raw": 1058589420528,
"min_ram_gb": 591.5,
"recommended_ram_gb": 985.9,
"min_vram_gb": 542.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose",
"capabilities": [
"vision"
],
"pipeline_tag": "image-text-to-text",
"architecture": "kimi_k25",
"hf_downloads": 1899549,
"hf_likes": 2220,
"release_date": "2026-01-01",
"gguf_sources": [
{
"repo": "unsloth/Kimi-K2.5-GGUF",
"provider": "unsloth"
}
]
},
{
"name": "QuantTrio/Qwen3.5-27B-AWQ",
"provider": "QuantTrio",
"parameter_count": "27.3B",
"parameters_raw": 27300000000,
"min_ram_gb": 14.2,
"recommended_ram_gb": 18.4,
"min_vram_gb": 14.2,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3.5-35B-A3B-AWQ",
"provider": "QuantTrio",
"parameter_count": "35.2B",
"parameters_raw": 35200000000,
"min_ram_gb": 18.1,
"recommended_ram_gb": 23.5,
"min_vram_gb": 18.1,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3.5-122B-A10B-AWQ",
"provider": "QuantTrio",
"parameter_count": "125.1B",
"parameters_raw": 125100000000,
"min_ram_gb": 63.0,
"recommended_ram_gb": 82.0,
"min_vram_gb": 63.0,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 10000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3.5-9B-AWQ",
"provider": "QuantTrio",
"parameter_count": "9.4B",
"parameters_raw": 9400000000,
"min_ram_gb": 5.2,
"recommended_ram_gb": 6.8,
"min_vram_gb": 5.2,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/GLM-4.5-Air-AWQ-FP16Mix",
"provider": "QuantTrio",
"parameter_count": "9.4B",
"parameters_raw": 9400000000,
"min_ram_gb": 5.2,
"recommended_ram_gb": 6.8,
"min_vram_gb": 5.2,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/GLM-4.5-AWQ",
"provider": "QuantTrio",
"parameter_count": "31.2B",
"parameters_raw": 31200000000,
"min_ram_gb": 16.1,
"recommended_ram_gb": 20.9,
"min_vram_gb": 16.1,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/GLM-4.5V-AWQ",
"provider": "QuantTrio",
"parameter_count": "31.2B",
"parameters_raw": 31200000000,
"min_ram_gb": 16.1,
"recommended_ram_gb": 20.9,
"min_vram_gb": 16.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Multimodal, vision",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/KAT-V1-40B-AWQ",
"provider": "QuantTrio",
"parameter_count": "40.0B",
"parameters_raw": 40000000000,
"min_ram_gb": 20.5,
"recommended_ram_gb": 26.7,
"min_vram_gb": 20.5,
"quantization": "AWQ-4bit",
"context_length": 65536,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/DeepSeek-V3.1-AWQ",
"provider": "QuantTrio",
"parameter_count": "685.0B",
"parameters_raw": 685000000000,
"min_ram_gb": 343.0,
"recommended_ram_gb": 445.9,
"min_vram_gb": 343.0,
"quantization": "AWQ-4bit",
"context_length": 163840,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 37000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/DeepSeek-V3.1-AWQ-Fp16Mix",
"provider": "QuantTrio",
"parameter_count": "685.0B",
"parameters_raw": 685000000000,
"min_ram_gb": 343.0,
"recommended_ram_gb": 445.9,
"min_vram_gb": 343.0,
"quantization": "AWQ-4bit",
"context_length": 163840,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 37000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/DeepSeek-V3.1-AWQ-Lite",
"provider": "QuantTrio",
"parameter_count": "685.0B",
"parameters_raw": 685000000000,
"min_ram_gb": 343.0,
"recommended_ram_gb": 445.9,
"min_vram_gb": 343.0,
"quantization": "AWQ-4bit",
"context_length": 163840,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 37000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/DeepSeek-V3.2-Exp-AWQ",
"provider": "QuantTrio",
"parameter_count": "486.0B",
"parameters_raw": 486000000000,
"min_ram_gb": 243.5,
"recommended_ram_gb": 316.6,
"min_vram_gb": 243.5,
"quantization": "AWQ-4bit",
"context_length": 163840,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 37000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/DeepSeek-V3.2-Exp-AWQ-Lite",
"provider": "QuantTrio",
"parameter_count": "486.0B",
"parameters_raw": 486000000000,
"min_ram_gb": 243.5,
"recommended_ram_gb": 316.6,
"min_vram_gb": 243.5,
"quantization": "AWQ-4bit",
"context_length": 163840,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 37000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/GLM-4.6-AWQ",
"provider": "QuantTrio",
"parameter_count": "31.2B",
"parameters_raw": 31200000000,
"min_ram_gb": 16.1,
"recommended_ram_gb": 20.9,
"min_vram_gb": 16.1,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/MiniMax-M2-REAP-162B-A10B-AWQ",
"provider": "QuantTrio",
"parameter_count": "162.0B",
"parameters_raw": 162000000000,
"min_ram_gb": 81.5,
"recommended_ram_gb": 106.0,
"min_vram_gb": 81.5,
"quantization": "AWQ-4bit",
"context_length": 1048576,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 10000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/DeepSeek-V3.2-Speciale-AWQ",
"provider": "QuantTrio",
"parameter_count": "685.0B",
"parameters_raw": 685000000000,
"min_ram_gb": 343.0,
"recommended_ram_gb": 445.9,
"min_vram_gb": 343.0,
"quantization": "AWQ-4bit",
"context_length": 163840,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 37000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/GLM-4.7-AWQ",
"provider": "QuantTrio",
"parameter_count": "31.2B",
"parameters_raw": 31200000000,
"min_ram_gb": 16.1,
"recommended_ram_gb": 20.9,
"min_vram_gb": 16.1,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/MiniMax-M2.1-AWQ",
"provider": "QuantTrio",
"parameter_count": "228.7B",
"parameters_raw": 228700000000,
"min_ram_gb": 114.8,
"recommended_ram_gb": 149.3,
"min_vram_gb": 114.8,
"quantization": "AWQ-4bit",
"context_length": 1048576,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 40000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Step3-VL-10B-AWQ",
"provider": "QuantTrio",
"parameter_count": "10.0B",
"parameters_raw": 10000000000,
"min_ram_gb": 5.5,
"recommended_ram_gb": 7.2,
"min_vram_gb": 5.5,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Multimodal, vision",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3.5-397B-A17B-AWQ",
"provider": "QuantTrio",
"parameter_count": "403.4B",
"parameters_raw": 403400000000,
"min_ram_gb": 202.2,
"recommended_ram_gb": 262.9,
"min_vram_gb": 202.2,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 17000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/GLM-5-AWQ",
"provider": "QuantTrio",
"parameter_count": "753.9B",
"parameters_raw": 753900000000,
"min_ram_gb": 377.4,
"recommended_ram_gb": 490.7,
"min_vram_gb": 377.4,
"quantization": "AWQ-4bit",
"context_length": 202752,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 35000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3.5-4B-AWQ",
"provider": "QuantTrio",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.5,
"recommended_ram_gb": 3.2,
"min_vram_gb": 2.5,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3.5-2B-AWQ",
"provider": "QuantTrio",
"parameter_count": "2.0B",
"parameters_raw": 2000000000,
"min_ram_gb": 1.5,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.5,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/sarvam-30b-AWQ",
"provider": "QuantTrio",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "Chat, multilingual",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/sarvam-105b-AWQ",
"provider": "QuantTrio",
"parameter_count": "105.0B",
"parameters_raw": 105000000000,
"min_ram_gb": 36.8,
"recommended_ram_gb": 73.7,
"min_vram_gb": 61.4,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "Chat, multilingual",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3500000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3.5-35B-A3B-FP8",
"provider": "Qwen",
"parameter_count": "35.2B",
"parameters_raw": 35200000000,
"min_ram_gb": 35.7,
"recommended_ram_gb": 46.4,
"min_vram_gb": 35.7,
"quantization": "FP8",
"context_length": 131072,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3.5-27B-FP8",
"provider": "Qwen",
"parameter_count": "27.3B",
"parameters_raw": 27300000000,
"min_ram_gb": 27.8,
"recommended_ram_gb": 36.1,
"min_vram_gb": 27.8,
"quantization": "FP8",
"context_length": 131072,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3.5-397B-A17B-FP8",
"provider": "Qwen",
"parameter_count": "403.4B",
"parameters_raw": 403400000000,
"min_ram_gb": 403.9,
"recommended_ram_gb": 525.1,
"min_vram_gb": 403.9,
"quantization": "FP8",
"context_length": 262144,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 17000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3.5-122B-A10B-FP8",
"provider": "Qwen",
"parameter_count": "125.1B",
"parameters_raw": 125100000000,
"min_ram_gb": 125.6,
"recommended_ram_gb": 163.3,
"min_vram_gb": 125.6,
"quantization": "FP8",
"context_length": 131072,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 10000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-30B-A3B-FP8",
"provider": "Qwen",
"parameter_count": "30.5B",
"parameters_raw": 30500000000,
"min_ram_gb": 31.0,
"recommended_ram_gb": 40.3,
"min_vram_gb": 31.0,
"quantization": "FP8",
"context_length": 131072,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-32B-FP8",
"provider": "Qwen",
"parameter_count": "32.8B",
"parameters_raw": 32800000000,
"min_ram_gb": 33.3,
"recommended_ram_gb": 43.3,
"min_vram_gb": 33.3,
"quantization": "FP8",
"context_length": 131072,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-14B-FP8",
"provider": "Qwen",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 14.5,
"recommended_ram_gb": 18.9,
"min_vram_gb": 14.5,
"quantization": "FP8",
"context_length": 131072,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3-VL-32B-Instruct-AWQ",
"provider": "QuantTrio",
"parameter_count": "32.8B",
"parameters_raw": 32800000000,
"min_ram_gb": 16.9,
"recommended_ram_gb": 22.0,
"min_vram_gb": 16.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Multimodal, vision",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3-235B-A22B-Instruct-2507-AWQ",
"provider": "QuantTrio",
"parameter_count": "234.6B",
"parameters_raw": 234600000000,
"min_ram_gb": 117.8,
"recommended_ram_gb": 153.1,
"min_vram_gb": 117.8,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 22000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/GLM-4.1V-9B-Thinking-AWQ",
"provider": "QuantTrio",
"parameter_count": "9.4B",
"parameters_raw": 9400000000,
"min_ram_gb": 5.2,
"recommended_ram_gb": 6.8,
"min_vram_gb": 5.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Multimodal, vision, reasoning",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3-Coder-480B-A35B-Instruct-AWQ",
"provider": "QuantTrio",
"parameter_count": "480.2B",
"parameters_raw": 480200000000,
"min_ram_gb": 240.6,
"recommended_ram_gb": 312.8,
"min_vram_gb": 240.6,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Coding",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 35000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3-235B-A22B-Thinking-2507-AWQ",
"provider": "QuantTrio",
"parameter_count": "234.6B",
"parameters_raw": 234600000000,
"min_ram_gb": 117.8,
"recommended_ram_gb": 153.1,
"min_vram_gb": 117.8,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "Reasoning",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 22000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3-30B-A3B-Thinking-2507-AWQ-BF16Mix",
"provider": "QuantTrio",
"parameter_count": "30.5B",
"parameters_raw": 30500000000,
"min_ram_gb": 15.8,
"recommended_ram_gb": 20.5,
"min_vram_gb": 15.8,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "Reasoning",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3-30B-A3B-Thinking-2507-AWQ",
"provider": "QuantTrio",
"parameter_count": "30.5B",
"parameters_raw": 30500000000,
"min_ram_gb": 15.8,
"recommended_ram_gb": 20.5,
"min_vram_gb": 15.8,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "Reasoning",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Seed-OSS-36B-Instruct-AWQ",
"provider": "QuantTrio",
"parameter_count": "36.0B",
"parameters_raw": 36000000000,
"min_ram_gb": 18.5,
"recommended_ram_gb": 24.1,
"min_vram_gb": 18.5,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "General",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3-VL-235B-A22B-Instruct-AWQ",
"provider": "QuantTrio",
"parameter_count": "234.6B",
"parameters_raw": 234600000000,
"min_ram_gb": 117.8,
"recommended_ram_gb": 153.1,
"min_vram_gb": 117.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Multimodal, vision",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 22000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3-VL-235B-A22B-Thinking-AWQ",
"provider": "QuantTrio",
"parameter_count": "234.6B",
"parameters_raw": 234600000000,
"min_ram_gb": 117.8,
"recommended_ram_gb": 153.1,
"min_vram_gb": 117.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Multimodal, vision, reasoning",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 22000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3-VL-30B-A3B-Thinking-AWQ",
"provider": "QuantTrio",
"parameter_count": "31.1B",
"parameters_raw": 31100000000,
"min_ram_gb": 16.1,
"recommended_ram_gb": 20.9,
"min_vram_gb": 16.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Multimodal, vision, reasoning",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3-VL-32B-Thinking-AWQ",
"provider": "QuantTrio",
"parameter_count": "32.8B",
"parameters_raw": 32800000000,
"min_ram_gb": 16.9,
"recommended_ram_gb": 22.0,
"min_vram_gb": 16.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Multimodal, vision, reasoning",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-VL-8B-Instruct-FP8",
"provider": "Qwen",
"parameter_count": "8.2B",
"parameters_raw": 8200000000,
"min_ram_gb": 8.7,
"recommended_ram_gb": 11.3,
"min_vram_gb": 8.7,
"quantization": "FP8",
"context_length": 32768,
"use_case": "Multimodal, vision",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-VL-32B-Instruct-FP8",
"provider": "Qwen",
"parameter_count": "32.8B",
"parameters_raw": 32800000000,
"min_ram_gb": 33.3,
"recommended_ram_gb": 43.3,
"min_vram_gb": 33.3,
"quantization": "FP8",
"context_length": 32768,
"use_case": "Multimodal, vision",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-VL-30B-A3B-Instruct-FP8",
"provider": "Qwen",
"parameter_count": "31.1B",
"parameters_raw": 31100000000,
"min_ram_gb": 31.6,
"recommended_ram_gb": 41.1,
"min_vram_gb": 31.6,
"quantization": "FP8",
"context_length": 32768,
"use_case": "Multimodal, vision",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-4B-Thinking-2507-FP8",
"provider": "Qwen",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 4.5,
"recommended_ram_gb": 5.9,
"min_vram_gb": 4.5,
"quantization": "FP8",
"context_length": 32768,
"use_case": "Reasoning",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-VL-235B-A22B-Instruct-FP8",
"provider": "Qwen",
"parameter_count": "234.6B",
"parameters_raw": 234600000000,
"min_ram_gb": 235.1,
"recommended_ram_gb": 305.6,
"min_vram_gb": 235.1,
"quantization": "FP8",
"context_length": 32768,
"use_case": "Multimodal, vision",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 22000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
"provider": "Qwen",
"parameter_count": "480.2B",
"parameters_raw": 480200000000,
"min_ram_gb": 480.7,
"recommended_ram_gb": 624.9,
"min_vram_gb": 480.7,
"quantization": "FP8",
"context_length": 262144,
"use_case": "Coding",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 35000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-30B-A3B-Thinking-2507-FP8",
"provider": "Qwen",
"parameter_count": "30.5B",
"parameters_raw": 30500000000,
"min_ram_gb": 31.0,
"recommended_ram_gb": 40.3,
"min_vram_gb": 31.0,
"quantization": "FP8",
"context_length": 131072,
"use_case": "Reasoning",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-VL-30B-A3B-Thinking-FP8",
"provider": "Qwen",
"parameter_count": "31.1B",
"parameters_raw": 31100000000,
"min_ram_gb": 31.6,
"recommended_ram_gb": 41.1,
"min_vram_gb": 31.6,
"quantization": "FP8",
"context_length": 32768,
"use_case": "Multimodal, vision, reasoning",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3-VL-2B-Instruct-FP8",
"provider": "Qwen",
"parameter_count": "2.7B",
"parameters_raw": 2700000000,
"min_ram_gb": 3.2,
"recommended_ram_gb": 4.2,
"min_vram_gb": 3.2,
"quantization": "FP8",
"context_length": 32768,
"use_case": "Multimodal, vision",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"release_date": "2025-07-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "zai-org/GLM-4.7-Flash",
"provider": "zai-org",
"parameter_count": "31.2B",
"parameters_raw": 31221488576,
"min_ram_gb": 17.4,
"recommended_ram_gb": 29.1,
"min_vram_gb": 16.0,
"quantization": "Q4_K_M",
"context_length": 202752,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe_lite",
"hf_downloads": 1709725,
"hf_likes": 1617,
"release_date": "2026-01-29",
"is_moe": true,
"num_experts": 64,
"active_experts": 4,
"active_parameters": null,
"_discovered": true,
"gguf_sources": []
},
{
"name": "cyankiwi/Qwen3.5-35B-A3B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "35.0B",
"parameters_raw": 35000000000,
"min_ram_gb": 4.4,
"recommended_ram_gb": 7.3,
"min_vram_gb": 4.0,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Multimodal, vision, chat",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 651639,
"hf_likes": 30,
"release_date": "2026-02-25",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 3000000000,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3-VL-4B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Multimodal, vision",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 583536,
"hf_likes": 6,
"release_date": "2025-10-14",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3-Coder-Next-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "79.7B",
"parameters_raw": 79674391296,
"min_ram_gb": 44.5,
"recommended_ram_gb": 74.2,
"min_vram_gb": 40.8,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Coding",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 248200,
"hf_likes": 18,
"release_date": "2026-02-04",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3.5-9B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "9.0B",
"parameters_raw": 9000000000,
"min_ram_gb": 5.5,
"recommended_ram_gb": 9.2,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Multimodal, vision, chat",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 183369,
"hf_likes": 13,
"release_date": "2026-03-02",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3.5-27B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "27.0B",
"parameters_raw": 27000000000,
"min_ram_gb": 3.9,
"recommended_ram_gb": 6.5,
"min_vram_gb": 3.6,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Multimodal, vision, chat",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 149004,
"hf_likes": 19,
"release_date": "2026-02-25",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3.5-122B-A10B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "122.0B",
"parameters_raw": 122000000000,
"min_ram_gb": 71.9,
"recommended_ram_gb": 119.9,
"min_vram_gb": 66.0,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Multimodal, vision, chat",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 137640,
"hf_likes": 22,
"release_date": "2026-02-25",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 10000000000,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3-VL-8B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 1.6,
"recommended_ram_gb": 2.7,
"min_vram_gb": 1.5,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Multimodal, vision",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 90955,
"hf_likes": 13,
"release_date": "2025-10-14",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3.5-27B-AWQ-BF16-INT8",
"provider": "cyankiwi",
"parameter_count": "27.0B",
"parameters_raw": 27000000000,
"min_ram_gb": 7.8,
"recommended_ram_gb": 13.1,
"min_vram_gb": 7.2,
"quantization": "AWQ-8bit",
"context_length": 262144,
"use_case": "Multimodal, vision, chat",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 82325,
"hf_likes": 8,
"release_date": "2026-02-24",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3-Omni-30B-A3B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 5.6,
"recommended_ram_gb": 9.3,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 65536,
"use_case": "Multimodal, any-to-any",
"capabilities": [],
"pipeline_tag": "any-to-any",
"architecture": "qwen3_omni_moe",
"hf_downloads": 68670,
"hf_likes": 45,
"release_date": "2025-09-28",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3000000000,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3-30B-A3B-Instruct-2507-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 5.1,
"recommended_ram_gb": 8.4,
"min_vram_gb": 4.6,
"quantization": "AWQ-8bit",
"context_length": 262144,
"use_case": "Instruction following, chat",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 44772,
"hf_likes": 2,
"release_date": "2025-08-08",
"is_moe": true,
"num_experts": 128,
"active_experts": 8,
"active_parameters": 3000000000,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3.5-27B-AWQ-BF16-INT4",
"provider": "cyankiwi",
"parameter_count": "27.0B",
"parameters_raw": 27000000000,
"min_ram_gb": 6.5,
"recommended_ram_gb": 10.8,
"min_vram_gb": 6.0,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Multimodal, vision, chat",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 42645,
"hf_likes": 30,
"release_date": "2026-02-24",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3.5-4B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.7,
"recommended_ram_gb": 4.4,
"min_vram_gb": 2.4,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Multimodal, vision, chat",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 35275,
"hf_likes": 7,
"release_date": "2026-03-02",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Devstral-2-123B-Instruct-2512-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "123.0B",
"parameters_raw": 123000000000,
"min_ram_gb": 12.4,
"recommended_ram_gb": 20.7,
"min_vram_gb": 11.4,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Coding",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "ministral3",
"hf_downloads": 31584,
"hf_likes": 15,
"release_date": "2025-12-11",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3.5-35B-A3B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "35.0B",
"parameters_raw": 35000000000,
"min_ram_gb": 6.7,
"recommended_ram_gb": 11.2,
"min_vram_gb": 6.2,
"quantization": "AWQ-8bit",
"context_length": 262144,
"use_case": "Multimodal, vision, chat",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 21278,
"hf_likes": 7,
"release_date": "2026-02-25",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 3000000000,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/InternVL3_5-38B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "38.0B",
"parameters_raw": 38000000000,
"min_ram_gb": 6.7,
"recommended_ram_gb": 11.2,
"min_vram_gb": 6.2,
"quantization": "AWQ-4bit",
"context_length": 40960,
"use_case": "Multimodal, vision",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "internvl_chat",
"hf_downloads": 20665,
"hf_likes": 1,
"release_date": "2025-08-29",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3-VL-4B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.9,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Multimodal, vision, reasoning",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 17082,
"hf_likes": 1,
"release_date": "2025-10-14",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3.5-4B-AWQ-BF16-INT4",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.6,
"recommended_ram_gb": 4.4,
"min_vram_gb": 2.4,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Multimodal, vision, chat",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 14400,
"hf_likes": 1,
"release_date": "2026-03-02",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/Qwen3.5-2B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 2000000000,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.2,
"min_vram_gb": 1.2,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Multimodal, vision, chat",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 14333,
"hf_likes": 1,
"release_date": "2026-03-02",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/LFM2-24B-A2B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "24.0B",
"parameters_raw": 24000000000,
"min_ram_gb": 2.5,
"recommended_ram_gb": 4.1,
"min_vram_gb": 2.2,
"quantization": "AWQ-4bit",
"context_length": 128000,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2_moe",
"hf_downloads": 13987,
"hf_likes": 1,
"release_date": "2026-02-25",
"is_moe": true,
"num_experts": 64,
"active_experts": 4,
"active_parameters": 2000000000,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/OmniCoder-9B-AWQ-BF16-INT4",
"provider": "cyankiwi",
"parameter_count": "9.0B",
"parameters_raw": 9000000000,
"min_ram_gb": 5.3,
"recommended_ram_gb": 8.9,
"min_vram_gb": 4.9,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Coding, reasoning",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_5",
"hf_downloads": 12121,
"hf_likes": 0,
"release_date": "2026-03-14",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/GLM-4.7-Flash-REAP-23B-A3B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "23.0B",
"parameters_raw": 23000000000,
"min_ram_gb": 2.6,
"recommended_ram_gb": 4.3,
"min_vram_gb": 2.3,
"quantization": "AWQ-4bit",
"context_length": 202752,
"use_case": "General purpose text generation",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe_lite",
"hf_downloads": 10101,
"hf_likes": 2,
"release_date": "2026-01-25",
"is_moe": true,
"num_experts": 49,
"active_experts": 4,
"active_parameters": 3000000000,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/OmniCoder-9B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "9.0B",
"parameters_raw": 9000000000,
"min_ram_gb": 5.4,
"recommended_ram_gb": 9.0,
"min_vram_gb": 4.9,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "Coding, reasoning",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_5",
"hf_downloads": 9212,
"hf_likes": 2,
"release_date": "2026-03-14",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "Qwen/Qwen3.6-27B",
"provider": "Qwen",
"parameter_count": "27.8B",
"parameters_raw": 27781427952,
"min_ram_gb": 16.6,
"recommended_ram_gb": 21.6,
"min_vram_gb": 16.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose, coding",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"architecture": "qwen3",
"pipeline_tag": "text-generation",
"release_date": "2026-04-01",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.6-27B-GGUF",
"provider": "unsloth",
"file": "Qwen3.6-27B-Q4_K_M.gguf"
}
],
"capabilities": []
},
{
"name": "Qwen/Qwen3.6-27B-FP8",
"provider": "Qwen",
"parameter_count": "27.8B",
"parameters_raw": 27781427952,
"min_ram_gb": 28.3,
"recommended_ram_gb": 36.8,
"min_vram_gb": 28.3,
"quantization": "FP8",
"context_length": 262144,
"use_case": "General purpose, coding",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"architecture": "qwen3",
"pipeline_tag": "text-generation",
"release_date": "2026-04-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3.6-27B-AWQ",
"provider": "QuantTrio",
"parameter_count": "27.8B",
"parameters_raw": 27781427952,
"min_ram_gb": 14.4,
"recommended_ram_gb": 18.7,
"min_vram_gb": 14.4,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "General purpose, coding",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"architecture": "qwen3",
"pipeline_tag": "text-generation",
"release_date": "2026-04-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "Qwen/Qwen3.6-35B-A3B",
"provider": "Qwen",
"parameter_count": "36.0B",
"parameters_raw": 35951822704,
"min_ram_gb": 21.4,
"recommended_ram_gb": 27.8,
"min_vram_gb": 21.4,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose (MoE)",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"architecture": "qwen3_moe",
"pipeline_tag": "text-generation",
"release_date": "2026-04-01",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.6-35B-A3B-GGUF",
"provider": "unsloth",
"file": "Qwen3.6-35B-A3B-UD-Q4_K_M.gguf"
}
],
"capabilities": []
},
{
"name": "Qwen/Qwen3.6-35B-A3B-FP8",
"provider": "Qwen",
"parameter_count": "36.0B",
"parameters_raw": 35951822704,
"min_ram_gb": 36.5,
"recommended_ram_gb": 47.5,
"min_vram_gb": 36.5,
"quantization": "FP8",
"context_length": 262144,
"use_case": "General purpose (MoE)",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"architecture": "qwen3_moe",
"pipeline_tag": "text-generation",
"release_date": "2026-04-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "QuantTrio/Qwen3.6-35B-A3B-AWQ",
"provider": "QuantTrio",
"parameter_count": "36.0B",
"parameters_raw": 35951822704,
"min_ram_gb": 18.5,
"recommended_ram_gb": 24.1,
"min_vram_gb": 18.5,
"quantization": "AWQ-4bit",
"context_length": 262144,
"use_case": "General purpose (MoE)",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"architecture": "qwen3_moe",
"pipeline_tag": "text-generation",
"release_date": "2026-04-01",
"gguf_sources": [],
"capabilities": []
},
{
"name": "deepseek-ai/DeepSeek-V4-Flash",
"provider": "DeepSeek",
"parameter_count": "158B",
"parameters_raw": 158000000000,
"min_ram_gb": 165.0,
"recommended_ram_gb": 205.0,
"min_vram_gb": 165.0,
"quantization": "FP8",
"context_length": 1000000,
"use_case": "General purpose, reasoning (MoE)",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 13000000000,
"architecture": "deepseek_v4",
"pipeline_tag": "text-generation",
"release_date": "2026-04-22",
"gguf_sources": [
{
"repo": "unsloth/DeepSeek-V4-Flash",
"provider": "unsloth"
}
],
"capabilities": []
},
{
"name": "deepseek-ai/DeepSeek-V4-Pro",
"provider": "DeepSeek",
"parameter_count": "1600B",
"parameters_raw": 1600000000000,
"min_ram_gb": 928.5,
"recommended_ram_gb": 1207.0,
"min_vram_gb": 928.5,
"quantization": "Q4_K_M",
"context_length": 1000000,
"use_case": "Frontier reasoning (MoE)",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 49000000000,
"architecture": "deepseek_v4",
"pipeline_tag": "text-generation",
"release_date": "2026-04-22",
"gguf_sources": [],
"capabilities": []
},
{
"name": "google/gemma-4-E2B-it",
"provider": "Google",
"parameter_count": "5.1B",
"parameters_raw": 5123178051,
"min_ram_gb": 3.5,
"recommended_ram_gb": 4.5,
"min_vram_gb": 3.5,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "On-device, multimodal",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"architecture": "gemma4",
"pipeline_tag": "image-text-to-text",
"release_date": "2026-04-01",
"gguf_sources": [
{
"repo": "unsloth/gemma-4-E2B-it-GGUF",
"provider": "unsloth"
}
],
"capabilities": [
"vision"
]
},
{
"name": "google/gemma-4-E4B-it",
"provider": "Google",
"parameter_count": "8.0B",
"parameters_raw": 7996156490,
"min_ram_gb": 5.1,
"recommended_ram_gb": 6.6,
"min_vram_gb": 5.1,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "On-device, multimodal",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"architecture": "gemma4",
"pipeline_tag": "image-text-to-text",
"release_date": "2026-04-01",
"gguf_sources": [
{
"repo": "unsloth/gemma-4-E4B-it-GGUF",
"provider": "unsloth"
}
],
"capabilities": [
"vision"
]
},
{
"name": "google/gemma-4-31B-it",
"provider": "Google",
"parameter_count": "32.7B",
"parameters_raw": 32682372656,
"min_ram_gb": 19.5,
"recommended_ram_gb": 25.4,
"min_vram_gb": 19.5,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "General purpose, multimodal",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"architecture": "gemma4",
"pipeline_tag": "image-text-to-text",
"release_date": "2026-04-01",
"gguf_sources": [
{
"repo": "unsloth/gemma-4-31B-it-GGUF",
"provider": "unsloth"
}
],
"capabilities": [
"vision"
]
},
{
"name": "google/gemma-4-26B-A4B-it",
"provider": "Google",
"parameter_count": "26.5B",
"parameters_raw": 26544131376,
"min_ram_gb": 15.9,
"recommended_ram_gb": 20.7,
"min_vram_gb": 15.9,
"quantization": "Q4_K_M",
"context_length": 131072,
"use_case": "High-throughput, multimodal (MoE)",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 4000000000,
"architecture": "gemma4",
"pipeline_tag": "image-text-to-text",
"release_date": "2026-04-01",
"gguf_sources": [
{
"repo": "unsloth/gemma-4-26B-A4B-it-GGUF",
"provider": "unsloth"
}
],
"capabilities": [
"vision"
]
},
{
"name": "cyankiwi/gemma-4-31B-it-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "31.0B",
"parameters_raw": 31000000000,
"min_ram_gb": 16.8,
"recommended_ram_gb": 21.8,
"min_vram_gb": 16.8,
"quantization": "AWQ-4bit",
"context_length": 131072,
"use_case": "General purpose, multimodal",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"architecture": "gemma4",
"pipeline_tag": "image-text-to-text",
"release_date": "2026-04-01",
"gguf_sources": [],
"capabilities": [
"vision"
]
},
{
"name": "cyankiwi/Qwen3.6-27B-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "27.0B",
"parameters_raw": 27000000000,
"min_ram_gb": 9.7,
"recommended_ram_gb": 19.4,
"min_vram_gb": 16.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 1370875,
"hf_likes": 66,
"release_date": "2026-04-22",
"_discovered": true
},
{
"name": "cyankiwi/gemma-4-26B-A4B-it-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "26.0B",
"parameters_raw": 26000000000,
"min_ram_gb": 9.4,
"recommended_ram_gb": 18.7,
"min_vram_gb": 15.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "gemma4",
"hf_downloads": 4146360,
"hf_likes": 71,
"release_date": "2026-04-03",
"_discovered": true,
"is_moe": true,
"active_parameters": 4000000000
},
{
"name": "cyankiwi/Qwen3.6-35B-A3B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "35.0B",
"parameters_raw": 35000000000,
"min_ram_gb": 12.5,
"recommended_ram_gb": 25.0,
"min_vram_gb": 20.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 881182,
"hf_likes": 67,
"release_date": "2026-04-16",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Qwen3.6-27B-AWQ-BF16-INT4",
"provider": "cyankiwi",
"parameter_count": "27.0B",
"parameters_raw": 27000000000,
"min_ram_gb": 9.7,
"recommended_ram_gb": 19.4,
"min_vram_gb": 16.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 285756,
"hf_likes": 30,
"release_date": "2026-04-22",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3.6-27B-AWQ-BF16-INT8",
"provider": "cyankiwi",
"parameter_count": "27.0B",
"parameters_raw": 27000000000,
"min_ram_gb": 18.1,
"recommended_ram_gb": 36.2,
"min_vram_gb": 30.2,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 4433,
"hf_likes": 5,
"release_date": "2026-05-06",
"_discovered": true
},
{
"name": "cyankiwi/MiniMax-M2.7-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "228.7B",
"parameters_raw": 228700000000,
"min_ram_gb": 79.9,
"recommended_ram_gb": 159.7,
"min_vram_gb": 133.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 266548,
"hf_likes": 32,
"release_date": "2026-04-13",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-30B-A3B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl_moe",
"hf_downloads": 31781,
"hf_likes": 10,
"release_date": "2025-10-06",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/MiMo-V2-Flash-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "50.9B",
"parameters_raw": 50919007194,
"min_ram_gb": 18.0,
"recommended_ram_gb": 36.0,
"min_vram_gb": 30.0,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "custom_code",
"hf_downloads": 1650,
"hf_likes": 9,
"release_date": "2025-12-18",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.7-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "59.1B",
"parameters_raw": 59092091016,
"min_ram_gb": 20.9,
"recommended_ram_gb": 41.8,
"min_vram_gb": 34.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 251,
"hf_likes": 5,
"release_date": "2025-12-24",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.7-REAP-218B-A32B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "218.0B",
"parameters_raw": 218000000000,
"min_ram_gb": 76.1,
"recommended_ram_gb": 152.3,
"min_vram_gb": 126.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 29,
"hf_likes": 10,
"release_date": "2026-01-16",
"_discovered": true,
"is_moe": true,
"active_parameters": 32000000000
},
{
"name": "cyankiwi/GLM-4.7-REAP-268B-A32B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "268.0B",
"parameters_raw": 268000000000,
"min_ram_gb": 93.5,
"recommended_ram_gb": 187.1,
"min_vram_gb": 155.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 16,
"hf_likes": 6,
"release_date": "2026-01-26",
"_discovered": true,
"is_moe": true,
"active_parameters": 32000000000
},
{
"name": "cyankiwi/MiniMax-M2.1-REAP-139B-A10B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "139.0B",
"parameters_raw": 139000000000,
"min_ram_gb": 48.7,
"recommended_ram_gb": 97.3,
"min_vram_gb": 81.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 2,
"hf_likes": 1,
"release_date": "2026-02-03",
"_discovered": true,
"is_moe": true,
"active_parameters": 10000000000
},
{
"name": "cyankiwi/NVIDIA-Nemotron-3-Super-120B-A12B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "120.0B",
"parameters_raw": 120000000000,
"min_ram_gb": 42.1,
"recommended_ram_gb": 84.1,
"min_vram_gb": 70.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nemotron_h",
"hf_downloads": 1185,
"hf_likes": 6,
"release_date": "2026-03-16",
"_discovered": true,
"is_moe": true,
"active_parameters": 12000000000
},
{
"name": "cyankiwi/Mistral-Small-4-119B-2603-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "119.0B",
"parameters_raw": 119000000000,
"min_ram_gb": 41.7,
"recommended_ram_gb": 83.4,
"min_vram_gb": 69.5,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 2022,
"hf_likes": 7,
"release_date": "2026-03-18",
"_discovered": true
},
{
"name": "cyankiwi/gemma-4-31B-it-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "31.0B",
"parameters_raw": 31000000000,
"min_ram_gb": 20.8,
"recommended_ram_gb": 41.5,
"min_vram_gb": 34.6,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "gemma4",
"hf_downloads": 61491,
"hf_likes": 16,
"release_date": "2026-04-02",
"_discovered": true
},
{
"name": "cyankiwi/Nemotron-Cascade-2-30B-A3B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nvidia",
"hf_downloads": 219,
"hf_likes": 2,
"release_date": "2026-04-08",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Laguna-XS.2-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "33.4B",
"parameters_raw": 33442617088,
"min_ram_gb": 11.9,
"recommended_ram_gb": 23.9,
"min_vram_gb": 19.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "laguna",
"hf_downloads": 4344,
"hf_likes": 1,
"release_date": "2026-05-02",
"_discovered": true
},
{
"name": "cyankiwi/gemma-4-E2B-it-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 2000000000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "any-to-any",
"architecture": "gemma4",
"hf_downloads": 15565,
"hf_likes": 3,
"release_date": "2026-05-03",
"_discovered": true
},
{
"name": "cyankiwi/Mistral-Medium-3.5-128B-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "128.0B",
"parameters_raw": 128000000000,
"min_ram_gb": 44.8,
"recommended_ram_gb": 89.6,
"min_vram_gb": 74.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 17040,
"hf_likes": 2,
"release_date": "2026-05-04",
"_discovered": true
},
{
"name": "cyankiwi/Devstral-Small-2507-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "23.6B",
"parameters_raw": 23572403200,
"min_ram_gb": 8.5,
"recommended_ram_gb": 17.0,
"min_vram_gb": 14.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 1340,
"hf_likes": 9,
"release_date": "2025-07-12",
"_discovered": true
},
{
"name": "cyankiwi/KAT-V1-40B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "40.0B",
"parameters_raw": 40000000000,
"min_ram_gb": 14.2,
"recommended_ram_gb": 28.4,
"min_vram_gb": 23.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 2,
"hf_likes": 2,
"release_date": "2025-07-24",
"_discovered": true
},
{
"name": "cyankiwi/Magistral-Small-2507-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "23.6B",
"parameters_raw": 23572403200,
"min_ram_gb": 8.5,
"recommended_ram_gb": 17.0,
"min_vram_gb": 14.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral",
"hf_downloads": 25,
"hf_likes": 0,
"release_date": "2025-07-25",
"_discovered": true
},
{
"name": "cyankiwi/Llama-3_3-Nemotron-Super-49B-v1_5-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "49.0B",
"parameters_raw": 49000000000,
"min_ram_gb": 17.3,
"recommended_ram_gb": 34.7,
"min_vram_gb": 28.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nemotron_nas",
"hf_downloads": 311,
"hf_likes": 3,
"release_date": "2025-07-27",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-30B-A3B-Thinking-2507-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 73546,
"hf_likes": 15,
"release_date": "2025-07-30",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Qwen3-4B-Instruct-2507-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 1.7,
"recommended_ram_gb": 3.4,
"min_vram_gb": 2.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 142168,
"hf_likes": 7,
"release_date": "2025-08-06",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-4B-Thinking-2507-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 1.7,
"recommended_ram_gb": 3.4,
"min_vram_gb": 2.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 671,
"hf_likes": 5,
"release_date": "2025-08-06",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-4B-Thinking-2507-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.9,
"recommended_ram_gb": 5.9,
"min_vram_gb": 4.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 60,
"hf_likes": 4,
"release_date": "2025-08-08",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-4B-Instruct-2507-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.9,
"recommended_ram_gb": 5.9,
"min_vram_gb": 4.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 1539,
"hf_likes": 1,
"release_date": "2025-08-08",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-Coder-30B-A3B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 573,
"hf_likes": 2,
"release_date": "2025-08-08",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Qwen3-30B-A3B-Thinking-2507-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 88,
"hf_likes": 2,
"release_date": "2025-08-08",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/GLM-4.5-Air-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "31.7B",
"parameters_raw": 31696906344,
"min_ram_gb": 21.2,
"recommended_ram_gb": 42.5,
"min_vram_gb": 35.4,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 67,
"hf_likes": 2,
"release_date": "2025-08-08",
"_discovered": true
},
{
"name": "cyankiwi/Jan-v1-4B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.9,
"recommended_ram_gb": 5.9,
"min_vram_gb": 4.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 3,
"hf_likes": 1,
"release_date": "2025-08-12",
"_discovered": true
},
{
"name": "cyankiwi/Jan-v1-4B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 1.7,
"recommended_ram_gb": 3.4,
"min_vram_gb": 2.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 1,
"hf_likes": 2,
"release_date": "2025-08-12",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.5V-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "19.5B",
"parameters_raw": 19485088360,
"min_ram_gb": 7.1,
"recommended_ram_gb": 14.2,
"min_vram_gb": 11.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "glm4v_moe",
"hf_downloads": 664,
"hf_likes": 4,
"release_date": "2025-08-13",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.5V-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "32.6B",
"parameters_raw": 32555588200,
"min_ram_gb": 21.8,
"recommended_ram_gb": 43.6,
"min_vram_gb": 36.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "glm4v_moe",
"hf_downloads": 54,
"hf_likes": 3,
"release_date": "2025-08-13",
"_discovered": true
},
{
"name": "cyankiwi/Kimi-Dev-72B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "72.0B",
"parameters_raw": 72000000000,
"min_ram_gb": 25.4,
"recommended_ram_gb": 50.8,
"min_vram_gb": 42.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 881,
"hf_likes": 3,
"release_date": "2025-08-19",
"_discovered": true
},
{
"name": "cyankiwi/Kimi-Dev-72B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "72.0B",
"parameters_raw": 72000000000,
"min_ram_gb": 47.8,
"recommended_ram_gb": 95.6,
"min_vram_gb": 79.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 729,
"hf_likes": 1,
"release_date": "2025-08-19",
"_discovered": true
},
{
"name": "cyankiwi/Seed-OSS-36B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "36.0B",
"parameters_raw": 36000000000,
"min_ram_gb": 24.1,
"recommended_ram_gb": 48.1,
"min_vram_gb": 40.1,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "seed_oss",
"hf_downloads": 2,
"hf_likes": 0,
"release_date": "2025-08-23",
"_discovered": true
},
{
"name": "cyankiwi/Seed-OSS-36B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "36.0B",
"parameters_raw": 36000000000,
"min_ram_gb": 12.8,
"recommended_ram_gb": 25.7,
"min_vram_gb": 21.4,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "seed_oss",
"hf_downloads": 43,
"hf_likes": 0,
"release_date": "2025-08-23",
"_discovered": true
},
{
"name": "cyankiwi/command-a-reasoning-08-2025-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "23.2B",
"parameters_raw": 23153357696,
"min_ram_gb": 8.3,
"recommended_ram_gb": 16.7,
"min_vram_gb": 13.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "cohere2",
"hf_downloads": 206,
"hf_likes": 3,
"release_date": "2025-08-23",
"_discovered": true
},
{
"name": "cyankiwi/command-a-reasoning-08-2025-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "36.6B",
"parameters_raw": 36642239360,
"min_ram_gb": 24.5,
"recommended_ram_gb": 49.0,
"min_vram_gb": 40.8,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "cohere2",
"hf_downloads": 5,
"hf_likes": 0,
"release_date": "2025-08-24",
"_discovered": true
},
{
"name": "cyankiwi/Hermes-4-70B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "70.0B",
"parameters_raw": 70000000000,
"min_ram_gb": 24.7,
"recommended_ram_gb": 49.3,
"min_vram_gb": 41.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 45819,
"hf_likes": 6,
"release_date": "2025-08-27",
"_discovered": true
},
{
"name": "cyankiwi/Hermes-4-70B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "70.0B",
"parameters_raw": 70000000000,
"min_ram_gb": 46.5,
"recommended_ram_gb": 93.0,
"min_vram_gb": 77.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 1,
"hf_likes": 1,
"release_date": "2025-08-27",
"_discovered": true
},
{
"name": "cyankiwi/InternVL3_5-8B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 3.1,
"recommended_ram_gb": 6.1,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "internvl_chat",
"hf_downloads": 923,
"hf_likes": 1,
"release_date": "2025-08-29",
"_discovered": true
},
{
"name": "cyankiwi/InternVL3_5-14B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 5.2,
"recommended_ram_gb": 10.3,
"min_vram_gb": 8.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "internvl_chat",
"hf_downloads": 829,
"hf_likes": 4,
"release_date": "2025-08-29",
"_discovered": true
},
{
"name": "cyankiwi/InternVL3_5-38B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "38.0B",
"parameters_raw": 38000000000,
"min_ram_gb": 25.4,
"recommended_ram_gb": 50.8,
"min_vram_gb": 42.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "internvl_chat",
"hf_downloads": 782,
"hf_likes": 0,
"release_date": "2025-08-30",
"_discovered": true
},
{
"name": "cyankiwi/InternVL3_5-14B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 9.5,
"recommended_ram_gb": 19.1,
"min_vram_gb": 15.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "internvl_chat",
"hf_downloads": 27,
"hf_likes": 2,
"release_date": "2025-08-30",
"_discovered": true
},
{
"name": "cyankiwi/InternVL3_5-8B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 5.6,
"recommended_ram_gb": 11.2,
"min_vram_gb": 9.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "internvl_chat",
"hf_downloads": 27783,
"hf_likes": 1,
"release_date": "2025-08-30",
"_discovered": true
},
{
"name": "cyankiwi/NVIDIA-Nemotron-Nano-9B-v2-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "9.0B",
"parameters_raw": 9000000000,
"min_ram_gb": 3.4,
"recommended_ram_gb": 6.8,
"min_vram_gb": 5.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nvidia",
"hf_downloads": 75,
"hf_likes": 3,
"release_date": "2025-08-31",
"_discovered": true
},
{
"name": "cyankiwi/NVIDIA-Nemotron-Nano-12B-v2-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "12.0B",
"parameters_raw": 12000000000,
"min_ram_gb": 4.5,
"recommended_ram_gb": 9.0,
"min_vram_gb": 7.5,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nvidia",
"hf_downloads": 1114,
"hf_likes": 4,
"release_date": "2025-08-31",
"_discovered": true
},
{
"name": "cyankiwi/NVIDIA-Nemotron-Nano-12B-v2-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "12.0B",
"parameters_raw": 12000000000,
"min_ram_gb": 8.2,
"recommended_ram_gb": 16.4,
"min_vram_gb": 13.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nvidia",
"hf_downloads": 1030,
"hf_likes": 1,
"release_date": "2025-08-31",
"_discovered": true
},
{
"name": "cyankiwi/NVIDIA-Nemotron-Nano-9B-v2-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "9.0B",
"parameters_raw": 9000000000,
"min_ram_gb": 6.2,
"recommended_ram_gb": 12.5,
"min_vram_gb": 10.4,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nvidia",
"hf_downloads": 33,
"hf_likes": 0,
"release_date": "2025-08-31",
"_discovered": true
},
{
"name": "cyankiwi/Hermes-4-14B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 5.2,
"recommended_ram_gb": 10.3,
"min_vram_gb": 8.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 6866,
"hf_likes": 4,
"release_date": "2025-09-03",
"_discovered": true
},
{
"name": "cyankiwi/Hermes-4-14B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 9.5,
"recommended_ram_gb": 19.1,
"min_vram_gb": 15.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 2,
"hf_likes": 0,
"release_date": "2025-09-03",
"_discovered": true
},
{
"name": "cyankiwi/ERNIE-4.5-21B-A3B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "21.0B",
"parameters_raw": 21000000000,
"min_ram_gb": 14.2,
"recommended_ram_gb": 28.3,
"min_vram_gb": 23.6,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "ernie4_5_moe",
"hf_downloads": 10,
"hf_likes": 4,
"release_date": "2025-09-09",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/ERNIE-4.5-21B-A3B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "21.0B",
"parameters_raw": 21000000000,
"min_ram_gb": 7.6,
"recommended_ram_gb": 15.2,
"min_vram_gb": 12.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "ernie4_5_moe",
"hf_downloads": 89,
"hf_likes": 4,
"release_date": "2025-09-09",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Jan-v1-2509-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "1.3B",
"parameters_raw": 1345814520,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 4,
"hf_likes": 1,
"release_date": "2025-09-09",
"_discovered": true
},
{
"name": "cyankiwi/Tongyi-DeepResearch-30B-A3B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 358,
"hf_likes": 4,
"release_date": "2025-09-17",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Tongyi-DeepResearch-30B-A3B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 11,
"hf_likes": 4,
"release_date": "2025-09-17",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Magistral-Small-2509-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "5.3B",
"parameters_raw": 5254958640,
"min_ram_gb": 2.1,
"recommended_ram_gb": 4.2,
"min_vram_gb": 3.5,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 271,
"hf_likes": 3,
"release_date": "2025-09-20",
"_discovered": true
},
{
"name": "cyankiwi/Magistral-Small-2509-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8033685040,
"min_ram_gb": 5.6,
"recommended_ram_gb": 11.2,
"min_vram_gb": 9.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 0,
"hf_likes": 1,
"release_date": "2025-09-20",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-Next-80B-A3B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "80.0B",
"parameters_raw": 80000000000,
"min_ram_gb": 53.1,
"recommended_ram_gb": 106.2,
"min_vram_gb": 88.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 80,
"hf_likes": 5,
"release_date": "2025-09-23",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Qwen3-Next-80B-A3B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "80.0B",
"parameters_raw": 80000000000,
"min_ram_gb": 53.1,
"recommended_ram_gb": 106.2,
"min_vram_gb": 88.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 74,
"hf_likes": 4,
"release_date": "2025-09-23",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/KAT-Dev-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "6.4B",
"parameters_raw": 6432380800,
"min_ram_gb": 2.5,
"recommended_ram_gb": 5.0,
"min_vram_gb": 4.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2025-09-28",
"_discovered": true
},
{
"name": "cyankiwi/KAT-Dev-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "10.3B",
"parameters_raw": 10333083520,
"min_ram_gb": 7.1,
"recommended_ram_gb": 14.3,
"min_vram_gb": 11.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 2,
"hf_likes": 0,
"release_date": "2025-09-28",
"_discovered": true
},
{
"name": "cyankiwi/cwm-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "6.4B",
"parameters_raw": 6421224320,
"min_ram_gb": 2.5,
"recommended_ram_gb": 5.0,
"min_vram_gb": 4.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 7,
"hf_likes": 1,
"release_date": "2025-09-28",
"_discovered": true
},
{
"name": "cyankiwi/cwm-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "10.3B",
"parameters_raw": 10296761216,
"min_ram_gb": 7.1,
"recommended_ram_gb": 14.2,
"min_vram_gb": 11.8,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 2,
"hf_likes": 0,
"release_date": "2025-09-28",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-Omni-30B-A3B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "any-to-any",
"architecture": "qwen3_omni_moe",
"hf_downloads": 7136,
"hf_likes": 8,
"release_date": "2025-09-28",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Qwen3-Omni-30B-A3B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "any-to-any",
"architecture": "qwen3_omni_moe",
"hf_downloads": 486,
"hf_likes": 1,
"release_date": "2025-09-29",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Qwen3-Omni-30B-A3B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "any-to-any",
"architecture": "qwen3_omni_moe",
"hf_downloads": 2081,
"hf_likes": 7,
"release_date": "2025-09-29",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Qwen3-Omni-30B-A3B-Captioner-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "any-to-any",
"architecture": "qwen3_omni_moe",
"hf_downloads": 660,
"hf_likes": 7,
"release_date": "2025-10-01",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Qwen3-Omni-30B-A3B-Captioner-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "any-to-any",
"architecture": "qwen3_omni_moe",
"hf_downloads": 12,
"hf_likes": 0,
"release_date": "2025-10-01",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Apriel-1.5-15b-Thinker-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "15.0B",
"parameters_raw": 15000000000,
"min_ram_gb": 5.5,
"recommended_ram_gb": 11.0,
"min_vram_gb": 9.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llava",
"hf_downloads": 5,
"hf_likes": 2,
"release_date": "2025-10-02",
"_discovered": true
},
{
"name": "cyankiwi/Apriel-1.5-15b-Thinker-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "15.0B",
"parameters_raw": 15000000000,
"min_ram_gb": 10.2,
"recommended_ram_gb": 20.4,
"min_vram_gb": 17.0,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llava",
"hf_downloads": 0,
"hf_likes": 1,
"release_date": "2025-10-02",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-30B-A3B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl_moe",
"hf_downloads": 19000,
"hf_likes": 5,
"release_date": "2025-10-06",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Qwen3-VL-30B-A3B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl_moe",
"hf_downloads": 205,
"hf_likes": 3,
"release_date": "2025-10-07",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Qwen3-VL-30B-A3B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl_moe",
"hf_downloads": 16,
"hf_likes": 4,
"release_date": "2025-10-07",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/granite-4.0-h-micro-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "0.9B",
"parameters_raw": 878516304,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.0,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granitemoehybrid",
"hf_downloads": 44,
"hf_likes": 0,
"release_date": "2025-10-08",
"_discovered": true
},
{
"name": "cyankiwi/granite-4.0-h-micro-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "1.3B",
"parameters_raw": 1251612752,
"min_ram_gb": 1.1,
"recommended_ram_gb": 2.3,
"min_vram_gb": 1.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granitemoehybrid",
"hf_downloads": 52,
"hf_likes": 0,
"release_date": "2025-10-08",
"_discovered": true
},
{
"name": "cyankiwi/KAT-Dev-72B-Exp-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "72.0B",
"parameters_raw": 72000000000,
"min_ram_gb": 25.4,
"recommended_ram_gb": 50.8,
"min_vram_gb": 42.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1,
"hf_likes": 2,
"release_date": "2025-10-11",
"_discovered": true
},
{
"name": "cyankiwi/granite-4.0-h-tiny-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "2.8B",
"parameters_raw": 2752073520,
"min_ram_gb": 2.1,
"recommended_ram_gb": 4.2,
"min_vram_gb": 3.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granitemoehybrid",
"hf_downloads": 326,
"hf_likes": 0,
"release_date": "2025-10-13",
"_discovered": true
},
{
"name": "cyankiwi/granite-4.0-h-small-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "9.7B",
"parameters_raw": 9686022896,
"min_ram_gb": 3.7,
"recommended_ram_gb": 7.3,
"min_vram_gb": 6.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granitemoehybrid",
"hf_downloads": 78,
"hf_likes": 1,
"release_date": "2025-10-13",
"_discovered": true
},
{
"name": "cyankiwi/granite-4.0-h-small-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "13.1B",
"parameters_raw": 13083409136,
"min_ram_gb": 8.9,
"recommended_ram_gb": 17.9,
"min_vram_gb": 14.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granitemoehybrid",
"hf_downloads": 1,
"hf_likes": 1,
"release_date": "2025-10-13",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-8B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 5.6,
"recommended_ram_gb": 11.2,
"min_vram_gb": 9.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 2351,
"hf_likes": 4,
"release_date": "2025-10-14",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-8B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 3.1,
"recommended_ram_gb": 6.1,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 847,
"hf_likes": 2,
"release_date": "2025-10-14",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-8B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 5.6,
"recommended_ram_gb": 11.2,
"min_vram_gb": 9.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 67,
"hf_likes": 4,
"release_date": "2025-10-14",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-4B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.9,
"recommended_ram_gb": 5.9,
"min_vram_gb": 4.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 199,
"hf_likes": 3,
"release_date": "2025-10-14",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-4B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.9,
"recommended_ram_gb": 5.9,
"min_vram_gb": 4.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 9,
"hf_likes": 0,
"release_date": "2025-10-14",
"_discovered": true
},
{
"name": "cyankiwi/LFM2-8B-A1B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 3.1,
"recommended_ram_gb": 6.1,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2_moe",
"hf_downloads": 34,
"hf_likes": 1,
"release_date": "2025-10-20",
"_discovered": true,
"is_moe": true,
"active_parameters": 1000000000
},
{
"name": "cyankiwi/LFM2-8B-A1B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 5.6,
"recommended_ram_gb": 11.2,
"min_vram_gb": 9.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2_moe",
"hf_downloads": 8,
"hf_likes": 0,
"release_date": "2025-10-20",
"_discovered": true,
"is_moe": true,
"active_parameters": 1000000000
},
{
"name": "cyankiwi/Qwen3-VL-32B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 11.5,
"recommended_ram_gb": 22.9,
"min_vram_gb": 19.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 6631,
"hf_likes": 5,
"release_date": "2025-10-21",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-32B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 11.5,
"recommended_ram_gb": 22.9,
"min_vram_gb": 19.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 112,
"hf_likes": 2,
"release_date": "2025-10-21",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-32B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 21.4,
"recommended_ram_gb": 42.8,
"min_vram_gb": 35.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 502,
"hf_likes": 1,
"release_date": "2025-10-22",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-32B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 21.4,
"recommended_ram_gb": 42.8,
"min_vram_gb": 35.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 898,
"hf_likes": 3,
"release_date": "2025-10-22",
"_discovered": true
},
{
"name": "cyankiwi/JanusCoder-14B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 5.2,
"recommended_ram_gb": 10.3,
"min_vram_gb": 8.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2025-10-29",
"_discovered": true
},
{
"name": "cyankiwi/JanusCoder-14B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 9.5,
"recommended_ram_gb": 19.1,
"min_vram_gb": 15.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2025-10-29",
"_discovered": true
},
{
"name": "cyankiwi/JanusCoder-8B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 5.6,
"recommended_ram_gb": 11.2,
"min_vram_gb": 9.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2025-10-29",
"_discovered": true
},
{
"name": "cyankiwi/JanusCoder-8B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 3.1,
"recommended_ram_gb": 6.1,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2025-10-29",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-Nemotron-32B-RLBFF-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 11.5,
"recommended_ram_gb": 22.9,
"min_vram_gb": 19.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 2,
"hf_likes": 0,
"release_date": "2025-10-30",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-Nemotron-32B-RLBFF-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 21.4,
"recommended_ram_gb": 42.8,
"min_vram_gb": 35.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2025-10-30",
"_discovered": true
},
{
"name": "cyankiwi/Kimi-Linear-48B-A3B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "48.0B",
"parameters_raw": 48000000000,
"min_ram_gb": 17.0,
"recommended_ram_gb": 34.0,
"min_vram_gb": 28.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "kimi_linear",
"hf_downloads": 1653,
"hf_likes": 18,
"release_date": "2025-10-30",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Kimi-Linear-48B-A3B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "48.0B",
"parameters_raw": 48000000000,
"min_ram_gb": 32.0,
"recommended_ram_gb": 64.0,
"min_vram_gb": 53.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "kimi_linear",
"hf_downloads": 45,
"hf_likes": 4,
"release_date": "2025-10-31",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/MiniMax-M2-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "36.8B",
"parameters_raw": 36811839984,
"min_ram_gb": 13.1,
"recommended_ram_gb": 26.3,
"min_vram_gb": 21.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 69,
"hf_likes": 4,
"release_date": "2025-11-10",
"_discovered": true
},
{
"name": "cyankiwi/ERNIE-4.5-VL-28B-A3B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "28.0B",
"parameters_raw": 28000000000,
"min_ram_gb": 10.0,
"recommended_ram_gb": 20.0,
"min_vram_gb": 16.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "ernie4_5_moe_vl",
"hf_downloads": 24,
"hf_likes": 12,
"release_date": "2025-11-13",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/ERNIE-4.5-VL-28B-A3B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "28.0B",
"parameters_raw": 28000000000,
"min_ram_gb": 18.8,
"recommended_ram_gb": 37.6,
"min_vram_gb": 31.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "ernie4_5_moe_vl",
"hf_downloads": 21,
"hf_likes": 3,
"release_date": "2025-11-13",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/MiniMax-M2-REAP-162B-A10B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "162.0B",
"parameters_raw": 162000000000,
"min_ram_gb": 56.7,
"recommended_ram_gb": 113.4,
"min_vram_gb": 94.5,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 55,
"hf_likes": 4,
"release_date": "2025-11-18",
"_discovered": true,
"is_moe": true,
"active_parameters": 10000000000
},
{
"name": "cyankiwi/MiroThinker-v1.0-72B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "72.0B",
"parameters_raw": 72000000000,
"min_ram_gb": 25.4,
"recommended_ram_gb": 50.8,
"min_vram_gb": 42.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 5,
"hf_likes": 4,
"release_date": "2025-11-18",
"_discovered": true
},
{
"name": "cyankiwi/MiroThinker-v1.0-30B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 35,
"hf_likes": 2,
"release_date": "2025-11-18",
"_discovered": true
},
{
"name": "cyankiwi/MiroThinker-v1.0-30B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 16,
"hf_likes": 0,
"release_date": "2025-11-19",
"_discovered": true
},
{
"name": "cyankiwi/MiroThinker-v1.0-72B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "72.0B",
"parameters_raw": 72000000000,
"min_ram_gb": 47.8,
"recommended_ram_gb": 95.6,
"min_vram_gb": 79.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2025-11-19",
"_discovered": true
},
{
"name": "cyankiwi/Jan-v2-VL-high-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "2.9B",
"parameters_raw": 2906632936,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.6,
"min_vram_gb": 2.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 3,
"hf_likes": 2,
"release_date": "2025-11-20",
"_discovered": true
},
{
"name": "cyankiwi/Jan-v2-VL-high-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "3.8B",
"parameters_raw": 3774853864,
"min_ram_gb": 2.8,
"recommended_ram_gb": 5.6,
"min_vram_gb": 4.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 6,
"hf_likes": 1,
"release_date": "2025-11-20",
"_discovered": true
},
{
"name": "cyankiwi/Olmo-3-32B-Think-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 11.5,
"recommended_ram_gb": 22.9,
"min_vram_gb": 19.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo3",
"hf_downloads": 172,
"hf_likes": 2,
"release_date": "2025-11-20",
"_discovered": true
},
{
"name": "cyankiwi/Olmo-3-32B-Think-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 21.4,
"recommended_ram_gb": 42.8,
"min_vram_gb": 35.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo3",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2025-11-20",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.5-Air-Derestricted-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "18.6B",
"parameters_raw": 18626406504,
"min_ram_gb": 6.8,
"recommended_ram_gb": 13.6,
"min_vram_gb": 11.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 650,
"hf_likes": 3,
"release_date": "2025-11-28",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.5-Air-Derestricted-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "31.7B",
"parameters_raw": 31696906344,
"min_ram_gb": 21.2,
"recommended_ram_gb": 42.5,
"min_vram_gb": 35.4,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 21,
"hf_likes": 1,
"release_date": "2025-11-28",
"_discovered": true
},
{
"name": "cyankiwi/INTELLECT-3-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "18.6B",
"parameters_raw": 18626406504,
"min_ram_gb": 6.8,
"recommended_ram_gb": 13.6,
"min_vram_gb": 11.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 27,
"hf_likes": 3,
"release_date": "2025-11-29",
"_discovered": true
},
{
"name": "cyankiwi/INTELLECT-3-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "31.7B",
"parameters_raw": 31696906344,
"min_ram_gb": 21.2,
"recommended_ram_gb": 42.5,
"min_vram_gb": 35.4,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 14,
"hf_likes": 2,
"release_date": "2025-11-29",
"_discovered": true
},
{
"name": "cyankiwi/Nemotron-Orchestrator-8B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 3.1,
"recommended_ram_gb": 6.1,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 437,
"hf_likes": 3,
"release_date": "2025-12-03",
"_discovered": true
},
{
"name": "cyankiwi/Nemotron-Orchestrator-8B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 5.6,
"recommended_ram_gb": 11.2,
"min_vram_gb": 9.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 28296,
"hf_likes": 4,
"release_date": "2025-12-03",
"_discovered": true
},
{
"name": "cyankiwi/Trinity-Mini-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "5.0B",
"parameters_raw": 5049586220,
"min_ram_gb": 2.0,
"recommended_ram_gb": 4.1,
"min_vram_gb": 3.4,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "afmoe",
"hf_downloads": 16,
"hf_likes": 0,
"release_date": "2025-12-03",
"_discovered": true
},
{
"name": "cyankiwi/Trinity-Mini-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.2B",
"parameters_raw": 8171721260,
"min_ram_gb": 5.7,
"recommended_ram_gb": 11.4,
"min_vram_gb": 9.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "afmoe",
"hf_downloads": 54,
"hf_likes": 1,
"release_date": "2025-12-03",
"_discovered": true
},
{
"name": "cyankiwi/Hermes-4.3-36B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "36.0B",
"parameters_raw": 36000000000,
"min_ram_gb": 24.1,
"recommended_ram_gb": 48.1,
"min_vram_gb": 40.1,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "seed_oss",
"hf_downloads": 96,
"hf_likes": 0,
"release_date": "2025-12-03",
"_discovered": true
},
{
"name": "cyankiwi/Hermes-4.3-36B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "36.0B",
"parameters_raw": 36000000000,
"min_ram_gb": 12.8,
"recommended_ram_gb": 25.7,
"min_vram_gb": 21.4,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "seed_oss",
"hf_downloads": 1560,
"hf_likes": 1,
"release_date": "2025-12-03",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-8B-Instruct-2512-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 3.1,
"recommended_ram_gb": 6.1,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 44802,
"hf_likes": 2,
"release_date": "2025-12-04",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-8B-Instruct-2512-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 5.6,
"recommended_ram_gb": 11.2,
"min_vram_gb": 9.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 222,
"hf_likes": 1,
"release_date": "2025-12-04",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-8B-Reasoning-2512-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 3.1,
"recommended_ram_gb": 6.1,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 201,
"hf_likes": 0,
"release_date": "2025-12-04",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-8B-Reasoning-2512-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 5.6,
"recommended_ram_gb": 11.2,
"min_vram_gb": 9.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 91,
"hf_likes": 1,
"release_date": "2025-12-04",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-14B-Instruct-2512-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 5.2,
"recommended_ram_gb": 10.3,
"min_vram_gb": 8.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 11586,
"hf_likes": 6,
"release_date": "2025-12-04",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-14B-Instruct-2512-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 9.5,
"recommended_ram_gb": 19.1,
"min_vram_gb": 15.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 73,
"hf_likes": 0,
"release_date": "2025-12-04",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-14B-Reasoning-2512-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 5.2,
"recommended_ram_gb": 10.3,
"min_vram_gb": 8.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 136375,
"hf_likes": 1,
"release_date": "2025-12-04",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-14B-Reasoning-2512-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 9.5,
"recommended_ram_gb": 19.1,
"min_vram_gb": 15.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 193,
"hf_likes": 0,
"release_date": "2025-12-04",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-3B-Instruct-2512-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "3.0B",
"parameters_raw": 3000000000,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.6,
"min_vram_gb": 2.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 429,
"hf_likes": 0,
"release_date": "2025-12-05",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-3B-Instruct-2512-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "3.0B",
"parameters_raw": 3000000000,
"min_ram_gb": 2.3,
"recommended_ram_gb": 4.6,
"min_vram_gb": 3.8,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 80,
"hf_likes": 1,
"release_date": "2025-12-05",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-3B-Reasoning-2512-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "3.0B",
"parameters_raw": 3000000000,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.6,
"min_vram_gb": 2.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 44,
"hf_likes": 0,
"release_date": "2025-12-05",
"_discovered": true
},
{
"name": "cyankiwi/Ministral-3-3B-Reasoning-2512-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "3.0B",
"parameters_raw": 3000000000,
"min_ram_gb": 2.3,
"recommended_ram_gb": 4.6,
"min_vram_gb": 3.8,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 41,
"hf_likes": 0,
"release_date": "2025-12-05",
"_discovered": true
},
{
"name": "cyankiwi/rnj-1-instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "2.3B",
"parameters_raw": 2267558336,
"min_ram_gb": 1.1,
"recommended_ram_gb": 2.2,
"min_vram_gb": 1.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gemma3_text",
"hf_downloads": 3,
"hf_likes": 2,
"release_date": "2025-12-06",
"_discovered": true
},
{
"name": "cyankiwi/rnj-1-instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "3.2B",
"parameters_raw": 3240636864,
"min_ram_gb": 2.5,
"recommended_ram_gb": 4.9,
"min_vram_gb": 4.1,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "gemma3_text",
"hf_downloads": 10,
"hf_likes": 1,
"release_date": "2025-12-06",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.6V-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "19.5B",
"parameters_raw": 19485088360,
"min_ram_gb": 7.1,
"recommended_ram_gb": 14.2,
"min_vram_gb": 11.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "glm4v_moe",
"hf_downloads": 1412,
"hf_likes": 12,
"release_date": "2025-12-08",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.6V-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "32.6B",
"parameters_raw": 32555588200,
"min_ram_gb": 21.8,
"recommended_ram_gb": 43.6,
"min_vram_gb": 36.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "glm4v_moe",
"hf_downloads": 22,
"hf_likes": 1,
"release_date": "2025-12-08",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.6V-Flash-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "3.4B",
"parameters_raw": 3409531872,
"min_ram_gb": 1.5,
"recommended_ram_gb": 3.0,
"min_vram_gb": 2.5,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "glm4v",
"hf_downloads": 1157,
"hf_likes": 2,
"release_date": "2025-12-08",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.6V-Flash-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "4.4B",
"parameters_raw": 4429272032,
"min_ram_gb": 3.2,
"recommended_ram_gb": 6.5,
"min_vram_gb": 5.4,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "glm4v",
"hf_downloads": 1062,
"hf_likes": 0,
"release_date": "2025-12-08",
"_discovered": true
},
{
"name": "cyankiwi/Devstral-Small-2-24B-Instruct-2512-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "24.0B",
"parameters_raw": 24000000000,
"min_ram_gb": 8.6,
"recommended_ram_gb": 17.3,
"min_vram_gb": 14.4,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "mistral3",
"hf_downloads": 114314,
"hf_likes": 11,
"release_date": "2025-12-10",
"_discovered": true
},
{
"name": "cyankiwi/Apriel-1.6-15b-Thinker-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "15.0B",
"parameters_raw": 15000000000,
"min_ram_gb": 5.5,
"recommended_ram_gb": 11.0,
"min_vram_gb": 9.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "llava",
"hf_downloads": 130,
"hf_likes": 2,
"release_date": "2025-12-10",
"_discovered": true
},
{
"name": "cyankiwi/Apriel-1.6-15b-Thinker-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "15.0B",
"parameters_raw": 15000000000,
"min_ram_gb": 10.2,
"recommended_ram_gb": 20.4,
"min_vram_gb": 17.0,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "llava",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2025-12-11",
"_discovered": true
},
{
"name": "cyankiwi/Olmo-3.1-32B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 11.5,
"recommended_ram_gb": 22.9,
"min_vram_gb": 19.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo3",
"hf_downloads": 470,
"hf_likes": 1,
"release_date": "2025-12-14",
"_discovered": true
},
{
"name": "cyankiwi/Olmo-3.1-32B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 21.4,
"recommended_ram_gb": 42.8,
"min_vram_gb": 35.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo3",
"hf_downloads": 2,
"hf_likes": 0,
"release_date": "2025-12-14",
"_discovered": true
},
{
"name": "cyankiwi/Olmo-3.1-32B-Think-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 11.5,
"recommended_ram_gb": 22.9,
"min_vram_gb": 19.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo3",
"hf_downloads": 66,
"hf_likes": 0,
"release_date": "2025-12-14",
"_discovered": true
},
{
"name": "cyankiwi/Olmo-3.1-32B-Think-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "32.0B",
"parameters_raw": 32000000000,
"min_ram_gb": 21.4,
"recommended_ram_gb": 42.8,
"min_vram_gb": 35.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "olmo3",
"hf_downloads": 11,
"hf_likes": 0,
"release_date": "2025-12-14",
"_discovered": true
},
{
"name": "cyankiwi/Nemotron-Cascade-14B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 5.2,
"recommended_ram_gb": 10.3,
"min_vram_gb": 8.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 22,
"hf_likes": 1,
"release_date": "2025-12-18",
"_discovered": true
},
{
"name": "cyankiwi/Nemotron-Cascade-14B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 9.5,
"recommended_ram_gb": 19.1,
"min_vram_gb": 15.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 4,
"hf_likes": 0,
"release_date": "2025-12-18",
"_discovered": true
},
{
"name": "cyankiwi/Nemotron-Cascade-8B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 3.1,
"recommended_ram_gb": 6.1,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2025-12-18",
"_discovered": true
},
{
"name": "cyankiwi/Nemotron-Cascade-8B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 5.6,
"recommended_ram_gb": 11.2,
"min_vram_gb": 9.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 4,
"hf_likes": 0,
"release_date": "2025-12-18",
"_discovered": true
},
{
"name": "cyankiwi/QwenLong-L1.5-30B-A3B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 58,
"hf_likes": 2,
"release_date": "2025-12-18",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Nemotron-Cascade-8B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 3.1,
"recommended_ram_gb": 6.1,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 78,
"hf_likes": 1,
"release_date": "2025-12-18",
"_discovered": true
},
{
"name": "cyankiwi/Nemotron-Cascade-8B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 5.6,
"recommended_ram_gb": 11.2,
"min_vram_gb": 9.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 1,
"hf_likes": 1,
"release_date": "2025-12-18",
"_discovered": true
},
{
"name": "cyankiwi/nomos-1-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "5.3B",
"parameters_raw": 5306567040,
"min_ram_gb": 2.2,
"recommended_ram_gb": 4.3,
"min_vram_gb": 3.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 5,
"hf_likes": 1,
"release_date": "2025-12-23",
"_discovered": true
},
{
"name": "cyankiwi/nomos-1-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "9.0B",
"parameters_raw": 9043691904,
"min_ram_gb": 6.2,
"recommended_ram_gb": 12.5,
"min_vram_gb": 10.4,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 2,
"hf_likes": 0,
"release_date": "2025-12-23",
"_discovered": true
},
{
"name": "cyankiwi/Solar-Open-100B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "100.0B",
"parameters_raw": 100000000000,
"min_ram_gb": 35.1,
"recommended_ram_gb": 70.2,
"min_vram_gb": 58.5,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "solar_open",
"hf_downloads": 393,
"hf_likes": 1,
"release_date": "2026-01-01",
"_discovered": true
},
{
"name": "cyankiwi/Solar-Open-100B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "100.0B",
"parameters_raw": 100000000000,
"min_ram_gb": 66.3,
"recommended_ram_gb": 132.6,
"min_vram_gb": 110.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "solar_open",
"hf_downloads": 17,
"hf_likes": 2,
"release_date": "2026-01-01",
"_discovered": true
},
{
"name": "cyankiwi/IQuest-Coder-V1-40B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "40.0B",
"parameters_raw": 40000000000,
"min_ram_gb": 14.2,
"recommended_ram_gb": 28.4,
"min_vram_gb": 23.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "iquestcoder",
"hf_downloads": 33,
"hf_likes": 2,
"release_date": "2026-01-02",
"_discovered": true
},
{
"name": "cyankiwi/IQuest-Coder-V1-40B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "40.0B",
"parameters_raw": 40000000000,
"min_ram_gb": 26.7,
"recommended_ram_gb": 53.4,
"min_vram_gb": 44.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "iquestcoder",
"hf_downloads": 14,
"hf_likes": 5,
"release_date": "2026-01-02",
"_discovered": true
},
{
"name": "cyankiwi/QwenLong-L1.5-30B-A3B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 1,
"hf_likes": 1,
"release_date": "2026-01-03",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/bu-30b-a3b-preview-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl_moe",
"hf_downloads": 880,
"hf_likes": 0,
"release_date": "2026-01-05",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/bu-30b-a3b-preview-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl_moe",
"hf_downloads": 3,
"hf_likes": 0,
"release_date": "2026-01-05",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/MiroThinker-v1.5-30B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 6,
"hf_likes": 2,
"release_date": "2026-01-06",
"_discovered": true
},
{
"name": "cyankiwi/MiroThinker-v1.5-235B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "235.0B",
"parameters_raw": 235000000000,
"min_ram_gb": 82.1,
"recommended_ram_gb": 164.2,
"min_vram_gb": 136.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 7,
"hf_likes": 3,
"release_date": "2026-01-06",
"_discovered": true
},
{
"name": "cyankiwi/MiroThinker-v1.5-235B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "235.0B",
"parameters_raw": 235000000000,
"min_ram_gb": 155.4,
"recommended_ram_gb": 310.8,
"min_vram_gb": 259.0,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 2,
"hf_likes": 0,
"release_date": "2026-01-06",
"_discovered": true
},
{
"name": "cyankiwi/NousCoder-14B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 5.2,
"recommended_ram_gb": 10.3,
"min_vram_gb": 8.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 3,
"hf_likes": 0,
"release_date": "2026-01-08",
"_discovered": true
},
{
"name": "cyankiwi/NousCoder-14B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "14.0B",
"parameters_raw": 14000000000,
"min_ram_gb": 9.5,
"recommended_ram_gb": 19.1,
"min_vram_gb": 15.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2026-01-08",
"_discovered": true
},
{
"name": "cyankiwi/AI21-Jamba2-Mini-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "13.5B",
"parameters_raw": 13519598976,
"min_ram_gb": 5.0,
"recommended_ram_gb": 10.0,
"min_vram_gb": 8.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "jamba",
"hf_downloads": 4,
"hf_likes": 0,
"release_date": "2026-01-09",
"_discovered": true
},
{
"name": "cyankiwi/AI21-Jamba2-Mini-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "19.2B",
"parameters_raw": 19156743552,
"min_ram_gb": 13.0,
"recommended_ram_gb": 25.9,
"min_vram_gb": 21.6,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "jamba",
"hf_downloads": 5,
"hf_likes": 1,
"release_date": "2026-01-09",
"_discovered": true
},
{
"name": "cyankiwi/IQuest-Coder-V1-40B-Loop-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "40.0B",
"parameters_raw": 40000000000,
"min_ram_gb": 14.2,
"recommended_ram_gb": 28.4,
"min_vram_gb": 23.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "iquestloopcoder",
"hf_downloads": 613,
"hf_likes": 4,
"release_date": "2026-01-10",
"_discovered": true
},
{
"name": "cyankiwi/IQuest-Coder-V1-40B-Loop-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "40.0B",
"parameters_raw": 40000000000,
"min_ram_gb": 26.7,
"recommended_ram_gb": 53.4,
"min_vram_gb": 44.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "iquestloopcoder",
"hf_downloads": 3,
"hf_likes": 0,
"release_date": "2026-01-10",
"_discovered": true
},
{
"name": "cyankiwi/Baichuan-M3-235B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "235.0B",
"parameters_raw": 235000000000,
"min_ram_gb": 82.1,
"recommended_ram_gb": 164.2,
"min_vram_gb": 136.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 5,
"hf_likes": 2,
"release_date": "2026-01-13",
"_discovered": true
},
{
"name": "cyankiwi/DASD-30B-A3B-Thinking-Preview-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2026-01-18",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/DASD-30B-A3B-Thinking-Preview-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 4,
"hf_likes": 1,
"release_date": "2026-01-18",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/AgentCPM-Explore-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "1.3B",
"parameters_raw": 1345814520,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 103,
"hf_likes": 1,
"release_date": "2026-01-18",
"_discovered": true
},
{
"name": "cyankiwi/AgentCPM-Explore-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "1.8B",
"parameters_raw": 1799979000,
"min_ram_gb": 1.5,
"recommended_ram_gb": 3.0,
"min_vram_gb": 2.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 5,
"hf_likes": 0,
"release_date": "2026-01-18",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.7-Flash-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "32.1B",
"parameters_raw": 32140559382,
"min_ram_gb": 21.5,
"recommended_ram_gb": 43.1,
"min_vram_gb": 35.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe_lite",
"hf_downloads": 225,
"hf_likes": 17,
"release_date": "2026-01-19",
"_discovered": true
},
{
"name": "cyankiwi/DASD-4B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 1.7,
"recommended_ram_gb": 3.4,
"min_vram_gb": 2.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 4,
"hf_likes": 1,
"release_date": "2026-01-20",
"_discovered": true
},
{
"name": "cyankiwi/DASD-4B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.9,
"recommended_ram_gb": 5.9,
"min_vram_gb": 4.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 3,
"hf_likes": 0,
"release_date": "2026-01-20",
"_discovered": true
},
{
"name": "cyankiwi/Step3-VL-10B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "10.0B",
"parameters_raw": 10000000000,
"min_ram_gb": 3.8,
"recommended_ram_gb": 7.6,
"min_vram_gb": 6.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "step_robotics",
"hf_downloads": 255,
"hf_likes": 0,
"release_date": "2026-01-23",
"_discovered": true
},
{
"name": "cyankiwi/Step3-VL-10B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "10.0B",
"parameters_raw": 10000000000,
"min_ram_gb": 6.9,
"recommended_ram_gb": 13.8,
"min_vram_gb": 11.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "step_robotics",
"hf_downloads": 33,
"hf_likes": 1,
"release_date": "2026-01-23",
"_discovered": true
},
{
"name": "cyankiwi/GLM-4.7-Flash-REAP-23B-A3B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "23.0B",
"parameters_raw": 23000000000,
"min_ram_gb": 15.5,
"recommended_ram_gb": 31.0,
"min_vram_gb": 25.8,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe_lite",
"hf_downloads": 53,
"hf_likes": 3,
"release_date": "2026-01-25",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/AgentCPM-Report-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "1.8B",
"parameters_raw": 1786843584,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.5,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minicpm",
"hf_downloads": 6,
"hf_likes": 1,
"release_date": "2026-01-26",
"_discovered": true
},
{
"name": "cyankiwi/AgentCPM-Report-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "2.7B",
"parameters_raw": 2734756288,
"min_ram_gb": 2.1,
"recommended_ram_gb": 4.2,
"min_vram_gb": 3.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minicpm",
"hf_downloads": 4,
"hf_likes": 1,
"release_date": "2026-01-26",
"_discovered": true
},
{
"name": "cyankiwi/MiniMax-M2.1-REAP-172B-A10B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "172.0B",
"parameters_raw": 172000000000,
"min_ram_gb": 60.2,
"recommended_ram_gb": 120.4,
"min_vram_gb": 100.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 28,
"hf_likes": 0,
"release_date": "2026-02-03",
"_discovered": true,
"is_moe": true,
"active_parameters": 10000000000
},
{
"name": "cyankiwi/Qwen3-VL-2B-Instruct-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 2000000000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 32348,
"hf_likes": 1,
"release_date": "2026-02-05",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-2B-Instruct-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 2000000000,
"min_ram_gb": 1.6,
"recommended_ram_gb": 3.2,
"min_vram_gb": 2.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 83,
"hf_likes": 0,
"release_date": "2026-02-05",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-2B-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 2000000000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 438,
"hf_likes": 0,
"release_date": "2026-02-05",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-VL-2B-Thinking-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 2000000000,
"min_ram_gb": 1.6,
"recommended_ram_gb": 3.2,
"min_vram_gb": 2.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_vl",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2026-02-05",
"_discovered": true
},
{
"name": "cyankiwi/MiniCPM-SALA-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 1988798976,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minicpm_sala",
"hf_downloads": 48,
"hf_likes": 1,
"release_date": "2026-02-15",
"_discovered": true
},
{
"name": "cyankiwi/MiniCPM-SALA-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "3.1B",
"parameters_raw": 3098192384,
"min_ram_gb": 2.3,
"recommended_ram_gb": 4.7,
"min_vram_gb": 3.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minicpm_sala",
"hf_downloads": 200,
"hf_likes": 0,
"release_date": "2026-02-15",
"_discovered": true
},
{
"name": "cyankiwi/Nanbeige4.1-3B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "3.0B",
"parameters_raw": 3000000000,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.6,
"min_vram_gb": 2.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 271,
"hf_likes": 1,
"release_date": "2026-02-15",
"_discovered": true
},
{
"name": "cyankiwi/VulnLLM-R-7B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "7.0B",
"parameters_raw": 7000000000,
"min_ram_gb": 2.8,
"recommended_ram_gb": 5.5,
"min_vram_gb": 4.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 1,
"hf_likes": 0,
"release_date": "2026-02-18",
"_discovered": true
},
{
"name": "cyankiwi/VulnLLM-R-7B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "7.0B",
"parameters_raw": 7000000000,
"min_ram_gb": 4.9,
"recommended_ram_gb": 9.8,
"min_vram_gb": 8.2,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen2",
"hf_downloads": 7,
"hf_likes": 1,
"release_date": "2026-02-18",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3.5-397B-A17B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "397.0B",
"parameters_raw": 397000000000,
"min_ram_gb": 138.5,
"recommended_ram_gb": 277.0,
"min_vram_gb": 230.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 1389,
"hf_likes": 2,
"release_date": "2026-02-18",
"_discovered": true,
"is_moe": true,
"active_parameters": 17000000000
},
{
"name": "cyankiwi/INTELLECT-3.1-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "18.6B",
"parameters_raw": 18626406504,
"min_ram_gb": 6.8,
"recommended_ram_gb": 13.6,
"min_vram_gb": 11.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 13,
"hf_likes": 0,
"release_date": "2026-02-18",
"_discovered": true
},
{
"name": "cyankiwi/JoyAI-LLM-Flash-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "8.3B",
"parameters_raw": 8326243206,
"min_ram_gb": 3.2,
"recommended_ram_gb": 6.4,
"min_vram_gb": 5.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"hf_downloads": 2,
"hf_likes": 3,
"release_date": "2026-02-18",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3-Coder-Next-REAM-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "79.7B",
"parameters_raw": 79674391296,
"min_ram_gb": 22.3,
"recommended_ram_gb": 44.6,
"min_vram_gb": 40.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "Coding",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 695,
"hf_likes": 10,
"release_date": "2026-02-19",
"is_moe": true,
"num_experts": 512,
"active_experts": 10,
"active_parameters": null,
"_discovered": true,
"format": "awq"
},
{
"name": "cyankiwi/INTELLECT-3.1-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "31.7B",
"parameters_raw": 31696906344,
"min_ram_gb": 21.2,
"recommended_ram_gb": 42.5,
"min_vram_gb": 35.4,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm4_moe",
"hf_downloads": 4,
"hf_likes": 0,
"release_date": "2026-02-20",
"_discovered": true
},
{
"name": "cyankiwi/JoyAI-LLM-Flash-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "14.3B",
"parameters_raw": 14343480198,
"min_ram_gb": 9.8,
"recommended_ram_gb": 19.6,
"min_vram_gb": 16.3,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "deepseek_v3",
"hf_downloads": 0,
"hf_likes": 0,
"release_date": "2026-02-20",
"_discovered": true
},
{
"name": "cyankiwi/Ovis2.6-30B-A3B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "ovis2_6_moe",
"hf_downloads": 65,
"hf_likes": 0,
"release_date": "2026-02-20",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Ovis2.6-30B-A3B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "ovis2_6_moe",
"hf_downloads": 241,
"hf_likes": 1,
"release_date": "2026-02-20",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Qwen3-Coder-Next-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "24.1B",
"parameters_raw": 24108399360,
"min_ram_gb": 16.2,
"recommended_ram_gb": 32.4,
"min_vram_gb": 27.0,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 826,
"hf_likes": 5,
"release_date": "2026-02-20",
"_discovered": true
},
{
"name": "cyankiwi/MiniMax-M2.5-REAP-139B-A10B-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "139.0B",
"parameters_raw": 139000000000,
"min_ram_gb": 48.7,
"recommended_ram_gb": 97.3,
"min_vram_gb": 81.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 121866,
"hf_likes": 13,
"release_date": "2026-02-25",
"_discovered": true,
"is_moe": true,
"active_parameters": 10000000000
},
{
"name": "cyankiwi/LFM2-24B-A2B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "24.0B",
"parameters_raw": 24000000000,
"min_ram_gb": 16.1,
"recommended_ram_gb": 32.3,
"min_vram_gb": 26.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "lfm2_moe",
"hf_downloads": 52,
"hf_likes": 0,
"release_date": "2026-02-25",
"_discovered": true,
"is_moe": true,
"active_parameters": 2000000000
},
{
"name": "cyankiwi/Qwen3.5-122B-A10B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "122.0B",
"parameters_raw": 122000000000,
"min_ram_gb": 80.8,
"recommended_ram_gb": 161.6,
"min_vram_gb": 134.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 4323,
"hf_likes": 4,
"release_date": "2026-03-01",
"_discovered": true,
"is_moe": true,
"active_parameters": 10000000000
},
{
"name": "cyankiwi/Jan-code-4b-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 1.7,
"recommended_ram_gb": 3.4,
"min_vram_gb": 2.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 9,
"hf_likes": 0,
"release_date": "2026-03-02",
"_discovered": true
},
{
"name": "cyankiwi/Jan-code-4b-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.9,
"recommended_ram_gb": 5.9,
"min_vram_gb": 4.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3",
"hf_downloads": 10,
"hf_likes": 2,
"release_date": "2026-03-02",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3.5-9B-AWQ-BF16-INT4",
"provider": "cyankiwi",
"parameter_count": "9.0B",
"parameters_raw": 9000000000,
"min_ram_gb": 3.4,
"recommended_ram_gb": 6.8,
"min_vram_gb": 5.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 8058,
"hf_likes": 7,
"release_date": "2026-03-02",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3.5-2B-AWQ-BF16-INT4",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 2000000000,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 1.7,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 210,
"hf_likes": 1,
"release_date": "2026-03-02",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3.5-2B-AWQ-BF16-INT8",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 2000000000,
"min_ram_gb": 1.6,
"recommended_ram_gb": 3.2,
"min_vram_gb": 2.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 828,
"hf_likes": 1,
"release_date": "2026-03-02",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3.5-4B-AWQ-BF16-INT8",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.9,
"recommended_ram_gb": 5.9,
"min_vram_gb": 4.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 4421,
"hf_likes": 3,
"release_date": "2026-03-02",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3.5-9B-AWQ-BF16-INT8",
"provider": "cyankiwi",
"parameter_count": "9.0B",
"parameters_raw": 9000000000,
"min_ram_gb": 6.2,
"recommended_ram_gb": 12.5,
"min_vram_gb": 10.4,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 20406,
"hf_likes": 0,
"release_date": "2026-03-02",
"_discovered": true
},
{
"name": "cyankiwi/GLM-5-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "766.9B",
"parameters_raw": 766947340782,
"min_ram_gb": 267.2,
"recommended_ram_gb": 534.4,
"min_vram_gb": 445.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm_moe_dsa",
"hf_downloads": 2,
"hf_likes": 0,
"release_date": "2026-03-06",
"_discovered": true
},
{
"name": "cyankiwi/SVD-Qwen3-Coder-Next-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "14.4B",
"parameters_raw": 14444722944,
"min_ram_gb": 5.3,
"recommended_ram_gb": 10.7,
"min_vram_gb": 8.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_next",
"hf_downloads": 30,
"hf_likes": 2,
"release_date": "2026-03-09",
"_discovered": true
},
{
"name": "cyankiwi/OmniCoder-9B-AWQ-BF16-INT8",
"provider": "cyankiwi",
"parameter_count": "9.0B",
"parameters_raw": 9000000000,
"min_ram_gb": 6.2,
"recommended_ram_gb": 12.5,
"min_vram_gb": 10.4,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_5",
"hf_downloads": 132,
"hf_likes": 1,
"release_date": "2026-03-14",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3.5-27B-AWQ-INT8-INT4",
"provider": "cyankiwi",
"parameter_count": "27.0B",
"parameters_raw": 27000000000,
"min_ram_gb": 18.1,
"recommended_ram_gb": 36.2,
"min_vram_gb": 30.2,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 531,
"hf_likes": 2,
"release_date": "2026-03-29",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3.5-9B-AWQ-INT8-INT4",
"provider": "cyankiwi",
"parameter_count": "9.0B",
"parameters_raw": 9000000000,
"min_ram_gb": 6.2,
"recommended_ram_gb": 12.5,
"min_vram_gb": 10.4,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 3925,
"hf_likes": 2,
"release_date": "2026-03-29",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3.5-4B-AWQ-INT8-INT4",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.9,
"recommended_ram_gb": 5.9,
"min_vram_gb": 4.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 20289,
"hf_likes": 2,
"release_date": "2026-03-29",
"_discovered": true
},
{
"name": "cyankiwi/Qwen3.5-2B-AWQ-INT8-INT4",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 2000000000,
"min_ram_gb": 1.6,
"recommended_ram_gb": 3.2,
"min_vram_gb": 2.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 397,
"hf_likes": 1,
"release_date": "2026-03-29",
"_discovered": true
},
{
"name": "cyankiwi/MiroThinker-1.7-mini-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "5.3B",
"parameters_raw": 5306567040,
"min_ram_gb": 2.2,
"recommended_ram_gb": 4.3,
"min_vram_gb": 3.6,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 44,
"hf_likes": 1,
"release_date": "2026-04-01",
"_discovered": true
},
{
"name": "cyankiwi/MiroThinker-1.7-mini-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "9.0B",
"parameters_raw": 9043691904,
"min_ram_gb": 6.2,
"recommended_ram_gb": 12.5,
"min_vram_gb": 10.4,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "qwen3_moe",
"hf_downloads": 3,
"hf_likes": 0,
"release_date": "2026-04-01",
"_discovered": true
},
{
"name": "cyankiwi/gemma-4-26B-A4B-it-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "26.0B",
"parameters_raw": 26000000000,
"min_ram_gb": 17.5,
"recommended_ram_gb": 34.9,
"min_vram_gb": 29.1,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "gemma4",
"hf_downloads": 291580,
"hf_likes": 8,
"release_date": "2026-04-03",
"_discovered": true,
"is_moe": true,
"active_parameters": 4000000000
},
{
"name": "cyankiwi/Nemotron-Cascade-2-30B-A3B-AWQ-8bit",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 20.1,
"recommended_ram_gb": 40.2,
"min_vram_gb": 33.5,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "nvidia",
"hf_downloads": 111,
"hf_likes": 1,
"release_date": "2026-04-08",
"_discovered": true,
"is_moe": true,
"active_parameters": 3000000000
},
{
"name": "cyankiwi/Trinity-Large-Thinking-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "65.5B",
"parameters_raw": 65542882332,
"min_ram_gb": 23.1,
"recommended_ram_gb": 46.2,
"min_vram_gb": 38.5,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "afmoe",
"hf_downloads": 175,
"hf_likes": 2,
"release_date": "2026-04-08",
"_discovered": true
},
{
"name": "cyankiwi/GLM-5.1-AWQ-4bit",
"provider": "cyankiwi",
"parameter_count": "766.9B",
"parameters_raw": 766909554882,
"min_ram_gb": 267.2,
"recommended_ram_gb": 534.4,
"min_vram_gb": 445.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "glm_moe_dsa",
"hf_downloads": 8512,
"hf_likes": 11,
"release_date": "2026-04-10",
"_discovered": true
},
{
"name": "cyankiwi/granite-4.1-8b-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 3.1,
"recommended_ram_gb": 6.1,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granite",
"hf_downloads": 1920,
"hf_likes": 1,
"release_date": "2026-05-01",
"_discovered": true
},
{
"name": "cyankiwi/granite-4.1-30b-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "30.0B",
"parameters_raw": 30000000000,
"min_ram_gb": 10.7,
"recommended_ram_gb": 21.5,
"min_vram_gb": 17.9,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granite",
"hf_downloads": 1318,
"hf_likes": 1,
"release_date": "2026-05-03",
"_discovered": true
},
{
"name": "cyankiwi/gemma-4-E4B-it-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 1.7,
"recommended_ram_gb": 3.4,
"min_vram_gb": 2.8,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "any-to-any",
"architecture": "gemma4",
"hf_downloads": 188508,
"hf_likes": 2,
"release_date": "2026-05-03",
"_discovered": true
},
{
"name": "cyankiwi/GRM-2.6-Plus-AWQ-BF16-INT4",
"provider": "cyankiwi",
"parameter_count": "29.0B",
"parameters_raw": 28979098878,
"min_ram_gb": 10.4,
"recommended_ram_gb": 20.8,
"min_vram_gb": 17.3,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 237,
"hf_likes": 1,
"release_date": "2026-05-04",
"_discovered": true
},
{
"name": "cyankiwi/GRM-2.6-Plus-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "29.3B",
"parameters_raw": 29325129246,
"min_ram_gb": 10.5,
"recommended_ram_gb": 21.0,
"min_vram_gb": 17.5,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 1528,
"hf_likes": 0,
"release_date": "2026-05-04",
"_discovered": true
},
{
"name": "cyankiwi/granite-4.1-3b-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "3.0B",
"parameters_raw": 3000000000,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.6,
"min_vram_gb": 2.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "granite",
"hf_downloads": 143,
"hf_likes": 0,
"release_date": "2026-05-05",
"_discovered": true
},
{
"name": "cyankiwi/gemma-4-E4B-it-AWQ-INT8",
"provider": "cyankiwi",
"parameter_count": "4.0B",
"parameters_raw": 4000000000,
"min_ram_gb": 2.9,
"recommended_ram_gb": 5.9,
"min_vram_gb": 4.9,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "any-to-any",
"architecture": "gemma4",
"hf_downloads": 9631,
"hf_likes": 0,
"release_date": "2026-05-06",
"_discovered": true
},
{
"name": "cyankiwi/gemma-4-E2B-it-AWQ-INT8",
"provider": "cyankiwi",
"parameter_count": "2.0B",
"parameters_raw": 2000000000,
"min_ram_gb": 1.6,
"recommended_ram_gb": 3.2,
"min_vram_gb": 2.7,
"quantization": "AWQ-8bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "any-to-any",
"architecture": "gemma4",
"hf_downloads": 242,
"hf_likes": 0,
"release_date": "2026-05-06",
"_discovered": true
},
{
"name": "cyankiwi/Llama-3.3-70B-Instruct-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "70.0B",
"parameters_raw": 70000000000,
"min_ram_gb": 24.7,
"recommended_ram_gb": 49.3,
"min_vram_gb": 41.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 33,
"hf_likes": 0,
"release_date": "2026-05-07",
"_discovered": true
},
{
"name": "cyankiwi/Llama-3.1-8B-Instruct-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "8.0B",
"parameters_raw": 8000000000,
"min_ram_gb": 3.1,
"recommended_ram_gb": 6.1,
"min_vram_gb": 5.1,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 149,
"hf_likes": 0,
"release_date": "2026-05-12",
"_discovered": true
},
{
"name": "cyankiwi/Llama-3.2-3B-Instruct-AWQ-INT4",
"provider": "cyankiwi",
"parameter_count": "3.0B",
"parameters_raw": 3000000000,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.6,
"min_vram_gb": 2.2,
"quantization": "AWQ-4bit",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "llama",
"hf_downloads": 425,
"hf_likes": 0,
"release_date": "2026-05-12",
"_discovered": true
},
{
"name": "MiniMaxAI/MiniMax-M2.7",
"provider": "MiniMaxAI",
"parameter_count": "228.7B",
"parameters_raw": 228700000000,
"min_ram_gb": 240.0,
"recommended_ram_gb": 280.0,
"min_vram_gb": 240.0,
"quantization": "FP8",
"context_length": 196608,
"use_case": "Chat, reasoning, tool use",
"capabilities": [
"tool_use"
],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 534825,
"hf_likes": 1134,
"release_date": "2026-04-09",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 13600000000
},
{
"name": "bullerwins/MiniMax-M2.7-REAP-172B-fp8",
"provider": "bullerwins",
"parameter_count": "172B",
"parameters_raw": 172000000000,
"min_ram_gb": 113.8,
"recommended_ram_gb": 227.6,
"min_vram_gb": 189.7,
"quantization": "FP8",
"context_length": 32768,
"use_case": "General purpose",
"capabilities": [],
"pipeline_tag": "text-generation",
"architecture": "minimax_m2",
"hf_downloads": 9,
"hf_likes": 0,
"release_date": "2026-04-19",
"_discovered": true
},
{
"name": "Qwen/Qwen3.6-27B-MTP",
"provider": "Qwen",
"parameter_count": "27.8B",
"parameters_raw": 27781427952,
"min_ram_gb": 16.6,
"recommended_ram_gb": 21.6,
"min_vram_gb": 16.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose, coding, MTP",
"is_moe": false,
"num_experts": null,
"active_experts": null,
"active_parameters": null,
"architecture": "qwen3",
"pipeline_tag": "text-generation",
"release_date": "2026-04-01",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.6-27B-MTP-GGUF",
"provider": "unsloth"
}
],
"capabilities": [
"mtp"
],
"_discovered": true
},
{
"name": "Qwen/Qwen3.6-35B-A3B-MTP",
"provider": "Qwen",
"parameter_count": "36.0B",
"parameters_raw": 35951822704,
"min_ram_gb": 21.4,
"recommended_ram_gb": 27.8,
"min_vram_gb": 21.4,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose (MoE), MTP",
"is_moe": true,
"num_experts": null,
"active_experts": null,
"active_parameters": 3000000000,
"architecture": "qwen3_moe",
"pipeline_tag": "text-generation",
"release_date": "2026-04-01",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.6-35B-A3B-MTP-GGUF",
"provider": "unsloth"
}
],
"capabilities": [
"mtp"
],
"_discovered": true
},
{
"name": "Qwen/Qwen3.5-0.8B-MTP",
"provider": "Qwen",
"parameter_count": "873M",
"parameters_raw": 873438784,
"min_ram_gb": 1.0,
"recommended_ram_gb": 2.0,
"min_vram_gb": 0.5,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose, MTP",
"capabilities": [
"mtp",
"tool_use",
"vision"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 93448,
"hf_likes": 208,
"release_date": "2026-02-28",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-0.8B-MTP-GGUF",
"provider": "unsloth"
}
],
"_discovered": true
},
{
"name": "Qwen/Qwen3.5-2B-MTP",
"provider": "Qwen",
"parameter_count": "2.3B",
"parameters_raw": 2274069824,
"min_ram_gb": 1.3,
"recommended_ram_gb": 2.1,
"min_vram_gb": 1.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose, MTP",
"capabilities": [
"mtp",
"tool_use",
"vision"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 46974,
"hf_likes": 115,
"release_date": "2026-02-28",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-2B-MTP-GGUF",
"provider": "unsloth"
}
],
"_discovered": true
},
{
"name": "Qwen/Qwen3.5-4B-MTP",
"provider": "Qwen",
"parameter_count": "4.7B",
"parameters_raw": 4659865088,
"min_ram_gb": 2.6,
"recommended_ram_gb": 4.3,
"min_vram_gb": 2.4,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose, MTP",
"capabilities": [
"mtp",
"tool_use",
"vision"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 99087,
"hf_likes": 202,
"release_date": "2026-02-27",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-4B-MTP-GGUF",
"provider": "unsloth"
}
],
"_discovered": true
},
{
"name": "Qwen/Qwen3.5-9B-MTP",
"provider": "Qwen",
"parameter_count": "9.7B",
"parameters_raw": 9653104368,
"min_ram_gb": 5.4,
"recommended_ram_gb": 9.0,
"min_vram_gb": 4.9,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose, MTP",
"capabilities": [
"mtp",
"tool_use",
"vision"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 172298,
"hf_likes": 345,
"release_date": "2026-02-27",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-9B-MTP-GGUF",
"provider": "unsloth"
}
],
"_discovered": true
},
{
"name": "Qwen/Qwen3.5-27B-MTP",
"provider": "Qwen",
"parameter_count": "27.8B",
"parameters_raw": 27781427952,
"min_ram_gb": 15.5,
"recommended_ram_gb": 25.9,
"min_vram_gb": 14.2,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose, MTP",
"capabilities": [
"mtp",
"tool_use",
"vision"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5",
"hf_downloads": 406808,
"hf_likes": 565,
"release_date": "2026-02-24",
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-27B-MTP-GGUF",
"provider": "unsloth"
}
],
"_discovered": true
},
{
"name": "Qwen/Qwen3.5-35B-A3B-MTP",
"provider": "Qwen",
"parameter_count": "36.0B",
"parameters_raw": 35951822704,
"min_ram_gb": 20.1,
"recommended_ram_gb": 33.5,
"min_vram_gb": 18.4,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose, MTP",
"capabilities": [
"mtp",
"tool_use",
"vision"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 769032,
"hf_likes": 905,
"release_date": "2026-02-24",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 3000000000,
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-35B-A3B-MTP-GGUF",
"provider": "unsloth"
}
],
"_discovered": true
},
{
"name": "Qwen/Qwen3.5-122B-A10B-MTP",
"provider": "Qwen",
"parameter_count": "125.1B",
"parameters_raw": 125086497008,
"min_ram_gb": 69.9,
"recommended_ram_gb": 116.5,
"min_vram_gb": 64.1,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose, MTP",
"capabilities": [
"mtp",
"tool_use",
"vision"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 171055,
"hf_likes": 389,
"release_date": "2026-02-24",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 10000000000,
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-122B-A10B-MTP-GGUF",
"provider": "unsloth"
}
],
"_discovered": true
},
{
"name": "Qwen/Qwen3.5-397B-A17B-MTP",
"provider": "Qwen",
"parameter_count": "403.4B",
"parameters_raw": 403397928944,
"min_ram_gb": 225.4,
"recommended_ram_gb": 375.7,
"min_vram_gb": 206.6,
"quantization": "Q4_K_M",
"context_length": 262144,
"use_case": "General purpose, MTP",
"capabilities": [
"mtp",
"tool_use",
"vision"
],
"pipeline_tag": "image-text-to-text",
"architecture": "qwen3_5_moe",
"hf_downloads": 1291825,
"hf_likes": 1214,
"release_date": "2026-02-16",
"is_moe": true,
"num_experts": 256,
"active_experts": 8,
"active_parameters": 17000000000,
"gguf_sources": [
{
"repo": "unsloth/Qwen3.5-397B-A17B-MTP-GGUF",
"provider": "unsloth"
}
],
"_discovered": true
}
]