[ { "name": "echarlaix/tiny-random-PhiForCausalLM", "provider": "echarlaix", "parameter_count": "80K", "parameters_raw": 80074, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 512, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phi", "hf_downloads": 24984, "hf_likes": 0, "release_date": "2024-03-29", "_discovered": true }, { "name": "peft-internal-testing/tiny-random-GPT2LMHeadModel", "provider": "peft-internal-testing", "parameter_count": "83K", "parameters_raw": 83161, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 512, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt2", "hf_downloads": 37534, "hf_likes": 0, "release_date": "2025-11-17", "_discovered": true }, { "name": "peft-internal-testing/tiny-random-gpt2", "provider": "peft-internal-testing", "parameter_count": "112K", "parameters_raw": 111968, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 512, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt2", "hf_downloads": 28458, "hf_likes": 0, "release_date": "2025-11-17", "_discovered": true }, { "name": "peft-internal-testing/tiny-random-GPTJForCausalLM", "provider": "peft-internal-testing", "parameter_count": "129K", "parameters_raw": 129184, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 512, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gptj", "hf_downloads": 38953, "hf_likes": 0, "release_date": "2025-11-17", "_discovered": true }, { "name": "allenai/Olmo-3-7B-Instruct", "provider": "allenai", "parameter_count": "528K", "parameters_raw": 528384, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 65536, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo3", "hf_downloads": 101787, "hf_likes": 118, "release_date": "2025-11-19", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/Olmo-3-7B-Instruct-GGUF", "provider": "unsloth" } ] }, { "name": "allenai/Olmo-3-7B-Think", "provider": "allenai", "parameter_count": "528K", "parameters_raw": 528384, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 65536, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo3", "hf_downloads": 44414, "hf_likes": 88, "release_date": "2025-11-18", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/Olmo-3-7B-Think-GGUF", "provider": "unsloth" } ] }, { "name": "allenai/Olmo-3-7B-Think-DPO", "provider": "allenai", "parameter_count": "528K", "parameters_raw": 528384, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 65536, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo3", "hf_downloads": 21555, "hf_likes": 7, "release_date": "2025-11-18", "_discovered": true }, { "name": "MaxJeblick/llama2-0b-unit-test", "provider": "maxjeblick", "parameter_count": "771K", "parameters_raw": 770940, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 1024, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 48409, "hf_likes": 2, "release_date": "2023-10-25", "_discovered": true }, { "name": "peft-internal-testing/tiny-random-OPTForCausalLM", "provider": "peft-internal-testing", "parameter_count": "812K", "parameters_raw": 812404, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 100, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "opt", "hf_downloads": 388627, "hf_likes": 0, "release_date": "2025-11-13", "_discovered": true }, { "name": "hmellor/tiny-random-LlamaForCausalLM", "provider": "hmellor", "parameter_count": "1M", "parameters_raw": 1062992, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 1295572, "hf_likes": 0, "release_date": "2025-04-29", "_discovered": true }, { "name": "peft-internal-testing/tiny-dummy-qwen2", "provider": "peft-internal-testing", "parameter_count": "1M", "parameters_raw": 1217480, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 102441, "hf_likes": 0, "release_date": "2024-07-04", "_discovered": true }, { "name": "SimpleStories/SimpleStories-1.25M", "provider": "simplestories", "parameter_count": "1M", "parameters_raw": 1245824, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 512, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 86406, "hf_likes": 1, "release_date": "2025-04-22", "_discovered": true }, { "name": "optimum-intel-internal-testing/tiny-random-Phi3ForCausalLM", "provider": "optimum-intel-internal-testing", "parameter_count": "2M", "parameters_raw": 2072736, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phi3", "hf_downloads": 22058, "hf_likes": 0, "release_date": "2025-10-21", "_discovered": true }, { "name": "llamafactory/tiny-random-qwen3", "provider": "llamafactory", "parameter_count": "2M", "parameters_raw": 2439264, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Lightweight, edge deployment", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 47369, "hf_likes": 0, "release_date": "2026-01-06", "_discovered": true }, { "name": "tiny-random/qwen3-next-moe", "provider": "tiny-random", "parameter_count": "3M", "parameters_raw": 2839160, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Lightweight, edge deployment", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 27920, "hf_likes": 4, "release_date": "2025-09-12", "is_moe": true, "num_experts": 32, "active_experts": 10, "active_parameters": 984828, "_discovered": true }, { "name": "llamafactory/tiny-random-Llama-3", "provider": "llamafactory", "parameter_count": "4M", "parameters_raw": 4112464, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 950276, "hf_likes": 3, "release_date": "2024-06-07", "_discovered": true }, { "name": "Maykeye/TinyLLama-v0", "provider": "maykeye", "parameter_count": "5M", "parameters_raw": 4621392, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 32384, "hf_likes": 43, "release_date": "2023-07-08", "_discovered": true }, { "name": "optimum-intel-internal-testing/tiny-random-gpt-oss-mxfp4", "provider": "optimum-intel-internal-testing", "parameter_count": "7M", "parameters_raw": 6865444, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_oss", "hf_downloads": 27904, "hf_likes": 0, "release_date": "2025-10-21", "is_moe": true, "num_experts": 32, "active_experts": 4, "active_parameters": 1158540, "_discovered": true }, { "name": "hmellor/tiny-random-Gemma2ForCausalLM", "provider": "hmellor", "parameter_count": "8M", "parameters_raw": 8438816, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gemma2", "hf_downloads": 339841, "hf_likes": 0, "release_date": "2025-04-29", "_discovered": true }, { "name": "michaelbenayoun/llama-2-tiny-4kv-heads-4layers-random", "provider": "michaelbenayoun", "parameter_count": "9M", "parameters_raw": 8537216, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 52387, "hf_likes": 0, "release_date": "2024-03-28", "_discovered": true }, { "name": "tiiuae/falcon-mamba-tiny-dev", "provider": "TII", "parameter_count": "9M", "parameters_raw": 8765056, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "falcon_mamba", "hf_downloads": 21730, "hf_likes": 2, "release_date": "2024-10-13", "_discovered": true }, { "name": "arnir0/Tiny-LLM", "provider": "arnir0", "parameter_count": "13M", "parameters_raw": 12988992, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 1024, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 54600, "hf_likes": 45, "release_date": "2024-11-03", "_discovered": true }, { "name": "EleutherAI/pythia-14m", "provider": "eleutherai", "parameter_count": "14M", "parameters_raw": 14067712, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neox", "hf_downloads": 33322, "hf_likes": 0, "release_date": "2026-02-24", "_discovered": true }, { "name": "hmellor/tiny-random-BambaForCausalLM", "provider": "hmellor", "parameter_count": "33M", "parameters_raw": 33110760, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "bamba", "hf_downloads": 173798, "hf_likes": 0, "release_date": "2025-04-29", "_discovered": true }, { "name": "erwanf/gpt2-mini", "provider": "erwanf", "parameter_count": "39M", "parameters_raw": 38604288, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 512, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt2", "hf_downloads": 391187, "hf_likes": 2, "release_date": "2024-06-23", "_discovered": true }, { "name": "EleutherAI/pythia-14m-deduped", "provider": "eleutherai", "parameter_count": "39M", "parameters_raw": 39233560, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neox", "hf_downloads": 69404, "hf_likes": 28, "release_date": "2023-07-19", "_discovered": true }, { "name": "hyper-accel/tiny-random-llama", "provider": "hyper-accel", "parameter_count": "73M", "parameters_raw": 73271808, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 44649, "hf_likes": 0, "release_date": "2025-02-10", "_discovered": true }, { "name": "RedHatAI/SmolLM-135M-Instruct-quantized.w8a16", "provider": "redhatai", "parameter_count": "83M", "parameters_raw": 83356260, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 20835, "hf_likes": 0, "release_date": "2024-08-22", "_discovered": true }, { "name": "tiiuae/Falcon-H1-Tiny-90M-Instruct", "provider": "TII", "parameter_count": "91M", "parameters_raw": 91131072, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "falcon_h1", "hf_downloads": 301062, "hf_likes": 33, "release_date": "2026-01-12", "_discovered": true }, { "name": "EleutherAI/pythia-70m-deduped", "provider": "eleutherai", "parameter_count": "96M", "parameters_raw": 95592496, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neox", "hf_downloads": 613928, "hf_likes": 27, "release_date": "2023-02-13", "_discovered": true }, { "name": "gratefulasi/lumeleto", "provider": "gratefulasi", "parameter_count": "124M", "parameters_raw": 124439808, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 1024, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt2", "hf_downloads": 47679, "hf_likes": 1, "release_date": "2025-04-24", "_discovered": true }, { "name": "peft-internal-testing/opt-125m", "provider": "peft-internal-testing", "parameter_count": "125M", "parameters_raw": 125239296, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "opt", "hf_downloads": 232784, "hf_likes": 0, "release_date": "2025-11-19", "_discovered": true }, { "name": "state-spaces/mamba-130m-hf", "provider": "state-spaces", "parameter_count": "129M", "parameters_raw": 129135360, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mamba", "hf_downloads": 161407, "hf_likes": 68, "release_date": "2024-03-06", "_discovered": true }, { "name": "HuggingFaceTB/SmolLM2-135M", "provider": "huggingfacetb", "parameter_count": "135M", "parameters_raw": 134515008, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 954486, "hf_likes": 168, "release_date": "2024-10-31", "_discovered": true }, { "name": "HuggingFaceTB/SmolLM2-135M-Instruct", "provider": "huggingfacetb", "parameter_count": "135M", "parameters_raw": 134515008, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 603656, "hf_likes": 295, "release_date": "2024-10-31", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/SmolLM2-135M-Instruct-GGUF", "provider": "unsloth" }, { "repo": "bartowski/SmolLM2-135M-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "HuggingFaceTB/SmolLM-135M-Instruct", "provider": "huggingfacetb", "parameter_count": "135M", "parameters_raw": 134515008, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 359214, "hf_likes": 133, "release_date": "2024-07-15", "_discovered": true }, { "name": "HuggingFaceTB/SmolLM-135M", "provider": "huggingfacetb", "parameter_count": "135M", "parameters_raw": 134515008, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 156129, "hf_likes": 249, "release_date": "2024-07-14", "_discovered": true }, { "name": "nomic-ai/nomic-embed-text-v1.5", "provider": "Nomic", "parameter_count": "137M", "parameters_raw": 137000000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "F16", "context_length": 8192, "use_case": "Text embeddings for RAG", "pipeline_tag": "feature-extraction", "architecture": "nomic_bert", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "EleutherAI/gpt-neo-125m", "provider": "eleutherai", "parameter_count": "150M", "parameters_raw": 150364416, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neo", "hf_downloads": 100060, "hf_likes": 227, "release_date": "2022-03-02", "_discovered": true }, { "name": "JackFram/llama-160m", "provider": "jackfram", "parameter_count": "162M", "parameters_raw": 162417792, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 46025, "hf_likes": 36, "release_date": "2023-05-26", "_discovered": true }, { "name": "microsoft/DialoGPT-small", "provider": "Microsoft", "parameter_count": "176M", "parameters_raw": 175620096, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 1024, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt2", "hf_downloads": 58248, "hf_likes": 143, "release_date": "2022-03-02", "_discovered": true }, { "name": "lmstudio-community/LFM2.5-1.2B-Instruct-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "183M", "parameters_raw": 182975232, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 441394, "hf_likes": 1, "release_date": "2026-01-07", "_discovered": true }, { "name": "rinna/japanese-gpt-neox-small", "provider": "rinna", "parameter_count": "204M", "parameters_raw": 203611008, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neox", "hf_downloads": 457560, "hf_likes": 15, "release_date": "2022-08-31", "_discovered": true }, { "name": "EleutherAI/pythia-160m-deduped", "provider": "eleutherai", "parameter_count": "213M", "parameters_raw": 212654688, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neox", "hf_downloads": 82245, "hf_likes": 3, "release_date": "2023-02-08", "_discovered": true }, { "name": "Vamsi/T5_Paraphrase_Paws", "provider": "vamsi", "parameter_count": "223M", "parameters_raw": 222903936, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 512, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "t5", "hf_downloads": 83813, "hf_likes": 40, "release_date": "2022-03-02", "_discovered": true }, { "name": "TitanML/tiny-mixtral", "provider": "titanml", "parameter_count": "247M", "parameters_raw": 246961152, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mixtral", "hf_downloads": 100054, "hf_likes": 2, "release_date": "2024-04-24", "is_moe": true, "num_experts": 8, "active_experts": 2, "active_parameters": 71001329, "_discovered": true }, { "name": "lmstudio-community/LFM2.5-1.2B-Instruct-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "256M", "parameters_raw": 256113408, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 441834, "hf_likes": 4, "release_date": "2026-01-07", "_discovered": true }, { "name": "lmstudio-community/Qwen3-1.7B-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "269M", "parameters_raw": 268944384, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 25290, "hf_likes": 0, "release_date": "2025-04-28", "_discovered": true }, { "name": "google/t5gemma-s-s-prefixlm", "provider": "Google", "parameter_count": "313M", "parameters_raw": 312517632, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "t5gemma", "hf_downloads": 41131, "hf_likes": 2, "release_date": "2025-06-19", "_discovered": true }, { "name": "lmstudio-community/LFM2.5-1.2B-Instruct-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "329M", "parameters_raw": 329251584, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 449901, "hf_likes": 2, "release_date": "2026-01-07", "_discovered": true }, { "name": "lmstudio-community/LFM2-1.2B-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "329M", "parameters_raw": 329251584, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 26421, "hf_likes": 4, "release_date": "2025-07-14", "_discovered": true }, { "name": "LiquidAI/LFM2-ColBERT-350M", "provider": "Liquid AI", "parameter_count": "353M", "parameters_raw": 353322752, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Semantic search, sentence similarity", "pipeline_tag": "sentence-similarity", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2-350M", "provider": "liquidai", "parameter_count": "354M", "parameters_raw": 354483968, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 41124, "hf_likes": 235, "release_date": "2025-07-10", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/LFM2-350M-GGUF", "provider": "unsloth" } ] }, { "name": "HuggingFaceTB/SmolLM2-360M", "provider": "huggingfacetb", "parameter_count": "362M", "parameters_raw": 361821120, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 36444, "hf_likes": 87, "release_date": "2024-10-31", "_discovered": true }, { "name": "LiquidAI/LFM2-350M-Extract", "provider": "Liquid AI", "parameter_count": "354M", "parameters_raw": 354483968, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Data extraction, structured output", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2-350M-Math", "provider": "Liquid AI", "parameter_count": "354M", "parameters_raw": 354483968, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Math reasoning, chain-of-thought", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2-350M-ENJP-MT", "provider": "Liquid AI", "parameter_count": "354M", "parameters_raw": 354483968, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "English-Japanese translation", "pipeline_tag": "translation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2-350M-PII-Extract-JP", "provider": "Liquid AI", "parameter_count": "354M", "parameters_raw": 354483968, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "PII extraction, Japanese", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "lmstudio-community/LFM2-350M-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "354M", "parameters_raw": 354483968, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "mlx-8bit", "context_length": 128000, "use_case": "Lightweight, edge deployment", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "lmstudio-community/LFM2-350M-MLX-bf16", "provider": "lmstudio-community", "parameter_count": "354M", "parameters_raw": 354483968, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.7, "quantization": "BF16", "context_length": 128000, "use_case": "Lightweight, edge deployment", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "HuggingFaceTB/SmolLM-360M-Instruct", "provider": "huggingfacetb", "parameter_count": "362M", "parameters_raw": 361821120, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 26935, "hf_likes": 83, "release_date": "2024-07-15", "_discovered": true }, { "name": "openbmb/MiniCPM4-0.5B", "provider": "openbmb", "parameter_count": "434M", "parameters_raw": 433873920, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 28889, "hf_likes": 77, "release_date": "2025-06-05", "_discovered": true }, { "name": "LiquidAI/LFM2-VL-450M", "provider": "Liquid AI", "parameter_count": "451M", "parameters_raw": 450822656, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Multimodal, vision and text", "pipeline_tag": "image-text-to-text", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "lmstudio-community/Qwen3-1.7B-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "484M", "parameters_raw": 484000768, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 28313, "hf_likes": 1, "release_date": "2025-04-28", "_discovered": true }, { "name": "Qwen/Qwen2.5-0.5B-Instruct", "provider": "Alibaba", "parameter_count": "494M", "parameters_raw": 494032768, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 6992099, "hf_likes": 470, "release_date": "2024-09-16", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-0.5B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-Coder-0.5B-Instruct", "provider": "Alibaba", "parameter_count": "494M", "parameters_raw": 494032768, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1408034, "hf_likes": 65, "release_date": "2024-11-06", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/Qwen2.5-Coder-0.5B-Instruct-GGUF", "provider": "unsloth" }, { "repo": "bartowski/Qwen2.5-Coder-0.5B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-0.5B", "provider": "Alibaba", "parameter_count": "494M", "parameters_raw": 494032768, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1200041, "hf_likes": 378, "release_date": "2024-09-15", "_discovered": true }, { "name": "Qwen/Qwen2-0.5B-Instruct", "provider": "Alibaba", "parameter_count": "494M", "parameters_raw": 494032768, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 259334, "hf_likes": 200, "release_date": "2024-06-03", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2-0.5B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Gensyn/Qwen2.5-0.5B-Instruct", "provider": "gensyn", "parameter_count": "494M", "parameters_raw": 494032768, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 106514, "hf_likes": 33, "release_date": "2025-03-28", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-0.5B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-Coder-0.5B", "provider": "Alibaba", "parameter_count": "494M", "parameters_raw": 494032768, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 64868, "hf_likes": 44, "release_date": "2024-11-08", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-Coder-0.5B-GGUF", "provider": "bartowski" } ] }, { "name": "EleutherAI/pythia-410m", "provider": "eleutherai", "parameter_count": "506M", "parameters_raw": 505997504, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neox", "hf_downloads": 88847, "hf_likes": 36, "release_date": "2023-02-13", "_discovered": true }, { "name": "EleutherAI/pythia-410m-deduped", "provider": "eleutherai", "parameter_count": "506M", "parameters_raw": 505997504, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neox", "hf_downloads": 32196, "hf_likes": 20, "release_date": "2023-02-13", "_discovered": true }, { "name": "h2oai/h2o-danube3-500m-chat", "provider": "h2oai", "parameter_count": "514M", "parameters_raw": 513590784, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 31122, "hf_likes": 39, "release_date": "2024-07-04", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/h2o-danube3-500m-chat-GGUF", "provider": "bartowski" } ] }, { "name": "tiiuae/Falcon-H1-0.5B-Base", "provider": "TII", "parameter_count": "521M", "parameters_raw": 521411104, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 16384, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "falcon_h1", "hf_downloads": 25562, "hf_likes": 16, "release_date": "2025-05-01", "_discovered": true }, { "name": "RedHatAI/Qwen3-30B-A3B-Instruct-2507-speculator.eagle3", "provider": "redhatai", "parameter_count": "522M", "parameters_raw": 522152832, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 115085, "hf_likes": 1, "release_date": "2025-12-12", "_discovered": true }, { "name": "z-lab/Qwen3-4B-DFlash-b16", "provider": "z-lab", "parameter_count": "537M", "parameters_raw": 537427200, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 25679, "hf_likes": 22, "release_date": "2026-01-04", "_discovered": true }, { "name": "bigscience/bloomz-560m", "provider": "bigscience", "parameter_count": "559M", "parameters_raw": 559214592, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "bloom", "hf_downloads": 1303926, "hf_likes": 137, "release_date": "2022-10-08", "_discovered": true }, { "name": "bigscience/bloom-560m", "provider": "bigscience", "parameter_count": "559M", "parameters_raw": 559214592, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "bloom", "hf_downloads": 134778, "hf_likes": 371, "release_date": "2022-05-19", "_discovered": true }, { "name": "Qwen/Qwen3-4B-MLX-4bit", "provider": "Alibaba", "parameter_count": "566M", "parameters_raw": 565828096, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 65536, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 74343, "hf_likes": 26, "release_date": "2025-05-23", "_discovered": true }, { "name": "google/t5gemma-b-b-ul2", "provider": "Google", "parameter_count": "591M", "parameters_raw": 591490560, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "t5gemma", "hf_downloads": 39788, "hf_likes": 2, "release_date": "2025-06-19", "_discovered": true }, { "name": "google/t5gemma-b-b-prefixlm", "provider": "Google", "parameter_count": "591M", "parameters_raw": 591490560, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "pipeline_tag": "text-generation", "architecture": "t5gemma", "hf_downloads": 1187971, "hf_likes": 13, "release_date": "2025-06-19", "_discovered": true }, { "name": "lmstudio-community/Phi-4-mini-reasoning-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "600M", "parameters_raw": 599546880, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phi3", "hf_downloads": 43404, "hf_likes": 3, "release_date": "2025-05-01", "_discovered": true }, { "name": "Qwen/Qwen1.5-0.5B-Chat", "provider": "Alibaba", "parameter_count": "620M", "parameters_raw": 619570176, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 87380, "hf_likes": 92, "release_date": "2024-01-31", "_discovered": true }, { "name": "Qwen/Qwen1.5-0.5B", "provider": "Alibaba", "parameter_count": "620M", "parameters_raw": 619570176, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 26651, "hf_likes": 173, "release_date": "2024-01-22", "_discovered": true }, { "name": "lmstudio-community/Qwen3-4B-Thinking-2507-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "629M", "parameters_raw": 628676096, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 95794, "hf_likes": 10, "release_date": "2025-08-06", "_discovered": true }, { "name": "lmstudio-community/Qwen3-4B-Instruct-2507-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "629M", "parameters_raw": 628676096, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 66279, "hf_likes": 3, "release_date": "2025-08-06", "_discovered": true }, { "name": "lmstudio-community/Qwen3-4B-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "629M", "parameters_raw": 628676096, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 21982, "hf_likes": 1, "release_date": "2025-04-28", "_discovered": true }, { "name": "LiquidAI/LFM2-700M", "provider": "Liquid AI", "parameter_count": "742M", "parameters_raw": 742489344, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Lightweight, edge deployment", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "lmstudio-community/LFM2-700M-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "742M", "parameters_raw": 742489344, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "mlx-8bit", "context_length": 128000, "use_case": "Lightweight, edge deployment", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "lmstudio-community/LFM2-700M-MLX-bf16", "provider": "lmstudio-community", "parameter_count": "742M", "parameters_raw": 742489344, "min_ram_gb": 1.7, "recommended_ram_gb": 2.8, "min_vram_gb": 1.5, "quantization": "BF16", "context_length": 128000, "use_case": "Lightweight, edge deployment", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "Qwen/Qwen3-0.6B", "provider": "Alibaba", "parameter_count": "752M", "parameters_raw": 751632384, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 11310453, "hf_likes": 1120, "release_date": "2025-04-27", "gguf_sources": [ { "repo": "unsloth/Qwen3-0.6B-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen3Guard-Gen-0.6B", "provider": "Alibaba", "parameter_count": "752M", "parameters_raw": 751632384, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 146728, "hf_likes": 62, "release_date": "2025-09-23", "_discovered": true }, { "name": "Qwen/Qwen3-0.6B-FP8", "provider": "Alibaba", "parameter_count": "752M", "parameters_raw": 751659264, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 1648717, "hf_likes": 57, "release_date": "2025-04-28", "_discovered": true }, { "name": "lmstudio-community/Qwen3-4B-Instruct-2507-MLX-5bit", "provider": "lmstudio-community", "parameter_count": "754M", "parameters_raw": 754372096, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 62740, "hf_likes": 0, "release_date": "2025-08-06", "_discovered": true }, { "name": "h2oai/h2ovl-mississippi-800m", "provider": "h2oai", "parameter_count": "826M", "parameters_raw": 826295808, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "h2ovl_chat", "hf_downloads": 1014882, "hf_likes": 39, "release_date": "2024-10-16", "_discovered": true }, { "name": "Qwen/Qwen3.5-0.8B", "provider": "Alibaba", "parameter_count": "873M", "parameters_raw": 873438784, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 93448, "hf_likes": 208, "release_date": "2026-02-28", "gguf_sources": [ { "repo": "unsloth/Qwen3.5-0.8B-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen3.5-0.8B-Base", "provider": "Alibaba", "parameter_count": "873M", "parameters_raw": 873438784, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 4680, "hf_likes": 37, "release_date": "2026-02-28" }, { "name": "lmstudio-community/Qwen3-4B-Thinking-2507-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "880M", "parameters_raw": 880068096, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 91703, "hf_likes": 2, "release_date": "2025-08-06", "_discovered": true }, { "name": "lmstudio-community/Qwen3-4B-Instruct-2507-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "880M", "parameters_raw": 880068096, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 62883, "hf_likes": 0, "release_date": "2025-08-06", "_discovered": true }, { "name": "Joaoffg/ELM", "provider": "joaoffg", "parameter_count": "903M", "parameters_raw": 902891520, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 339775, "hf_likes": 2, "release_date": "2024-05-29", "_discovered": true }, { "name": "RedHatAI/Qwen3-8B-speculator.eagle3", "provider": "redhatai", "parameter_count": "1.0B", "parameters_raw": 1022037632, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 76636, "hf_likes": 2, "release_date": "2025-09-19", "_discovered": true }, { "name": "EleutherAI/pythia-1b", "provider": "eleutherai", "parameter_count": "1.1B", "parameters_raw": 1078891008, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neox", "hf_downloads": 27818, "hf_likes": 43, "release_date": "2023-03-10", "_discovered": true }, { "name": "TinyLlama/TinyLlama-1.1B-Chat-v1.0", "provider": "Community", "parameter_count": "1.1B", "parameters_raw": 1100048384, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 1870099, "hf_likes": 1538, "release_date": "2023-12-30" }, { "name": "nm-testing/tinyllama-oneshot-w8w8-test-static-shape-change", "provider": "nm-testing", "parameter_count": "1.1B", "parameters_raw": 1100048692, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 31348, "hf_likes": 0, "release_date": "2024-06-12", "_discovered": true }, { "name": "bigcode/gpt_bigcode-santacoder", "provider": "BigCode", "parameter_count": "1.1B", "parameters_raw": 1124886528, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_bigcode", "hf_downloads": 49973, "hf_likes": 26, "release_date": "2023-04-06", "_discovered": true }, { "name": "lmstudio-community/Qwen3-4B-Thinking-2507-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "1.1B", "parameters_raw": 1131460096, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 93477, "hf_likes": 7, "release_date": "2025-08-06", "_discovered": true }, { "name": "lmstudio-community/Qwen3-4B-Instruct-2507-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "1.1B", "parameters_raw": 1131460096, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 63832, "hf_likes": 1, "release_date": "2025-08-06", "_discovered": true }, { "name": "LiquidAI/LFM2.5-1.2B-Instruct", "provider": "liquidai", "parameter_count": "1.2B", "parameters_raw": 1170340608, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 116655, "hf_likes": 516, "release_date": "2026-01-06", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/LFM2.5-1.2B-Instruct-GGUF", "provider": "unsloth" } ] }, { "name": "lmstudio-community/LFM2-1.2B-MLX-bf16", "provider": "lmstudio-community", "parameter_count": "1.2B", "parameters_raw": 1170340608, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 26071, "hf_likes": 6, "release_date": "2025-07-14", "_discovered": true }, { "name": "LiquidAI/LFM2-1.2B", "provider": "Liquid AI", "parameter_count": "1.2B", "parameters_raw": 1170340608, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "General purpose text generation", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2.5-1.2B-Base", "provider": "Liquid AI", "parameter_count": "1.2B", "parameters_raw": 1170340608, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "General purpose text generation", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2.5-1.2B-Thinking", "provider": "Liquid AI", "parameter_count": "1.2B", "parameters_raw": 1170340608, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Advanced reasoning, chain-of-thought", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2.5-1.2B-JP", "provider": "Liquid AI", "parameter_count": "1.2B", "parameters_raw": 1170340608, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Japanese language, multilingual chat", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2-1.2B-Tool", "provider": "Liquid AI", "parameter_count": "1.2B", "parameters_raw": 1170340608, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Tool calling, function calling", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2-1.2B-RAG", "provider": "Liquid AI", "parameter_count": "1.2B", "parameters_raw": 1170340608, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Retrieval-augmented generation", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2-1.2B-Extract", "provider": "Liquid AI", "parameter_count": "1.2B", "parameters_raw": 1170340608, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Data extraction, structured output", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "lmstudio-community/LFM2.5-1.2B-Thinking-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "1.2B", "parameters_raw": 1170340608, "min_ram_gb": 1.3, "recommended_ram_gb": 2.2, "min_vram_gb": 1.2, "quantization": "mlx-8bit", "context_length": 128000, "use_case": "Advanced reasoning, chain-of-thought", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "lmstudio-community/LFM2.5-1.2B-Thinking-MLX-bf16", "provider": "lmstudio-community", "parameter_count": "1.2B", "parameters_raw": 1170340608, "min_ram_gb": 2.6, "recommended_ram_gb": 4.4, "min_vram_gb": 2.4, "quantization": "BF16", "context_length": 128000, "use_case": "Advanced reasoning, chain-of-thought", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "allenai/OLMo-1B-hf", "provider": "allenai", "parameter_count": "1.2B", "parameters_raw": 1176764416, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo", "hf_downloads": 23538, "hf_likes": 26, "release_date": "2024-04-12", "_discovered": true }, { "name": "Zyphra/Zamba2-1.2B-instruct", "provider": "zyphra", "parameter_count": "1.2B", "parameters_raw": 1215064704, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "zamba2", "hf_downloads": 72584, "hf_likes": 30, "release_date": "2024-09-19", "_discovered": true }, { "name": "meta-llama/Llama-3.2-1B", "provider": "Meta", "parameter_count": "1.2B", "parameters_raw": 1235814400, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 1453836, "hf_likes": 2306, "release_date": "2024-09-18" }, { "name": "hmellor/Ilama-3.2-1B", "provider": "hmellor", "parameter_count": "1.2B", "parameters_raw": 1235814400, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "ilama", "hf_downloads": 89998, "hf_likes": 0, "release_date": "2025-07-22", "_discovered": true }, { "name": "warshanks/Jan-nano-AWQ", "provider": "warshanks", "parameter_count": "1.3B", "parameters_raw": 1264206840, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.6, "quantization": "AWQ-4bit", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 99084, "hf_likes": 3, "release_date": "2025-07-12", "_discovered": true, "format": "awq" }, { "name": "LGAI-EXAONE/EXAONE-4.0-1.2B", "provider": "lgai-exaone", "parameter_count": "1.3B", "parameters_raw": 1279391488, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.7, "quantization": "Q4_K_M", "context_length": 65536, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "exaone4", "hf_downloads": 100975, "hf_likes": 172, "release_date": "2025-07-11" }, { "name": "lmstudio-community/DeepSeek-R1-0528-Qwen3-8B-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "1.3B", "parameters_raw": 1280062464, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.7, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 348365, "hf_likes": 7, "release_date": "2025-05-29", "_discovered": true }, { "name": "lmstudio-community/Qwen3-8B-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "1.3B", "parameters_raw": 1280062464, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.7, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 39201, "hf_likes": 2, "release_date": "2025-04-28", "_discovered": true }, { "name": "pfnet/plamo-2-1b", "provider": "pfnet", "parameter_count": "1.3B", "parameters_raw": 1291441920, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.7, "quantization": "Q4_K_M", "context_length": 10485760, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "plamo2", "hf_downloads": 63725, "hf_likes": 38, "release_date": "2025-02-05", "_discovered": true }, { "name": "EleutherAI/gpt-neo-1.3B", "provider": "eleutherai", "parameter_count": "1.4B", "parameters_raw": 1365907456, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.7, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neo", "hf_downloads": 48440, "hf_likes": 324, "release_date": "2022-03-02", "_discovered": true }, { "name": "microsoft/phi-1_5", "provider": "Microsoft", "parameter_count": "1.4B", "parameters_raw": 1418270720, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.7, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phi", "hf_downloads": 152337, "hf_likes": 1355, "release_date": "2023-09-10", "_discovered": true }, { "name": "starvector/starvector-1b-im2svg", "provider": "starvector", "parameter_count": "1.4B", "parameters_raw": 1434095620, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.7, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "starvector", "hf_downloads": 38196, "hf_likes": 184, "release_date": "2025-01-11", "_discovered": true }, { "name": "allenai/OLMo-2-0425-1B", "provider": "allenai", "parameter_count": "1.5B", "parameters_raw": 1484916736, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo2", "hf_downloads": 533223, "hf_likes": 70, "release_date": "2025-04-17", "_discovered": true }, { "name": "allenai/OLMo-2-0425-1B-Instruct", "provider": "allenai", "parameter_count": "1.5B", "parameters_raw": 1484916736, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo2", "hf_downloads": 38389, "hf_likes": 56, "release_date": "2025-04-29", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/OLMo-2-0425-1B-Instruct-GGUF", "provider": "unsloth" } ] }, { "name": "RedHatAI/Llama-3.2-1B-Instruct-FP8", "provider": "redhatai", "parameter_count": "1.5B", "parameters_raw": 1498482912, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 814349, "hf_likes": 3, "release_date": "2024-09-26", "_discovered": true }, { "name": "RedHatAI/Llama-3.2-1B-Instruct-FP8-dynamic", "provider": "redhatai", "parameter_count": "1.5B", "parameters_raw": 1498859520, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 1823969, "hf_likes": 3, "release_date": "2024-09-25", "_discovered": true }, { "name": "LiquidAI/LFM2-Audio-1.5B", "provider": "Liquid AI", "parameter_count": "1.5B", "parameters_raw": 1500000000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Speech-to-speech, ASR, TTS", "pipeline_tag": "audio-to-audio", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2.5-Audio-1.5B", "provider": "Liquid AI", "parameter_count": "1.5B", "parameters_raw": 1500000000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Speech-to-speech, ASR, TTS", "pipeline_tag": "audio-to-audio", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "EleutherAI/pythia-1.4b", "provider": "eleutherai", "parameter_count": "1.5B", "parameters_raw": 1515311488, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neox", "hf_downloads": 27804, "hf_likes": 26, "release_date": "2023-02-09", "_discovered": true }, { "name": "Qwen/Qwen2.5-Coder-1.5B-Instruct", "provider": "Alibaba", "parameter_count": "1.5B", "parameters_raw": 1543714304, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1789513, "hf_likes": 107, "release_date": "2024-09-18", "gguf_sources": [ { "repo": "unsloth/Qwen2.5-Coder-1.5B-Instruct-GGUF", "provider": "unsloth" }, { "repo": "bartowski/Qwen2.5-Coder-1.5B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-1.5B-Instruct", "provider": "Alibaba", "parameter_count": "1.5B", "parameters_raw": 1543714304, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 7037921, "hf_likes": 627, "release_date": "2024-09-17", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-1.5B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2-1.5B-Instruct", "provider": "Alibaba", "parameter_count": "1.5B", "parameters_raw": 1543714304, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 3508972, "hf_likes": 161, "release_date": "2024-06-03", "_discovered": true }, { "name": "Qwen/Qwen2.5-Math-1.5B", "provider": "Alibaba", "parameter_count": "1.5B", "parameters_raw": 1543714304, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1064952, "hf_likes": 102, "release_date": "2024-09-16", "_discovered": true }, { "name": "Qwen/Qwen2.5-1.5B", "provider": "Alibaba", "parameter_count": "1.5B", "parameters_raw": 1543714304, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 431369, "hf_likes": 166, "release_date": "2024-09-15", "_discovered": true }, { "name": "Qwen/Qwen2-1.5B", "provider": "Alibaba", "parameter_count": "1.5B", "parameters_raw": 1543714304, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 114016, "hf_likes": 99, "release_date": "2024-05-31", "_discovered": true }, { "name": "Qwen/Qwen2.5-Math-1.5B-Instruct", "provider": "Alibaba", "parameter_count": "1.5B", "parameters_raw": 1543714304, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 80310, "hf_likes": 54, "release_date": "2024-09-16", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-Math-1.5B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "RedHatAI/Qwen2-1.5B-Instruct-FP8", "provider": "redhatai", "parameter_count": "1.5B", "parameters_raw": 1543714304, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 24030, "hf_likes": 0, "release_date": "2024-06-14", "_discovered": true }, { "name": "KiteFishAI/Minnow-Math-1.5B", "provider": "kitefishai", "parameter_count": "1.6B", "parameters_raw": 1633781760, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 147620, "hf_likes": 1, "release_date": "2026-02-12", "_discovered": true }, { "name": "LiquidAI/LFM2-VL-1.6B", "provider": "Liquid AI", "parameter_count": "1.6B", "parameters_raw": 1584804000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Multimodal, vision and text", "pipeline_tag": "image-text-to-text", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2.5-VL-1.6B", "provider": "Liquid AI", "parameter_count": "1.6B", "parameters_raw": 1596625904, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Multimodal, vision and text", "pipeline_tag": "image-text-to-text", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "lmstudio-community/LFM2.5-VL-1.6B-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "1.6B", "parameters_raw": 1596625904, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "mlx-4bit", "context_length": 32768, "use_case": "Multimodal, vision and text", "pipeline_tag": "image-text-to-text", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "lmstudio-community/LFM2.5-VL-1.6B-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "1.6B", "parameters_raw": 1596625904, "min_ram_gb": 1.3, "recommended_ram_gb": 2.2, "min_vram_gb": 1.2, "quantization": "mlx-6bit", "context_length": 32768, "use_case": "Multimodal, vision and text", "pipeline_tag": "image-text-to-text", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "lmstudio-community/LFM2.5-VL-1.6B-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "1.6B", "parameters_raw": 1596625904, "min_ram_gb": 1.8, "recommended_ram_gb": 3.0, "min_vram_gb": 1.6, "quantization": "mlx-8bit", "context_length": 32768, "use_case": "Multimodal, vision and text", "pipeline_tag": "image-text-to-text", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "stabilityai/stablelm-2-1_6b-chat", "provider": "Stability AI", "parameter_count": "1.6B", "parameters_raw": 1644515328, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.8, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "stablelm", "hf_downloads": 955, "hf_likes": 34, "release_date": "2024-04-08" }, { "name": "HuggingFaceTB/SmolLM-1.7B", "provider": "huggingfacetb", "parameter_count": "1.7B", "parameters_raw": 1711376384, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 63387, "hf_likes": 180, "release_date": "2024-07-14", "_discovered": true }, { "name": "HuggingFaceTB/SmolLM2-1.7B", "provider": "huggingfacetb", "parameter_count": "1.7B", "parameters_raw": 1711376384, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 25638, "hf_likes": 144, "release_date": "2024-10-30", "_discovered": true }, { "name": "cyankiwi/Nanbeige4.1-3B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "3.0B", "parameters_raw": 3000000000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "AWQ-8bit", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 49220, "hf_likes": 2, "release_date": "2026-02-15", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen3-1.7B-Base", "provider": "Alibaba", "parameter_count": "1.7B", "parameters_raw": 1720574976, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 295900, "hf_likes": 64, "release_date": "2025-04-28", "_discovered": true }, { "name": "lmstudio-community/Qwen3-1.7B-MLX-bf16", "provider": "lmstudio-community", "parameter_count": "1.7B", "parameters_raw": 1720574976, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 24714, "hf_likes": 2, "release_date": "2025-04-28", "_discovered": true }, { "name": "bigscience/bloom-1b7", "provider": "bigscience", "parameter_count": "1.7B", "parameters_raw": 1722408960, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "bloom", "hf_downloads": 38813, "hf_likes": 122, "release_date": "2022-05-19", "_discovered": true }, { "name": "Qwen/Qwen2.5-1.5B-Instruct-AWQ", "provider": "Alibaba", "parameter_count": "1.8B", "parameters_raw": 1777088000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 727989, "hf_likes": 6, "release_date": "2024-09-17", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen2.5-Coder-1.5B-Instruct-AWQ", "provider": "Alibaba", "parameter_count": "1.8B", "parameters_raw": 1777088000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 164152, "hf_likes": 4, "release_date": "2024-09-20", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen2-1.5B-Instruct-AWQ", "provider": "Alibaba", "parameter_count": "1.8B", "parameters_raw": 1777088000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 24850, "hf_likes": 9, "release_date": "2024-06-06", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen2-1.5B-Instruct-GPTQ-Int4", "provider": "Alibaba", "parameter_count": "1.8B", "parameters_raw": 1777675776, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "GPTQ-Int4", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 24724, "hf_likes": 5, "release_date": "2024-06-06", "_discovered": true, "format": "gptq" }, { "name": "RedHatAI/Qwen2.5-1.5B-quantized.w8a8", "provider": "redhatai", "parameter_count": "1.8B", "parameters_raw": 1777733120, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1091974, "hf_likes": 2, "release_date": "2024-10-09", "_discovered": true }, { "name": "Qwen/Qwen1.5-1.8B-Chat", "provider": "Alibaba", "parameter_count": "1.8B", "parameters_raw": 1836828672, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 72445, "hf_likes": 73, "release_date": "2024-01-30", "_discovered": true }, { "name": "jonathanli/induction-vl2-mdl-fswd7-20000-720p-proj-256-var", "provider": "jonathanli", "parameter_count": "1.9B", "parameters_raw": 1940015872, "min_ram_gb": 1.1, "recommended_ram_gb": 2.0, "min_vram_gb": 1.0, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "induction_vl2", "hf_downloads": 24886, "hf_likes": 0, "release_date": "2026-02-01", "_discovered": true }, { "name": "cyankiwi/granite-4.0-h-tiny-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 1997098800, "min_ram_gb": 1.1, "recommended_ram_gb": 2.0, "min_vram_gb": 1.0, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granitemoehybrid", "hf_downloads": 63040, "hf_likes": 2, "release_date": "2025-10-13", "is_moe": true, "num_experts": 64, "active_experts": 6, "active_parameters": 277721550, "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen3-1.7B-FP8", "provider": "Alibaba", "parameter_count": "2.0B", "parameters_raw": 2031825920, "min_ram_gb": 1.1, "recommended_ram_gb": 2.0, "min_vram_gb": 1.0, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 47050, "hf_likes": 35, "release_date": "2025-04-28", "_discovered": true }, { "name": "h2oai/h2ovl-mississippi-2b", "provider": "h2oai", "parameter_count": "2.2B", "parameters_raw": 2152317440, "min_ram_gb": 1.2, "recommended_ram_gb": 2.0, "min_vram_gb": 1.1, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "h2ovl_chat", "hf_downloads": 1007240, "hf_likes": 42, "release_date": "2024-10-15", "_discovered": true }, { "name": "warshanks/Qwen3-8B-abliterated-AWQ", "provider": "warshanks", "parameter_count": "8.2B", "parameters_raw": 8190735872, "min_ram_gb": 3.2, "recommended_ram_gb": 6.4, "min_vram_gb": 5.3, "quantization": "AWQ-4bit", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 25559, "hf_likes": 0, "release_date": "2025-07-27", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen3.5-2B", "provider": "Alibaba", "parameter_count": "2.3B", "parameters_raw": 2274069824, "min_ram_gb": 1.3, "recommended_ram_gb": 2.1, "min_vram_gb": 1.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 46974, "hf_likes": 115, "release_date": "2026-02-28", "gguf_sources": [ { "repo": "unsloth/Qwen3.5-2B-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen3.5-2B-Base", "provider": "Alibaba", "parameter_count": "2.3B", "parameters_raw": 2274069824, "min_ram_gb": 1.3, "recommended_ram_gb": 2.1, "min_vram_gb": 1.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 3336, "hf_likes": 33, "release_date": "2026-02-28" }, { "name": "lmstudio-community/Phi-4-reasoning-plus-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "2.3B", "parameters_raw": 2290897920, "min_ram_gb": 1.3, "recommended_ram_gb": 2.1, "min_vram_gb": 1.2, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phi3", "hf_downloads": 28622, "hf_likes": 1, "release_date": "2025-05-01", "_discovered": true }, { "name": "lmstudio-community/DeepSeek-R1-0528-Qwen3-8B-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "2.3B", "parameters_raw": 2303865856, "min_ram_gb": 1.3, "recommended_ram_gb": 2.1, "min_vram_gb": 1.2, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 333300, "hf_likes": 13, "release_date": "2025-05-29", "_discovered": true }, { "name": "lmstudio-community/Qwen3-8B-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "2.3B", "parameters_raw": 2303865856, "min_ram_gb": 1.3, "recommended_ram_gb": 2.1, "min_vram_gb": 1.2, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 37222, "hf_likes": 2, "release_date": "2025-04-28", "_discovered": true }, { "name": "lmstudio-community/Qwen3-14B-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "2.3B", "parameters_raw": 2307906560, "min_ram_gb": 1.3, "recommended_ram_gb": 2.1, "min_vram_gb": 1.2, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 46163, "hf_likes": 5, "release_date": "2025-04-28", "_discovered": true }, { "name": "lmstudio-community/Qwen2.5-Coder-14B-Instruct-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "2.3B", "parameters_raw": 2308527104, "min_ram_gb": 1.3, "recommended_ram_gb": 2.1, "min_vram_gb": 1.2, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 92774, "hf_likes": 2, "release_date": "2024-11-11", "_discovered": true }, { "name": "google/gemma-1.1-2b-it", "provider": "Google", "parameter_count": "2.5B", "parameters_raw": 2506172416, "min_ram_gb": 1.4, "recommended_ram_gb": 2.3, "min_vram_gb": 1.3, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gemma", "hf_downloads": 66616, "hf_likes": 171, "release_date": "2024-03-26", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/gemma-1.1-2b-it-GGUF", "provider": "bartowski" } ] }, { "name": "LiquidAI/LFM2-2.6B", "provider": "liquidai", "parameter_count": "2.6B", "parameters_raw": 2569272320, "min_ram_gb": 1.4, "recommended_ram_gb": 2.4, "min_vram_gb": 1.3, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 25773, "hf_likes": 180, "release_date": "2025-09-22", "_discovered": true }, { "name": "LiquidAI/LFM2-2.6B-Exp", "provider": "Liquid AI", "parameter_count": "2.6B", "parameters_raw": 2569272320, "min_ram_gb": 1.4, "recommended_ram_gb": 2.4, "min_vram_gb": 1.3, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Instruction following, math, knowledge", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "LiquidAI/LFM2-2.6B-Transcript", "provider": "Liquid AI", "parameter_count": "2.6B", "parameters_raw": 2569272320, "min_ram_gb": 1.4, "recommended_ram_gb": 2.4, "min_vram_gb": 1.3, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Meeting transcription, summarization", "pipeline_tag": "text-generation", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "google/gemma-2-2b-it", "provider": "Google", "parameter_count": "2.6B", "parameters_raw": 2614341376, "min_ram_gb": 1.5, "recommended_ram_gb": 2.4, "min_vram_gb": 1.3, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "Lightweight, edge deployment", "pipeline_tag": "text-generation", "architecture": "gemma2", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "bartowski/gemma-2-2b-it-GGUF", "provider": "bartowski" } ] }, { "name": "Efficient-Large-Model/gemma-2-2b-it", "provider": "efficient-large-model", "parameter_count": "2.6B", "parameters_raw": 2614341888, "min_ram_gb": 1.5, "recommended_ram_gb": 2.4, "min_vram_gb": 1.3, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gemma2", "hf_downloads": 50419, "hf_likes": 3, "release_date": "2024-12-12", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/gemma-2-2b-it-GGUF", "provider": "bartowski" } ] }, { "name": "EleutherAI/gpt-neo-2.7B", "provider": "eleutherai", "parameter_count": "2.7B", "parameters_raw": 2718416384, "min_ram_gb": 1.5, "recommended_ram_gb": 2.5, "min_vram_gb": 1.4, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neo", "hf_downloads": 23217, "hf_likes": 501, "release_date": "2022-03-02", "_discovered": true }, { "name": "microsoft/phi-2", "provider": "Microsoft", "parameter_count": "2.8B", "parameters_raw": 2779683840, "min_ram_gb": 1.6, "recommended_ram_gb": 2.6, "min_vram_gb": 1.4, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phi", "hf_downloads": 1651432, "hf_likes": 3429, "release_date": "2023-12-13", "_discovered": true }, { "name": "stabilityai/stablelm-3b-4e1t", "provider": "Stability AI", "parameter_count": "2.8B", "parameters_raw": 2795443200, "min_ram_gb": 1.6, "recommended_ram_gb": 2.6, "min_vram_gb": 1.4, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "stablelm", "hf_downloads": 24407, "hf_likes": 312, "release_date": "2023-09-29", "_discovered": true }, { "name": "HuggingFaceTB/SmolLM3-3B", "provider": "HuggingFace", "parameter_count": "3B", "parameters_raw": 3000000000, "min_ram_gb": 1.7, "recommended_ram_gb": 2.8, "min_vram_gb": 1.5, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Lightweight, multilingual reasoning", "pipeline_tag": "text-generation", "architecture": "smollm", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-07-08", "gguf_sources": [ { "repo": "unsloth/SmolLM3-3B-GGUF", "provider": "unsloth" } ] }, { "name": "LiquidAI/LFM2-VL-3B", "provider": "Liquid AI", "parameter_count": "3.0B", "parameters_raw": 2998975216, "min_ram_gb": 1.7, "recommended_ram_gb": 2.8, "min_vram_gb": 1.5, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Multimodal, vision and text", "pipeline_tag": "image-text-to-text", "architecture": "lfm2", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "bigscience/bloom-3b", "provider": "bigscience", "parameter_count": "3.0B", "parameters_raw": 3002557440, "min_ram_gb": 1.7, "recommended_ram_gb": 2.8, "min_vram_gb": 1.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "bloom", "hf_downloads": 30567, "hf_likes": 94, "release_date": "2022-05-19", "_discovered": true }, { "name": "bigcode/starcoder2-3b", "provider": "BigCode", "parameter_count": "3.0B", "parameters_raw": 3030371328, "min_ram_gb": 1.7, "recommended_ram_gb": 2.8, "min_vram_gb": 1.6, "quantization": "Q4_K_M", "context_length": 16384, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "starcoder2", "hf_downloads": 97310, "hf_likes": 216, "release_date": "2023-11-29", "_discovered": true }, { "name": "TechxGenus/gemma-1.1-2b-it-GPTQ", "provider": "techxgenus", "parameter_count": "3.0B", "parameters_raw": 3031170048, "min_ram_gb": 1.7, "recommended_ram_gb": 2.8, "min_vram_gb": 1.6, "quantization": "GPTQ-Int4", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gemma", "hf_downloads": 20793, "hf_likes": 1, "release_date": "2024-04-07", "_discovered": true, "format": "gptq" }, { "name": "Qwen/Qwen2.5-3B-Instruct", "provider": "Alibaba", "parameter_count": "3.1B", "parameters_raw": 3085938688, "min_ram_gb": 1.7, "recommended_ram_gb": 2.9, "min_vram_gb": 1.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 6598470, "hf_likes": 409, "release_date": "2024-09-17", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-3B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-3B", "provider": "Alibaba", "parameter_count": "3.1B", "parameters_raw": 3085938688, "min_ram_gb": 1.7, "recommended_ram_gb": 2.9, "min_vram_gb": 1.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 297679, "hf_likes": 172, "release_date": "2024-09-15", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-3B-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-Coder-3B-Instruct", "provider": "Alibaba", "parameter_count": "3.1B", "parameters_raw": 3085938688, "min_ram_gb": 1.7, "recommended_ram_gb": 2.9, "min_vram_gb": 1.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 126989, "hf_likes": 96, "release_date": "2024-11-06", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/Qwen2.5-Coder-3B-Instruct-GGUF", "provider": "unsloth" }, { "repo": "bartowski/Qwen2.5-Coder-3B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Salesforce/xLAM-2-3b-fc-r", "provider": "salesforce", "parameter_count": "3.1B", "parameters_raw": 3085938688, "min_ram_gb": 1.7, "recommended_ram_gb": 2.9, "min_vram_gb": 1.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 44516, "hf_likes": 16, "release_date": "2025-03-27", "_discovered": true }, { "name": "Qwen/Qwen2.5-Coder-3B", "provider": "Alibaba", "parameter_count": "3.1B", "parameters_raw": 3085938688, "min_ram_gb": 1.7, "recommended_ram_gb": 2.9, "min_vram_gb": 1.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 42540, "hf_likes": 40, "release_date": "2024-11-08", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-Coder-3B-GGUF", "provider": "bartowski" } ] }, { "name": "meta-llama/Llama-3.2-3B", "provider": "Meta", "parameter_count": "3.2B", "parameters_raw": 3212749824, "min_ram_gb": 1.8, "recommended_ram_gb": 3.0, "min_vram_gb": 1.6, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 1409393, "hf_likes": 702, "release_date": "2024-09-18" }, { "name": "ibm-research/PowerMoE-3b", "provider": "ibm-research", "parameter_count": "3.4B", "parameters_raw": 3374286336, "min_ram_gb": 1.9, "recommended_ram_gb": 3.1, "min_vram_gb": 1.7, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granitemoe", "hf_downloads": 399266, "hf_likes": 17, "release_date": "2024-08-14", "is_moe": true, "num_experts": 40, "active_experts": 8, "active_parameters": 809828716, "_discovered": true }, { "name": "Qwen/Qwen2.5-3B-Instruct-AWQ", "provider": "Alibaba", "parameter_count": "3.4B", "parameters_raw": 3397103616, "min_ram_gb": 1.9, "recommended_ram_gb": 3.2, "min_vram_gb": 1.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 38262, "hf_likes": 16, "release_date": "2024-09-17", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen2.5-Coder-3B-Instruct-AWQ", "provider": "Alibaba", "parameter_count": "3.4B", "parameters_raw": 3397103616, "min_ram_gb": 1.9, "recommended_ram_gb": 3.2, "min_vram_gb": 1.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 21964, "hf_likes": 5, "release_date": "2024-11-09", "_discovered": true, "format": "awq" }, { "name": "ibm-granite/granite-3b-code-base-2k", "provider": "ibm-granite", "parameter_count": "3.5B", "parameters_raw": 3482503680, "min_ram_gb": 1.9, "recommended_ram_gb": 3.2, "min_vram_gb": 1.8, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 73193, "hf_likes": 37, "release_date": "2024-04-23", "_discovered": true }, { "name": "ibm-research/PowerLM-3b", "provider": "ibm-research", "parameter_count": "3.5B", "parameters_raw": 3512017152, "min_ram_gb": 2.0, "recommended_ram_gb": 3.3, "min_vram_gb": 1.8, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granite", "hf_downloads": 30013, "hf_likes": 20, "release_date": "2024-08-14", "_discovered": true }, { "name": "Qwen/Qwen2.5-VL-3B-Instruct", "provider": "Alibaba", "parameter_count": "3.8B", "parameters_raw": 3754622976, "min_ram_gb": 2.1, "recommended_ram_gb": 3.5, "min_vram_gb": 1.9, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Instruction following, chat", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen2_5_vl", "hf_downloads": 2621650, "hf_likes": 623, "release_date": "2025-01-26", "gguf_sources": [ { "repo": "unsloth/Qwen2.5-VL-3B-Instruct-GGUF", "provider": "unsloth" } ] }, { "name": "microsoft/Phi-tiny-MoE-instruct", "provider": "Microsoft", "parameter_count": "3.8B", "parameters_raw": 3755220288, "min_ram_gb": 2.1, "recommended_ram_gb": 3.5, "min_vram_gb": 1.9, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phimoe", "hf_downloads": 310211, "hf_likes": 31, "release_date": "2025-06-23", "is_moe": true, "num_experts": 16, "active_experts": 2, "active_parameters": 633693422, "_discovered": true }, { "name": "llm-jp/llm-jp-3-3.7b-instruct", "provider": "llm-jp", "parameter_count": "3.8B", "parameters_raw": 3782913024, "min_ram_gb": 2.1, "recommended_ram_gb": 3.5, "min_vram_gb": 1.9, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 810462, "hf_likes": 13, "release_date": "2024-09-23", "_discovered": true }, { "name": "microsoft/Phi-4-mini-reasoning", "provider": "Microsoft", "parameter_count": "3.8B", "parameters_raw": 3800000000, "min_ram_gb": 2.1, "recommended_ram_gb": 3.5, "min_vram_gb": 1.9, "quantization": "Q4_K_M", "context_length": 16384, "use_case": "Lightweight reasoning", "pipeline_tag": "text-generation", "architecture": "phi4", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-04-01", "gguf_sources": [ { "repo": "unsloth/Phi-4-mini-reasoning-GGUF", "provider": "unsloth" } ] }, { "name": "microsoft/phi-3-mini-4k-instruct", "provider": "Microsoft", "parameter_count": "3.8B", "parameters_raw": 3821000000, "min_ram_gb": 2.1, "recommended_ram_gb": 3.6, "min_vram_gb": 2.0, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Lightweight, edge deployment", "pipeline_tag": "text-generation", "architecture": "phi3", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "bartowski/phi-3-mini-4k-instruct-GGUF", "provider": "bartowski" } ] }, { "name": "microsoft/Phi-3.5-mini-instruct", "provider": "Microsoft", "parameter_count": "3.8B", "parameters_raw": 3821000000, "min_ram_gb": 2.1, "recommended_ram_gb": 3.6, "min_vram_gb": 2.0, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Lightweight, long context", "pipeline_tag": "text-generation", "architecture": "phi3", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "bartowski/Phi-3.5-mini-instruct-GGUF", "provider": "bartowski" } ] }, { "name": "zstanjj/HTML-Pruner-Phi-3.8B", "provider": "zstanjj", "parameter_count": "3.8B", "parameters_raw": 3821079552, "min_ram_gb": 2.1, "recommended_ram_gb": 3.6, "min_vram_gb": 2.0, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phi3", "hf_downloads": 88805, "hf_likes": 18, "release_date": "2024-10-16", "_discovered": true }, { "name": "Sreenington/Phi-3-mini-4k-instruct-AWQ", "provider": "sreenington", "parameter_count": "3.8B", "parameters_raw": 3821079552, "min_ram_gb": 2.1, "recommended_ram_gb": 3.6, "min_vram_gb": 2.0, "quantization": "AWQ-4bit", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 40949, "hf_likes": 5, "release_date": "2024-05-05", "_discovered": true, "format": "awq" }, { "name": "numind/NuExtract-1.5", "provider": "numind", "parameter_count": "3.8B", "parameters_raw": 3821079552, "min_ram_gb": 2.1, "recommended_ram_gb": 3.6, "min_vram_gb": 2.0, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phi3", "hf_downloads": 31247, "hf_likes": 243, "release_date": "2024-09-26", "_discovered": true }, { "name": "kaitchup/Phi-3-mini-4k-instruct-gptq-4bit", "provider": "kaitchup", "parameter_count": "3.8B", "parameters_raw": 3822095360, "min_ram_gb": 2.1, "recommended_ram_gb": 3.6, "min_vram_gb": 2.0, "quantization": "GPTQ-Int4", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phi3", "hf_downloads": 881144, "hf_likes": 2, "release_date": "2024-04-25", "_discovered": true, "format": "gptq" }, { "name": "Nanbeige/Nanbeige4.1-3B", "provider": "nanbeige", "parameter_count": "3.9B", "parameters_raw": 3933637120, "min_ram_gb": 2.2, "recommended_ram_gb": 3.7, "min_vram_gb": 2.0, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 417673, "hf_likes": 941, "release_date": "2026-02-10", "_discovered": true }, { "name": "google/gemma-3n-E2B-it", "provider": "Google", "parameter_count": "4B", "parameters_raw": 4000000000, "min_ram_gb": 2.2, "recommended_ram_gb": 3.7, "min_vram_gb": 2.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Multimodal, on-device (effective 2B)", "pipeline_tag": "image-text-to-text", "architecture": "gemma3n", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-06-25", "gguf_sources": [ { "repo": "unsloth/gemma-3n-E2B-it-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen3-4B-Base", "provider": "Alibaba", "parameter_count": "4.0B", "parameters_raw": 4022468096, "min_ram_gb": 2.2, "recommended_ram_gb": 3.7, "min_vram_gb": 2.1, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 548989, "hf_likes": 81, "release_date": "2025-04-28", "_discovered": true }, { "name": "Qwen/Qwen3-4B-AWQ", "provider": "Alibaba", "parameter_count": "4.0B", "parameters_raw": 4022468096, "min_ram_gb": 2.2, "recommended_ram_gb": 3.7, "min_vram_gb": 2.1, "quantization": "AWQ-4bit", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 344398, "hf_likes": 25, "release_date": "2025-05-05", "_discovered": true, "format": "awq" }, { "name": "typhoon-ai/typhoon2.5-qwen3-4b", "provider": "typhoon-ai", "parameter_count": "4.0B", "parameters_raw": 4022468096, "min_ram_gb": 2.2, "recommended_ram_gb": 3.7, "min_vram_gb": 2.1, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 51135, "hf_likes": 2, "release_date": "2025-09-23", "_discovered": true, "gguf_sources": [ { "repo": "typhoon-ai/typhoon2.5-qwen3-4b-gguf", "file": "typhoon2.5-qwen3-4b-q4_k_m.gguf", "quant": "Q4_K_M" } ] }, { "name": "JunHowie/Qwen3-4B-Instruct-2507-GPTQ-Int4", "provider": "junhowie", "parameter_count": "4.0B", "parameters_raw": 4022468096, "min_ram_gb": 2.2, "recommended_ram_gb": 3.7, "min_vram_gb": 2.1, "quantization": "GPTQ-Int4", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 36817, "hf_likes": 2, "release_date": "2025-09-01", "_discovered": true, "format": "gptq" }, { "name": "TIGER-Lab/VLM2Vec-Full", "provider": "tiger-lab", "parameter_count": "4.1B", "parameters_raw": 4146621440, "min_ram_gb": 2.3, "recommended_ram_gb": 3.9, "min_vram_gb": 2.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phi3_v", "hf_downloads": 64160, "hf_likes": 28, "release_date": "2024-10-08", "_discovered": true }, { "name": "lmstudio-community/Qwen3-14B-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "4.2B", "parameters_raw": 4153891840, "min_ram_gb": 2.3, "recommended_ram_gb": 3.9, "min_vram_gb": 2.1, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 42084, "hf_likes": 1, "release_date": "2025-04-28", "_discovered": true }, { "name": "lmstudio-community/Qwen2.5-Coder-14B-Instruct-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "4.2B", "parameters_raw": 4154676224, "min_ram_gb": 2.3, "recommended_ram_gb": 3.9, "min_vram_gb": 2.1, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 82050, "hf_likes": 1, "release_date": "2024-11-11", "_discovered": true }, { "name": "Qwen/Qwen3-4B-SafeRL", "provider": "Alibaba", "parameter_count": "4.4B", "parameters_raw": 4411424256, "min_ram_gb": 2.5, "recommended_ram_gb": 4.1, "min_vram_gb": 2.3, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 53732, "hf_likes": 41, "release_date": "2025-09-30", "_discovered": true }, { "name": "Qwen/Qwen3-4B-Instruct-2507-FP8", "provider": "Alibaba", "parameter_count": "4.4B", "parameters_raw": 4411646016, "min_ram_gb": 2.5, "recommended_ram_gb": 4.1, "min_vram_gb": 2.3, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 507765, "hf_likes": 69, "release_date": "2025-08-06", "_discovered": true }, { "name": "Qwen/Qwen3-4B-FP8", "provider": "Alibaba", "parameter_count": "4.4B", "parameters_raw": 4411646016, "min_ram_gb": 2.5, "recommended_ram_gb": 4.1, "min_vram_gb": 2.3, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 250469, "hf_likes": 38, "release_date": "2025-04-28", "_discovered": true }, { "name": "nvidia/Nemotron-H-4B-Base-8K", "provider": "nvidia", "parameter_count": "4.5B", "parameters_raw": 4489223040, "min_ram_gb": 2.5, "recommended_ram_gb": 4.2, "min_vram_gb": 2.3, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 40602, "hf_likes": 5, "release_date": "2025-03-20", "_discovered": true }, { "name": "nvidia/Nemotron-H-4B-Instruct-128K", "provider": "nvidia", "parameter_count": "4.5B", "parameters_raw": 4489223040, "min_ram_gb": 2.5, "recommended_ram_gb": 4.2, "min_vram_gb": 2.3, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 38647, "hf_likes": 8, "release_date": "2025-04-15", "_discovered": true }, { "name": "stelterlab/Qwen3-Coder-30B-A3B-Instruct-AWQ", "provider": "stelterlab", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 10.9, "recommended_ram_gb": 21.8, "min_vram_gb": 18.2, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 63349, "hf_likes": 4, "release_date": "2025-07-31", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3300000000, "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen3.5-4B", "provider": "Alibaba", "parameter_count": "4.7B", "parameters_raw": 4659865088, "min_ram_gb": 2.6, "recommended_ram_gb": 4.3, "min_vram_gb": 2.4, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 99087, "hf_likes": 202, "release_date": "2026-02-27", "gguf_sources": [ { "repo": "unsloth/Qwen3.5-4B-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen3.5-4B-Base", "provider": "Alibaba", "parameter_count": "4.7B", "parameters_raw": 4659865088, "min_ram_gb": 2.6, "recommended_ram_gb": 4.3, "min_vram_gb": 2.4, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 3593, "hf_likes": 38, "release_date": "2026-02-27" }, { "name": "nvidia/Qwen3-8B-NVFP4", "provider": "nvidia", "parameter_count": "4.7B", "parameters_raw": 4717851648, "min_ram_gb": 2.6, "recommended_ram_gb": 4.4, "min_vram_gb": 2.4, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 32743, "hf_likes": 14, "release_date": "2025-09-09", "_discovered": true }, { "name": "speakleash/Bielik-4.5B-v3.0-Instruct", "provider": "speakleash", "parameter_count": "4.8B", "parameters_raw": 4757260288, "min_ram_gb": 2.7, "recommended_ram_gb": 4.4, "min_vram_gb": 2.4, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 43008, "hf_likes": 27, "release_date": "2025-04-18", "_discovered": true }, { "name": "XLabs-AI/xflux_text_encoders", "provider": "xlabs-ai", "parameter_count": "4.8B", "parameters_raw": 4762310656, "min_ram_gb": 2.7, "recommended_ram_gb": 4.4, "min_vram_gb": 2.4, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "t5", "hf_downloads": 162123, "hf_likes": 21, "release_date": "2024-08-11", "_discovered": true }, { "name": "stelterlab/NVIDIA-Nemotron-3-Nano-30B-A3B-AWQ", "provider": "stelterlab", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 10.9, "recommended_ram_gb": 21.8, "min_vram_gb": 18.2, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 38947, "hf_likes": 4, "release_date": "2026-01-31", "_discovered": true, "format": "awq", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3300000000 }, { "name": "lmstudio-community/Qwen3-32B-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "5.1B", "parameters_raw": 5119652864, "min_ram_gb": 2.9, "recommended_ram_gb": 4.8, "min_vram_gb": 2.6, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 26287, "hf_likes": 4, "release_date": "2025-04-28", "_discovered": true }, { "name": "lmstudio-community/Qwen2.5-Coder-32B-Instruct-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "5.1B", "parameters_raw": 5120300032, "min_ram_gb": 2.9, "recommended_ram_gb": 4.8, "min_vram_gb": 2.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 44413, "hf_likes": 6, "release_date": "2024-11-11", "_discovered": true }, { "name": "lmstudio-community/QwQ-32B-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "5.1B", "parameters_raw": 5120300032, "min_ram_gb": 2.9, "recommended_ram_gb": 4.8, "min_vram_gb": 2.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 32595, "hf_likes": 0, "release_date": "2025-03-05", "_discovered": true }, { "name": "cyankiwi/Qwen3-Coder-30B-A3B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 3.0, "recommended_ram_gb": 4.9, "min_vram_gb": 2.7, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 135548, "hf_likes": 40, "release_date": "2025-08-01", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3000000000, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3-30B-A3B-Instruct-2507-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 3.0, "recommended_ram_gb": 4.9, "min_vram_gb": 2.7, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 85989, "hf_likes": 30, "release_date": "2025-07-29", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3000000000, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/MiroThinker-v1.5-30B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 3.0, "recommended_ram_gb": 4.9, "min_vram_gb": 2.7, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 20465, "hf_likes": 3, "release_date": "2026-01-06", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 580405768, "_discovered": true, "format": "awq" }, { "name": "01-ai/Yi-6B-Chat", "provider": "01.ai", "parameter_count": "6.1B", "parameters_raw": 6061035520, "min_ram_gb": 3.4, "recommended_ram_gb": 5.6, "min_vram_gb": 3.1, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 15481, "hf_likes": 70, "release_date": "2023-11-22" }, { "name": "arcee-ai/Trinity-Nano-Preview", "provider": "arcee-ai", "parameter_count": "6.1B", "parameters_raw": 6120003328, "min_ram_gb": 3.4, "recommended_ram_gb": 5.7, "min_vram_gb": 3.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "afmoe", "hf_downloads": 22294, "hf_likes": 67, "release_date": "2025-12-01", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 669375358, "_discovered": true }, { "name": "cyankiwi/GLM-4.7-Flash-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "6.4B", "parameters_raw": 6407095318, "min_ram_gb": 3.6, "recommended_ram_gb": 6.0, "min_vram_gb": 3.3, "quantization": "AWQ-4bit", "context_length": 202752, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe_lite", "hf_downloads": 217691, "hf_likes": 46, "release_date": "2026-01-19", "_discovered": true, "format": "awq" }, { "name": "lmsys/vicuna-7b-v1.5", "provider": "LMSYS", "parameter_count": "7.0B", "parameters_raw": 6738415616, "min_ram_gb": 3.8, "recommended_ram_gb": 6.3, "min_vram_gb": 3.4, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "tartuNLP/Llammas-base-p1-GPT-4o-human-error-mix-paragraph-GEC", "provider": "tartunlp", "parameter_count": "6.7B", "parameters_raw": 6738415616, "min_ram_gb": 3.8, "recommended_ram_gb": 6.3, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 36045, "hf_likes": 0, "release_date": "2025-02-11", "_discovered": true }, { "name": "meta-llama/Llama-2-7b-hf", "provider": "Meta", "parameter_count": "6.7B", "parameters_raw": 6738417664, "min_ram_gb": 3.8, "recommended_ram_gb": 6.3, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 617643, "hf_likes": 2272, "release_date": "2023-07-13", "_discovered": true }, { "name": "huggyllama/llama-7b", "provider": "huggyllama", "parameter_count": "6.7B", "parameters_raw": 6738417664, "min_ram_gb": 3.8, "recommended_ram_gb": 6.3, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 103505, "hf_likes": 354, "release_date": "2023-04-03", "_discovered": true }, { "name": "NousResearch/Llama-2-7b-hf", "provider": "NousResearch", "parameter_count": "6.7B", "parameters_raw": 6738417664, "min_ram_gb": 3.8, "recommended_ram_gb": 6.3, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 81336, "hf_likes": 171, "release_date": "2023-07-18", "_discovered": true }, { "name": "NousResearch/Llama-2-7b-chat-hf", "provider": "NousResearch", "parameter_count": "6.7B", "parameters_raw": 6738417664, "min_ram_gb": 3.8, "recommended_ram_gb": 6.3, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 20573, "hf_likes": 194, "release_date": "2023-07-18", "_discovered": true }, { "name": "meta-llama/CodeLlama-7b-Instruct-hf", "provider": "Meta", "parameter_count": "6.7B", "parameters_raw": 6738546688, "min_ram_gb": 3.8, "recommended_ram_gb": 6.3, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 5404, "hf_likes": 59, "release_date": "2024-03-13" }, { "name": "codellama/CodeLlama-7b-Instruct-hf", "provider": "codellama", "parameter_count": "6.7B", "parameters_raw": 6738546688, "min_ram_gb": 3.8, "recommended_ram_gb": 6.3, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 16384, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 65896, "hf_likes": 254, "release_date": "2023-08-24", "_discovered": true }, { "name": "codellama/CodeLlama-7b-hf", "provider": "codellama", "parameter_count": "6.7B", "parameters_raw": 6738546688, "min_ram_gb": 3.8, "recommended_ram_gb": 6.3, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 16384, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 54518, "hf_likes": 375, "release_date": "2023-08-24", "_discovered": true }, { "name": "deepseek-ai/deepseek-coder-6.7b-instruct", "provider": "DeepSeek", "parameter_count": "6.7B", "parameters_raw": 6740512768, "min_ram_gb": 3.8, "recommended_ram_gb": 6.3, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 16384, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 97176, "hf_likes": 478, "release_date": "2023-10-29", "_discovered": true }, { "name": "deepseek-ai/DeepSeek-V4-Flash", "provider": "deepseek-ai", "parameter_count": "284B", "parameters_raw": 284000000000, "active_parameters": 13000000000, "is_moe": true, "min_ram_gb": 200.0, "recommended_ram_gb": 320.0, "min_vram_gb": 156.0, "quantization": "FP4-MoE-Mixed", "context_length": 1000000, "use_case": "General-purpose reasoning, long-context", "capabilities": [ "long_context", "reasoning", "moe" ], "pipeline_tag": "text-generation", "architecture": "deepseek_v4_moe", "hf_downloads": 3542202, "hf_likes": 0, "release_date": "2026-05-15" }, { "name": "deepseek-ai/DeepSeek-V4-Flash-Base", "provider": "deepseek-ai", "parameter_count": "284B", "parameters_raw": 284000000000, "active_parameters": 13000000000, "is_moe": true, "min_ram_gb": 290.0, "recommended_ram_gb": 460.0, "min_vram_gb": 284.0, "quantization": "FP8-Mixed", "context_length": 1000000, "use_case": "Base pretrained \u2014 fine-tuning starting point", "capabilities": [ "long_context", "moe" ], "pipeline_tag": "text-generation", "architecture": "deepseek_v4_moe", "hf_downloads": 0, "hf_likes": 0, "release_date": "2026-05-15" }, { "name": "deepseek-ai/DeepSeek-V4-Pro", "provider": "deepseek-ai", "parameter_count": "1.6T", "parameters_raw": 1600000000000, "active_parameters": 49000000000, "is_moe": true, "min_ram_gb": 1100.0, "recommended_ram_gb": 1800.0, "min_vram_gb": 880.0, "quantization": "FP4-MoE-Mixed", "context_length": 1000000, "use_case": "Flagship reasoning, long-context", "capabilities": [ "long_context", "reasoning", "moe" ], "pipeline_tag": "text-generation", "architecture": "deepseek_v4_moe", "hf_downloads": 0, "hf_likes": 0, "release_date": "2026-05-15" }, { "name": "deepseek-ai/DeepSeek-V4-Pro-Base", "provider": "deepseek-ai", "parameter_count": "1.6T", "parameters_raw": 1600000000000, "active_parameters": 49000000000, "is_moe": true, "min_ram_gb": 1700.0, "recommended_ram_gb": 2600.0, "min_vram_gb": 1600.0, "quantization": "FP8-Mixed", "context_length": 1000000, "use_case": "Base pretrained \u2014 fine-tuning starting point", "capabilities": [ "long_context", "moe" ], "pipeline_tag": "text-generation", "architecture": "deepseek_v4_moe", "hf_downloads": 0, "hf_likes": 0, "release_date": "2026-05-15" }, { "name": "deepseek-ai/deepseek-coder-6.7b-base", "provider": "DeepSeek", "parameter_count": "6.7B", "parameters_raw": 6740512768, "min_ram_gb": 3.8, "recommended_ram_gb": 6.3, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 16384, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 28134, "hf_likes": 122, "release_date": "2023-10-23", "_discovered": true }, { "name": "allenai/OLMoE-1B-7B-0125", "provider": "allenai", "parameter_count": "6.9B", "parameters_raw": 6919161856, "min_ram_gb": 3.9, "recommended_ram_gb": 6.4, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmoe", "hf_downloads": 42434, "hf_likes": 35, "release_date": "2025-01-21", "is_moe": true, "num_experts": 64, "active_experts": 8, "active_parameters": 1167608556, "_discovered": true }, { "name": "allenai/OLMoE-1B-7B-0125-Instruct", "provider": "allenai", "parameter_count": "6.9B", "parameters_raw": 6919161856, "min_ram_gb": 3.9, "recommended_ram_gb": 6.4, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmoe", "hf_downloads": 35624, "hf_likes": 58, "release_date": "2025-01-27", "is_moe": true, "num_experts": 64, "active_experts": 8, "active_parameters": 1167608556, "_discovered": true }, { "name": "EleutherAI/pythia-6.9b", "provider": "eleutherai", "parameter_count": "7.0B", "parameters_raw": 6991520256, "min_ram_gb": 3.9, "recommended_ram_gb": 6.5, "min_vram_gb": 3.6, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neox", "hf_downloads": 20516, "hf_likes": 59, "release_date": "2023-02-14", "_discovered": true }, { "name": "openchat/openchat-3.5-0106", "provider": "OpenChat", "parameter_count": "7.0B", "parameters_raw": 7000000000, "min_ram_gb": 3.9, "recommended_ram_gb": 6.5, "min_vram_gb": 3.6, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "Instruction following, chat", "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "XiaomiMiMo/MiMo-7B-RL", "provider": "Xiaomi", "parameter_count": "7.0B", "parameters_raw": 7000000000, "min_ram_gb": 3.9, "recommended_ram_gb": 6.5, "min_vram_gb": 3.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Advanced reasoning, math and code", "pipeline_tag": "text-generation", "architecture": "mimo", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-05-01" }, { "name": "microsoft/Orca-2-7b", "provider": "Microsoft", "parameter_count": "7.0B", "parameters_raw": 7016400896, "min_ram_gb": 3.9, "recommended_ram_gb": 6.5, "min_vram_gb": 3.6, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Reasoning, step-by-step solutions", "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "omni-research/Tarsier-7b", "provider": "omni-research", "parameter_count": "7.1B", "parameters_raw": 7063427072, "min_ram_gb": 3.9, "recommended_ram_gb": 6.6, "min_vram_gb": 3.6, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llava", "hf_downloads": 49581, "hf_likes": 25, "release_date": "2024-07-04", "_discovered": true }, { "name": "bigcode/starcoder2-7b", "provider": "BigCode", "parameter_count": "7.2B", "parameters_raw": 7173923840, "min_ram_gb": 4.0, "recommended_ram_gb": 6.7, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 16384, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "starcoder2", "hf_downloads": 19199, "hf_likes": 208, "release_date": "2024-02-20" }, { "name": "tiiuae/falcon-7b-instruct", "provider": "TII", "parameter_count": "7.2B", "parameters_raw": 7217189760, "min_ram_gb": 4.0, "recommended_ram_gb": 6.7, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "falcon", "hf_downloads": 47656, "hf_likes": 1031, "release_date": "2023-04-25" }, { "name": "HuggingFaceH4/zephyr-7b-beta", "provider": "HuggingFace", "parameter_count": "7.2B", "parameters_raw": 7241732096, "min_ram_gb": 4.0, "recommended_ram_gb": 6.7, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 107437, "hf_likes": 1834, "release_date": "2023-10-26" }, { "name": "mistralai/Mistral-7B-Instruct-v0.2", "provider": "Mistral AI", "parameter_count": "7.2B", "parameters_raw": 7241732096, "min_ram_gb": 4.0, "recommended_ram_gb": 6.7, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 2920309, "hf_likes": 3088, "release_date": "2023-12-11", "_discovered": true }, { "name": "speakleash/Bielik-7B-Instruct-v0.1", "provider": "speakleash", "parameter_count": "7.2B", "parameters_raw": 7241732096, "min_ram_gb": 4.0, "recommended_ram_gb": 6.7, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 101914, "hf_likes": 63, "release_date": "2024-03-30", "_discovered": true }, { "name": "prometheus-eval/prometheus-7b-v2.0", "provider": "prometheus-eval", "parameter_count": "7.2B", "parameters_raw": 7241732096, "min_ram_gb": 4.0, "recommended_ram_gb": 6.7, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 54661, "hf_likes": 100, "release_date": "2024-02-13", "_discovered": true }, { "name": "Salesforce/xLAM-7b-r", "provider": "salesforce", "parameter_count": "7.2B", "parameters_raw": 7241732096, "min_ram_gb": 4.0, "recommended_ram_gb": 6.7, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 38045, "hf_likes": 32, "release_date": "2024-08-28", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/xLAM-7b-r-GGUF", "provider": "bartowski" } ] }, { "name": "Intel/neural-chat-7b-v3-3", "provider": "intel", "parameter_count": "7.2B", "parameters_raw": 7241732096, "min_ram_gb": 4.0, "recommended_ram_gb": 6.7, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 27068, "hf_likes": 80, "release_date": "2023-12-09", "_discovered": true }, { "name": "Featherless-Chat-Models/Mistral-7B-Instruct-v0.2", "provider": "featherless-chat-models", "parameter_count": "7.2B", "parameters_raw": 7241732096, "min_ram_gb": 4.0, "recommended_ram_gb": 6.7, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 26186, "hf_likes": 0, "release_date": "2025-05-08", "_discovered": true }, { "name": "augmxnt/shisa-gamma-7b-v1", "provider": "augmxnt", "parameter_count": "7.2B", "parameters_raw": 7241732096, "min_ram_gb": 4.0, "recommended_ram_gb": 6.7, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 20213, "hf_likes": 18, "release_date": "2023-12-23", "_discovered": true }, { "name": "dphn/dolphin-2.6-mistral-7b", "provider": "dphn", "parameter_count": "7.2B", "parameters_raw": 7241740288, "min_ram_gb": 4.0, "recommended_ram_gb": 6.7, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 60305, "hf_likes": 105, "release_date": "2023-12-27", "_discovered": true }, { "name": "mistralai/Mistral-7B-Instruct-v0.3", "provider": "Mistral AI", "parameter_count": "7.2B", "parameters_raw": 7248023552, "min_ram_gb": 4.1, "recommended_ram_gb": 6.8, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "unknown", "architecture": "mistral", "hf_downloads": 1540743, "hf_likes": 2447, "release_date": "2024-05-22", "gguf_sources": [ { "repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF", "provider": "bartowski" } ] }, { "name": "allenai/wildguard", "provider": "allenai", "parameter_count": "7.2B", "parameters_raw": 7248031744, "min_ram_gb": 4.1, "recommended_ram_gb": 6.8, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 23686, "hf_likes": 38, "release_date": "2024-06-15", "_discovered": true }, { "name": "dphn/dolphin-2.9.3-mistral-7B-32k", "provider": "dphn", "parameter_count": "7.2B", "parameters_raw": 7248039936, "min_ram_gb": 4.1, "recommended_ram_gb": 6.8, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 79357, "hf_likes": 57, "release_date": "2024-06-25", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/dolphin-2.9.3-mistral-7B-32k-GGUF", "provider": "bartowski" } ] }, { "name": "thesven/Mistral-7B-Instruct-v0.3-GPTQ", "provider": "thesven", "parameter_count": "7.2B", "parameters_raw": 7249399808, "min_ram_gb": 4.1, "recommended_ram_gb": 6.8, "min_vram_gb": 3.7, "quantization": "GPTQ-Int4", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 35763, "hf_likes": 1, "release_date": "2024-05-22", "_discovered": true, "format": "gptq" }, { "name": "allenai/Olmo-3-7B-Instruct-SFT", "provider": "allenai", "parameter_count": "7.3B", "parameters_raw": 7298011136, "min_ram_gb": 4.1, "recommended_ram_gb": 6.8, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 65536, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo3", "hf_downloads": 134834, "hf_likes": 4, "release_date": "2025-11-17", "_discovered": true }, { "name": "allenai/Olmo-3-1025-7B", "provider": "allenai", "parameter_count": "7.3B", "parameters_raw": 7298011136, "min_ram_gb": 4.1, "recommended_ram_gb": 6.8, "min_vram_gb": 3.7, "quantization": "Q4_K_M", "context_length": 65536, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo3", "hf_downloads": 71128, "hf_likes": 54, "release_date": "2025-09-12", "_discovered": true }, { "name": "TechxGenus/starcoder2-7b-GPTQ", "provider": "techxgenus", "parameter_count": "7.4B", "parameters_raw": 7400416256, "min_ram_gb": 4.1, "recommended_ram_gb": 6.9, "min_vram_gb": 3.8, "quantization": "GPTQ-Int4", "context_length": 16384, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "starcoder2", "hf_downloads": 36955, "hf_likes": 2, "release_date": "2024-03-22", "_discovered": true, "format": "gptq" }, { "name": "tiiuae/Falcon3-7B-Instruct", "provider": "TII", "parameter_count": "7.5B", "parameters_raw": 7455550464, "min_ram_gb": 4.2, "recommended_ram_gb": 6.9, "min_vram_gb": 3.8, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 18394, "hf_likes": 76, "release_date": "2024-11-29", "gguf_sources": [ { "repo": "bartowski/Falcon3-7B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-7B-Instruct", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 20736120, "hf_likes": 1108, "release_date": "2024-09-16", "gguf_sources": [ { "repo": "bartowski/Qwen2.5-7B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-Coder-7B-Instruct", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1575000, "hf_likes": 659, "release_date": "2024-09-17", "gguf_sources": [ { "repo": "unsloth/Qwen2.5-Coder-7B-Instruct-GGUF", "provider": "unsloth" }, { "repo": "bartowski/Qwen2.5-Coder-7B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", "provider": "DeepSeek", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 743941, "hf_likes": 797, "release_date": "2025-01-20", "gguf_sources": [ { "repo": "unsloth/DeepSeek-R1-Distill-Qwen-7B-GGUF", "provider": "unsloth" }, { "repo": "bartowski/DeepSeek-R1-Distill-Qwen-7B-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-7B", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 2029944, "hf_likes": 266, "release_date": "2024-09-15", "_discovered": true }, { "name": "Qwen/Qwen2.5-Coder-7B-Instruct-AWQ", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1107387, "hf_likes": 19, "release_date": "2024-09-20", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen2.5-Coder-7B-Instruct-GPTQ-Int4", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "GPTQ-Int4", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1066717, "hf_likes": 13, "release_date": "2024-09-20", "_discovered": true, "format": "gptq" }, { "name": "Qwen/Qwen2.5-Math-7B-Instruct", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 318106, "hf_likes": 89, "release_date": "2024-09-19", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-Math-7B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2-7B-Instruct", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 310355, "hf_likes": 683, "release_date": "2024-06-04", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2-7B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-Coder-7B", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 240132, "hf_likes": 137, "release_date": "2024-09-16", "_discovered": true }, { "name": "Qwen/Qwen2.5-7B-Instruct-GPTQ-Int4", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "GPTQ-Int4", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 158122, "hf_likes": 29, "release_date": "2024-09-17", "_discovered": true, "format": "gptq" }, { "name": "Dream-org/Dream-v0-Instruct-7B", "provider": "dream-org", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "Dream", "hf_downloads": 73949, "hf_likes": 154, "release_date": "2025-04-03", "_discovered": true }, { "name": "Qwen/Qwen2-7B", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 70734, "hf_likes": 170, "release_date": "2024-06-04", "_discovered": true }, { "name": "Qwen/Qwen2.5-Math-7B", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 68238, "hf_likes": 106, "release_date": "2024-09-16", "_discovered": true }, { "name": "DeepHat/DeepHat-V1-7B", "provider": "deephat", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 63374, "hf_likes": 111, "release_date": "2025-04-25", "_discovered": true }, { "name": "Qwen/Qwen2.5-7B-Instruct-1M", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 1010000, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 46699, "hf_likes": 366, "release_date": "2025-01-23", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-7B-Instruct-1M-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-7B-Instruct-GPTQ-Int8", "provider": "Alibaba", "parameter_count": "7.6B", "parameters_raw": 7615616512, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "GPTQ-Int8", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 30708, "hf_likes": 18, "release_date": "2024-09-17", "_discovered": true, "format": "gptq" }, { "name": "microsoft/Phi-mini-MoE-instruct", "provider": "Microsoft", "parameter_count": "7.6B", "parameters_raw": 7647632704, "min_ram_gb": 4.3, "recommended_ram_gb": 7.1, "min_vram_gb": 3.9, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phimoe", "hf_downloads": 69775, "hf_likes": 30, "release_date": "2025-06-23", "is_moe": true, "num_experts": 16, "active_experts": 2, "active_parameters": 1290538017, "_discovered": true }, { "name": "Qwen/Qwen-7B-Chat", "provider": "Alibaba", "parameter_count": "7.7B", "parameters_raw": 7721324544, "min_ram_gb": 4.3, "recommended_ram_gb": 7.2, "min_vram_gb": 4.0, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen", "hf_downloads": 195550, "hf_likes": 787, "release_date": "2023-08-03", "_discovered": true }, { "name": "Qwen/Qwen-7B", "provider": "Alibaba", "parameter_count": "7.7B", "parameters_raw": 7721324544, "min_ram_gb": 4.3, "recommended_ram_gb": 7.2, "min_vram_gb": 4.0, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen", "hf_downloads": 189346, "hf_likes": 396, "release_date": "2023-08-03", "_discovered": true }, { "name": "Qwen/Qwen1.5-7B", "provider": "Alibaba", "parameter_count": "7.7B", "parameters_raw": 7721324544, "min_ram_gb": 4.3, "recommended_ram_gb": 7.2, "min_vram_gb": 4.0, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 75458, "hf_likes": 56, "release_date": "2024-01-22", "_discovered": true }, { "name": "BSC-LT/salamandra-7b-instruct", "provider": "bsc-lt", "parameter_count": "7.8B", "parameters_raw": 7768117248, "min_ram_gb": 4.3, "recommended_ram_gb": 7.2, "min_vram_gb": 4.0, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 31017, "hf_likes": 75, "release_date": "2024-09-30", "_discovered": true }, { "name": "kmhf/hf-moshiko", "provider": "kmhf", "parameter_count": "7.8B", "parameters_raw": 7783880545, "min_ram_gb": 4.3, "recommended_ram_gb": 7.2, "min_vram_gb": 4.0, "quantization": "Q4_K_M", "context_length": 3000, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "moshi", "hf_downloads": 123900, "hf_likes": 0, "release_date": "2024-09-27", "_discovered": true }, { "name": "XiaomiMiMo/MiMo-7B-Base", "provider": "xiaomimimo", "parameter_count": "7.8B", "parameters_raw": 7833409536, "min_ram_gb": 4.4, "recommended_ram_gb": 7.3, "min_vram_gb": 4.0, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mimo", "hf_downloads": 93937, "hf_likes": 124, "release_date": "2025-04-29", "_discovered": true }, { "name": "google/gemma-3n-E4B-it", "provider": "Google", "parameter_count": "8B", "parameters_raw": 8000000000, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Multimodal, on-device (effective 4B)", "pipeline_tag": "image-text-to-text", "architecture": "gemma3n", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-06-25", "gguf_sources": [ { "repo": "unsloth/gemma-3n-E4B-it-GGUF", "provider": "unsloth" } ] }, { "name": "mistralai/Ministral-8B-Instruct-2410", "provider": "Mistral AI", "parameter_count": "8.0B", "parameters_raw": 8030261248, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "bartowski/Ministral-8B-Instruct-2410-GGUF", "provider": "bartowski" } ] }, { "name": "meta-llama/Meta-Llama-3-8B", "provider": "Meta", "parameter_count": "8.0B", "parameters_raw": 8030261248, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 2463959, "hf_likes": 6473, "release_date": "2024-04-17", "_discovered": true }, { "name": "meta-llama/Meta-Llama-3-8B-Instruct", "provider": "Meta", "parameter_count": "8.0B", "parameters_raw": 8030261248, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 1353966, "hf_likes": 4391, "release_date": "2024-04-17", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Meta-Llama-3-8B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "NousResearch/Hermes-3-Llama-3.1-8B", "provider": "NousResearch", "parameter_count": "8.0B", "parameters_raw": 8030261248, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 635984, "hf_likes": 391, "release_date": "2024-07-28", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Hermes-3-Llama-3.1-8B-GGUF", "provider": "bartowski" } ] }, { "name": "IlyaGusev/saiga_llama3_8b", "provider": "ilyagusev", "parameter_count": "8.0B", "parameters_raw": 8030261248, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 399621, "hf_likes": 137, "release_date": "2024-04-18", "_discovered": true }, { "name": "NousResearch/Meta-Llama-3.1-8B-Instruct", "provider": "NousResearch", "parameter_count": "8.0B", "parameters_raw": 8030261248, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 207258, "hf_likes": 39, "release_date": "2024-07-24", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "meta-llama/Llama-Guard-3-8B", "provider": "Meta", "parameter_count": "8.0B", "parameters_raw": 8030261248, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 163719, "hf_likes": 272, "release_date": "2024-07-22", "_discovered": true }, { "name": "nvidia/Llama-3.1-8B-Instruct-FP8", "provider": "nvidia", "parameter_count": "8.0B", "parameters_raw": 8030261248, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 93876, "hf_likes": 32, "release_date": "2024-08-29", "_discovered": true }, { "name": "PatronusAI/Llama-3-Patronus-Lynx-8B-Instruct-v1.1", "provider": "patronusai", "parameter_count": "8.0B", "parameters_raw": 8030261248, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 20626, "hf_likes": 10, "release_date": "2024-07-24", "_discovered": true }, { "name": "RedHatAI/Meta-Llama-3.1-8B-Instruct-FP8", "provider": "redhatai", "parameter_count": "8.0B", "parameters_raw": 8030261696, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 684729, "hf_likes": 44, "release_date": "2024-07-23", "_discovered": true }, { "name": "RedHatAI/Meta-Llama-3.1-8B-FP8", "provider": "redhatai", "parameter_count": "8.0B", "parameters_raw": 8030261696, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 200501, "hf_likes": 10, "release_date": "2024-07-31", "_discovered": true }, { "name": "fdtn-ai/Foundation-Sec-1.1-8B-Instruct", "provider": "fdtn-ai", "parameter_count": "8.0B", "parameters_raw": 8030326784, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 65536, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 53389, "hf_likes": 13, "release_date": "2025-11-18", "_discovered": true }, { "name": "lmms-lab/llava-onevision-qwen2-7b-ov", "provider": "lmms-lab", "parameter_count": "8.0B", "parameters_raw": 8030348832, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [ "vision" ], "pipeline_tag": "text-generation", "architecture": "llava", "hf_downloads": 133340, "hf_likes": 62, "release_date": "2024-06-29", "_discovered": true }, { "name": "RedHatAI/Meta-Llama-3.1-8B-Instruct-quantized.w4a16", "provider": "redhatai", "parameter_count": "8.0B", "parameters_raw": 8031637504, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 36809, "hf_likes": 30, "release_date": "2024-07-26", "_discovered": true }, { "name": "hugging-quants/Meta-Llama-3.1-8B-Instruct-GPTQ-INT4", "provider": "hugging-quants", "parameter_count": "8.0B", "parameters_raw": 8031637504, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "GPTQ-Int4", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 27054, "hf_likes": 41, "release_date": "2024-07-24", "_discovered": true, "format": "gptq" }, { "name": "RedHatAI/Meta-Llama-3.1-8B-Instruct-FP8-dynamic", "provider": "redhatai", "parameter_count": "8.0B", "parameters_raw": 8031637504, "min_ram_gb": 4.5, "recommended_ram_gb": 7.5, "min_vram_gb": 4.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 21204, "hf_likes": 9, "release_date": "2024-07-23", "_discovered": true }, { "name": "ibm-granite/granite-3.3-8b-instruct", "provider": "ibm-granite", "parameter_count": "8.2B", "parameters_raw": 8170864640, "min_ram_gb": 4.6, "recommended_ram_gb": 7.6, "min_vram_gb": 4.2, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granite", "hf_downloads": 65699, "hf_likes": 153, "release_date": "2025-04-09", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/granite-3.3-8b-instruct-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen3-8B-Base", "provider": "Alibaba", "parameter_count": "8.2B", "parameters_raw": 8190735360, "min_ram_gb": 4.6, "recommended_ram_gb": 7.6, "min_vram_gb": 4.2, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 790734, "hf_likes": 87, "release_date": "2025-04-28", "_discovered": true }, { "name": "Qwen/Qwen3-8B-AWQ", "provider": "Alibaba", "parameter_count": "8.2B", "parameters_raw": 8190735360, "min_ram_gb": 4.6, "recommended_ram_gb": 7.6, "min_vram_gb": 4.2, "quantization": "AWQ-4bit", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 327827, "hf_likes": 37, "release_date": "2025-05-03", "_discovered": true, "format": "awq" }, { "name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", "provider": "DeepSeek", "parameter_count": "8.2B", "parameters_raw": 8190735360, "min_ram_gb": 4.6, "recommended_ram_gb": 7.6, "min_vram_gb": 4.2, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 148562, "hf_likes": 1040, "release_date": "2025-05-29", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/DeepSeek-R1-0528-Qwen3-8B-GGUF", "provider": "unsloth" } ] }, { "name": "huihui-ai/Huihui-Qwen3-8B-abliterated-v2", "provider": "huihui-ai", "parameter_count": "8.2B", "parameters_raw": 8190735360, "min_ram_gb": 4.6, "recommended_ram_gb": 7.6, "min_vram_gb": 4.2, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 32025, "hf_likes": 34, "release_date": "2025-06-18", "_discovered": true }, { "name": "Qwen/Qwen3-8B-FP8", "provider": "Alibaba", "parameter_count": "8.2B", "parameters_raw": 8191159296, "min_ram_gb": 4.6, "recommended_ram_gb": 7.6, "min_vram_gb": 4.2, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 196191, "hf_likes": 57, "release_date": "2025-04-28", "_discovered": true }, { "name": "nytopop/Qwen3-8B.w8a8", "provider": "nytopop", "parameter_count": "8.2B", "parameters_raw": 8192136192, "min_ram_gb": 4.6, "recommended_ram_gb": 7.6, "min_vram_gb": 4.2, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 33985, "hf_likes": 1, "release_date": "2025-04-29", "_discovered": true }, { "name": "Qwen/Qwen2.5-VL-7B-Instruct", "provider": "Alibaba", "parameter_count": "8.3B", "parameters_raw": 8292166656, "min_ram_gb": 4.6, "recommended_ram_gb": 7.7, "min_vram_gb": 4.2, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Instruction following, chat", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen2_5_vl", "hf_downloads": 4008802, "hf_likes": 1462, "release_date": "2025-01-26", "gguf_sources": [ { "repo": "unsloth/Qwen2.5-VL-7B-Instruct-GGUF", "provider": "unsloth" } ] }, { "name": "LiquidAI/LFM2-8B-A1B", "provider": "liquidai", "parameter_count": "8.3B", "parameters_raw": 8339929856, "min_ram_gb": 4.7, "recommended_ram_gb": 7.8, "min_vram_gb": 4.3, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2_moe", "hf_downloads": 47242, "hf_likes": 328, "release_date": "2025-10-07", "is_moe": true, "num_experts": 32, "active_experts": 4, "active_parameters": 1407363160, "_discovered": true, "gguf_sources": [ { "repo": "unsloth/LFM2-8B-A1B-GGUF", "provider": "unsloth" } ] }, { "name": "nvidia/Mistral-NeMo-Minitron-8B-Instruct", "provider": "nvidia", "parameter_count": "8.4B", "parameters_raw": 8414105600, "min_ram_gb": 4.7, "recommended_ram_gb": 7.8, "min_vram_gb": 4.3, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 55809, "hf_likes": 82, "release_date": "2024-10-02", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Mistral-NeMo-Minitron-8B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "01-ai/Yi-1.5-9B-Chat", "provider": "01.ai", "parameter_count": "8.8B", "parameters_raw": 8829407232, "min_ram_gb": 4.9, "recommended_ram_gb": 8.2, "min_vram_gb": 4.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 19975, "hf_likes": 148, "release_date": "2024-05-10", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Yi-1.5-9B-Chat-GGUF", "provider": "bartowski" } ] }, { "name": "nvidia/NVIDIA-Nemotron-Nano-9B-v2-Base", "provider": "nvidia", "parameter_count": "8.9B", "parameters_raw": 8888227328, "min_ram_gb": 5.0, "recommended_ram_gb": 8.3, "min_vram_gb": 4.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 165722, "hf_likes": 43, "release_date": "2025-08-14", "_discovered": true }, { "name": "nvidia/NVIDIA-Nemotron-Nano-9B-v2-Japanese", "provider": "nvidia", "parameter_count": "8.9B", "parameters_raw": 8888227328, "min_ram_gb": 5.0, "recommended_ram_gb": 8.3, "min_vram_gb": 4.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nemotron_h", "hf_downloads": 24028, "hf_likes": 121, "release_date": "2026-02-04", "_discovered": true }, { "name": "nvidia/NVIDIA-Nemotron-Nano-9B-v2-FP8", "provider": "nvidia", "parameter_count": "8.9B", "parameters_raw": 8888227432, "min_ram_gb": 5.0, "recommended_ram_gb": 8.3, "min_vram_gb": 4.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nemotron_h", "hf_downloads": 70791, "hf_likes": 7, "release_date": "2025-09-22", "_discovered": true }, { "name": "nvidia/NVIDIA-Nemotron-Nano-9B-v2", "provider": "NVIDIA", "parameter_count": "9B", "parameters_raw": 9000000000, "min_ram_gb": 5.0, "recommended_ram_gb": 8.4, "min_vram_gb": 4.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Hybrid Mamba2, reasoning", "pipeline_tag": "text-generation", "architecture": "nemotron", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-06-01" }, { "name": "lmstudio-community/Qwen3-32B-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "9.2B", "parameters_raw": 9214833664, "min_ram_gb": 5.1, "recommended_ram_gb": 8.6, "min_vram_gb": 4.7, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 24718, "hf_likes": 2, "release_date": "2025-04-28", "_discovered": true }, { "name": "lmstudio-community/Qwen2.5-Coder-32B-Instruct-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "9.2B", "parameters_raw": 9215644672, "min_ram_gb": 5.1, "recommended_ram_gb": 8.6, "min_vram_gb": 4.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 41754, "hf_likes": 3, "release_date": "2024-11-11", "_discovered": true }, { "name": "lmstudio-community/QwQ-32B-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "9.2B", "parameters_raw": 9215644672, "min_ram_gb": 5.1, "recommended_ram_gb": 8.6, "min_vram_gb": 4.7, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 32269, "hf_likes": 0, "release_date": "2025-03-05", "_discovered": true }, { "name": "google/gemma-2-9b-it", "provider": "Google", "parameter_count": "9.2B", "parameters_raw": 9241705984, "min_ram_gb": 5.2, "recommended_ram_gb": 8.6, "min_vram_gb": 4.7, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gemma2", "hf_downloads": 180627, "hf_likes": 775, "release_date": "2024-06-24", "gguf_sources": [ { "repo": "bartowski/gemma-2-9b-it-GGUF", "provider": "bartowski" } ] }, { "name": "zai-org/glm-4-9b-chat-hf", "provider": "zai-org", "parameter_count": "9.4B", "parameters_raw": 9399951360, "min_ram_gb": 5.3, "recommended_ram_gb": 8.8, "min_vram_gb": 4.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm", "hf_downloads": 22553, "hf_likes": 24, "release_date": "2024-10-23", "_discovered": true }, { "name": "THUDM/glm-4-9b-chat", "provider": "thudm", "parameter_count": "9.4B", "parameters_raw": 9399951392, "min_ram_gb": 5.3, "recommended_ram_gb": 8.8, "min_vram_gb": 4.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "unknown", "architecture": "chatglm", "hf_downloads": 190092, "hf_likes": 702, "release_date": "2024-06-04", "gguf_sources": [ { "repo": "bartowski/glm-4-9b-chat-GGUF", "provider": "bartowski" } ] }, { "name": "zai-org/glm-4-9b", "provider": "zai-org", "parameter_count": "9.4B", "parameters_raw": 9399951392, "min_ram_gb": 5.3, "recommended_ram_gb": 8.8, "min_vram_gb": 4.8, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "chatglm", "hf_downloads": 23550, "hf_likes": 143, "release_date": "2024-06-04", "_discovered": true }, { "name": "Qwen/Qwen3.5-9B", "provider": "Alibaba", "parameter_count": "9.7B", "parameters_raw": 9653104368, "min_ram_gb": 5.4, "recommended_ram_gb": 9.0, "min_vram_gb": 4.9, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 172298, "hf_likes": 345, "release_date": "2026-02-27", "gguf_sources": [ { "repo": "unsloth/Qwen3.5-9B-GGUF", "provider": "unsloth", "file": "Qwen3.5-9B-Q4_K_M.gguf" } ] }, { "name": "Qwen/Qwen3.5-9B-Base", "provider": "Alibaba", "parameter_count": "9.7B", "parameters_raw": 9653104368, "min_ram_gb": 5.4, "recommended_ram_gb": 9.0, "min_vram_gb": 4.9, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 5324, "hf_likes": 38, "release_date": "2026-02-26" }, { "name": "solidrust/gemma-2-9b-it-AWQ", "provider": "solidrust", "parameter_count": "10.2B", "parameters_raw": 10159209984, "min_ram_gb": 5.7, "recommended_ram_gb": 9.5, "min_vram_gb": 5.2, "quantization": "AWQ-4bit", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gemma2", "hf_downloads": 32664, "hf_likes": 2, "release_date": "2024-09-03", "_discovered": true, "format": "awq" }, { "name": "meta-llama/Llama-3.2-11B-Vision-Instruct", "provider": "Meta", "parameter_count": "11.0B", "parameters_raw": 10665463808, "min_ram_gb": 6.0, "recommended_ram_gb": 9.9, "min_vram_gb": 5.5, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Multimodal, vision and text", "pipeline_tag": "image-text-to-text", "architecture": "llama", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "upstage/SOLAR-10.7B-Instruct-v1.0", "provider": "Upstage", "parameter_count": "10.7B", "parameters_raw": 10700000000, "min_ram_gb": 6.0, "recommended_ram_gb": 10.0, "min_vram_gb": 5.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "High-performance instruction following", "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "naver-hyperclovax/HyperCLOVAX-SEED-Omni-8B", "provider": "naver-hyperclovax", "parameter_count": "10.7B", "parameters_raw": 10741664520, "min_ram_gb": 6.0, "recommended_ram_gb": 10.0, "min_vram_gb": 5.5, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "vlm", "hf_downloads": 102546, "hf_likes": 181, "release_date": "2025-12-23", "_discovered": true }, { "name": "speakleash/Bielik-11B-v3.0-Instruct", "provider": "speakleash", "parameter_count": "11.2B", "parameters_raw": 11168796672, "min_ram_gb": 6.2, "recommended_ram_gb": 10.4, "min_vram_gb": 5.7, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 232376, "hf_likes": 55, "release_date": "2025-11-07", "_discovered": true }, { "name": "cjvt/GaMS3-12B-Instruct", "provider": "cjvt", "parameter_count": "11.8B", "parameters_raw": 11766034176, "min_ram_gb": 6.6, "recommended_ram_gb": 11.0, "min_vram_gb": 6.0, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gemma3_text", "hf_downloads": 26653, "hf_likes": 1, "release_date": "2025-12-04", "_discovered": true }, { "name": "EleutherAI/pythia-12b", "provider": "eleutherai", "parameter_count": "12.0B", "parameters_raw": 11997067840, "min_ram_gb": 6.7, "recommended_ram_gb": 11.2, "min_vram_gb": 6.1, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_neox", "hf_downloads": 43453, "hf_likes": 144, "release_date": "2023-02-28", "_discovered": true }, { "name": "google/gemma-3-12b-it", "provider": "Google", "parameter_count": "12B", "parameters_raw": 12000000000, "min_ram_gb": 6.7, "recommended_ram_gb": 11.2, "min_vram_gb": 6.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Multimodal, vision and text", "pipeline_tag": "text-generation", "architecture": "gemma3", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "unsloth/gemma-3-12b-it-GGUF", "provider": "unsloth" } ] }, { "name": "mistralai/Mistral-Nemo-Instruct-2407", "provider": "Mistral AI", "parameter_count": "12.2B", "parameters_raw": 12247076864, "min_ram_gb": 6.8, "recommended_ram_gb": 11.4, "min_vram_gb": 6.3, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "unsloth/Mistral-Nemo-Instruct-2407-GGUF", "provider": "unsloth" }, { "repo": "bartowski/Mistral-Nemo-Instruct-2407-GGUF", "provider": "bartowski" } ] }, { "name": "casperhansen/mistral-nemo-instruct-2407-awq", "provider": "casperhansen", "parameter_count": "12.2B", "parameters_raw": 12247782400, "min_ram_gb": 6.8, "recommended_ram_gb": 11.4, "min_vram_gb": 6.3, "quantization": "AWQ-4bit", "context_length": 1024000, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 189490, "hf_likes": 12, "release_date": "2024-07-23", "_discovered": true, "format": "awq" }, { "name": "m8than/Mistral-Nemo-Instruct-2407-lenient-chatfix", "provider": "m8than", "parameter_count": "12.2B", "parameters_raw": 12247782400, "min_ram_gb": 6.8, "recommended_ram_gb": 11.4, "min_vram_gb": 6.3, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 25879, "hf_likes": 0, "release_date": "2025-05-06", "_discovered": true }, { "name": "mixtao/MixTAO-7Bx2-MoE-v8.1", "provider": "mixtao", "parameter_count": "12.9B", "parameters_raw": 12879138816, "min_ram_gb": 7.2, "recommended_ram_gb": 12.0, "min_vram_gb": 6.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mixtral", "hf_downloads": 20213, "hf_likes": 55, "release_date": "2024-02-26", "is_moe": true, "num_experts": 2, "active_experts": 2, "active_parameters": 12879138816, "_discovered": true }, { "name": "microsoft/Orca-2-13b", "provider": "Microsoft", "parameter_count": "13.0B", "parameters_raw": 13015864320, "min_ram_gb": 7.3, "recommended_ram_gb": 12.1, "min_vram_gb": 6.7, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Reasoning, step-by-step solutions", "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "lmsys/vicuna-13b-v1.5", "provider": "LMSYS", "parameter_count": "13.0B", "parameters_raw": 13015864320, "min_ram_gb": 7.3, "recommended_ram_gb": 12.1, "min_vram_gb": 6.7, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "WizardLMTeam/WizardLM-13B-V1.2", "provider": "WizardLM", "parameter_count": "13.0B", "parameters_raw": 13015864320, "min_ram_gb": 7.3, "recommended_ram_gb": 12.1, "min_vram_gb": 6.7, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "cais/HarmBench-Llama-2-13b-cls", "provider": "cais", "parameter_count": "13.0B", "parameters_raw": 13015864320, "min_ram_gb": 7.3, "recommended_ram_gb": 12.1, "min_vram_gb": 6.7, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 30370, "hf_likes": 27, "release_date": "2024-02-03", "_discovered": true }, { "name": "meta-llama/CodeLlama-13b-Instruct-hf", "provider": "Meta", "parameter_count": "13.0B", "parameters_raw": 13016028160, "min_ram_gb": 7.3, "recommended_ram_gb": 12.1, "min_vram_gb": 6.7, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 6450, "hf_likes": 27, "release_date": "2024-03-13" }, { "name": "microsoft/phi-4", "provider": "Microsoft", "parameter_count": "14B", "parameters_raw": 14000000000, "min_ram_gb": 7.8, "recommended_ram_gb": 13.0, "min_vram_gb": 7.2, "quantization": "Q4_K_M", "context_length": 16384, "use_case": "Reasoning, STEM, code generation", "pipeline_tag": "text-generation", "architecture": "phi", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "unsloth/phi-4-GGUF", "provider": "unsloth" }, { "repo": "bartowski/phi-4-GGUF", "provider": "bartowski" } ] }, { "name": "microsoft/Phi-3-medium-14b-instruct", "provider": "Microsoft", "parameter_count": "14B", "parameters_raw": 14000000000, "min_ram_gb": 7.8, "recommended_ram_gb": 13.0, "min_vram_gb": 7.2, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Balanced performance and size", "pipeline_tag": "text-generation", "architecture": "phi3", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "microsoft/Phi-4-reasoning", "provider": "Microsoft", "parameter_count": "14B", "parameters_raw": 14000000000, "min_ram_gb": 7.8, "recommended_ram_gb": 13.0, "min_vram_gb": 7.2, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Advanced reasoning, math and code", "pipeline_tag": "text-generation", "architecture": "phi4", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-04-01", "gguf_sources": [ { "repo": "unsloth/Phi-4-reasoning-GGUF", "provider": "unsloth" } ] }, { "name": "microsoft/Phi-4-multimodal-instruct", "provider": "Microsoft", "parameter_count": "14B", "parameters_raw": 14000000000, "min_ram_gb": 7.8, "recommended_ram_gb": 13.0, "min_vram_gb": 7.2, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Multimodal, vision and audio", "pipeline_tag": "image-text-to-text", "architecture": "phi4", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-04-01" }, { "name": "Qwen/Qwen-14B-Chat-Int4", "provider": "Alibaba", "parameter_count": "14.2B", "parameters_raw": 14168796160, "min_ram_gb": 7.9, "recommended_ram_gb": 13.2, "min_vram_gb": 7.3, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen", "hf_downloads": 45732, "hf_likes": 100, "release_date": "2023-09-24", "_discovered": true }, { "name": "Qwen/Qwen1.5-MoE-A2.7B", "provider": "Alibaba", "parameter_count": "14.3B", "parameters_raw": 14315784192, "min_ram_gb": 8.0, "recommended_ram_gb": 13.3, "min_vram_gb": 7.3, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2_moe", "hf_downloads": 59931, "hf_likes": 220, "release_date": "2024-02-29", "is_moe": true, "num_experts": 60, "active_experts": 4, "active_parameters": 1622455541, "_discovered": true }, { "name": "bullpoint/Qwen3-Coder-Next-AWQ-4bit", "provider": "bullpoint", "parameter_count": "14.4B", "parameters_raw": 14444722944, "min_ram_gb": 8.1, "recommended_ram_gb": 13.5, "min_vram_gb": 7.4, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 1226868, "hf_likes": 14, "release_date": "2026-02-03", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": 990253467, "_discovered": true, "format": "awq" }, { "name": "stelterlab/phi-4-AWQ", "provider": "stelterlab", "parameter_count": "14.7B", "parameters_raw": 14659507200, "min_ram_gb": 8.2, "recommended_ram_gb": 13.7, "min_vram_gb": 7.5, "quantization": "AWQ-4bit", "context_length": 16384, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "phi3", "hf_downloads": 55064, "hf_likes": 4, "release_date": "2025-01-11", "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3-Next-80B-A3B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "80.0B", "parameters_raw": 80000000000, "min_ram_gb": 8.2, "recommended_ram_gb": 13.7, "min_vram_gb": 7.5, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 192744, "hf_likes": 61, "release_date": "2025-09-12", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": 3000000000, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3-Next-80B-A3B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "80.0B", "parameters_raw": 80000000000, "min_ram_gb": 8.2, "recommended_ram_gb": 13.7, "min_vram_gb": 7.5, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 168561, "hf_likes": 22, "release_date": "2025-09-12", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": 3000000000, "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen3-14B-AWQ", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14768307200, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "AWQ-4bit", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 258163, "hf_likes": 57, "release_date": "2025-05-01", "_discovered": true, "format": "awq" }, { "name": "OpenPipe/Qwen3-14B-Instruct", "provider": "openpipe", "parameter_count": "14.8B", "parameters_raw": 14768307200, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 207053, "hf_likes": 12, "release_date": "2025-10-10", "_discovered": true }, { "name": "Goekdeniz-Guelmez/Josiefied-Qwen3-14B-abliterated-v3", "provider": "goekdeniz-guelmez", "parameter_count": "14.8B", "parameters_raw": 14768307200, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 55059, "hf_likes": 24, "release_date": "2025-05-12", "_discovered": true }, { "name": "Qwen/Qwen3-14B-Base", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14768307200, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 50835, "hf_likes": 49, "release_date": "2025-04-28", "_discovered": true }, { "name": "Qwen/Qwen2.5-14B-Instruct", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14770000000, "min_ram_gb": 8.2, "recommended_ram_gb": 13.7, "min_vram_gb": 7.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-14B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen3-14B", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14770000000, "min_ram_gb": 8.2, "recommended_ram_gb": 13.7, "min_vram_gb": 7.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "unsloth/Qwen3-14B-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen2.5-Coder-14B-Instruct", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14770033664, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 491583, "hf_likes": 142, "release_date": "2024-11-06", "gguf_sources": [ { "repo": "unsloth/Qwen2.5-Coder-14B-Instruct-GGUF", "provider": "unsloth" }, { "repo": "bartowski/Qwen2.5-Coder-14B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-14B-Instruct-AWQ", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14770033664, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1077036, "hf_likes": 27, "release_date": "2024-09-17", "_discovered": true, "format": "awq" }, { "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", "provider": "DeepSeek", "parameter_count": "14.8B", "parameters_raw": 14770033664, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 761474, "hf_likes": 608, "release_date": "2025-01-20", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/DeepSeek-R1-Distill-Qwen-14B-GGUF", "provider": "unsloth" }, { "repo": "bartowski/DeepSeek-R1-Distill-Qwen-14B-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-Coder-14B-Instruct-AWQ", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14770033664, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 168345, "hf_likes": 16, "release_date": "2024-11-09", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen2.5-14B", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14770033664, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 100307, "hf_likes": 144, "release_date": "2024-09-15", "_discovered": true }, { "name": "Qwen/Qwen2.5-14B-Instruct-GPTQ-Int4", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14770033664, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "GPTQ-Int4", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 93325, "hf_likes": 26, "release_date": "2024-09-17", "_discovered": true, "format": "gptq" }, { "name": "Qwen/Qwen2.5-14B-Instruct-1M", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14770033664, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "Q4_K_M", "context_length": 1010000, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 54355, "hf_likes": 334, "release_date": "2025-01-23", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-14B-Instruct-1M-GGUF", "provider": "bartowski" } ] }, { "name": "OpenDFM/ChemDFM-R-14B", "provider": "opendfm", "parameter_count": "14.8B", "parameters_raw": 14770033664, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 41195, "hf_likes": 6, "release_date": "2025-10-26", "_discovered": true }, { "name": "Qwen/Qwen2.5-14B-Instruct-GPTQ-Int8", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14770033664, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "GPTQ-Int8", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 37961, "hf_likes": 21, "release_date": "2024-09-17", "_discovered": true, "format": "gptq" }, { "name": "Qwen/Qwen2.5-Coder-14B", "provider": "Alibaba", "parameter_count": "14.8B", "parameters_raw": 14770033664, "min_ram_gb": 8.3, "recommended_ram_gb": 13.8, "min_vram_gb": 7.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 27181, "hf_likes": 66, "release_date": "2024-11-08", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-Coder-14B-GGUF", "provider": "bartowski" } ] }, { "name": "WizardLMTeam/WizardCoder-15B-V1.0", "provider": "WizardLM", "parameter_count": "15.5B", "parameters_raw": 15515334656, "min_ram_gb": 8.7, "recommended_ram_gb": 14.5, "min_vram_gb": 7.9, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "Code generation and completion", "pipeline_tag": "text-generation", "architecture": "starcoder", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "nvidia/Qwen3-30B-A3B-NVFP4", "provider": "nvidia", "parameter_count": "15.6B", "parameters_raw": 15583623168, "min_ram_gb": 8.7, "recommended_ram_gb": 14.5, "min_vram_gb": 8.0, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 63897, "hf_likes": 24, "release_date": "2025-07-08", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 1704458782, "_discovered": true }, { "name": "NVFP4/Qwen3-Coder-30B-A3B-Instruct-FP4", "provider": "nvfp4", "parameter_count": "15.6B", "parameters_raw": 15583623168, "min_ram_gb": 8.7, "recommended_ram_gb": 14.5, "min_vram_gb": 8.0, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 25920, "hf_likes": 11, "release_date": "2025-08-05", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 1704458782, "_discovered": true }, { "name": "bigcode/starcoder2-15b", "provider": "BigCode", "parameter_count": "15.7B", "parameters_raw": 15700000000, "min_ram_gb": 8.8, "recommended_ram_gb": 14.6, "min_vram_gb": 8.0, "quantization": "Q4_K_M", "context_length": 16384, "use_case": "Code generation and completion", "pipeline_tag": "text-generation", "architecture": "starcoder2", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct", "provider": "DeepSeek", "parameter_count": "16B", "parameters_raw": 15700000000, "min_ram_gb": 8.8, "recommended_ram_gb": 14.6, "min_vram_gb": 8.0, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Code generation and completion", "pipeline_tag": "text-generation", "architecture": "deepseek_v2", "is_moe": true, "num_experts": 64, "active_experts": 6, "active_parameters": 2400000000, "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "bartowski/DeepSeek-Coder-V2-Lite-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "deepseek-ai/DeepSeek-V2-Lite-Chat", "provider": "DeepSeek", "parameter_count": "15.7B", "parameters_raw": 15706484224, "min_ram_gb": 8.8, "recommended_ram_gb": 14.6, "min_vram_gb": 8.0, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v2", "hf_downloads": 330400, "hf_likes": 134, "release_date": "2024-05-15", "is_moe": true, "num_experts": 64, "active_experts": 6, "active_parameters": 2184182961, "_discovered": true }, { "name": "deepseek-ai/DeepSeek-V2-Lite", "provider": "DeepSeek", "parameter_count": "15.7B", "parameters_raw": 15706484224, "min_ram_gb": 8.8, "recommended_ram_gb": 14.6, "min_vram_gb": 8.0, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v2", "hf_downloads": 194737, "hf_likes": 167, "release_date": "2024-05-15", "is_moe": true, "num_experts": 64, "active_experts": 6, "active_parameters": 2184182961, "_discovered": true }, { "name": "RedHatAI/DeepSeek-Coder-V2-Lite-Instruct-FP8", "provider": "redhatai", "parameter_count": "15.7B", "parameters_raw": 15706484224, "min_ram_gb": 8.8, "recommended_ram_gb": 14.6, "min_vram_gb": 8.0, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v2", "hf_downloads": 53780, "hf_likes": 9, "release_date": "2024-07-17", "is_moe": true, "num_experts": 64, "active_experts": 6, "active_parameters": 2184182961, "_discovered": true }, { "name": "moonshotai/Moonlight-16B-A3B", "provider": "moonshotai", "parameter_count": "16.0B", "parameters_raw": 15960111936, "min_ram_gb": 8.9, "recommended_ram_gb": 14.9, "min_vram_gb": 8.2, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "hf_downloads": 45835, "hf_likes": 108, "release_date": "2025-02-22", "is_moe": true, "num_experts": 256, "active_experts": 6, "active_parameters": 1153367458, "_discovered": true }, { "name": "moonshotai/Moonlight-16B-A3B-Instruct", "provider": "moonshotai", "parameter_count": "16.0B", "parameters_raw": 15960111936, "min_ram_gb": 8.9, "recommended_ram_gb": 14.9, "min_vram_gb": 8.2, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "hf_downloads": 38514, "hf_likes": 192, "release_date": "2025-02-22", "is_moe": true, "num_experts": 256, "active_experts": 6, "active_parameters": 1153367458, "_discovered": true }, { "name": "inclusionAI/LLaDA2.1-mini", "provider": "inclusionai", "parameter_count": "16.3B", "parameters_raw": 16255643392, "min_ram_gb": 9.1, "recommended_ram_gb": 15.1, "min_vram_gb": 8.3, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llada2_moe", "hf_downloads": 21824, "hf_likes": 94, "release_date": "2026-02-09", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 1295371577, "_discovered": true }, { "name": "deepseek-ai/deepseek-moe-16b-base", "provider": "DeepSeek", "parameter_count": "16.4B", "parameters_raw": 16375728128, "min_ram_gb": 9.2, "recommended_ram_gb": 15.3, "min_vram_gb": 8.4, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek", "hf_downloads": 22326, "hf_likes": 139, "release_date": "2024-01-08", "_discovered": true }, { "name": "inclusionAI/Ling-lite", "provider": "inclusionai", "parameter_count": "16.8B", "parameters_raw": 16801974272, "min_ram_gb": 9.4, "recommended_ram_gb": 15.6, "min_vram_gb": 8.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "bailing_moe", "hf_downloads": 388, "hf_likes": 78, "release_date": "2025-02-28", "is_moe": true, "num_experts": 64, "active_experts": 6, "active_parameters": 2336524543 }, { "name": "nvidia/Qwen3-32B-NVFP4", "provider": "nvidia", "parameter_count": "17.2B", "parameters_raw": 17159312384, "min_ram_gb": 9.6, "recommended_ram_gb": 16.0, "min_vram_gb": 8.8, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 26285, "hf_likes": 11, "release_date": "2025-09-09", "_discovered": true }, { "name": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-NVFP4", "provider": "nvidia", "parameter_count": "18.2B", "parameters_raw": 18237772608, "min_ram_gb": 10.2, "recommended_ram_gb": 17.0, "min_vram_gb": 9.3, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nemotron_h", "hf_downloads": 490404, "hf_likes": 105, "release_date": "2025-12-20", "_discovered": true }, { "name": "cyankiwi/GLM-4.5-Air-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "18.6B", "parameters_raw": 18626406504, "min_ram_gb": 10.4, "recommended_ram_gb": 17.3, "min_vram_gb": 9.5, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 260177, "hf_likes": 27, "release_date": "2025-07-29", "_discovered": true, "format": "awq" }, { "name": "QuantTrio/GLM-4.5-Air-GPTQ-Int4-Int8Mix", "provider": "quanttrio", "parameter_count": "19.8B", "parameters_raw": 19809102592, "min_ram_gb": 11.1, "recommended_ram_gb": 18.4, "min_vram_gb": 10.1, "quantization": "GPTQ-Int4", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 24759, "hf_likes": 10, "release_date": "2025-07-30", "_discovered": true, "format": "gptq" }, { "name": "internlm/internlm2-chat-20b", "provider": "internlm", "parameter_count": "19.9B", "parameters_raw": 19861149696, "min_ram_gb": 11.1, "recommended_ram_gb": 18.5, "min_vram_gb": 10.2, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "internlm2", "hf_downloads": 20010, "hf_likes": 88, "release_date": "2024-01-10", "_discovered": true }, { "name": "openai/gpt-oss-20b", "provider": "openai", "parameter_count": "21B", "parameters_raw": 21000000000, "min_ram_gb": 16.0, "recommended_ram_gb": 24.0, "min_vram_gb": 16.0, "quantization": "BF16", "context_length": 131072, "use_case": "Chat, reasoning, tool use", "is_moe": true, "num_experts": 32, "active_experts": 4, "active_parameters": 3600000000, "release_date": "2025-08-08", "pipeline_tag": "text-generation", "architecture": "gpt_oss", "hf_downloads": 7259974, "hf_likes": 4470, "gguf_sources": [ { "repo": "unsloth/gpt-oss-20b-GGUF", "provider": "unsloth" }, { "repo": "ggml-org/gpt-oss-20b-GGUF", "provider": "ggml-org" }, { "repo": "lmstudio-community/gpt-oss-20b-GGUF", "provider": "lmstudio-community" } ], "capabilities": [ "tool_use" ] }, { "name": "RedHatAI/gpt-oss-20b", "provider": "redhatai", "parameter_count": "21.5B", "parameters_raw": 21511953984, "min_ram_gb": 12.0, "recommended_ram_gb": 20.0, "min_vram_gb": 11.0, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_oss", "hf_downloads": 20506, "hf_likes": 5, "release_date": "2025-09-04", "is_moe": true, "num_experts": 32, "active_experts": 4, "active_parameters": 3630142231, "_discovered": true, "gguf_sources": [ { "repo": "unsloth/gpt-oss-20b-GGUF", "provider": "unsloth" } ] }, { "name": "lmstudio-community/ERNIE-4.5-21B-A3B-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "21.8B", "parameters_raw": 21825436160, "min_ram_gb": 12.2, "recommended_ram_gb": 20.3, "min_vram_gb": 11.2, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "ernie4_5_moe", "hf_downloads": 24749, "hf_likes": 1, "release_date": "2025-07-09", "_discovered": true }, { "name": "lmstudio-community/ERNIE-4.5-21B-A3B-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "21.8B", "parameters_raw": 21825436160, "min_ram_gb": 12.2, "recommended_ram_gb": 20.3, "min_vram_gb": 11.2, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "ernie4_5_moe", "hf_downloads": 24612, "hf_likes": 1, "release_date": "2025-07-10", "_discovered": true }, { "name": "lmstudio-community/ERNIE-4.5-21B-A3B-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "21.8B", "parameters_raw": 21825436160, "min_ram_gb": 12.2, "recommended_ram_gb": 20.3, "min_vram_gb": 11.2, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "ernie4_5_moe", "hf_downloads": 24573, "hf_likes": 1, "release_date": "2025-07-10", "_discovered": true }, { "name": "solidrust/Codestral-22B-v0.1-hf-AWQ", "provider": "solidrust", "parameter_count": "22.2B", "parameters_raw": 22247282688, "min_ram_gb": 12.4, "recommended_ram_gb": 20.7, "min_vram_gb": 11.4, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 84893, "hf_likes": 2, "release_date": "2024-05-30", "_discovered": true, "format": "awq" }, { "name": "stelterlab/Mistral-Small-24B-Instruct-2501-AWQ", "provider": "stelterlab", "parameter_count": "23.6B", "parameters_raw": 23572403200, "min_ram_gb": 13.2, "recommended_ram_gb": 22.0, "min_vram_gb": 12.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 266172, "hf_likes": 26, "release_date": "2025-01-30", "_discovered": true, "format": "awq" }, { "name": "lmstudio-community/Devstral-Small-2507-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "23.6B", "parameters_raw": 23572403200, "min_ram_gb": 13.2, "recommended_ram_gb": 22.0, "min_vram_gb": 12.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 19891, "hf_likes": 2, "release_date": "2025-07-09", "_discovered": true }, { "name": "lmstudio-community/LFM2-24B-A2B-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "23.8B", "parameters_raw": 23843659008, "min_ram_gb": 13.3, "recommended_ram_gb": 22.2, "min_vram_gb": 12.2, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2_moe", "hf_downloads": 207367, "hf_likes": 1, "release_date": "2026-02-23", "is_moe": true, "num_experts": 64, "active_experts": 4, "active_parameters": 2607900202, "_discovered": true }, { "name": "lmstudio-community/LFM2-24B-A2B-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "23.8B", "parameters_raw": 23843659008, "min_ram_gb": 13.3, "recommended_ram_gb": 22.2, "min_vram_gb": 12.2, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2_moe", "hf_downloads": 205544, "hf_likes": 2, "release_date": "2026-02-23", "is_moe": true, "num_experts": 64, "active_experts": 4, "active_parameters": 2607900202, "_discovered": true }, { "name": "lmstudio-community/LFM2-24B-A2B-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "23.8B", "parameters_raw": 23843659008, "min_ram_gb": 13.3, "recommended_ram_gb": 22.2, "min_vram_gb": 12.2, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2_moe", "hf_downloads": 204884, "hf_likes": 1, "release_date": "2026-02-23", "is_moe": true, "num_experts": 64, "active_experts": 4, "active_parameters": 2607900202, "_discovered": true }, { "name": "lmstudio-community/LFM2-24B-A2B-MLX-5bit", "provider": "lmstudio-community", "parameter_count": "23.8B", "parameters_raw": 23843659008, "min_ram_gb": 13.3, "recommended_ram_gb": 22.2, "min_vram_gb": 12.2, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2_moe", "hf_downloads": 204308, "hf_likes": 1, "release_date": "2026-02-23", "is_moe": true, "num_experts": 64, "active_experts": 4, "active_parameters": 2607900202, "_discovered": true }, { "name": "LiquidAI/LFM2-24B-A2B", "provider": "Liquid AI", "parameter_count": "23.8B", "parameters_raw": 23843661440, "min_ram_gb": 13.3, "recommended_ram_gb": 22.2, "min_vram_gb": 12.2, "quantization": "Q4_K_M", "context_length": 128000, "use_case": "Agentic tasks, RAG, summarization", "pipeline_tag": "text-generation", "architecture": "lfm2", "is_moe": true, "num_experts": 32, "active_experts": 4, "active_parameters": 2300000000, "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-11-28" }, { "name": "mistralai/Mistral-Small-24B-Instruct-2501", "provider": "Mistral AI", "parameter_count": "24B", "parameters_raw": 24000000000, "min_ram_gb": 13.4, "recommended_ram_gb": 22.4, "min_vram_gb": 12.3, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "unsloth/Mistral-Small-24B-Instruct-2501-GGUF", "provider": "unsloth" }, { "repo": "bartowski/Mistral-Small-24B-Instruct-2501-GGUF", "provider": "bartowski" } ] }, { "name": "google/gemma-2-27b-it", "provider": "Google", "parameter_count": "27.2B", "parameters_raw": 27227128320, "min_ram_gb": 15.2, "recommended_ram_gb": 25.4, "min_vram_gb": 13.9, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gemma2", "hf_downloads": 409260, "hf_likes": 560, "release_date": "2024-06-24", "gguf_sources": [ { "repo": "bartowski/gemma-2-27b-it-GGUF", "provider": "bartowski" } ] }, { "name": "google/gemma-3-27b-it", "provider": "Google", "parameter_count": "27.4B", "parameters_raw": 27432406640, "min_ram_gb": 15.3, "recommended_ram_gb": 25.5, "min_vram_gb": 14.1, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose", "capabilities": [ "vision" ], "pipeline_tag": "image-text-to-text", "architecture": "gemma3", "hf_downloads": 1520563, "hf_likes": 1905, "release_date": "2025-03-01", "gguf_sources": [ { "repo": "unsloth/gemma-3-27b-it-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen3.5-27B", "provider": "Alibaba", "parameter_count": "27.8B", "parameters_raw": 27781427952, "min_ram_gb": 15.5, "recommended_ram_gb": 25.9, "min_vram_gb": 14.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 406808, "hf_likes": 565, "release_date": "2026-02-24", "gguf_sources": [ { "repo": "unsloth/Qwen3.5-27B-GGUF", "provider": "unsloth" } ] }, { "name": "lmstudio-community/GLM-4.7-Flash-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "29.9B", "parameters_raw": 29943393920, "min_ram_gb": 16.7, "recommended_ram_gb": 27.9, "min_vram_gb": 15.3, "quantization": "Q4_K_M", "context_length": 202752, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe_lite", "hf_downloads": 1001623, "hf_likes": 9, "release_date": "2026-01-19", "_discovered": true }, { "name": "lmstudio-community/GLM-4.7-Flash-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "29.9B", "parameters_raw": 29943393920, "min_ram_gb": 16.7, "recommended_ram_gb": 27.9, "min_vram_gb": 15.3, "quantization": "Q4_K_M", "context_length": 202752, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe_lite", "hf_downloads": 991211, "hf_likes": 8, "release_date": "2026-01-19", "_discovered": true }, { "name": "Qwen/Qwen3-30B-A3B-GPTQ-Int4", "provider": "Alibaba", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "GPTQ-Int4", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 226311, "hf_likes": 47, "release_date": "2025-05-05", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true, "format": "gptq" }, { "name": "lmstudio-community/Qwen3-Coder-30B-A3B-Instruct-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 191895, "hf_likes": 14, "release_date": "2025-07-31", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true }, { "name": "lmstudio-community/Qwen3-Coder-30B-A3B-Instruct-MLX-5bit", "provider": "lmstudio-community", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 185814, "hf_likes": 4, "release_date": "2025-08-01", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true }, { "name": "lmstudio-community/Qwen3-Coder-30B-A3B-Instruct-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 181127, "hf_likes": 12, "release_date": "2025-07-31", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true }, { "name": "lmstudio-community/Qwen3-Coder-30B-A3B-Instruct-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 179804, "hf_likes": 4, "release_date": "2025-07-31", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true }, { "name": "Qwen/Qwen3-30B-A3B-Base", "provider": "Alibaba", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 83458, "hf_likes": 69, "release_date": "2025-04-28", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true }, { "name": "typhoon-ai/typhoon2.5-qwen3-30b-a3b", "provider": "typhoon-ai", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 53587, "hf_likes": 1, "release_date": "2025-09-23", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true, "gguf_sources": [ { "repo": "typhoon-ai/typhoon2.5-qwen3-30b-a3b-gguf", "file": "typhoon2.5-qwen3-30b-a3b-q4_k_m.gguf", "quant": "Q4_K_M" } ] }, { "name": "QuantTrio/Qwen3-Coder-30B-A3B-Instruct-AWQ", "provider": "quanttrio", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 46035, "hf_likes": 6, "release_date": "2025-08-01", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true, "format": "awq" }, { "name": "lmstudio-community/Qwen3-30B-A3B-Instruct-2507-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 45854, "hf_likes": 6, "release_date": "2025-07-29", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true }, { "name": "lmstudio-community/Qwen3-30B-A3B-Instruct-2507-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 44199, "hf_likes": 4, "release_date": "2025-07-29", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true }, { "name": "lmstudio-community/Qwen3-30B-A3B-Instruct-2507-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 43483, "hf_likes": 0, "release_date": "2025-07-29", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true }, { "name": "Alibaba-NLP/Tongyi-DeepResearch-30B-A3B", "provider": "alibaba-nlp", "parameter_count": "30.5B", "parameters_raw": 30532122624, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 26559, "hf_likes": 802, "release_date": "2025-09-16", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339450907, "_discovered": true }, { "name": "Qwen/Qwen3-30B-A3B-Instruct-2507-FP8", "provider": "Alibaba", "parameter_count": "30.5B", "parameters_raw": 30533947392, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 957458, "hf_likes": 115, "release_date": "2025-07-28", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339650489, "_discovered": true }, { "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8", "provider": "Alibaba", "parameter_count": "30.5B", "parameters_raw": 30533947392, "min_ram_gb": 17.1, "recommended_ram_gb": 28.4, "min_vram_gb": 15.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 265519, "hf_likes": 164, "release_date": "2025-07-31", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3339650489, "_discovered": true }, { "name": "QuantTrio/Qwen3-VL-30B-A3B-Instruct-AWQ", "provider": "quanttrio", "parameter_count": "31.1B", "parameters_raw": 31070754032, "min_ram_gb": 17.4, "recommended_ram_gb": 28.9, "min_vram_gb": 15.9, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_vl_moe", "hf_downloads": 301353, "hf_likes": 40, "release_date": "2025-10-04", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 2475950709, "_discovered": true, "format": "awq" }, { "name": "QuantTrio/GLM-4.7-Flash-AWQ", "provider": "quanttrio", "parameter_count": "31.2B", "parameters_raw": 31221488576, "min_ram_gb": 17.4, "recommended_ram_gb": 29.1, "min_vram_gb": 16.0, "quantization": "AWQ-4bit", "context_length": 202752, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe_lite", "hf_downloads": 103703, "hf_likes": 7, "release_date": "2026-01-21", "_discovered": true, "format": "awq" }, { "name": "lmstudio-community/NVIDIA-Nemotron-3-Nano-30B-A3B-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "31.6B", "parameters_raw": 31577935872, "min_ram_gb": 17.6, "recommended_ram_gb": 29.4, "min_vram_gb": 16.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 195432, "hf_likes": 2, "release_date": "2025-12-16", "_discovered": true }, { "name": "lmstudio-community/NVIDIA-Nemotron-3-Nano-30B-A3B-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "31.6B", "parameters_raw": 31577935872, "min_ram_gb": 17.6, "recommended_ram_gb": 29.4, "min_vram_gb": 16.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 190541, "hf_likes": 3, "release_date": "2025-12-16", "_discovered": true }, { "name": "lmstudio-community/NVIDIA-Nemotron-3-Nano-30B-A3B-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "31.6B", "parameters_raw": 31577935872, "min_ram_gb": 17.6, "recommended_ram_gb": 29.4, "min_vram_gb": 16.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 188175, "hf_likes": 0, "release_date": "2025-12-16", "_discovered": true }, { "name": "lmstudio-community/NVIDIA-Nemotron-3-Nano-30B-A3B-MLX-5bit", "provider": "lmstudio-community", "parameter_count": "31.6B", "parameters_raw": 31577935872, "min_ram_gb": 17.6, "recommended_ram_gb": 29.4, "min_vram_gb": 16.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 188130, "hf_likes": 0, "release_date": "2025-12-16", "_discovered": true }, { "name": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16", "provider": "nvidia", "parameter_count": "31.6B", "parameters_raw": 31577937344, "min_ram_gb": 17.6, "recommended_ram_gb": 29.4, "min_vram_gb": 16.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nemotron_h", "hf_downloads": 1025721, "hf_likes": 648, "release_date": "2025-12-04" }, { "name": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-Base-BF16", "provider": "nvidia", "parameter_count": "31.6B", "parameters_raw": 31577937344, "min_ram_gb": 17.6, "recommended_ram_gb": 29.4, "min_vram_gb": 16.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 65364, "hf_likes": 109, "release_date": "2025-12-03", "_discovered": true }, { "name": "OpenResearcher/OpenResearcher-30B-A3B", "provider": "openresearcher", "parameter_count": "31.6B", "parameters_raw": 31577937344, "min_ram_gb": 17.6, "recommended_ram_gb": 29.4, "min_vram_gb": 16.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nemotron_h", "hf_downloads": 23630, "hf_likes": 59, "release_date": "2026-02-03", "_discovered": true }, { "name": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-FP8", "provider": "nvidia", "parameter_count": "31.6B", "parameters_raw": 31577946256, "min_ram_gb": 17.6, "recommended_ram_gb": 29.4, "min_vram_gb": 16.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nemotron_h", "hf_downloads": 1412797, "hf_likes": 289, "release_date": "2025-12-06", "_discovered": true }, { "name": "LGAI-EXAONE/EXAONE-4.0-32B", "provider": "LG AI", "parameter_count": "32B", "parameters_raw": 32000000000, "min_ram_gb": 17.9, "recommended_ram_gb": 29.8, "min_vram_gb": 16.4, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Hybrid reasoning, multilingual", "pipeline_tag": "text-generation", "architecture": "exaone", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-07-15" }, { "name": "LGAI-EXAONE/EXAONE-4.0.1-32B", "provider": "lgai-exaone", "parameter_count": "32.0B", "parameters_raw": 32003216384, "min_ram_gb": 17.9, "recommended_ram_gb": 29.8, "min_vram_gb": 16.4, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "exaone4", "hf_downloads": 186516, "hf_likes": 24, "release_date": "2025-07-29", "_discovered": true }, { "name": "LGAI-EXAONE/EXAONE-4.0-32B-FP8", "provider": "lgai-exaone", "parameter_count": "32.0B", "parameters_raw": 32005105664, "min_ram_gb": 17.9, "recommended_ram_gb": 29.8, "min_vram_gb": 16.4, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "exaone4", "hf_downloads": 20430, "hf_likes": 17, "release_date": "2025-07-11", "_discovered": true }, { "name": "allenai/OLMo-2-0325-32B-Instruct", "provider": "allenai", "parameter_count": "32.2B", "parameters_raw": 32234279936, "min_ram_gb": 18.0, "recommended_ram_gb": 30.0, "min_vram_gb": 16.5, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo2", "hf_downloads": 2979, "hf_likes": 148, "release_date": "2025-03-12", "gguf_sources": [ { "repo": "unsloth/OLMo-2-0325-32B-Instruct-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen2.5-32B-Instruct", "provider": "Alibaba", "parameter_count": "32.5B", "parameters_raw": 32510000000, "min_ram_gb": 18.2, "recommended_ram_gb": 30.3, "min_vram_gb": 16.7, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-32B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen1.5-32B-Chat", "provider": "Alibaba", "parameter_count": "32.5B", "parameters_raw": 32512218112, "min_ram_gb": 18.2, "recommended_ram_gb": 30.3, "min_vram_gb": 16.7, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 25041, "hf_likes": 109, "release_date": "2024-04-03", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen1.5-32B-Chat-GGUF", "provider": "bartowski" } ] }, { "name": "nn-tech/MetalGPT-1", "provider": "nn-tech", "parameter_count": "32.8B", "parameters_raw": 32759593984, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 20663, "hf_likes": 38, "release_date": "2025-12-04", "_discovered": true }, { "name": "Qwen/Qwen3-32B-AWQ", "provider": "Alibaba", "parameter_count": "32.8B", "parameters_raw": 32762123264, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "AWQ-4bit", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 552811, "hf_likes": 129, "release_date": "2025-05-01", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen2.5-Coder-32B-Instruct", "provider": "Alibaba", "parameter_count": "32.8B", "parameters_raw": 32763876352, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 858975, "hf_likes": 2000, "release_date": "2024-11-06", "gguf_sources": [ { "repo": "unsloth/Qwen2.5-Coder-32B-Instruct-GGUF", "provider": "unsloth" }, { "repo": "bartowski/Qwen2.5-Coder-32B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "provider": "DeepSeek", "parameter_count": "32.8B", "parameters_raw": 32763876352, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 873156, "hf_likes": 1525, "release_date": "2025-01-20", "gguf_sources": [ { "repo": "unsloth/DeepSeek-R1-Distill-Qwen-32B-GGUF", "provider": "unsloth" }, { "repo": "bartowski/DeepSeek-R1-Distill-Qwen-32B-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-32B-Instruct-AWQ", "provider": "Alibaba", "parameter_count": "32.8B", "parameters_raw": 32763876352, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1643600, "hf_likes": 94, "release_date": "2024-09-17", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen2.5-32B", "provider": "Alibaba", "parameter_count": "32.8B", "parameters_raw": 32763876352, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1453252, "hf_likes": 173, "release_date": "2024-09-15", "_discovered": true }, { "name": "Qwen/Qwen2.5-Coder-32B-Instruct-AWQ", "provider": "Alibaba", "parameter_count": "32.8B", "parameters_raw": 32763876352, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 973260, "hf_likes": 33, "release_date": "2024-11-09", "_discovered": true, "format": "awq" }, { "name": "Qwen/QwQ-32B-AWQ", "provider": "Alibaba", "parameter_count": "32.8B", "parameters_raw": 32763876352, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "AWQ-4bit", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 280279, "hf_likes": 133, "release_date": "2025-03-05", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen2.5-32B-Instruct-GPTQ-Int4", "provider": "Alibaba", "parameter_count": "32.8B", "parameters_raw": 32763876352, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "GPTQ-Int4", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 191251, "hf_likes": 40, "release_date": "2024-09-17", "_discovered": true, "format": "gptq" }, { "name": "baichuan-inc/Baichuan-M2-32B", "provider": "baichuan-inc", "parameter_count": "32.8B", "parameters_raw": 32763876352, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 152016, "hf_likes": 118, "release_date": "2025-08-10", "_discovered": true }, { "name": "Qwen/Qwen2.5-32B-Instruct-GPTQ-Int8", "provider": "Alibaba", "parameter_count": "32.8B", "parameters_raw": 32763876352, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "GPTQ-Int8", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 105034, "hf_likes": 14, "release_date": "2024-09-17", "_discovered": true, "format": "gptq" }, { "name": "Qwen/Qwen2.5-Coder-32B", "provider": "Alibaba", "parameter_count": "32.8B", "parameters_raw": 32763876352, "min_ram_gb": 18.3, "recommended_ram_gb": 30.5, "min_vram_gb": 16.8, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 43109, "hf_likes": 142, "release_date": "2024-11-08", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2.5-Coder-32B-GGUF", "provider": "bartowski" } ] }, { "name": "meta-llama/CodeLlama-34b-Instruct-hf", "provider": "Meta", "parameter_count": "33.7B", "parameters_raw": 33743970304, "min_ram_gb": 18.9, "recommended_ram_gb": 31.4, "min_vram_gb": 17.3, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 950, "hf_likes": 19, "release_date": "2024-03-14" }, { "name": "01-ai/Yi-34B-Chat", "provider": "01.ai", "parameter_count": "34.4B", "parameters_raw": 34386780160, "min_ram_gb": 19.2, "recommended_ram_gb": 32.0, "min_vram_gb": 17.6, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Multilingual, Chinese/English chat", "pipeline_tag": "text-generation", "architecture": "yi", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "dphn/dolphin-2.9.1-yi-1.5-34b", "provider": "dphn", "parameter_count": "34.4B", "parameters_raw": 34388917248, "min_ram_gb": 19.2, "recommended_ram_gb": 32.0, "min_vram_gb": 17.6, "quantization": "Q4_K_M", "context_length": 8192, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 4650971, "hf_likes": 56, "release_date": "2024-05-18", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/dolphin-2.9.1-yi-1.5-34b-GGUF", "provider": "bartowski" } ] }, { "name": "CohereForAI/c4ai-command-r-v01", "provider": "Cohere", "parameter_count": "35B", "parameters_raw": 35000000000, "min_ram_gb": 19.5, "recommended_ram_gb": 32.6, "min_vram_gb": 17.9, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "RAG, tool use, agents", "pipeline_tag": "text-generation", "architecture": "cohere", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "bartowski/c4ai-command-r-v01-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen3.5-35B-A3B", "provider": "Alibaba", "parameter_count": "36.0B", "parameters_raw": 35951822704, "min_ram_gb": 20.1, "recommended_ram_gb": 33.5, "min_vram_gb": 18.4, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 769032, "hf_likes": 905, "release_date": "2026-02-24", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 3000000000, "gguf_sources": [ { "repo": "unsloth/Qwen3.5-35B-A3B-GGUF", "provider": "unsloth" } ] }, { "name": "lmstudio-community/Seed-OSS-36B-Instruct-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "36.2B", "parameters_raw": 36151104512, "min_ram_gb": 20.2, "recommended_ram_gb": 33.7, "min_vram_gb": 18.5, "quantization": "Q4_K_M", "context_length": 524288, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "seed_oss", "hf_downloads": 46944, "hf_likes": 2, "release_date": "2025-08-26", "_discovered": true }, { "name": "lmstudio-community/Seed-OSS-36B-Instruct-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "36.2B", "parameters_raw": 36151104512, "min_ram_gb": 20.2, "recommended_ram_gb": 33.7, "min_vram_gb": 18.5, "quantization": "Q4_K_M", "context_length": 524288, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "seed_oss", "hf_downloads": 45348, "hf_likes": 0, "release_date": "2025-08-26", "_discovered": true }, { "name": "lmstudio-community/Seed-OSS-36B-Instruct-MLX-5bit", "provider": "lmstudio-community", "parameter_count": "36.2B", "parameters_raw": 36151104512, "min_ram_gb": 20.2, "recommended_ram_gb": 33.7, "min_vram_gb": 18.5, "quantization": "Q4_K_M", "context_length": 524288, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "seed_oss", "hf_downloads": 45061, "hf_likes": 1, "release_date": "2025-08-26", "_discovered": true }, { "name": "lmstudio-community/Seed-OSS-36B-Instruct-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "36.2B", "parameters_raw": 36151104512, "min_ram_gb": 20.2, "recommended_ram_gb": 33.7, "min_vram_gb": 18.5, "quantization": "Q4_K_M", "context_length": 524288, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "seed_oss", "hf_downloads": 44971, "hf_likes": 0, "release_date": "2025-08-26", "_discovered": true }, { "name": "cyankiwi/MiniMax-M2.1-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "36.8B", "parameters_raw": 36811839984, "min_ram_gb": 20.6, "recommended_ram_gb": 34.3, "min_vram_gb": 18.9, "quantization": "AWQ-4bit", "context_length": 196608, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 36114, "hf_likes": 16, "release_date": "2025-12-27", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 2933443495, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/MiniMax-M2.5-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "36.8B", "parameters_raw": 36811839984, "min_ram_gb": 20.6, "recommended_ram_gb": 34.3, "min_vram_gb": 18.9, "quantization": "AWQ-4bit", "context_length": 196608, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 24338, "hf_likes": 6, "release_date": "2026-02-15", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 2933443495, "_discovered": true, "format": "awq" }, { "name": "mratsim/MiniMax-M2.5-BF16-INT4-AWQ", "provider": "mratsim", "parameter_count": "39.1B", "parameters_raw": 39115692032, "min_ram_gb": 21.9, "recommended_ram_gb": 36.4, "min_vram_gb": 20.0, "quantization": "AWQ-4bit", "context_length": 196608, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 46268, "hf_likes": 29, "release_date": "2026-02-14", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 3117031705, "_discovered": true, "format": "awq" }, { "name": "tiiuae/falcon-40b-instruct", "provider": "TII", "parameter_count": "40.0B", "parameters_raw": 40000000000, "min_ram_gb": 22.4, "recommended_ram_gb": 37.3, "min_vram_gb": 20.5, "quantization": "Q4_K_M", "context_length": 2048, "use_case": "Instruction following, chat", "pipeline_tag": "text-generation", "architecture": "falcon", "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "mistralai/Mixtral-8x7B-Instruct-v0.1", "provider": "Mistral AI", "parameter_count": "46.7B", "parameters_raw": 46702792704, "min_ram_gb": 26.1, "recommended_ram_gb": 43.5, "min_vram_gb": 23.9, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "unknown", "architecture": "mixtral", "hf_downloads": 787218, "hf_likes": 4641, "release_date": "2023-12-10", "is_moe": true, "num_experts": 8, "active_experts": 2, "active_parameters": 12900000000 }, { "name": "Salesforce/xLAM-8x7b-r", "provider": "salesforce", "parameter_count": "46.7B", "parameters_raw": 46702792704, "min_ram_gb": 26.1, "recommended_ram_gb": 43.5, "min_vram_gb": 23.9, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mixtral", "hf_downloads": 25430, "hf_likes": 15, "release_date": "2024-08-28", "is_moe": true, "num_experts": 8, "active_experts": 2, "active_parameters": 13427052901, "_discovered": true, "gguf_sources": [ { "repo": "bartowski/xLAM-8x7b-r-GGUF", "provider": "bartowski" } ] }, { "name": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO", "provider": "NousResearch", "parameter_count": "46.7B", "parameters_raw": 46702809088, "min_ram_gb": 26.1, "recommended_ram_gb": 43.5, "min_vram_gb": 23.9, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "mixtral", "hf_downloads": 9050, "hf_likes": 453, "release_date": "2024-01-11", "is_moe": true, "num_experts": 8, "active_experts": 2, "active_parameters": 12900000000 }, { "name": "moonshotai/Kimi-Linear-48B-A3B-Instruct", "provider": "moonshotai", "parameter_count": "49.1B", "parameters_raw": 49122681728, "min_ram_gb": 27.4, "recommended_ram_gb": 45.7, "min_vram_gb": 25.2, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "kimi_linear", "hf_downloads": 35486, "hf_likes": 546, "release_date": "2025-10-30", "_discovered": true }, { "name": "nvidia/Llama-3_3-Nemotron-Super-49B-v1_5", "provider": "nvidia", "parameter_count": "49.9B", "parameters_raw": 49867145216, "min_ram_gb": 27.9, "recommended_ram_gb": 46.4, "min_vram_gb": 25.5, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nemotron-nas", "hf_downloads": 105079, "hf_likes": 226, "release_date": "2025-07-25", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/Llama-3_3-Nemotron-Super-49B-v1_5-GGUF", "provider": "unsloth" } ] }, { "name": "nvidia/Llama-3_3-Nemotron-Super-49B-v1", "provider": "nvidia", "parameter_count": "49.9B", "parameters_raw": 49867145216, "min_ram_gb": 27.9, "recommended_ram_gb": 46.4, "min_vram_gb": 25.5, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nemotron-nas", "hf_downloads": 23805, "hf_likes": 320, "release_date": "2025-03-16", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/Llama-3_3-Nemotron-Super-49B-v1-GGUF", "provider": "unsloth" } ] }, { "name": "txn545/Qwen3.5-122B-A10B-NVFP4", "provider": "txn545", "parameter_count": "64.4B", "parameters_raw": 64354266864, "min_ram_gb": 36.0, "recommended_ram_gb": 59.9, "min_vram_gb": 33.0, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_5_moe", "hf_downloads": 37707, "hf_likes": 6, "release_date": "2026-02-24", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 5128230639, "_discovered": true }, { "name": "meta-llama/Llama-3.1-70B-Instruct", "provider": "Meta", "parameter_count": "70.6B", "parameters_raw": 70553706496, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 801189, "hf_likes": 894, "release_date": "2024-07-16" }, { "name": "meta-llama/Llama-3.3-70B-Instruct", "provider": "Meta", "parameter_count": "70.6B", "parameters_raw": 70553706496, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 0, "hf_likes": 0, "release_date": null, "gguf_sources": [ { "repo": "unsloth/Llama-3.3-70B-Instruct-GGUF", "provider": "unsloth" }, { "repo": "bartowski/Llama-3.3-70B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "casperhansen/llama-3.3-70b-instruct-awq", "provider": "casperhansen", "parameter_count": "70.6B", "parameters_raw": 70553706496, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 674865, "hf_likes": 39, "release_date": "2024-12-06", "_discovered": true, "format": "awq" }, { "name": "kosbu/Llama-3.3-70B-Instruct-AWQ", "provider": "kosbu", "parameter_count": "70.6B", "parameters_raw": 70553706496, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 505688, "hf_likes": 10, "release_date": "2024-12-06", "_discovered": true, "format": "awq" }, { "name": "ibnzterrell/Meta-Llama-3.3-70B-Instruct-AWQ-INT4", "provider": "ibnzterrell", "parameter_count": "70.6B", "parameters_raw": 70553706496, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 138353, "hf_likes": 30, "release_date": "2024-12-07", "_discovered": true, "format": "awq" }, { "name": "RedHatAI/Meta-Llama-3.1-70B-Instruct-quantized.w4a16", "provider": "redhatai", "parameter_count": "70.6B", "parameters_raw": 70553706496, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 116205, "hf_likes": 32, "release_date": "2024-07-31", "_discovered": true }, { "name": "meta-llama/Llama-3.1-70B", "provider": "Meta", "parameter_count": "70.6B", "parameters_raw": 70553706496, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 75498, "hf_likes": 408, "release_date": "2024-07-14", "_discovered": true }, { "name": "meta-llama/Meta-Llama-3-70B-Instruct", "provider": "Meta", "parameter_count": "70.6B", "parameters_raw": 70553706496, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 61023, "hf_likes": 1506, "release_date": "2024-04-17", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Meta-Llama-3-70B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "tokyotech-llm/Llama-3.1-Swallow-70B-Instruct-v0.3", "provider": "tokyotech-llm", "parameter_count": "70.6B", "parameters_raw": 70553706496, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 35321, "hf_likes": 14, "release_date": "2024-12-25", "_discovered": true }, { "name": "RedHatAI/Meta-Llama-3.1-70B-Instruct-FP8", "provider": "redhatai", "parameter_count": "70.6B", "parameters_raw": 70553707616, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 39962, "hf_likes": 50, "release_date": "2024-07-23", "_discovered": true }, { "name": "RedHatAI/Llama-3.3-70B-Instruct-FP8-dynamic", "provider": "redhatai", "parameter_count": "70.6B", "parameters_raw": 70560423936, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 42062, "hf_likes": 14, "release_date": "2024-12-11", "_discovered": true }, { "name": "RedHatAI/DeepSeek-R1-Distill-Llama-70B-FP8-dynamic", "provider": "redhatai", "parameter_count": "70.6B", "parameters_raw": 70560423936, "min_ram_gb": 39.4, "recommended_ram_gb": 65.7, "min_vram_gb": 36.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 26238, "hf_likes": 10, "release_date": "2025-02-01", "_discovered": true }, { "name": "LLM360/K2-Think-V2", "provider": "llm360", "parameter_count": "72.6B", "parameters_raw": 72550195200, "min_ram_gb": 40.5, "recommended_ram_gb": 67.6, "min_vram_gb": 37.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 53839, "hf_likes": 23, "release_date": "2026-01-08", "_discovered": true }, { "name": "Qwen/Qwen2.5-72B-Instruct", "provider": "Alibaba", "parameter_count": "72.7B", "parameters_raw": 72706203648, "min_ram_gb": 40.6, "recommended_ram_gb": 67.7, "min_vram_gb": 37.2, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 558153, "hf_likes": 916, "release_date": "2024-09-16", "gguf_sources": [ { "repo": "bartowski/Qwen2.5-72B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2.5-72B", "provider": "Alibaba", "parameter_count": "72.7B", "parameters_raw": 72706203648, "min_ram_gb": 40.6, "recommended_ram_gb": 67.7, "min_vram_gb": 37.2, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 45193, "hf_likes": 89, "release_date": "2024-09-15", "_discovered": true }, { "name": "Qwen/Qwen2-72B-Instruct", "provider": "Alibaba", "parameter_count": "72.7B", "parameters_raw": 72706203648, "min_ram_gb": 40.6, "recommended_ram_gb": 67.7, "min_vram_gb": 37.2, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 40930, "hf_likes": 719, "release_date": "2024-05-28", "_discovered": true, "gguf_sources": [ { "repo": "bartowski/Qwen2-72B-Instruct-GGUF", "provider": "bartowski" } ] }, { "name": "Qwen/Qwen2-72B", "provider": "Alibaba", "parameter_count": "72.7B", "parameters_raw": 72706203648, "min_ram_gb": 40.6, "recommended_ram_gb": 67.7, "min_vram_gb": 37.2, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 34455, "hf_likes": 200, "release_date": "2024-05-22", "_discovered": true }, { "name": "huihui-ai/Qwen2.5-72B-Instruct-abliterated", "provider": "huihui-ai", "parameter_count": "72.7B", "parameters_raw": 72706203648, "min_ram_gb": 40.6, "recommended_ram_gb": 67.7, "min_vram_gb": 37.2, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 20754, "hf_likes": 35, "release_date": "2024-10-26", "_discovered": true }, { "name": "Qwen/Qwen2.5-72B-Instruct-AWQ", "provider": "Alibaba", "parameter_count": "73.0B", "parameters_raw": 72957861888, "min_ram_gb": 40.8, "recommended_ram_gb": 67.9, "min_vram_gb": 37.4, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 922364, "hf_likes": 75, "release_date": "2024-09-17", "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen2.5-72B-Instruct-GPTQ-Int8", "provider": "Alibaba", "parameter_count": "73.0B", "parameters_raw": 72957861888, "min_ram_gb": 40.8, "recommended_ram_gb": 67.9, "min_vram_gb": 37.4, "quantization": "GPTQ-Int8", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 42593, "hf_likes": 28, "release_date": "2024-09-17", "_discovered": true, "format": "gptq" }, { "name": "NexVeridian/Qwen3-Coder-Next-8bit", "provider": "nexveridian", "parameter_count": "79.7B", "parameters_raw": 79674388992, "min_ram_gb": 44.5, "recommended_ram_gb": 74.2, "min_vram_gb": 40.8, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 300258, "hf_likes": 0, "release_date": "2026-02-03", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": 5462052829, "_discovered": true }, { "name": "lmstudio-community/Qwen3-Next-80B-A3B-Instruct-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "79.7B", "parameters_raw": 79674388992, "min_ram_gb": 44.5, "recommended_ram_gb": 74.2, "min_vram_gb": 40.8, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 48644, "hf_likes": 7, "release_date": "2025-09-15", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": 5462052829, "_discovered": true }, { "name": "lmstudio-community/Qwen3-Next-80B-A3B-Instruct-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "79.7B", "parameters_raw": 79674388992, "min_ram_gb": 44.5, "recommended_ram_gb": 74.2, "min_vram_gb": 40.8, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 48355, "hf_likes": 2, "release_date": "2025-09-15", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": 5462052829, "_discovered": true }, { "name": "lmstudio-community/Qwen3-Next-80B-A3B-Instruct-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "79.7B", "parameters_raw": 79674388992, "min_ram_gb": 44.5, "recommended_ram_gb": 74.2, "min_vram_gb": 40.8, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 47109, "hf_likes": 0, "release_date": "2025-09-15", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": 5462052829, "_discovered": true }, { "name": "lmstudio-community/Qwen3-Next-80B-A3B-Instruct-MLX-5bit", "provider": "lmstudio-community", "parameter_count": "79.7B", "parameters_raw": 79674388992, "min_ram_gb": 44.5, "recommended_ram_gb": 74.2, "min_vram_gb": 40.8, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 47029, "hf_likes": 0, "release_date": "2025-09-15", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": 5462052829, "_discovered": true }, { "name": "Qwen/Qwen3-Coder-Next", "provider": "Alibaba", "parameter_count": "80B", "parameters_raw": 80000000000, "min_ram_gb": 44.8, "recommended_ram_gb": 74.6, "min_vram_gb": 41.0, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Code generation, agentic coding", "pipeline_tag": "text-generation", "architecture": "qwen3_next", "is_moe": true, "num_experts": 64, "active_experts": 4, "active_parameters": 3000000000, "hf_downloads": 0, "hf_likes": 0, "release_date": "2026-01-30", "gguf_sources": [ { "repo": "unsloth/Qwen3-Coder-Next-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen3-Coder-Next-FP8", "provider": "Alibaba", "parameter_count": "79.7B", "parameters_raw": 79679212800, "min_ram_gb": 44.5, "recommended_ram_gb": 74.2, "min_vram_gb": 40.8, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 398505, "hf_likes": 100, "release_date": "2026-02-01", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": 5462383530, "_discovered": true }, { "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "provider": "Alibaba", "parameter_count": "81.3B", "parameters_raw": 81324862720, "min_ram_gb": 45.4, "recommended_ram_gb": 75.7, "min_vram_gb": 41.7, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 1224711, "hf_likes": 945, "release_date": "2025-09-09", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": 5575200546, "_discovered": true, "gguf_sources": [ { "repo": "unsloth/Qwen3-Next-80B-A3B-Instruct-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen3-Next-80B-A3B-Instruct-FP8", "provider": "Alibaba", "parameter_count": "81.3B", "parameters_raw": 81329784384, "min_ram_gb": 45.4, "recommended_ram_gb": 75.7, "min_vram_gb": 41.7, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 148887, "hf_likes": 82, "release_date": "2025-09-22", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": 5575537949, "_discovered": true }, { "name": "Qwen/Qwen1.5-110B-Chat-AWQ", "provider": "Alibaba", "parameter_count": "111.2B", "parameters_raw": 111209914368, "min_ram_gb": 62.1, "recommended_ram_gb": 103.6, "min_vram_gb": 57.0, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 320397, "hf_likes": 9, "release_date": "2024-04-27", "_discovered": true, "format": "awq" }, { "name": "lmstudio-community/gpt-oss-120b-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "116.8B", "parameters_raw": 116829154368, "min_ram_gb": 65.3, "recommended_ram_gb": 108.8, "min_vram_gb": 59.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_oss", "hf_downloads": 61730, "hf_likes": 12, "release_date": "2025-08-05", "is_moe": true, "num_experts": 128, "active_experts": 4, "active_parameters": 9309823238, "_discovered": true }, { "name": "axolotl-ai-co/gpt-oss-120b-dequantized", "provider": "axolotl-ai-co", "parameter_count": "116.8B", "parameters_raw": 116829156672, "min_ram_gb": 65.3, "recommended_ram_gb": 108.8, "min_vram_gb": 59.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gpt_oss", "hf_downloads": 34254, "hf_likes": 0, "release_date": "2025-08-07", "is_moe": true, "num_experts": 128, "active_experts": 4, "active_parameters": 9309823421, "_discovered": true }, { "name": "openai/gpt-oss-120b", "provider": "openai", "parameter_count": "117B", "parameters_raw": 117000000000, "min_ram_gb": 80.0, "recommended_ram_gb": 96.0, "min_vram_gb": 80.0, "quantization": "BF16", "context_length": 131072, "use_case": "Chat, reasoning, tool use", "is_moe": true, "num_experts": 128, "active_experts": 4, "active_parameters": 5100000000, "release_date": "2025-08-08", "pipeline_tag": "text-generation", "architecture": "gpt_oss", "hf_downloads": 4628743, "hf_likes": 4600, "gguf_sources": [ { "repo": "ggml-org/gpt-oss-120b-GGUF", "provider": "ggml-org" }, { "repo": "unsloth/gpt-oss-120b-GGUF", "provider": "unsloth" } ], "capabilities": [ "tool_use" ] }, { "name": "Qwen/Qwen3.5-122B-A10B", "provider": "Alibaba", "parameter_count": "125.1B", "parameters_raw": 125086497008, "min_ram_gb": 69.9, "recommended_ram_gb": 116.5, "min_vram_gb": 64.1, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 171055, "hf_likes": 389, "release_date": "2026-02-24", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 10000000000, "gguf_sources": [ { "repo": "unsloth/Qwen3.5-122B-A10B-GGUF", "provider": "unsloth" } ] }, { "name": "mistralai/Mixtral-8x22B-Instruct-v0.1", "provider": "Mistral AI", "parameter_count": "140.6B", "parameters_raw": 140630071296, "min_ram_gb": 78.6, "recommended_ram_gb": 131.0, "min_vram_gb": 72.0, "quantization": "Q4_K_M", "context_length": 65536, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "unknown", "architecture": "mixtral", "hf_downloads": 15022, "hf_likes": 746, "release_date": "2024-04-16", "is_moe": true, "num_experts": 8, "active_experts": 2, "active_parameters": 39100000000 }, { "name": "MaziyarPanahi/Mixtral-8x22B-Instruct-v0.1-AWQ", "provider": "maziyarpanahi", "parameter_count": "140.6B", "parameters_raw": 140630071296, "min_ram_gb": 78.6, "recommended_ram_gb": 131.0, "min_vram_gb": 72.0, "quantization": "AWQ-4bit", "context_length": 65536, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mixtral", "hf_downloads": 40221, "hf_likes": 13, "release_date": "2024-04-18", "is_moe": true, "num_experts": 8, "active_experts": 2, "active_parameters": 40431145496, "_discovered": true, "format": "awq" }, { "name": "rednote-hilab/dots.llm1.inst", "provider": "rednote-hilab", "parameter_count": "142.8B", "parameters_raw": 142774381696, "min_ram_gb": 79.8, "recommended_ram_gb": 133.0, "min_vram_gb": 73.1, "quantization": "Q4_K_M", "context_length": 32768, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "dots1", "hf_downloads": 5040, "hf_likes": 175, "release_date": "2025-05-14", "gguf_sources": [ { "repo": "unsloth/dots.llm1.inst-GGUF", "provider": "unsloth" } ] }, { "name": "bigscience/bloom", "provider": "bigscience", "parameter_count": "176.2B", "parameters_raw": 176247271424, "min_ram_gb": 98.5, "recommended_ram_gb": 164.1, "min_vram_gb": 90.3, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "bloom", "hf_downloads": 4896, "hf_likes": 4986, "release_date": "2022-05-19" }, { "name": "tiiuae/falcon-180B-chat", "provider": "TII", "parameter_count": "179.5B", "parameters_raw": 179522565120, "min_ram_gb": 100.3, "recommended_ram_gb": 167.2, "min_vram_gb": 92.0, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "falcon", "hf_downloads": 65, "hf_likes": 545, "release_date": "2023-09-04" }, { "name": "stepfun-ai/Step-3.5-Flash", "provider": "stepfun-ai", "parameter_count": "199.4B", "parameters_raw": 199384301376, "min_ram_gb": 111.4, "recommended_ram_gb": 185.7, "min_vram_gb": 102.1, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "step3p5", "hf_downloads": 327178, "hf_likes": 674, "release_date": "2026-02-01", "_discovered": true }, { "name": "lmstudio-community/MiniMax-M2.5-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "228.7B", "parameters_raw": 228689748992, "min_ram_gb": 127.8, "recommended_ram_gb": 213.0, "min_vram_gb": 117.1, "quantization": "Q4_K_M", "context_length": 196608, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 112426, "hf_likes": 1, "release_date": "2026-02-13", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 18223714369, "_discovered": true }, { "name": "lmstudio-community/MiniMax-M2.5-MLX-4bit", "provider": "lmstudio-community", "parameter_count": "228.7B", "parameters_raw": 228689748992, "min_ram_gb": 127.8, "recommended_ram_gb": 213.0, "min_vram_gb": 117.1, "quantization": "Q4_K_M", "context_length": 196608, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 105419, "hf_likes": 0, "release_date": "2026-02-13", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 18223714369, "_discovered": true }, { "name": "lmstudio-community/MiniMax-M2.5-MLX-6bit", "provider": "lmstudio-community", "parameter_count": "228.7B", "parameters_raw": 228689748992, "min_ram_gb": 127.8, "recommended_ram_gb": 213.0, "min_vram_gb": 117.1, "quantization": "Q4_K_M", "context_length": 196608, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 103821, "hf_likes": 0, "release_date": "2026-02-13", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 18223714369, "_discovered": true }, { "name": "lmstudio-community/MiniMax-M2-MLX-8bit", "provider": "lmstudio-community", "parameter_count": "228.7B", "parameters_raw": 228689748992, "min_ram_gb": 127.8, "recommended_ram_gb": 213.0, "min_vram_gb": 117.1, "quantization": "Q4_K_M", "context_length": 196608, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax", "hf_downloads": 19959, "hf_likes": 0, "release_date": "2025-10-29", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 18223714369, "_discovered": true }, { "name": "QuantTrio/MiniMax-M2-AWQ", "provider": "quanttrio", "parameter_count": "228.7B", "parameters_raw": 228689764864, "min_ram_gb": 127.8, "recommended_ram_gb": 213.0, "min_vram_gb": 117.1, "quantization": "AWQ-4bit", "context_length": 196608, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mixtral", "hf_downloads": 586558, "hf_likes": 8, "release_date": "2025-10-28", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 18223715635, "_discovered": true, "format": "awq" }, { "name": "QuantTrio/MiniMax-M2.5-AWQ", "provider": "quanttrio", "parameter_count": "228.7B", "parameters_raw": 228689764864, "min_ram_gb": 127.8, "recommended_ram_gb": 213.0, "min_vram_gb": 117.1, "quantization": "AWQ-4bit", "context_length": 196608, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 45340, "hf_likes": 10, "release_date": "2026-02-15", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 18223715635, "_discovered": true, "format": "awq" }, { "name": "MiniMaxAI/MiniMax-M2.5", "provider": "MiniMaxAI", "parameter_count": "228.7B", "parameters_raw": 228700000000, "min_ram_gb": 240.0, "recommended_ram_gb": 280.0, "min_vram_gb": 240.0, "quantization": "FP8", "context_length": 196608, "use_case": "Chat, reasoning, tool use", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 13600000000, "release_date": "2025-06-01", "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 526151, "hf_likes": 1252, "gguf_sources": [], "capabilities": [ "tool_use" ] }, { "name": "MiniMaxAI/MiniMax-M2", "provider": "minimaxai", "parameter_count": "228.7B", "parameters_raw": 228703644928, "min_ram_gb": 127.8, "recommended_ram_gb": 213.0, "min_vram_gb": 117.1, "quantization": "Q4_K_M", "context_length": 196608, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 275243, "hf_likes": 1485, "release_date": "2025-10-22", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 18224821702, "_discovered": true, "gguf_sources": [ { "repo": "unsloth/MiniMax-M2-GGUF", "provider": "unsloth" } ] }, { "name": "MiniMaxAI/MiniMax-M2.1", "provider": "minimaxai", "parameter_count": "228.7B", "parameters_raw": 228703644928, "min_ram_gb": 127.8, "recommended_ram_gb": 213.0, "min_vram_gb": 117.1, "quantization": "Q4_K_M", "context_length": 196608, "use_case": "Lightweight, edge deployment", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 72189, "hf_likes": 1257, "release_date": "2025-12-20", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 18224821702, "_discovered": true, "gguf_sources": [ { "repo": "unsloth/MiniMax-M2.1-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen3-235B-A22B", "provider": "Alibaba", "parameter_count": "235.1B", "parameters_raw": 235093634560, "min_ram_gb": 131.4, "recommended_ram_gb": 218.9, "min_vram_gb": 120.4, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 684371, "hf_likes": 1077, "release_date": "2025-04-27", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 22000000000, "gguf_sources": [ { "repo": "unsloth/Qwen3-235B-A22B-GGUF", "provider": "unsloth" } ] }, { "name": "Qwen/Qwen3-235B-A22B-Instruct-2507-FP8", "provider": "Alibaba", "parameter_count": "235.1B", "parameters_raw": 235107904512, "min_ram_gb": 131.4, "recommended_ram_gb": 219.0, "min_vram_gb": 120.4, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 802366, "hf_likes": 146, "release_date": "2025-07-21", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 25714927049, "_discovered": true }, { "name": "Qwen/Qwen3-235B-A22B-Thinking-2507-FP8", "provider": "Alibaba", "parameter_count": "235.1B", "parameters_raw": 235107904512, "min_ram_gb": 131.4, "recommended_ram_gb": 219.0, "min_vram_gb": 120.4, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 77936, "hf_likes": 83, "release_date": "2025-07-25", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 25714927049, "_discovered": true }, { "name": "Qwen/Qwen3-235B-A22B-FP8", "provider": "Alibaba", "parameter_count": "235.1B", "parameters_raw": 235107904512, "min_ram_gb": 131.4, "recommended_ram_gb": 219.0, "min_vram_gb": 120.4, "quantization": "Q4_K_M", "context_length": 40960, "use_case": "General purpose text generation", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 32322, "hf_likes": 90, "release_date": "2025-04-28", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 25714927049, "_discovered": true }, { "name": "casperhansen/deepseek-coder-v2-instruct-awq", "provider": "casperhansen", "parameter_count": "235.7B", "parameters_raw": 235741434880, "min_ram_gb": 131.7, "recommended_ram_gb": 219.6, "min_vram_gb": 120.8, "quantization": "AWQ-4bit", "context_length": 163840, "use_case": "Code generation and completion", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v2", "hf_downloads": 155456, "hf_likes": 11, "release_date": "2024-07-03", "is_moe": true, "num_experts": 64, "active_experts": 6, "active_parameters": 32782793288, "_discovered": true, "format": "awq" }, { "name": "deepseek-ai/DeepSeek-V2.5", "provider": "DeepSeek", "parameter_count": "235.7B", "parameters_raw": 235741434880, "min_ram_gb": 131.7, "recommended_ram_gb": 219.6, "min_vram_gb": 120.8, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v2", "hf_downloads": 84805, "hf_likes": 733, "release_date": "2024-09-05", "is_moe": true, "num_experts": 64, "active_experts": 6, "active_parameters": 32782793288, "_discovered": true, "gguf_sources": [ { "repo": "bartowski/DeepSeek-V2.5-GGUF", "provider": "bartowski" } ] }, { "name": "RedHatAI/DeepSeek-V2.5-1210-FP8", "provider": "redhatai", "parameter_count": "235.7B", "parameters_raw": 235741492480, "min_ram_gb": 131.7, "recommended_ram_gb": 219.6, "min_vram_gb": 120.8, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v2", "hf_downloads": 54313, "hf_likes": 4, "release_date": "2025-01-04", "is_moe": true, "num_experts": 64, "active_experts": 6, "active_parameters": 32782801298, "_discovered": true }, { "name": "LGAI-EXAONE/K-EXAONE-236B-A23B", "provider": "lgai-exaone", "parameter_count": "237.1B", "parameters_raw": 237099669632, "min_ram_gb": 132.5, "recommended_ram_gb": 220.8, "min_vram_gb": 121.4, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "exaone_moe", "hf_downloads": 23695, "hf_likes": 549, "release_date": "2025-12-26", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 25932776361, "_discovered": true }, { "name": "baidu/ERNIE-4.5-300B-A47B-Paddle", "provider": "baidu", "parameter_count": "300.5B", "parameters_raw": 300474051776, "min_ram_gb": 167.9, "recommended_ram_gb": 279.8, "min_vram_gb": 153.9, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "ernie4_5_moe", "hf_downloads": 332, "hf_likes": 12, "release_date": "2025-06-28" }, { "name": "XiaomiMiMo/MiMo-V2-Flash", "provider": "xiaomimimo", "parameter_count": "309.8B", "parameters_raw": 309785318400, "min_ram_gb": 173.1, "recommended_ram_gb": 288.5, "min_vram_gb": 158.7, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mimo_v2_flash", "hf_downloads": 536830, "hf_likes": 636, "release_date": "2025-12-16", "gguf_sources": [ { "repo": "unsloth/MiMo-V2-Flash-GGUF", "provider": "unsloth" } ] }, { "name": "zai-org/GLM-4.6", "provider": "zai-org", "parameter_count": "356.8B", "parameters_raw": 356785898816, "min_ram_gb": 199.4, "recommended_ram_gb": 332.3, "min_vram_gb": 182.8, "quantization": "Q4_K_M", "context_length": 202752, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 81982, "hf_likes": 1204, "release_date": "2025-09-29", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/GLM-4.6-GGUF", "provider": "unsloth" } ] }, { "name": "zai-org/GLM-4.5", "provider": "zai-org", "parameter_count": "358.3B", "parameters_raw": 358337791296, "min_ram_gb": 200.2, "recommended_ram_gb": 333.7, "min_vram_gb": 183.6, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 42566, "hf_likes": 1396, "release_date": "2025-07-20", "_discovered": true, "gguf_sources": [ { "repo": "unsloth/GLM-4.5-GGUF", "provider": "unsloth" } ] }, { "name": "nvidia/DeepSeek-R1-0528-NVFP4-v2", "provider": "nvidia", "parameter_count": "393.6B", "parameters_raw": 393632819968, "min_ram_gb": 220.0, "recommended_ram_gb": 366.6, "min_vram_gb": 201.6, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "hf_downloads": 142525, "hf_likes": 16, "release_date": "2025-07-21", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 31367615334, "_discovered": true }, { "name": "nvidia/DeepSeek-V3.1-NVFP4", "provider": "nvidia", "parameter_count": "393.6B", "parameters_raw": 393632819968, "min_ram_gb": 220.0, "recommended_ram_gb": 366.6, "min_vram_gb": 201.6, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "hf_downloads": 37723, "hf_likes": 13, "release_date": "2025-11-21", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 31367615334, "_discovered": true }, { "name": "nvidia/DeepSeek-V3.2-NVFP4", "provider": "nvidia", "parameter_count": "394.5B", "parameters_raw": 394498304256, "min_ram_gb": 220.4, "recommended_ram_gb": 367.4, "min_vram_gb": 202.1, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v32", "hf_downloads": 21598, "hf_likes": 7, "release_date": "2025-12-30", "_discovered": true }, { "name": "nvidia/DeepSeek-V3-0324-NVFP4", "provider": "nvidia", "parameter_count": "396.8B", "parameters_raw": 396767013632, "min_ram_gb": 221.7, "recommended_ram_gb": 369.5, "min_vram_gb": 203.2, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "hf_downloads": 84851, "hf_likes": 14, "release_date": "2025-05-03", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 31617371393, "_discovered": true }, { "name": "nvidia/DeepSeek-R1-NVFP4", "provider": "nvidia", "parameter_count": "396.8B", "parameters_raw": 396767013632, "min_ram_gb": 221.7, "recommended_ram_gb": 369.5, "min_vram_gb": 203.2, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "hf_downloads": 43986, "hf_likes": 271, "release_date": "2025-02-21", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 31617371393, "_discovered": true }, { "name": "meta-llama/Llama-4-Maverick-17B-128E-Instruct", "provider": "Meta", "parameter_count": "401.6B", "parameters_raw": 401583781376, "min_ram_gb": 224.4, "recommended_ram_gb": 374.0, "min_vram_gb": 205.7, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [ "vision" ], "pipeline_tag": "image-text-to-text", "architecture": "llama4", "hf_downloads": 6341, "hf_likes": 466, "release_date": "2025-04-01", "is_moe": true, "num_experts": 16, "active_experts": 1, "active_parameters": 17000000000 }, { "name": "Qwen/Qwen3.5-397B-A17B", "provider": "Alibaba", "parameter_count": "403.4B", "parameters_raw": 403397928944, "min_ram_gb": 225.4, "recommended_ram_gb": 375.7, "min_vram_gb": 206.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision", "tool_use" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 1291825, "hf_likes": 1214, "release_date": "2026-02-16", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 17000000000 }, { "name": "meta-llama/Llama-3.1-405B-Instruct", "provider": "Meta", "parameter_count": "405.9B", "parameters_raw": 405853388800, "min_ram_gb": 226.8, "recommended_ram_gb": 378.0, "min_vram_gb": 207.9, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 173410, "hf_likes": 592, "release_date": "2024-07-16" }, { "name": "meta-llama/Llama-3.1-405B-Instruct-FP8", "provider": "Meta", "parameter_count": "405.9B", "parameters_raw": 405868625920, "min_ram_gb": 226.8, "recommended_ram_gb": 378.0, "min_vram_gb": 207.9, "quantization": "Q4_K_M", "context_length": 4096, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 22040, "hf_likes": 193, "release_date": "2024-07-20", "_discovered": true }, { "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", "provider": "Alibaba", "parameter_count": "480.2B", "parameters_raw": 480154875392, "min_ram_gb": 268.3, "recommended_ram_gb": 447.2, "min_vram_gb": 245.9, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Code generation and completion", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 75486, "hf_likes": 1304, "release_date": "2025-07-22", "is_moe": true, "num_experts": 160, "active_experts": 8, "active_parameters": 35000000000 }, { "name": "meituan-longcat/LongCat-Flash-Chat", "provider": "meituan-longcat", "parameter_count": "561.9B", "parameters_raw": 561862880256, "min_ram_gb": 314.0, "recommended_ram_gb": 523.3, "min_vram_gb": 287.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "unknown", "hf_downloads": 30116, "hf_likes": 526, "release_date": "2025-08-29", "_discovered": true }, { "name": "deepseek-ai/DeepSeek-R1", "provider": "DeepSeek", "parameter_count": "684.5B", "parameters_raw": 684531386000, "min_ram_gb": 382.5, "recommended_ram_gb": 637.5, "min_vram_gb": 350.6, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "hf_downloads": 1026085, "hf_likes": 13108, "release_date": "2025-01-20", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 37000000000, "gguf_sources": [ { "repo": "unsloth/DeepSeek-R1-GGUF", "provider": "unsloth" }, { "repo": "bartowski/DeepSeek-R1-GGUF", "provider": "bartowski" } ] }, { "name": "deepseek-ai/DeepSeek-R1-0528", "provider": "DeepSeek", "parameter_count": "684.5B", "parameters_raw": 684531386000, "min_ram_gb": 382.5, "recommended_ram_gb": 637.5, "min_vram_gb": 350.6, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "Advanced reasoning, chain-of-thought", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "hf_downloads": 1050237, "hf_likes": 2403, "release_date": "2025-05-28", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 54548594820, "_discovered": true }, { "name": "deepseek-ai/DeepSeek-V3-0324", "provider": "DeepSeek", "parameter_count": "684.5B", "parameters_raw": 684531386000, "min_ram_gb": 382.5, "recommended_ram_gb": 637.5, "min_vram_gb": 350.6, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "hf_downloads": 270362, "hf_likes": 3088, "release_date": "2025-03-24", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 54548594820, "_discovered": true }, { "name": "deepseek-ai/DeepSeek-V3", "provider": "DeepSeek", "parameter_count": "685B", "parameters_raw": 685000000000, "min_ram_gb": 382.8, "recommended_ram_gb": 638.0, "min_vram_gb": 351.3, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "State-of-the-art, MoE architecture", "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 37000000000, "hf_downloads": 0, "hf_likes": 0, "release_date": null }, { "name": "deepseek-ai/DeepSeek-V3.2-Speciale", "provider": "DeepSeek", "parameter_count": "685B", "parameters_raw": 685000000000, "min_ram_gb": 383.2, "recommended_ram_gb": 638.7, "min_vram_gb": 351.3, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Advanced reasoning, chain-of-thought", "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 37000000000, "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-12-01" }, { "name": "QuantTrio/DeepSeek-V3.2-AWQ", "provider": "quanttrio", "parameter_count": "685.0B", "parameters_raw": 685011996928, "min_ram_gb": 382.8, "recommended_ram_gb": 638.0, "min_vram_gb": 350.9, "quantization": "AWQ-4bit", "context_length": 163840, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v32", "hf_downloads": 103286, "hf_likes": 11, "release_date": "2025-12-03", "_discovered": true, "format": "awq" }, { "name": "deepseek-ai/DeepSeek-V3.2", "provider": "DeepSeek", "parameter_count": "685.4B", "parameters_raw": 685396921376, "min_ram_gb": 383.0, "recommended_ram_gb": 638.3, "min_vram_gb": 351.1, "quantization": "Q4_K_M", "context_length": 163840, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v32", "hf_downloads": 362520, "hf_likes": 1280, "release_date": "2025-12-01" }, { "name": "zai-org/GLM-5", "provider": "zai-org", "parameter_count": "753.9B", "parameters_raw": 753864139008, "min_ram_gb": 421.3, "recommended_ram_gb": 702.1, "min_vram_gb": 386.1, "quantization": "BF16", "context_length": 202752, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm_moe_dsa", "hf_downloads": 205187, "hf_likes": 1698, "release_date": "2026-02-11" }, { "name": "zai-org/GLM-5.1", "provider": "zai-org", "parameter_count": "753.9B", "parameters_raw": 753864139008, "min_ram_gb": 421.3, "recommended_ram_gb": 702.1, "min_vram_gb": 386.1, "quantization": "BF16", "context_length": 202752, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm_moe_dsa", "hf_downloads": 141194, "hf_likes": 0, "release_date": "2026-04-03" }, { "name": "moonshotai/Kimi-K2-Instruct", "provider": "moonshotai", "parameter_count": "1026.5B", "parameters_raw": 1026470731056, "min_ram_gb": 573.6, "recommended_ram_gb": 956.0, "min_vram_gb": 525.8, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "kimi_k2", "hf_downloads": 151155, "hf_likes": 2324, "release_date": "2025-07-11" }, { "name": "moonshotai/Kimi-K2-Instruct-0905", "provider": "moonshotai", "parameter_count": "1026.5B", "parameters_raw": 1026470735448, "min_ram_gb": 573.6, "recommended_ram_gb": 956.0, "min_vram_gb": 525.8, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "kimi_k2", "hf_downloads": 28801, "hf_likes": 683, "release_date": "2025-09-03", "_discovered": true }, { "name": "moonshotai/Kimi-K2.5", "provider": "moonshotai", "parameter_count": "1058.6B", "parameters_raw": 1058589420528, "min_ram_gb": 591.5, "recommended_ram_gb": 985.9, "min_vram_gb": 542.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose", "capabilities": [ "vision" ], "pipeline_tag": "image-text-to-text", "architecture": "kimi_k25", "hf_downloads": 1899549, "hf_likes": 2220, "release_date": "2026-01-01", "gguf_sources": [ { "repo": "unsloth/Kimi-K2.5-GGUF", "provider": "unsloth" } ] }, { "name": "QuantTrio/Qwen3.5-27B-AWQ", "provider": "QuantTrio", "parameter_count": "27.3B", "parameters_raw": 27300000000, "min_ram_gb": 14.2, "recommended_ram_gb": 18.4, "min_vram_gb": 14.2, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3.5-35B-A3B-AWQ", "provider": "QuantTrio", "parameter_count": "35.2B", "parameters_raw": 35200000000, "min_ram_gb": 18.1, "recommended_ram_gb": 23.5, "min_vram_gb": 18.1, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3.5-122B-A10B-AWQ", "provider": "QuantTrio", "parameter_count": "125.1B", "parameters_raw": 125100000000, "min_ram_gb": 63.0, "recommended_ram_gb": 82.0, "min_vram_gb": 63.0, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 10000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3.5-9B-AWQ", "provider": "QuantTrio", "parameter_count": "9.4B", "parameters_raw": 9400000000, "min_ram_gb": 5.2, "recommended_ram_gb": 6.8, "min_vram_gb": 5.2, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/GLM-4.5-Air-AWQ-FP16Mix", "provider": "QuantTrio", "parameter_count": "9.4B", "parameters_raw": 9400000000, "min_ram_gb": 5.2, "recommended_ram_gb": 6.8, "min_vram_gb": 5.2, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/GLM-4.5-AWQ", "provider": "QuantTrio", "parameter_count": "31.2B", "parameters_raw": 31200000000, "min_ram_gb": 16.1, "recommended_ram_gb": 20.9, "min_vram_gb": 16.1, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/GLM-4.5V-AWQ", "provider": "QuantTrio", "parameter_count": "31.2B", "parameters_raw": 31200000000, "min_ram_gb": 16.1, "recommended_ram_gb": 20.9, "min_vram_gb": 16.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Multimodal, vision", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/KAT-V1-40B-AWQ", "provider": "QuantTrio", "parameter_count": "40.0B", "parameters_raw": 40000000000, "min_ram_gb": 20.5, "recommended_ram_gb": 26.7, "min_vram_gb": 20.5, "quantization": "AWQ-4bit", "context_length": 65536, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/DeepSeek-V3.1-AWQ", "provider": "QuantTrio", "parameter_count": "685.0B", "parameters_raw": 685000000000, "min_ram_gb": 343.0, "recommended_ram_gb": 445.9, "min_vram_gb": 343.0, "quantization": "AWQ-4bit", "context_length": 163840, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 37000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/DeepSeek-V3.1-AWQ-Fp16Mix", "provider": "QuantTrio", "parameter_count": "685.0B", "parameters_raw": 685000000000, "min_ram_gb": 343.0, "recommended_ram_gb": 445.9, "min_vram_gb": 343.0, "quantization": "AWQ-4bit", "context_length": 163840, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 37000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/DeepSeek-V3.1-AWQ-Lite", "provider": "QuantTrio", "parameter_count": "685.0B", "parameters_raw": 685000000000, "min_ram_gb": 343.0, "recommended_ram_gb": 445.9, "min_vram_gb": 343.0, "quantization": "AWQ-4bit", "context_length": 163840, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 37000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/DeepSeek-V3.2-Exp-AWQ", "provider": "QuantTrio", "parameter_count": "486.0B", "parameters_raw": 486000000000, "min_ram_gb": 243.5, "recommended_ram_gb": 316.6, "min_vram_gb": 243.5, "quantization": "AWQ-4bit", "context_length": 163840, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 37000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/DeepSeek-V3.2-Exp-AWQ-Lite", "provider": "QuantTrio", "parameter_count": "486.0B", "parameters_raw": 486000000000, "min_ram_gb": 243.5, "recommended_ram_gb": 316.6, "min_vram_gb": 243.5, "quantization": "AWQ-4bit", "context_length": 163840, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 37000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/GLM-4.6-AWQ", "provider": "QuantTrio", "parameter_count": "31.2B", "parameters_raw": 31200000000, "min_ram_gb": 16.1, "recommended_ram_gb": 20.9, "min_vram_gb": 16.1, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/MiniMax-M2-REAP-162B-A10B-AWQ", "provider": "QuantTrio", "parameter_count": "162.0B", "parameters_raw": 162000000000, "min_ram_gb": 81.5, "recommended_ram_gb": 106.0, "min_vram_gb": 81.5, "quantization": "AWQ-4bit", "context_length": 1048576, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 10000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/DeepSeek-V3.2-Speciale-AWQ", "provider": "QuantTrio", "parameter_count": "685.0B", "parameters_raw": 685000000000, "min_ram_gb": 343.0, "recommended_ram_gb": 445.9, "min_vram_gb": 343.0, "quantization": "AWQ-4bit", "context_length": 163840, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 37000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/GLM-4.7-AWQ", "provider": "QuantTrio", "parameter_count": "31.2B", "parameters_raw": 31200000000, "min_ram_gb": 16.1, "recommended_ram_gb": 20.9, "min_vram_gb": 16.1, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/MiniMax-M2.1-AWQ", "provider": "QuantTrio", "parameter_count": "228.7B", "parameters_raw": 228700000000, "min_ram_gb": 114.8, "recommended_ram_gb": 149.3, "min_vram_gb": 114.8, "quantization": "AWQ-4bit", "context_length": 1048576, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 40000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Step3-VL-10B-AWQ", "provider": "QuantTrio", "parameter_count": "10.0B", "parameters_raw": 10000000000, "min_ram_gb": 5.5, "recommended_ram_gb": 7.2, "min_vram_gb": 5.5, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Multimodal, vision", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3.5-397B-A17B-AWQ", "provider": "QuantTrio", "parameter_count": "403.4B", "parameters_raw": 403400000000, "min_ram_gb": 202.2, "recommended_ram_gb": 262.9, "min_vram_gb": 202.2, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 17000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/GLM-5-AWQ", "provider": "QuantTrio", "parameter_count": "753.9B", "parameters_raw": 753900000000, "min_ram_gb": 377.4, "recommended_ram_gb": 490.7, "min_vram_gb": 377.4, "quantization": "AWQ-4bit", "context_length": 202752, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 35000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3.5-4B-AWQ", "provider": "QuantTrio", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.5, "recommended_ram_gb": 3.2, "min_vram_gb": 2.5, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3.5-2B-AWQ", "provider": "QuantTrio", "parameter_count": "2.0B", "parameters_raw": 2000000000, "min_ram_gb": 1.5, "recommended_ram_gb": 2.0, "min_vram_gb": 1.5, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/sarvam-30b-AWQ", "provider": "QuantTrio", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "Chat, multilingual", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/sarvam-105b-AWQ", "provider": "QuantTrio", "parameter_count": "105.0B", "parameters_raw": 105000000000, "min_ram_gb": 36.8, "recommended_ram_gb": 73.7, "min_vram_gb": 61.4, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "Chat, multilingual", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3500000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3.5-35B-A3B-FP8", "provider": "Qwen", "parameter_count": "35.2B", "parameters_raw": 35200000000, "min_ram_gb": 35.7, "recommended_ram_gb": 46.4, "min_vram_gb": 35.7, "quantization": "FP8", "context_length": 131072, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3.5-27B-FP8", "provider": "Qwen", "parameter_count": "27.3B", "parameters_raw": 27300000000, "min_ram_gb": 27.8, "recommended_ram_gb": 36.1, "min_vram_gb": 27.8, "quantization": "FP8", "context_length": 131072, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3.5-397B-A17B-FP8", "provider": "Qwen", "parameter_count": "403.4B", "parameters_raw": 403400000000, "min_ram_gb": 403.9, "recommended_ram_gb": 525.1, "min_vram_gb": 403.9, "quantization": "FP8", "context_length": 262144, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 17000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3.5-122B-A10B-FP8", "provider": "Qwen", "parameter_count": "125.1B", "parameters_raw": 125100000000, "min_ram_gb": 125.6, "recommended_ram_gb": 163.3, "min_vram_gb": 125.6, "quantization": "FP8", "context_length": 131072, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 10000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-30B-A3B-FP8", "provider": "Qwen", "parameter_count": "30.5B", "parameters_raw": 30500000000, "min_ram_gb": 31.0, "recommended_ram_gb": 40.3, "min_vram_gb": 31.0, "quantization": "FP8", "context_length": 131072, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-32B-FP8", "provider": "Qwen", "parameter_count": "32.8B", "parameters_raw": 32800000000, "min_ram_gb": 33.3, "recommended_ram_gb": 43.3, "min_vram_gb": 33.3, "quantization": "FP8", "context_length": 131072, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-14B-FP8", "provider": "Qwen", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 14.5, "recommended_ram_gb": 18.9, "min_vram_gb": 14.5, "quantization": "FP8", "context_length": 131072, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3-VL-32B-Instruct-AWQ", "provider": "QuantTrio", "parameter_count": "32.8B", "parameters_raw": 32800000000, "min_ram_gb": 16.9, "recommended_ram_gb": 22.0, "min_vram_gb": 16.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Multimodal, vision", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3-235B-A22B-Instruct-2507-AWQ", "provider": "QuantTrio", "parameter_count": "234.6B", "parameters_raw": 234600000000, "min_ram_gb": 117.8, "recommended_ram_gb": 153.1, "min_vram_gb": 117.8, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 22000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/GLM-4.1V-9B-Thinking-AWQ", "provider": "QuantTrio", "parameter_count": "9.4B", "parameters_raw": 9400000000, "min_ram_gb": 5.2, "recommended_ram_gb": 6.8, "min_vram_gb": 5.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Multimodal, vision, reasoning", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3-Coder-480B-A35B-Instruct-AWQ", "provider": "QuantTrio", "parameter_count": "480.2B", "parameters_raw": 480200000000, "min_ram_gb": 240.6, "recommended_ram_gb": 312.8, "min_vram_gb": 240.6, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Coding", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 35000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3-235B-A22B-Thinking-2507-AWQ", "provider": "QuantTrio", "parameter_count": "234.6B", "parameters_raw": 234600000000, "min_ram_gb": 117.8, "recommended_ram_gb": 153.1, "min_vram_gb": 117.8, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "Reasoning", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 22000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3-30B-A3B-Thinking-2507-AWQ-BF16Mix", "provider": "QuantTrio", "parameter_count": "30.5B", "parameters_raw": 30500000000, "min_ram_gb": 15.8, "recommended_ram_gb": 20.5, "min_vram_gb": 15.8, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "Reasoning", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3-30B-A3B-Thinking-2507-AWQ", "provider": "QuantTrio", "parameter_count": "30.5B", "parameters_raw": 30500000000, "min_ram_gb": 15.8, "recommended_ram_gb": 20.5, "min_vram_gb": 15.8, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "Reasoning", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Seed-OSS-36B-Instruct-AWQ", "provider": "QuantTrio", "parameter_count": "36.0B", "parameters_raw": 36000000000, "min_ram_gb": 18.5, "recommended_ram_gb": 24.1, "min_vram_gb": 18.5, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "General", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3-VL-235B-A22B-Instruct-AWQ", "provider": "QuantTrio", "parameter_count": "234.6B", "parameters_raw": 234600000000, "min_ram_gb": 117.8, "recommended_ram_gb": 153.1, "min_vram_gb": 117.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Multimodal, vision", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 22000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3-VL-235B-A22B-Thinking-AWQ", "provider": "QuantTrio", "parameter_count": "234.6B", "parameters_raw": 234600000000, "min_ram_gb": 117.8, "recommended_ram_gb": 153.1, "min_vram_gb": 117.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Multimodal, vision, reasoning", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 22000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3-VL-30B-A3B-Thinking-AWQ", "provider": "QuantTrio", "parameter_count": "31.1B", "parameters_raw": 31100000000, "min_ram_gb": 16.1, "recommended_ram_gb": 20.9, "min_vram_gb": 16.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Multimodal, vision, reasoning", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3-VL-32B-Thinking-AWQ", "provider": "QuantTrio", "parameter_count": "32.8B", "parameters_raw": 32800000000, "min_ram_gb": 16.9, "recommended_ram_gb": 22.0, "min_vram_gb": 16.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Multimodal, vision, reasoning", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-VL-8B-Instruct-FP8", "provider": "Qwen", "parameter_count": "8.2B", "parameters_raw": 8200000000, "min_ram_gb": 8.7, "recommended_ram_gb": 11.3, "min_vram_gb": 8.7, "quantization": "FP8", "context_length": 32768, "use_case": "Multimodal, vision", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-VL-32B-Instruct-FP8", "provider": "Qwen", "parameter_count": "32.8B", "parameters_raw": 32800000000, "min_ram_gb": 33.3, "recommended_ram_gb": 43.3, "min_vram_gb": 33.3, "quantization": "FP8", "context_length": 32768, "use_case": "Multimodal, vision", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-VL-30B-A3B-Instruct-FP8", "provider": "Qwen", "parameter_count": "31.1B", "parameters_raw": 31100000000, "min_ram_gb": 31.6, "recommended_ram_gb": 41.1, "min_vram_gb": 31.6, "quantization": "FP8", "context_length": 32768, "use_case": "Multimodal, vision", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-4B-Thinking-2507-FP8", "provider": "Qwen", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 4.5, "recommended_ram_gb": 5.9, "min_vram_gb": 4.5, "quantization": "FP8", "context_length": 32768, "use_case": "Reasoning", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-VL-235B-A22B-Instruct-FP8", "provider": "Qwen", "parameter_count": "234.6B", "parameters_raw": 234600000000, "min_ram_gb": 235.1, "recommended_ram_gb": 305.6, "min_vram_gb": 235.1, "quantization": "FP8", "context_length": 32768, "use_case": "Multimodal, vision", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 22000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", "provider": "Qwen", "parameter_count": "480.2B", "parameters_raw": 480200000000, "min_ram_gb": 480.7, "recommended_ram_gb": 624.9, "min_vram_gb": 480.7, "quantization": "FP8", "context_length": 262144, "use_case": "Coding", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 35000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-30B-A3B-Thinking-2507-FP8", "provider": "Qwen", "parameter_count": "30.5B", "parameters_raw": 30500000000, "min_ram_gb": 31.0, "recommended_ram_gb": 40.3, "min_vram_gb": 31.0, "quantization": "FP8", "context_length": 131072, "use_case": "Reasoning", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-VL-30B-A3B-Thinking-FP8", "provider": "Qwen", "parameter_count": "31.1B", "parameters_raw": 31100000000, "min_ram_gb": 31.6, "recommended_ram_gb": 41.1, "min_vram_gb": 31.6, "quantization": "FP8", "context_length": 32768, "use_case": "Multimodal, vision, reasoning", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3-VL-2B-Instruct-FP8", "provider": "Qwen", "parameter_count": "2.7B", "parameters_raw": 2700000000, "min_ram_gb": 3.2, "recommended_ram_gb": 4.2, "min_vram_gb": 3.2, "quantization": "FP8", "context_length": 32768, "use_case": "Multimodal, vision", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "release_date": "2025-07-01", "gguf_sources": [], "capabilities": [] }, { "name": "zai-org/GLM-4.7-Flash", "provider": "zai-org", "parameter_count": "31.2B", "parameters_raw": 31221488576, "min_ram_gb": 17.4, "recommended_ram_gb": 29.1, "min_vram_gb": 16.0, "quantization": "Q4_K_M", "context_length": 202752, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe_lite", "hf_downloads": 1709725, "hf_likes": 1617, "release_date": "2026-01-29", "is_moe": true, "num_experts": 64, "active_experts": 4, "active_parameters": null, "_discovered": true, "gguf_sources": [] }, { "name": "cyankiwi/Qwen3.5-35B-A3B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "35.0B", "parameters_raw": 35000000000, "min_ram_gb": 4.4, "recommended_ram_gb": 7.3, "min_vram_gb": 4.0, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Multimodal, vision, chat", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 651639, "hf_likes": 30, "release_date": "2026-02-25", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 3000000000, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3-VL-4B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Multimodal, vision", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 583536, "hf_likes": 6, "release_date": "2025-10-14", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3-Coder-Next-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "79.7B", "parameters_raw": 79674391296, "min_ram_gb": 44.5, "recommended_ram_gb": 74.2, "min_vram_gb": 40.8, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Coding", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 248200, "hf_likes": 18, "release_date": "2026-02-04", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3.5-9B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "9.0B", "parameters_raw": 9000000000, "min_ram_gb": 5.5, "recommended_ram_gb": 9.2, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Multimodal, vision, chat", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 183369, "hf_likes": 13, "release_date": "2026-03-02", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3.5-27B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "27.0B", "parameters_raw": 27000000000, "min_ram_gb": 3.9, "recommended_ram_gb": 6.5, "min_vram_gb": 3.6, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Multimodal, vision, chat", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 149004, "hf_likes": 19, "release_date": "2026-02-25", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3.5-122B-A10B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "122.0B", "parameters_raw": 122000000000, "min_ram_gb": 71.9, "recommended_ram_gb": 119.9, "min_vram_gb": 66.0, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Multimodal, vision, chat", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 137640, "hf_likes": 22, "release_date": "2026-02-25", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 10000000000, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3-VL-8B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 1.6, "recommended_ram_gb": 2.7, "min_vram_gb": 1.5, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Multimodal, vision", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 90955, "hf_likes": 13, "release_date": "2025-10-14", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3.5-27B-AWQ-BF16-INT8", "provider": "cyankiwi", "parameter_count": "27.0B", "parameters_raw": 27000000000, "min_ram_gb": 7.8, "recommended_ram_gb": 13.1, "min_vram_gb": 7.2, "quantization": "AWQ-8bit", "context_length": 262144, "use_case": "Multimodal, vision, chat", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 82325, "hf_likes": 8, "release_date": "2026-02-24", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3-Omni-30B-A3B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 5.6, "recommended_ram_gb": 9.3, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 65536, "use_case": "Multimodal, any-to-any", "capabilities": [], "pipeline_tag": "any-to-any", "architecture": "qwen3_omni_moe", "hf_downloads": 68670, "hf_likes": 45, "release_date": "2025-09-28", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3000000000, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3-30B-A3B-Instruct-2507-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 5.1, "recommended_ram_gb": 8.4, "min_vram_gb": 4.6, "quantization": "AWQ-8bit", "context_length": 262144, "use_case": "Instruction following, chat", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 44772, "hf_likes": 2, "release_date": "2025-08-08", "is_moe": true, "num_experts": 128, "active_experts": 8, "active_parameters": 3000000000, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3.5-27B-AWQ-BF16-INT4", "provider": "cyankiwi", "parameter_count": "27.0B", "parameters_raw": 27000000000, "min_ram_gb": 6.5, "recommended_ram_gb": 10.8, "min_vram_gb": 6.0, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Multimodal, vision, chat", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 42645, "hf_likes": 30, "release_date": "2026-02-24", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3.5-4B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.7, "recommended_ram_gb": 4.4, "min_vram_gb": 2.4, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Multimodal, vision, chat", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 35275, "hf_likes": 7, "release_date": "2026-03-02", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Devstral-2-123B-Instruct-2512-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "123.0B", "parameters_raw": 123000000000, "min_ram_gb": 12.4, "recommended_ram_gb": 20.7, "min_vram_gb": 11.4, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Coding", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "ministral3", "hf_downloads": 31584, "hf_likes": 15, "release_date": "2025-12-11", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3.5-35B-A3B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "35.0B", "parameters_raw": 35000000000, "min_ram_gb": 6.7, "recommended_ram_gb": 11.2, "min_vram_gb": 6.2, "quantization": "AWQ-8bit", "context_length": 262144, "use_case": "Multimodal, vision, chat", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 21278, "hf_likes": 7, "release_date": "2026-02-25", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 3000000000, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/InternVL3_5-38B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "38.0B", "parameters_raw": 38000000000, "min_ram_gb": 6.7, "recommended_ram_gb": 11.2, "min_vram_gb": 6.2, "quantization": "AWQ-4bit", "context_length": 40960, "use_case": "Multimodal, vision", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "internvl_chat", "hf_downloads": 20665, "hf_likes": 1, "release_date": "2025-08-29", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3-VL-4B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.9, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Multimodal, vision, reasoning", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 17082, "hf_likes": 1, "release_date": "2025-10-14", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3.5-4B-AWQ-BF16-INT4", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.6, "recommended_ram_gb": 4.4, "min_vram_gb": 2.4, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Multimodal, vision, chat", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 14400, "hf_likes": 1, "release_date": "2026-03-02", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/Qwen3.5-2B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 2000000000, "min_ram_gb": 1.3, "recommended_ram_gb": 2.2, "min_vram_gb": 1.2, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Multimodal, vision, chat", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 14333, "hf_likes": 1, "release_date": "2026-03-02", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/LFM2-24B-A2B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "24.0B", "parameters_raw": 24000000000, "min_ram_gb": 2.5, "recommended_ram_gb": 4.1, "min_vram_gb": 2.2, "quantization": "AWQ-4bit", "context_length": 128000, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2_moe", "hf_downloads": 13987, "hf_likes": 1, "release_date": "2026-02-25", "is_moe": true, "num_experts": 64, "active_experts": 4, "active_parameters": 2000000000, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/OmniCoder-9B-AWQ-BF16-INT4", "provider": "cyankiwi", "parameter_count": "9.0B", "parameters_raw": 9000000000, "min_ram_gb": 5.3, "recommended_ram_gb": 8.9, "min_vram_gb": 4.9, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Coding, reasoning", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_5", "hf_downloads": 12121, "hf_likes": 0, "release_date": "2026-03-14", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/GLM-4.7-Flash-REAP-23B-A3B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "23.0B", "parameters_raw": 23000000000, "min_ram_gb": 2.6, "recommended_ram_gb": 4.3, "min_vram_gb": 2.3, "quantization": "AWQ-4bit", "context_length": 202752, "use_case": "General purpose text generation", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe_lite", "hf_downloads": 10101, "hf_likes": 2, "release_date": "2026-01-25", "is_moe": true, "num_experts": 49, "active_experts": 4, "active_parameters": 3000000000, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/OmniCoder-9B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "9.0B", "parameters_raw": 9000000000, "min_ram_gb": 5.4, "recommended_ram_gb": 9.0, "min_vram_gb": 4.9, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "Coding, reasoning", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_5", "hf_downloads": 9212, "hf_likes": 2, "release_date": "2026-03-14", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "Qwen/Qwen3.6-27B", "provider": "Qwen", "parameter_count": "27.8B", "parameters_raw": 27781427952, "min_ram_gb": 16.6, "recommended_ram_gb": 21.6, "min_vram_gb": 16.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose, coding", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "architecture": "qwen3", "pipeline_tag": "text-generation", "release_date": "2026-04-01", "gguf_sources": [ { "repo": "unsloth/Qwen3.6-27B-GGUF", "provider": "unsloth", "file": "Qwen3.6-27B-Q4_K_M.gguf" } ], "capabilities": [] }, { "name": "Qwen/Qwen3.6-27B-FP8", "provider": "Qwen", "parameter_count": "27.8B", "parameters_raw": 27781427952, "min_ram_gb": 28.3, "recommended_ram_gb": 36.8, "min_vram_gb": 28.3, "quantization": "FP8", "context_length": 262144, "use_case": "General purpose, coding", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "architecture": "qwen3", "pipeline_tag": "text-generation", "release_date": "2026-04-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3.6-27B-AWQ", "provider": "QuantTrio", "parameter_count": "27.8B", "parameters_raw": 27781427952, "min_ram_gb": 14.4, "recommended_ram_gb": 18.7, "min_vram_gb": 14.4, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "General purpose, coding", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "architecture": "qwen3", "pipeline_tag": "text-generation", "release_date": "2026-04-01", "gguf_sources": [], "capabilities": [] }, { "name": "Qwen/Qwen3.6-35B-A3B", "provider": "Qwen", "parameter_count": "36.0B", "parameters_raw": 35951822704, "min_ram_gb": 21.4, "recommended_ram_gb": 27.8, "min_vram_gb": 21.4, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose (MoE)", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "architecture": "qwen3_moe", "pipeline_tag": "text-generation", "release_date": "2026-04-01", "gguf_sources": [ { "repo": "unsloth/Qwen3.6-35B-A3B-GGUF", "provider": "unsloth", "file": "Qwen3.6-35B-A3B-UD-Q4_K_M.gguf" } ], "capabilities": [] }, { "name": "Qwen/Qwen3.6-35B-A3B-FP8", "provider": "Qwen", "parameter_count": "36.0B", "parameters_raw": 35951822704, "min_ram_gb": 36.5, "recommended_ram_gb": 47.5, "min_vram_gb": 36.5, "quantization": "FP8", "context_length": 262144, "use_case": "General purpose (MoE)", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "architecture": "qwen3_moe", "pipeline_tag": "text-generation", "release_date": "2026-04-01", "gguf_sources": [], "capabilities": [] }, { "name": "QuantTrio/Qwen3.6-35B-A3B-AWQ", "provider": "QuantTrio", "parameter_count": "36.0B", "parameters_raw": 35951822704, "min_ram_gb": 18.5, "recommended_ram_gb": 24.1, "min_vram_gb": 18.5, "quantization": "AWQ-4bit", "context_length": 262144, "use_case": "General purpose (MoE)", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "architecture": "qwen3_moe", "pipeline_tag": "text-generation", "release_date": "2026-04-01", "gguf_sources": [], "capabilities": [] }, { "name": "google/gemma-4-E2B-it", "provider": "Google", "parameter_count": "5.1B", "parameters_raw": 5123178051, "min_ram_gb": 3.5, "recommended_ram_gb": 4.5, "min_vram_gb": 3.5, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "On-device, multimodal", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "architecture": "gemma4", "pipeline_tag": "image-text-to-text", "release_date": "2026-04-01", "gguf_sources": [ { "repo": "unsloth/gemma-4-E2B-it-GGUF", "provider": "unsloth" } ], "capabilities": [ "vision" ] }, { "name": "google/gemma-4-E4B-it", "provider": "Google", "parameter_count": "8.0B", "parameters_raw": 7996156490, "min_ram_gb": 5.1, "recommended_ram_gb": 6.6, "min_vram_gb": 5.1, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "On-device, multimodal", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "architecture": "gemma4", "pipeline_tag": "image-text-to-text", "release_date": "2026-04-01", "gguf_sources": [ { "repo": "unsloth/gemma-4-E4B-it-GGUF", "provider": "unsloth" } ], "capabilities": [ "vision" ] }, { "name": "google/gemma-4-31B-it", "provider": "Google", "parameter_count": "32.7B", "parameters_raw": 32682372656, "min_ram_gb": 19.5, "recommended_ram_gb": 25.4, "min_vram_gb": 19.5, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "General purpose, multimodal", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "architecture": "gemma4", "pipeline_tag": "image-text-to-text", "release_date": "2026-04-01", "gguf_sources": [ { "repo": "unsloth/gemma-4-31B-it-GGUF", "provider": "unsloth" } ], "capabilities": [ "vision" ] }, { "name": "google/gemma-4-26B-A4B-it", "provider": "Google", "parameter_count": "26.5B", "parameters_raw": 26544131376, "min_ram_gb": 15.9, "recommended_ram_gb": 20.7, "min_vram_gb": 15.9, "quantization": "Q4_K_M", "context_length": 131072, "use_case": "High-throughput, multimodal (MoE)", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 4000000000, "architecture": "gemma4", "pipeline_tag": "image-text-to-text", "release_date": "2026-04-01", "gguf_sources": [ { "repo": "unsloth/gemma-4-26B-A4B-it-GGUF", "provider": "unsloth" } ], "capabilities": [ "vision" ] }, { "name": "cyankiwi/gemma-4-31B-it-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "31.0B", "parameters_raw": 31000000000, "min_ram_gb": 16.8, "recommended_ram_gb": 21.8, "min_vram_gb": 16.8, "quantization": "AWQ-4bit", "context_length": 131072, "use_case": "General purpose, multimodal", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "architecture": "gemma4", "pipeline_tag": "image-text-to-text", "release_date": "2026-04-01", "gguf_sources": [], "capabilities": [ "vision" ] }, { "name": "cyankiwi/Qwen3.6-27B-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "27.0B", "parameters_raw": 27000000000, "min_ram_gb": 9.7, "recommended_ram_gb": 19.4, "min_vram_gb": 16.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 1370875, "hf_likes": 66, "release_date": "2026-04-22", "_discovered": true }, { "name": "cyankiwi/gemma-4-26B-A4B-it-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "26.0B", "parameters_raw": 26000000000, "min_ram_gb": 9.4, "recommended_ram_gb": 18.7, "min_vram_gb": 15.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "gemma4", "hf_downloads": 4146360, "hf_likes": 71, "release_date": "2026-04-03", "_discovered": true, "is_moe": true, "active_parameters": 4000000000 }, { "name": "cyankiwi/Qwen3.6-35B-A3B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "35.0B", "parameters_raw": 35000000000, "min_ram_gb": 12.5, "recommended_ram_gb": 25.0, "min_vram_gb": 20.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 881182, "hf_likes": 67, "release_date": "2026-04-16", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Qwen3.6-27B-AWQ-BF16-INT4", "provider": "cyankiwi", "parameter_count": "27.0B", "parameters_raw": 27000000000, "min_ram_gb": 9.7, "recommended_ram_gb": 19.4, "min_vram_gb": 16.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 285756, "hf_likes": 30, "release_date": "2026-04-22", "_discovered": true }, { "name": "cyankiwi/Qwen3.6-27B-AWQ-BF16-INT8", "provider": "cyankiwi", "parameter_count": "27.0B", "parameters_raw": 27000000000, "min_ram_gb": 18.1, "recommended_ram_gb": 36.2, "min_vram_gb": 30.2, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 4433, "hf_likes": 5, "release_date": "2026-05-06", "_discovered": true }, { "name": "cyankiwi/MiniMax-M2.7-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "228.7B", "parameters_raw": 228700000000, "min_ram_gb": 79.9, "recommended_ram_gb": 159.7, "min_vram_gb": 133.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 266548, "hf_likes": 32, "release_date": "2026-04-13", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-30B-A3B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl_moe", "hf_downloads": 31781, "hf_likes": 10, "release_date": "2025-10-06", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/MiMo-V2-Flash-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "50.9B", "parameters_raw": 50919007194, "min_ram_gb": 18.0, "recommended_ram_gb": 36.0, "min_vram_gb": 30.0, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "custom_code", "hf_downloads": 1650, "hf_likes": 9, "release_date": "2025-12-18", "_discovered": true }, { "name": "cyankiwi/GLM-4.7-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "59.1B", "parameters_raw": 59092091016, "min_ram_gb": 20.9, "recommended_ram_gb": 41.8, "min_vram_gb": 34.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 251, "hf_likes": 5, "release_date": "2025-12-24", "_discovered": true }, { "name": "cyankiwi/GLM-4.7-REAP-218B-A32B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "218.0B", "parameters_raw": 218000000000, "min_ram_gb": 76.1, "recommended_ram_gb": 152.3, "min_vram_gb": 126.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 29, "hf_likes": 10, "release_date": "2026-01-16", "_discovered": true, "is_moe": true, "active_parameters": 32000000000 }, { "name": "cyankiwi/GLM-4.7-REAP-268B-A32B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "268.0B", "parameters_raw": 268000000000, "min_ram_gb": 93.5, "recommended_ram_gb": 187.1, "min_vram_gb": 155.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 16, "hf_likes": 6, "release_date": "2026-01-26", "_discovered": true, "is_moe": true, "active_parameters": 32000000000 }, { "name": "cyankiwi/MiniMax-M2.1-REAP-139B-A10B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "139.0B", "parameters_raw": 139000000000, "min_ram_gb": 48.7, "recommended_ram_gb": 97.3, "min_vram_gb": 81.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 2, "hf_likes": 1, "release_date": "2026-02-03", "_discovered": true, "is_moe": true, "active_parameters": 10000000000 }, { "name": "cyankiwi/NVIDIA-Nemotron-3-Super-120B-A12B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "120.0B", "parameters_raw": 120000000000, "min_ram_gb": 42.1, "recommended_ram_gb": 84.1, "min_vram_gb": 70.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nemotron_h", "hf_downloads": 1185, "hf_likes": 6, "release_date": "2026-03-16", "_discovered": true, "is_moe": true, "active_parameters": 12000000000 }, { "name": "cyankiwi/Mistral-Small-4-119B-2603-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "119.0B", "parameters_raw": 119000000000, "min_ram_gb": 41.7, "recommended_ram_gb": 83.4, "min_vram_gb": 69.5, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 2022, "hf_likes": 7, "release_date": "2026-03-18", "_discovered": true }, { "name": "cyankiwi/gemma-4-31B-it-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "31.0B", "parameters_raw": 31000000000, "min_ram_gb": 20.8, "recommended_ram_gb": 41.5, "min_vram_gb": 34.6, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "gemma4", "hf_downloads": 61491, "hf_likes": 16, "release_date": "2026-04-02", "_discovered": true }, { "name": "cyankiwi/Nemotron-Cascade-2-30B-A3B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nvidia", "hf_downloads": 219, "hf_likes": 2, "release_date": "2026-04-08", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Laguna-XS.2-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "33.4B", "parameters_raw": 33442617088, "min_ram_gb": 11.9, "recommended_ram_gb": 23.9, "min_vram_gb": 19.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "laguna", "hf_downloads": 4344, "hf_likes": 1, "release_date": "2026-05-02", "_discovered": true }, { "name": "cyankiwi/gemma-4-E2B-it-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 2000000000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 1.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "any-to-any", "architecture": "gemma4", "hf_downloads": 15565, "hf_likes": 3, "release_date": "2026-05-03", "_discovered": true }, { "name": "cyankiwi/Mistral-Medium-3.5-128B-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "128.0B", "parameters_raw": 128000000000, "min_ram_gb": 44.8, "recommended_ram_gb": 89.6, "min_vram_gb": 74.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 17040, "hf_likes": 2, "release_date": "2026-05-04", "_discovered": true }, { "name": "cyankiwi/Devstral-Small-2507-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "23.6B", "parameters_raw": 23572403200, "min_ram_gb": 8.5, "recommended_ram_gb": 17.0, "min_vram_gb": 14.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 1340, "hf_likes": 9, "release_date": "2025-07-12", "_discovered": true }, { "name": "cyankiwi/KAT-V1-40B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "40.0B", "parameters_raw": 40000000000, "min_ram_gb": 14.2, "recommended_ram_gb": 28.4, "min_vram_gb": 23.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 2, "hf_likes": 2, "release_date": "2025-07-24", "_discovered": true }, { "name": "cyankiwi/Magistral-Small-2507-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "23.6B", "parameters_raw": 23572403200, "min_ram_gb": 8.5, "recommended_ram_gb": 17.0, "min_vram_gb": 14.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral", "hf_downloads": 25, "hf_likes": 0, "release_date": "2025-07-25", "_discovered": true }, { "name": "cyankiwi/Llama-3_3-Nemotron-Super-49B-v1_5-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "49.0B", "parameters_raw": 49000000000, "min_ram_gb": 17.3, "recommended_ram_gb": 34.7, "min_vram_gb": 28.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nemotron_nas", "hf_downloads": 311, "hf_likes": 3, "release_date": "2025-07-27", "_discovered": true }, { "name": "cyankiwi/Qwen3-30B-A3B-Thinking-2507-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 73546, "hf_likes": 15, "release_date": "2025-07-30", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Qwen3-4B-Instruct-2507-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 1.7, "recommended_ram_gb": 3.4, "min_vram_gb": 2.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 142168, "hf_likes": 7, "release_date": "2025-08-06", "_discovered": true }, { "name": "cyankiwi/Qwen3-4B-Thinking-2507-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 1.7, "recommended_ram_gb": 3.4, "min_vram_gb": 2.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 671, "hf_likes": 5, "release_date": "2025-08-06", "_discovered": true }, { "name": "cyankiwi/Qwen3-4B-Thinking-2507-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.9, "recommended_ram_gb": 5.9, "min_vram_gb": 4.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 60, "hf_likes": 4, "release_date": "2025-08-08", "_discovered": true }, { "name": "cyankiwi/Qwen3-4B-Instruct-2507-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.9, "recommended_ram_gb": 5.9, "min_vram_gb": 4.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 1539, "hf_likes": 1, "release_date": "2025-08-08", "_discovered": true }, { "name": "cyankiwi/Qwen3-Coder-30B-A3B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 573, "hf_likes": 2, "release_date": "2025-08-08", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Qwen3-30B-A3B-Thinking-2507-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 88, "hf_likes": 2, "release_date": "2025-08-08", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/GLM-4.5-Air-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "31.7B", "parameters_raw": 31696906344, "min_ram_gb": 21.2, "recommended_ram_gb": 42.5, "min_vram_gb": 35.4, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 67, "hf_likes": 2, "release_date": "2025-08-08", "_discovered": true }, { "name": "cyankiwi/Jan-v1-4B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.9, "recommended_ram_gb": 5.9, "min_vram_gb": 4.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 3, "hf_likes": 1, "release_date": "2025-08-12", "_discovered": true }, { "name": "cyankiwi/Jan-v1-4B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 1.7, "recommended_ram_gb": 3.4, "min_vram_gb": 2.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 1, "hf_likes": 2, "release_date": "2025-08-12", "_discovered": true }, { "name": "cyankiwi/GLM-4.5V-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "19.5B", "parameters_raw": 19485088360, "min_ram_gb": 7.1, "recommended_ram_gb": 14.2, "min_vram_gb": 11.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "glm4v_moe", "hf_downloads": 664, "hf_likes": 4, "release_date": "2025-08-13", "_discovered": true }, { "name": "cyankiwi/GLM-4.5V-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "32.6B", "parameters_raw": 32555588200, "min_ram_gb": 21.8, "recommended_ram_gb": 43.6, "min_vram_gb": 36.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "glm4v_moe", "hf_downloads": 54, "hf_likes": 3, "release_date": "2025-08-13", "_discovered": true }, { "name": "cyankiwi/Kimi-Dev-72B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "72.0B", "parameters_raw": 72000000000, "min_ram_gb": 25.4, "recommended_ram_gb": 50.8, "min_vram_gb": 42.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 881, "hf_likes": 3, "release_date": "2025-08-19", "_discovered": true }, { "name": "cyankiwi/Kimi-Dev-72B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "72.0B", "parameters_raw": 72000000000, "min_ram_gb": 47.8, "recommended_ram_gb": 95.6, "min_vram_gb": 79.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 729, "hf_likes": 1, "release_date": "2025-08-19", "_discovered": true }, { "name": "cyankiwi/Seed-OSS-36B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "36.0B", "parameters_raw": 36000000000, "min_ram_gb": 24.1, "recommended_ram_gb": 48.1, "min_vram_gb": 40.1, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "seed_oss", "hf_downloads": 2, "hf_likes": 0, "release_date": "2025-08-23", "_discovered": true }, { "name": "cyankiwi/Seed-OSS-36B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "36.0B", "parameters_raw": 36000000000, "min_ram_gb": 12.8, "recommended_ram_gb": 25.7, "min_vram_gb": 21.4, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "seed_oss", "hf_downloads": 43, "hf_likes": 0, "release_date": "2025-08-23", "_discovered": true }, { "name": "cyankiwi/command-a-reasoning-08-2025-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "23.2B", "parameters_raw": 23153357696, "min_ram_gb": 8.3, "recommended_ram_gb": 16.7, "min_vram_gb": 13.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "cohere2", "hf_downloads": 206, "hf_likes": 3, "release_date": "2025-08-23", "_discovered": true }, { "name": "cyankiwi/command-a-reasoning-08-2025-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "36.6B", "parameters_raw": 36642239360, "min_ram_gb": 24.5, "recommended_ram_gb": 49.0, "min_vram_gb": 40.8, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "cohere2", "hf_downloads": 5, "hf_likes": 0, "release_date": "2025-08-24", "_discovered": true }, { "name": "cyankiwi/Hermes-4-70B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "70.0B", "parameters_raw": 70000000000, "min_ram_gb": 24.7, "recommended_ram_gb": 49.3, "min_vram_gb": 41.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 45819, "hf_likes": 6, "release_date": "2025-08-27", "_discovered": true }, { "name": "cyankiwi/Hermes-4-70B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "70.0B", "parameters_raw": 70000000000, "min_ram_gb": 46.5, "recommended_ram_gb": 93.0, "min_vram_gb": 77.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 1, "hf_likes": 1, "release_date": "2025-08-27", "_discovered": true }, { "name": "cyankiwi/InternVL3_5-8B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 3.1, "recommended_ram_gb": 6.1, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "internvl_chat", "hf_downloads": 923, "hf_likes": 1, "release_date": "2025-08-29", "_discovered": true }, { "name": "cyankiwi/InternVL3_5-14B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 5.2, "recommended_ram_gb": 10.3, "min_vram_gb": 8.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "internvl_chat", "hf_downloads": 829, "hf_likes": 4, "release_date": "2025-08-29", "_discovered": true }, { "name": "cyankiwi/InternVL3_5-38B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "38.0B", "parameters_raw": 38000000000, "min_ram_gb": 25.4, "recommended_ram_gb": 50.8, "min_vram_gb": 42.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "internvl_chat", "hf_downloads": 782, "hf_likes": 0, "release_date": "2025-08-30", "_discovered": true }, { "name": "cyankiwi/InternVL3_5-14B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 9.5, "recommended_ram_gb": 19.1, "min_vram_gb": 15.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "internvl_chat", "hf_downloads": 27, "hf_likes": 2, "release_date": "2025-08-30", "_discovered": true }, { "name": "cyankiwi/InternVL3_5-8B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 5.6, "recommended_ram_gb": 11.2, "min_vram_gb": 9.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "internvl_chat", "hf_downloads": 27783, "hf_likes": 1, "release_date": "2025-08-30", "_discovered": true }, { "name": "cyankiwi/NVIDIA-Nemotron-Nano-9B-v2-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "9.0B", "parameters_raw": 9000000000, "min_ram_gb": 3.4, "recommended_ram_gb": 6.8, "min_vram_gb": 5.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nvidia", "hf_downloads": 75, "hf_likes": 3, "release_date": "2025-08-31", "_discovered": true }, { "name": "cyankiwi/NVIDIA-Nemotron-Nano-12B-v2-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "12.0B", "parameters_raw": 12000000000, "min_ram_gb": 4.5, "recommended_ram_gb": 9.0, "min_vram_gb": 7.5, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nvidia", "hf_downloads": 1114, "hf_likes": 4, "release_date": "2025-08-31", "_discovered": true }, { "name": "cyankiwi/NVIDIA-Nemotron-Nano-12B-v2-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "12.0B", "parameters_raw": 12000000000, "min_ram_gb": 8.2, "recommended_ram_gb": 16.4, "min_vram_gb": 13.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nvidia", "hf_downloads": 1030, "hf_likes": 1, "release_date": "2025-08-31", "_discovered": true }, { "name": "cyankiwi/NVIDIA-Nemotron-Nano-9B-v2-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "9.0B", "parameters_raw": 9000000000, "min_ram_gb": 6.2, "recommended_ram_gb": 12.5, "min_vram_gb": 10.4, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nvidia", "hf_downloads": 33, "hf_likes": 0, "release_date": "2025-08-31", "_discovered": true }, { "name": "cyankiwi/Hermes-4-14B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 5.2, "recommended_ram_gb": 10.3, "min_vram_gb": 8.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 6866, "hf_likes": 4, "release_date": "2025-09-03", "_discovered": true }, { "name": "cyankiwi/Hermes-4-14B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 9.5, "recommended_ram_gb": 19.1, "min_vram_gb": 15.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 2, "hf_likes": 0, "release_date": "2025-09-03", "_discovered": true }, { "name": "cyankiwi/ERNIE-4.5-21B-A3B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "21.0B", "parameters_raw": 21000000000, "min_ram_gb": 14.2, "recommended_ram_gb": 28.3, "min_vram_gb": 23.6, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "ernie4_5_moe", "hf_downloads": 10, "hf_likes": 4, "release_date": "2025-09-09", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/ERNIE-4.5-21B-A3B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "21.0B", "parameters_raw": 21000000000, "min_ram_gb": 7.6, "recommended_ram_gb": 15.2, "min_vram_gb": 12.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "ernie4_5_moe", "hf_downloads": 89, "hf_likes": 4, "release_date": "2025-09-09", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Jan-v1-2509-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "1.3B", "parameters_raw": 1345814520, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 1.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 4, "hf_likes": 1, "release_date": "2025-09-09", "_discovered": true }, { "name": "cyankiwi/Tongyi-DeepResearch-30B-A3B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 358, "hf_likes": 4, "release_date": "2025-09-17", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Tongyi-DeepResearch-30B-A3B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 11, "hf_likes": 4, "release_date": "2025-09-17", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Magistral-Small-2509-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "5.3B", "parameters_raw": 5254958640, "min_ram_gb": 2.1, "recommended_ram_gb": 4.2, "min_vram_gb": 3.5, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 271, "hf_likes": 3, "release_date": "2025-09-20", "_discovered": true }, { "name": "cyankiwi/Magistral-Small-2509-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8033685040, "min_ram_gb": 5.6, "recommended_ram_gb": 11.2, "min_vram_gb": 9.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 0, "hf_likes": 1, "release_date": "2025-09-20", "_discovered": true }, { "name": "cyankiwi/Qwen3-Next-80B-A3B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "80.0B", "parameters_raw": 80000000000, "min_ram_gb": 53.1, "recommended_ram_gb": 106.2, "min_vram_gb": 88.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 80, "hf_likes": 5, "release_date": "2025-09-23", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Qwen3-Next-80B-A3B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "80.0B", "parameters_raw": 80000000000, "min_ram_gb": 53.1, "recommended_ram_gb": 106.2, "min_vram_gb": 88.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 74, "hf_likes": 4, "release_date": "2025-09-23", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/KAT-Dev-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "6.4B", "parameters_raw": 6432380800, "min_ram_gb": 2.5, "recommended_ram_gb": 5.0, "min_vram_gb": 4.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 1, "hf_likes": 0, "release_date": "2025-09-28", "_discovered": true }, { "name": "cyankiwi/KAT-Dev-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "10.3B", "parameters_raw": 10333083520, "min_ram_gb": 7.1, "recommended_ram_gb": 14.3, "min_vram_gb": 11.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 2, "hf_likes": 0, "release_date": "2025-09-28", "_discovered": true }, { "name": "cyankiwi/cwm-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "6.4B", "parameters_raw": 6421224320, "min_ram_gb": 2.5, "recommended_ram_gb": 5.0, "min_vram_gb": 4.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 7, "hf_likes": 1, "release_date": "2025-09-28", "_discovered": true }, { "name": "cyankiwi/cwm-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "10.3B", "parameters_raw": 10296761216, "min_ram_gb": 7.1, "recommended_ram_gb": 14.2, "min_vram_gb": 11.8, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 2, "hf_likes": 0, "release_date": "2025-09-28", "_discovered": true }, { "name": "cyankiwi/Qwen3-Omni-30B-A3B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "any-to-any", "architecture": "qwen3_omni_moe", "hf_downloads": 7136, "hf_likes": 8, "release_date": "2025-09-28", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Qwen3-Omni-30B-A3B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "any-to-any", "architecture": "qwen3_omni_moe", "hf_downloads": 486, "hf_likes": 1, "release_date": "2025-09-29", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Qwen3-Omni-30B-A3B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "any-to-any", "architecture": "qwen3_omni_moe", "hf_downloads": 2081, "hf_likes": 7, "release_date": "2025-09-29", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Qwen3-Omni-30B-A3B-Captioner-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "any-to-any", "architecture": "qwen3_omni_moe", "hf_downloads": 660, "hf_likes": 7, "release_date": "2025-10-01", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Qwen3-Omni-30B-A3B-Captioner-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "any-to-any", "architecture": "qwen3_omni_moe", "hf_downloads": 12, "hf_likes": 0, "release_date": "2025-10-01", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Apriel-1.5-15b-Thinker-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "15.0B", "parameters_raw": 15000000000, "min_ram_gb": 5.5, "recommended_ram_gb": 11.0, "min_vram_gb": 9.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llava", "hf_downloads": 5, "hf_likes": 2, "release_date": "2025-10-02", "_discovered": true }, { "name": "cyankiwi/Apriel-1.5-15b-Thinker-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "15.0B", "parameters_raw": 15000000000, "min_ram_gb": 10.2, "recommended_ram_gb": 20.4, "min_vram_gb": 17.0, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llava", "hf_downloads": 0, "hf_likes": 1, "release_date": "2025-10-02", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-30B-A3B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl_moe", "hf_downloads": 19000, "hf_likes": 5, "release_date": "2025-10-06", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Qwen3-VL-30B-A3B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl_moe", "hf_downloads": 205, "hf_likes": 3, "release_date": "2025-10-07", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Qwen3-VL-30B-A3B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl_moe", "hf_downloads": 16, "hf_likes": 4, "release_date": "2025-10-07", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/granite-4.0-h-micro-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "0.9B", "parameters_raw": 878516304, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 1.0, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granitemoehybrid", "hf_downloads": 44, "hf_likes": 0, "release_date": "2025-10-08", "_discovered": true }, { "name": "cyankiwi/granite-4.0-h-micro-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "1.3B", "parameters_raw": 1251612752, "min_ram_gb": 1.1, "recommended_ram_gb": 2.3, "min_vram_gb": 1.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granitemoehybrid", "hf_downloads": 52, "hf_likes": 0, "release_date": "2025-10-08", "_discovered": true }, { "name": "cyankiwi/KAT-Dev-72B-Exp-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "72.0B", "parameters_raw": 72000000000, "min_ram_gb": 25.4, "recommended_ram_gb": 50.8, "min_vram_gb": 42.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1, "hf_likes": 2, "release_date": "2025-10-11", "_discovered": true }, { "name": "cyankiwi/granite-4.0-h-tiny-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "2.8B", "parameters_raw": 2752073520, "min_ram_gb": 2.1, "recommended_ram_gb": 4.2, "min_vram_gb": 3.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granitemoehybrid", "hf_downloads": 326, "hf_likes": 0, "release_date": "2025-10-13", "_discovered": true }, { "name": "cyankiwi/granite-4.0-h-small-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "9.7B", "parameters_raw": 9686022896, "min_ram_gb": 3.7, "recommended_ram_gb": 7.3, "min_vram_gb": 6.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granitemoehybrid", "hf_downloads": 78, "hf_likes": 1, "release_date": "2025-10-13", "_discovered": true }, { "name": "cyankiwi/granite-4.0-h-small-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "13.1B", "parameters_raw": 13083409136, "min_ram_gb": 8.9, "recommended_ram_gb": 17.9, "min_vram_gb": 14.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granitemoehybrid", "hf_downloads": 1, "hf_likes": 1, "release_date": "2025-10-13", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-8B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 5.6, "recommended_ram_gb": 11.2, "min_vram_gb": 9.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 2351, "hf_likes": 4, "release_date": "2025-10-14", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-8B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 3.1, "recommended_ram_gb": 6.1, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 847, "hf_likes": 2, "release_date": "2025-10-14", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-8B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 5.6, "recommended_ram_gb": 11.2, "min_vram_gb": 9.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 67, "hf_likes": 4, "release_date": "2025-10-14", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-4B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.9, "recommended_ram_gb": 5.9, "min_vram_gb": 4.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 199, "hf_likes": 3, "release_date": "2025-10-14", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-4B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.9, "recommended_ram_gb": 5.9, "min_vram_gb": 4.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 9, "hf_likes": 0, "release_date": "2025-10-14", "_discovered": true }, { "name": "cyankiwi/LFM2-8B-A1B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 3.1, "recommended_ram_gb": 6.1, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2_moe", "hf_downloads": 34, "hf_likes": 1, "release_date": "2025-10-20", "_discovered": true, "is_moe": true, "active_parameters": 1000000000 }, { "name": "cyankiwi/LFM2-8B-A1B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 5.6, "recommended_ram_gb": 11.2, "min_vram_gb": 9.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2_moe", "hf_downloads": 8, "hf_likes": 0, "release_date": "2025-10-20", "_discovered": true, "is_moe": true, "active_parameters": 1000000000 }, { "name": "cyankiwi/Qwen3-VL-32B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 11.5, "recommended_ram_gb": 22.9, "min_vram_gb": 19.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 6631, "hf_likes": 5, "release_date": "2025-10-21", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-32B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 11.5, "recommended_ram_gb": 22.9, "min_vram_gb": 19.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 112, "hf_likes": 2, "release_date": "2025-10-21", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-32B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 21.4, "recommended_ram_gb": 42.8, "min_vram_gb": 35.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 502, "hf_likes": 1, "release_date": "2025-10-22", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-32B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 21.4, "recommended_ram_gb": 42.8, "min_vram_gb": 35.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 898, "hf_likes": 3, "release_date": "2025-10-22", "_discovered": true }, { "name": "cyankiwi/JanusCoder-14B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 5.2, "recommended_ram_gb": 10.3, "min_vram_gb": 8.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 1, "hf_likes": 0, "release_date": "2025-10-29", "_discovered": true }, { "name": "cyankiwi/JanusCoder-14B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 9.5, "recommended_ram_gb": 19.1, "min_vram_gb": 15.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 1, "hf_likes": 0, "release_date": "2025-10-29", "_discovered": true }, { "name": "cyankiwi/JanusCoder-8B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 5.6, "recommended_ram_gb": 11.2, "min_vram_gb": 9.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 1, "hf_likes": 0, "release_date": "2025-10-29", "_discovered": true }, { "name": "cyankiwi/JanusCoder-8B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 3.1, "recommended_ram_gb": 6.1, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 1, "hf_likes": 0, "release_date": "2025-10-29", "_discovered": true }, { "name": "cyankiwi/Qwen3-Nemotron-32B-RLBFF-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 11.5, "recommended_ram_gb": 22.9, "min_vram_gb": 19.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 2, "hf_likes": 0, "release_date": "2025-10-30", "_discovered": true }, { "name": "cyankiwi/Qwen3-Nemotron-32B-RLBFF-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 21.4, "recommended_ram_gb": 42.8, "min_vram_gb": 35.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 0, "hf_likes": 0, "release_date": "2025-10-30", "_discovered": true }, { "name": "cyankiwi/Kimi-Linear-48B-A3B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "48.0B", "parameters_raw": 48000000000, "min_ram_gb": 17.0, "recommended_ram_gb": 34.0, "min_vram_gb": 28.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "kimi_linear", "hf_downloads": 1653, "hf_likes": 18, "release_date": "2025-10-30", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Kimi-Linear-48B-A3B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "48.0B", "parameters_raw": 48000000000, "min_ram_gb": 32.0, "recommended_ram_gb": 64.0, "min_vram_gb": 53.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "kimi_linear", "hf_downloads": 45, "hf_likes": 4, "release_date": "2025-10-31", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/MiniMax-M2-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "36.8B", "parameters_raw": 36811839984, "min_ram_gb": 13.1, "recommended_ram_gb": 26.3, "min_vram_gb": 21.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 69, "hf_likes": 4, "release_date": "2025-11-10", "_discovered": true }, { "name": "cyankiwi/ERNIE-4.5-VL-28B-A3B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "28.0B", "parameters_raw": 28000000000, "min_ram_gb": 10.0, "recommended_ram_gb": 20.0, "min_vram_gb": 16.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "ernie4_5_moe_vl", "hf_downloads": 24, "hf_likes": 12, "release_date": "2025-11-13", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/ERNIE-4.5-VL-28B-A3B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "28.0B", "parameters_raw": 28000000000, "min_ram_gb": 18.8, "recommended_ram_gb": 37.6, "min_vram_gb": 31.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "ernie4_5_moe_vl", "hf_downloads": 21, "hf_likes": 3, "release_date": "2025-11-13", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/MiniMax-M2-REAP-162B-A10B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "162.0B", "parameters_raw": 162000000000, "min_ram_gb": 56.7, "recommended_ram_gb": 113.4, "min_vram_gb": 94.5, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 55, "hf_likes": 4, "release_date": "2025-11-18", "_discovered": true, "is_moe": true, "active_parameters": 10000000000 }, { "name": "cyankiwi/MiroThinker-v1.0-72B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "72.0B", "parameters_raw": 72000000000, "min_ram_gb": 25.4, "recommended_ram_gb": 50.8, "min_vram_gb": 42.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 5, "hf_likes": 4, "release_date": "2025-11-18", "_discovered": true }, { "name": "cyankiwi/MiroThinker-v1.0-30B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 35, "hf_likes": 2, "release_date": "2025-11-18", "_discovered": true }, { "name": "cyankiwi/MiroThinker-v1.0-30B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 16, "hf_likes": 0, "release_date": "2025-11-19", "_discovered": true }, { "name": "cyankiwi/MiroThinker-v1.0-72B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "72.0B", "parameters_raw": 72000000000, "min_ram_gb": 47.8, "recommended_ram_gb": 95.6, "min_vram_gb": 79.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1, "hf_likes": 0, "release_date": "2025-11-19", "_discovered": true }, { "name": "cyankiwi/Jan-v2-VL-high-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "2.9B", "parameters_raw": 2906632936, "min_ram_gb": 1.3, "recommended_ram_gb": 2.6, "min_vram_gb": 2.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 3, "hf_likes": 2, "release_date": "2025-11-20", "_discovered": true }, { "name": "cyankiwi/Jan-v2-VL-high-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "3.8B", "parameters_raw": 3774853864, "min_ram_gb": 2.8, "recommended_ram_gb": 5.6, "min_vram_gb": 4.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 6, "hf_likes": 1, "release_date": "2025-11-20", "_discovered": true }, { "name": "cyankiwi/Olmo-3-32B-Think-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 11.5, "recommended_ram_gb": 22.9, "min_vram_gb": 19.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo3", "hf_downloads": 172, "hf_likes": 2, "release_date": "2025-11-20", "_discovered": true }, { "name": "cyankiwi/Olmo-3-32B-Think-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 21.4, "recommended_ram_gb": 42.8, "min_vram_gb": 35.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo3", "hf_downloads": 1, "hf_likes": 0, "release_date": "2025-11-20", "_discovered": true }, { "name": "cyankiwi/GLM-4.5-Air-Derestricted-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "18.6B", "parameters_raw": 18626406504, "min_ram_gb": 6.8, "recommended_ram_gb": 13.6, "min_vram_gb": 11.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 650, "hf_likes": 3, "release_date": "2025-11-28", "_discovered": true }, { "name": "cyankiwi/GLM-4.5-Air-Derestricted-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "31.7B", "parameters_raw": 31696906344, "min_ram_gb": 21.2, "recommended_ram_gb": 42.5, "min_vram_gb": 35.4, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 21, "hf_likes": 1, "release_date": "2025-11-28", "_discovered": true }, { "name": "cyankiwi/INTELLECT-3-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "18.6B", "parameters_raw": 18626406504, "min_ram_gb": 6.8, "recommended_ram_gb": 13.6, "min_vram_gb": 11.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 27, "hf_likes": 3, "release_date": "2025-11-29", "_discovered": true }, { "name": "cyankiwi/INTELLECT-3-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "31.7B", "parameters_raw": 31696906344, "min_ram_gb": 21.2, "recommended_ram_gb": 42.5, "min_vram_gb": 35.4, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 14, "hf_likes": 2, "release_date": "2025-11-29", "_discovered": true }, { "name": "cyankiwi/Nemotron-Orchestrator-8B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 3.1, "recommended_ram_gb": 6.1, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 437, "hf_likes": 3, "release_date": "2025-12-03", "_discovered": true }, { "name": "cyankiwi/Nemotron-Orchestrator-8B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 5.6, "recommended_ram_gb": 11.2, "min_vram_gb": 9.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 28296, "hf_likes": 4, "release_date": "2025-12-03", "_discovered": true }, { "name": "cyankiwi/Trinity-Mini-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "5.0B", "parameters_raw": 5049586220, "min_ram_gb": 2.0, "recommended_ram_gb": 4.1, "min_vram_gb": 3.4, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "afmoe", "hf_downloads": 16, "hf_likes": 0, "release_date": "2025-12-03", "_discovered": true }, { "name": "cyankiwi/Trinity-Mini-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.2B", "parameters_raw": 8171721260, "min_ram_gb": 5.7, "recommended_ram_gb": 11.4, "min_vram_gb": 9.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "afmoe", "hf_downloads": 54, "hf_likes": 1, "release_date": "2025-12-03", "_discovered": true }, { "name": "cyankiwi/Hermes-4.3-36B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "36.0B", "parameters_raw": 36000000000, "min_ram_gb": 24.1, "recommended_ram_gb": 48.1, "min_vram_gb": 40.1, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "seed_oss", "hf_downloads": 96, "hf_likes": 0, "release_date": "2025-12-03", "_discovered": true }, { "name": "cyankiwi/Hermes-4.3-36B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "36.0B", "parameters_raw": 36000000000, "min_ram_gb": 12.8, "recommended_ram_gb": 25.7, "min_vram_gb": 21.4, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "seed_oss", "hf_downloads": 1560, "hf_likes": 1, "release_date": "2025-12-03", "_discovered": true }, { "name": "cyankiwi/Ministral-3-8B-Instruct-2512-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 3.1, "recommended_ram_gb": 6.1, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 44802, "hf_likes": 2, "release_date": "2025-12-04", "_discovered": true }, { "name": "cyankiwi/Ministral-3-8B-Instruct-2512-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 5.6, "recommended_ram_gb": 11.2, "min_vram_gb": 9.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 222, "hf_likes": 1, "release_date": "2025-12-04", "_discovered": true }, { "name": "cyankiwi/Ministral-3-8B-Reasoning-2512-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 3.1, "recommended_ram_gb": 6.1, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 201, "hf_likes": 0, "release_date": "2025-12-04", "_discovered": true }, { "name": "cyankiwi/Ministral-3-8B-Reasoning-2512-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 5.6, "recommended_ram_gb": 11.2, "min_vram_gb": 9.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 91, "hf_likes": 1, "release_date": "2025-12-04", "_discovered": true }, { "name": "cyankiwi/Ministral-3-14B-Instruct-2512-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 5.2, "recommended_ram_gb": 10.3, "min_vram_gb": 8.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 11586, "hf_likes": 6, "release_date": "2025-12-04", "_discovered": true }, { "name": "cyankiwi/Ministral-3-14B-Instruct-2512-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 9.5, "recommended_ram_gb": 19.1, "min_vram_gb": 15.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 73, "hf_likes": 0, "release_date": "2025-12-04", "_discovered": true }, { "name": "cyankiwi/Ministral-3-14B-Reasoning-2512-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 5.2, "recommended_ram_gb": 10.3, "min_vram_gb": 8.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 136375, "hf_likes": 1, "release_date": "2025-12-04", "_discovered": true }, { "name": "cyankiwi/Ministral-3-14B-Reasoning-2512-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 9.5, "recommended_ram_gb": 19.1, "min_vram_gb": 15.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 193, "hf_likes": 0, "release_date": "2025-12-04", "_discovered": true }, { "name": "cyankiwi/Ministral-3-3B-Instruct-2512-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "3.0B", "parameters_raw": 3000000000, "min_ram_gb": 1.3, "recommended_ram_gb": 2.6, "min_vram_gb": 2.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 429, "hf_likes": 0, "release_date": "2025-12-05", "_discovered": true }, { "name": "cyankiwi/Ministral-3-3B-Instruct-2512-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "3.0B", "parameters_raw": 3000000000, "min_ram_gb": 2.3, "recommended_ram_gb": 4.6, "min_vram_gb": 3.8, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 80, "hf_likes": 1, "release_date": "2025-12-05", "_discovered": true }, { "name": "cyankiwi/Ministral-3-3B-Reasoning-2512-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "3.0B", "parameters_raw": 3000000000, "min_ram_gb": 1.3, "recommended_ram_gb": 2.6, "min_vram_gb": 2.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 44, "hf_likes": 0, "release_date": "2025-12-05", "_discovered": true }, { "name": "cyankiwi/Ministral-3-3B-Reasoning-2512-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "3.0B", "parameters_raw": 3000000000, "min_ram_gb": 2.3, "recommended_ram_gb": 4.6, "min_vram_gb": 3.8, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 41, "hf_likes": 0, "release_date": "2025-12-05", "_discovered": true }, { "name": "cyankiwi/rnj-1-instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "2.3B", "parameters_raw": 2267558336, "min_ram_gb": 1.1, "recommended_ram_gb": 2.2, "min_vram_gb": 1.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gemma3_text", "hf_downloads": 3, "hf_likes": 2, "release_date": "2025-12-06", "_discovered": true }, { "name": "cyankiwi/rnj-1-instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "3.2B", "parameters_raw": 3240636864, "min_ram_gb": 2.5, "recommended_ram_gb": 4.9, "min_vram_gb": 4.1, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "gemma3_text", "hf_downloads": 10, "hf_likes": 1, "release_date": "2025-12-06", "_discovered": true }, { "name": "cyankiwi/GLM-4.6V-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "19.5B", "parameters_raw": 19485088360, "min_ram_gb": 7.1, "recommended_ram_gb": 14.2, "min_vram_gb": 11.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "glm4v_moe", "hf_downloads": 1412, "hf_likes": 12, "release_date": "2025-12-08", "_discovered": true }, { "name": "cyankiwi/GLM-4.6V-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "32.6B", "parameters_raw": 32555588200, "min_ram_gb": 21.8, "recommended_ram_gb": 43.6, "min_vram_gb": 36.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "glm4v_moe", "hf_downloads": 22, "hf_likes": 1, "release_date": "2025-12-08", "_discovered": true }, { "name": "cyankiwi/GLM-4.6V-Flash-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "3.4B", "parameters_raw": 3409531872, "min_ram_gb": 1.5, "recommended_ram_gb": 3.0, "min_vram_gb": 2.5, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "glm4v", "hf_downloads": 1157, "hf_likes": 2, "release_date": "2025-12-08", "_discovered": true }, { "name": "cyankiwi/GLM-4.6V-Flash-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "4.4B", "parameters_raw": 4429272032, "min_ram_gb": 3.2, "recommended_ram_gb": 6.5, "min_vram_gb": 5.4, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "glm4v", "hf_downloads": 1062, "hf_likes": 0, "release_date": "2025-12-08", "_discovered": true }, { "name": "cyankiwi/Devstral-Small-2-24B-Instruct-2512-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "24.0B", "parameters_raw": 24000000000, "min_ram_gb": 8.6, "recommended_ram_gb": 17.3, "min_vram_gb": 14.4, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "mistral3", "hf_downloads": 114314, "hf_likes": 11, "release_date": "2025-12-10", "_discovered": true }, { "name": "cyankiwi/Apriel-1.6-15b-Thinker-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "15.0B", "parameters_raw": 15000000000, "min_ram_gb": 5.5, "recommended_ram_gb": 11.0, "min_vram_gb": 9.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "llava", "hf_downloads": 130, "hf_likes": 2, "release_date": "2025-12-10", "_discovered": true }, { "name": "cyankiwi/Apriel-1.6-15b-Thinker-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "15.0B", "parameters_raw": 15000000000, "min_ram_gb": 10.2, "recommended_ram_gb": 20.4, "min_vram_gb": 17.0, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "llava", "hf_downloads": 1, "hf_likes": 0, "release_date": "2025-12-11", "_discovered": true }, { "name": "cyankiwi/Olmo-3.1-32B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 11.5, "recommended_ram_gb": 22.9, "min_vram_gb": 19.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo3", "hf_downloads": 470, "hf_likes": 1, "release_date": "2025-12-14", "_discovered": true }, { "name": "cyankiwi/Olmo-3.1-32B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 21.4, "recommended_ram_gb": 42.8, "min_vram_gb": 35.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo3", "hf_downloads": 2, "hf_likes": 0, "release_date": "2025-12-14", "_discovered": true }, { "name": "cyankiwi/Olmo-3.1-32B-Think-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 11.5, "recommended_ram_gb": 22.9, "min_vram_gb": 19.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo3", "hf_downloads": 66, "hf_likes": 0, "release_date": "2025-12-14", "_discovered": true }, { "name": "cyankiwi/Olmo-3.1-32B-Think-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "32.0B", "parameters_raw": 32000000000, "min_ram_gb": 21.4, "recommended_ram_gb": 42.8, "min_vram_gb": 35.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "olmo3", "hf_downloads": 11, "hf_likes": 0, "release_date": "2025-12-14", "_discovered": true }, { "name": "cyankiwi/Nemotron-Cascade-14B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 5.2, "recommended_ram_gb": 10.3, "min_vram_gb": 8.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 22, "hf_likes": 1, "release_date": "2025-12-18", "_discovered": true }, { "name": "cyankiwi/Nemotron-Cascade-14B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 9.5, "recommended_ram_gb": 19.1, "min_vram_gb": 15.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 4, "hf_likes": 0, "release_date": "2025-12-18", "_discovered": true }, { "name": "cyankiwi/Nemotron-Cascade-8B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 3.1, "recommended_ram_gb": 6.1, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 1, "hf_likes": 0, "release_date": "2025-12-18", "_discovered": true }, { "name": "cyankiwi/Nemotron-Cascade-8B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 5.6, "recommended_ram_gb": 11.2, "min_vram_gb": 9.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 4, "hf_likes": 0, "release_date": "2025-12-18", "_discovered": true }, { "name": "cyankiwi/QwenLong-L1.5-30B-A3B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 58, "hf_likes": 2, "release_date": "2025-12-18", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Nemotron-Cascade-8B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 3.1, "recommended_ram_gb": 6.1, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 78, "hf_likes": 1, "release_date": "2025-12-18", "_discovered": true }, { "name": "cyankiwi/Nemotron-Cascade-8B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 5.6, "recommended_ram_gb": 11.2, "min_vram_gb": 9.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 1, "hf_likes": 1, "release_date": "2025-12-18", "_discovered": true }, { "name": "cyankiwi/nomos-1-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "5.3B", "parameters_raw": 5306567040, "min_ram_gb": 2.2, "recommended_ram_gb": 4.3, "min_vram_gb": 3.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 5, "hf_likes": 1, "release_date": "2025-12-23", "_discovered": true }, { "name": "cyankiwi/nomos-1-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "9.0B", "parameters_raw": 9043691904, "min_ram_gb": 6.2, "recommended_ram_gb": 12.5, "min_vram_gb": 10.4, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 2, "hf_likes": 0, "release_date": "2025-12-23", "_discovered": true }, { "name": "cyankiwi/Solar-Open-100B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "100.0B", "parameters_raw": 100000000000, "min_ram_gb": 35.1, "recommended_ram_gb": 70.2, "min_vram_gb": 58.5, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "solar_open", "hf_downloads": 393, "hf_likes": 1, "release_date": "2026-01-01", "_discovered": true }, { "name": "cyankiwi/Solar-Open-100B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "100.0B", "parameters_raw": 100000000000, "min_ram_gb": 66.3, "recommended_ram_gb": 132.6, "min_vram_gb": 110.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "solar_open", "hf_downloads": 17, "hf_likes": 2, "release_date": "2026-01-01", "_discovered": true }, { "name": "cyankiwi/IQuest-Coder-V1-40B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "40.0B", "parameters_raw": 40000000000, "min_ram_gb": 14.2, "recommended_ram_gb": 28.4, "min_vram_gb": 23.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "iquestcoder", "hf_downloads": 33, "hf_likes": 2, "release_date": "2026-01-02", "_discovered": true }, { "name": "cyankiwi/IQuest-Coder-V1-40B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "40.0B", "parameters_raw": 40000000000, "min_ram_gb": 26.7, "recommended_ram_gb": 53.4, "min_vram_gb": 44.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "iquestcoder", "hf_downloads": 14, "hf_likes": 5, "release_date": "2026-01-02", "_discovered": true }, { "name": "cyankiwi/QwenLong-L1.5-30B-A3B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 1, "hf_likes": 1, "release_date": "2026-01-03", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/bu-30b-a3b-preview-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl_moe", "hf_downloads": 880, "hf_likes": 0, "release_date": "2026-01-05", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/bu-30b-a3b-preview-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl_moe", "hf_downloads": 3, "hf_likes": 0, "release_date": "2026-01-05", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/MiroThinker-v1.5-30B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 6, "hf_likes": 2, "release_date": "2026-01-06", "_discovered": true }, { "name": "cyankiwi/MiroThinker-v1.5-235B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "235.0B", "parameters_raw": 235000000000, "min_ram_gb": 82.1, "recommended_ram_gb": 164.2, "min_vram_gb": 136.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 7, "hf_likes": 3, "release_date": "2026-01-06", "_discovered": true }, { "name": "cyankiwi/MiroThinker-v1.5-235B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "235.0B", "parameters_raw": 235000000000, "min_ram_gb": 155.4, "recommended_ram_gb": 310.8, "min_vram_gb": 259.0, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 2, "hf_likes": 0, "release_date": "2026-01-06", "_discovered": true }, { "name": "cyankiwi/NousCoder-14B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 5.2, "recommended_ram_gb": 10.3, "min_vram_gb": 8.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 3, "hf_likes": 0, "release_date": "2026-01-08", "_discovered": true }, { "name": "cyankiwi/NousCoder-14B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "14.0B", "parameters_raw": 14000000000, "min_ram_gb": 9.5, "recommended_ram_gb": 19.1, "min_vram_gb": 15.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 1, "hf_likes": 0, "release_date": "2026-01-08", "_discovered": true }, { "name": "cyankiwi/AI21-Jamba2-Mini-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "13.5B", "parameters_raw": 13519598976, "min_ram_gb": 5.0, "recommended_ram_gb": 10.0, "min_vram_gb": 8.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "jamba", "hf_downloads": 4, "hf_likes": 0, "release_date": "2026-01-09", "_discovered": true }, { "name": "cyankiwi/AI21-Jamba2-Mini-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "19.2B", "parameters_raw": 19156743552, "min_ram_gb": 13.0, "recommended_ram_gb": 25.9, "min_vram_gb": 21.6, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "jamba", "hf_downloads": 5, "hf_likes": 1, "release_date": "2026-01-09", "_discovered": true }, { "name": "cyankiwi/IQuest-Coder-V1-40B-Loop-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "40.0B", "parameters_raw": 40000000000, "min_ram_gb": 14.2, "recommended_ram_gb": 28.4, "min_vram_gb": 23.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "iquestloopcoder", "hf_downloads": 613, "hf_likes": 4, "release_date": "2026-01-10", "_discovered": true }, { "name": "cyankiwi/IQuest-Coder-V1-40B-Loop-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "40.0B", "parameters_raw": 40000000000, "min_ram_gb": 26.7, "recommended_ram_gb": 53.4, "min_vram_gb": 44.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "iquestloopcoder", "hf_downloads": 3, "hf_likes": 0, "release_date": "2026-01-10", "_discovered": true }, { "name": "cyankiwi/Baichuan-M3-235B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "235.0B", "parameters_raw": 235000000000, "min_ram_gb": 82.1, "recommended_ram_gb": 164.2, "min_vram_gb": 136.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 5, "hf_likes": 2, "release_date": "2026-01-13", "_discovered": true }, { "name": "cyankiwi/DASD-30B-A3B-Thinking-Preview-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 0, "hf_likes": 0, "release_date": "2026-01-18", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/DASD-30B-A3B-Thinking-Preview-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 4, "hf_likes": 1, "release_date": "2026-01-18", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/AgentCPM-Explore-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "1.3B", "parameters_raw": 1345814520, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 1.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 103, "hf_likes": 1, "release_date": "2026-01-18", "_discovered": true }, { "name": "cyankiwi/AgentCPM-Explore-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "1.8B", "parameters_raw": 1799979000, "min_ram_gb": 1.5, "recommended_ram_gb": 3.0, "min_vram_gb": 2.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 5, "hf_likes": 0, "release_date": "2026-01-18", "_discovered": true }, { "name": "cyankiwi/GLM-4.7-Flash-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "32.1B", "parameters_raw": 32140559382, "min_ram_gb": 21.5, "recommended_ram_gb": 43.1, "min_vram_gb": 35.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe_lite", "hf_downloads": 225, "hf_likes": 17, "release_date": "2026-01-19", "_discovered": true }, { "name": "cyankiwi/DASD-4B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 1.7, "recommended_ram_gb": 3.4, "min_vram_gb": 2.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 4, "hf_likes": 1, "release_date": "2026-01-20", "_discovered": true }, { "name": "cyankiwi/DASD-4B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.9, "recommended_ram_gb": 5.9, "min_vram_gb": 4.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 3, "hf_likes": 0, "release_date": "2026-01-20", "_discovered": true }, { "name": "cyankiwi/Step3-VL-10B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "10.0B", "parameters_raw": 10000000000, "min_ram_gb": 3.8, "recommended_ram_gb": 7.6, "min_vram_gb": 6.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "step_robotics", "hf_downloads": 255, "hf_likes": 0, "release_date": "2026-01-23", "_discovered": true }, { "name": "cyankiwi/Step3-VL-10B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "10.0B", "parameters_raw": 10000000000, "min_ram_gb": 6.9, "recommended_ram_gb": 13.8, "min_vram_gb": 11.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "step_robotics", "hf_downloads": 33, "hf_likes": 1, "release_date": "2026-01-23", "_discovered": true }, { "name": "cyankiwi/GLM-4.7-Flash-REAP-23B-A3B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "23.0B", "parameters_raw": 23000000000, "min_ram_gb": 15.5, "recommended_ram_gb": 31.0, "min_vram_gb": 25.8, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe_lite", "hf_downloads": 53, "hf_likes": 3, "release_date": "2026-01-25", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/AgentCPM-Report-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "1.8B", "parameters_raw": 1786843584, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 1.5, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minicpm", "hf_downloads": 6, "hf_likes": 1, "release_date": "2026-01-26", "_discovered": true }, { "name": "cyankiwi/AgentCPM-Report-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "2.7B", "parameters_raw": 2734756288, "min_ram_gb": 2.1, "recommended_ram_gb": 4.2, "min_vram_gb": 3.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minicpm", "hf_downloads": 4, "hf_likes": 1, "release_date": "2026-01-26", "_discovered": true }, { "name": "cyankiwi/MiniMax-M2.1-REAP-172B-A10B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "172.0B", "parameters_raw": 172000000000, "min_ram_gb": 60.2, "recommended_ram_gb": 120.4, "min_vram_gb": 100.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 28, "hf_likes": 0, "release_date": "2026-02-03", "_discovered": true, "is_moe": true, "active_parameters": 10000000000 }, { "name": "cyankiwi/Qwen3-VL-2B-Instruct-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 2000000000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 1.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 32348, "hf_likes": 1, "release_date": "2026-02-05", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-2B-Instruct-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 2000000000, "min_ram_gb": 1.6, "recommended_ram_gb": 3.2, "min_vram_gb": 2.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 83, "hf_likes": 0, "release_date": "2026-02-05", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-2B-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 2000000000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 1.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 438, "hf_likes": 0, "release_date": "2026-02-05", "_discovered": true }, { "name": "cyankiwi/Qwen3-VL-2B-Thinking-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 2000000000, "min_ram_gb": 1.6, "recommended_ram_gb": 3.2, "min_vram_gb": 2.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_vl", "hf_downloads": 1, "hf_likes": 0, "release_date": "2026-02-05", "_discovered": true }, { "name": "cyankiwi/MiniCPM-SALA-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 1988798976, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 1.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minicpm_sala", "hf_downloads": 48, "hf_likes": 1, "release_date": "2026-02-15", "_discovered": true }, { "name": "cyankiwi/MiniCPM-SALA-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "3.1B", "parameters_raw": 3098192384, "min_ram_gb": 2.3, "recommended_ram_gb": 4.7, "min_vram_gb": 3.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minicpm_sala", "hf_downloads": 200, "hf_likes": 0, "release_date": "2026-02-15", "_discovered": true }, { "name": "cyankiwi/Nanbeige4.1-3B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "3.0B", "parameters_raw": 3000000000, "min_ram_gb": 1.3, "recommended_ram_gb": 2.6, "min_vram_gb": 2.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 271, "hf_likes": 1, "release_date": "2026-02-15", "_discovered": true }, { "name": "cyankiwi/VulnLLM-R-7B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "7.0B", "parameters_raw": 7000000000, "min_ram_gb": 2.8, "recommended_ram_gb": 5.5, "min_vram_gb": 4.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 1, "hf_likes": 0, "release_date": "2026-02-18", "_discovered": true }, { "name": "cyankiwi/VulnLLM-R-7B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "7.0B", "parameters_raw": 7000000000, "min_ram_gb": 4.9, "recommended_ram_gb": 9.8, "min_vram_gb": 8.2, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen2", "hf_downloads": 7, "hf_likes": 1, "release_date": "2026-02-18", "_discovered": true }, { "name": "cyankiwi/Qwen3.5-397B-A17B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "397.0B", "parameters_raw": 397000000000, "min_ram_gb": 138.5, "recommended_ram_gb": 277.0, "min_vram_gb": 230.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 1389, "hf_likes": 2, "release_date": "2026-02-18", "_discovered": true, "is_moe": true, "active_parameters": 17000000000 }, { "name": "cyankiwi/INTELLECT-3.1-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "18.6B", "parameters_raw": 18626406504, "min_ram_gb": 6.8, "recommended_ram_gb": 13.6, "min_vram_gb": 11.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 13, "hf_likes": 0, "release_date": "2026-02-18", "_discovered": true }, { "name": "cyankiwi/JoyAI-LLM-Flash-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "8.3B", "parameters_raw": 8326243206, "min_ram_gb": 3.2, "recommended_ram_gb": 6.4, "min_vram_gb": 5.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "hf_downloads": 2, "hf_likes": 3, "release_date": "2026-02-18", "_discovered": true }, { "name": "cyankiwi/Qwen3-Coder-Next-REAM-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "79.7B", "parameters_raw": 79674391296, "min_ram_gb": 22.3, "recommended_ram_gb": 44.6, "min_vram_gb": 40.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "Coding", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 695, "hf_likes": 10, "release_date": "2026-02-19", "is_moe": true, "num_experts": 512, "active_experts": 10, "active_parameters": null, "_discovered": true, "format": "awq" }, { "name": "cyankiwi/INTELLECT-3.1-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "31.7B", "parameters_raw": 31696906344, "min_ram_gb": 21.2, "recommended_ram_gb": 42.5, "min_vram_gb": 35.4, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm4_moe", "hf_downloads": 4, "hf_likes": 0, "release_date": "2026-02-20", "_discovered": true }, { "name": "cyankiwi/JoyAI-LLM-Flash-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "14.3B", "parameters_raw": 14343480198, "min_ram_gb": 9.8, "recommended_ram_gb": 19.6, "min_vram_gb": 16.3, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "deepseek_v3", "hf_downloads": 0, "hf_likes": 0, "release_date": "2026-02-20", "_discovered": true }, { "name": "cyankiwi/Ovis2.6-30B-A3B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "ovis2_6_moe", "hf_downloads": 65, "hf_likes": 0, "release_date": "2026-02-20", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Ovis2.6-30B-A3B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "ovis2_6_moe", "hf_downloads": 241, "hf_likes": 1, "release_date": "2026-02-20", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Qwen3-Coder-Next-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "24.1B", "parameters_raw": 24108399360, "min_ram_gb": 16.2, "recommended_ram_gb": 32.4, "min_vram_gb": 27.0, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 826, "hf_likes": 5, "release_date": "2026-02-20", "_discovered": true }, { "name": "cyankiwi/MiniMax-M2.5-REAP-139B-A10B-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "139.0B", "parameters_raw": 139000000000, "min_ram_gb": 48.7, "recommended_ram_gb": 97.3, "min_vram_gb": 81.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 121866, "hf_likes": 13, "release_date": "2026-02-25", "_discovered": true, "is_moe": true, "active_parameters": 10000000000 }, { "name": "cyankiwi/LFM2-24B-A2B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "24.0B", "parameters_raw": 24000000000, "min_ram_gb": 16.1, "recommended_ram_gb": 32.3, "min_vram_gb": 26.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "lfm2_moe", "hf_downloads": 52, "hf_likes": 0, "release_date": "2026-02-25", "_discovered": true, "is_moe": true, "active_parameters": 2000000000 }, { "name": "cyankiwi/Qwen3.5-122B-A10B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "122.0B", "parameters_raw": 122000000000, "min_ram_gb": 80.8, "recommended_ram_gb": 161.6, "min_vram_gb": 134.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 4323, "hf_likes": 4, "release_date": "2026-03-01", "_discovered": true, "is_moe": true, "active_parameters": 10000000000 }, { "name": "cyankiwi/Jan-code-4b-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 1.7, "recommended_ram_gb": 3.4, "min_vram_gb": 2.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 9, "hf_likes": 0, "release_date": "2026-03-02", "_discovered": true }, { "name": "cyankiwi/Jan-code-4b-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.9, "recommended_ram_gb": 5.9, "min_vram_gb": 4.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3", "hf_downloads": 10, "hf_likes": 2, "release_date": "2026-03-02", "_discovered": true }, { "name": "cyankiwi/Qwen3.5-9B-AWQ-BF16-INT4", "provider": "cyankiwi", "parameter_count": "9.0B", "parameters_raw": 9000000000, "min_ram_gb": 3.4, "recommended_ram_gb": 6.8, "min_vram_gb": 5.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 8058, "hf_likes": 7, "release_date": "2026-03-02", "_discovered": true }, { "name": "cyankiwi/Qwen3.5-2B-AWQ-BF16-INT4", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 2000000000, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 1.7, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 210, "hf_likes": 1, "release_date": "2026-03-02", "_discovered": true }, { "name": "cyankiwi/Qwen3.5-2B-AWQ-BF16-INT8", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 2000000000, "min_ram_gb": 1.6, "recommended_ram_gb": 3.2, "min_vram_gb": 2.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 828, "hf_likes": 1, "release_date": "2026-03-02", "_discovered": true }, { "name": "cyankiwi/Qwen3.5-4B-AWQ-BF16-INT8", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.9, "recommended_ram_gb": 5.9, "min_vram_gb": 4.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 4421, "hf_likes": 3, "release_date": "2026-03-02", "_discovered": true }, { "name": "cyankiwi/Qwen3.5-9B-AWQ-BF16-INT8", "provider": "cyankiwi", "parameter_count": "9.0B", "parameters_raw": 9000000000, "min_ram_gb": 6.2, "recommended_ram_gb": 12.5, "min_vram_gb": 10.4, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 20406, "hf_likes": 0, "release_date": "2026-03-02", "_discovered": true }, { "name": "cyankiwi/GLM-5-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "766.9B", "parameters_raw": 766947340782, "min_ram_gb": 267.2, "recommended_ram_gb": 534.4, "min_vram_gb": 445.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm_moe_dsa", "hf_downloads": 2, "hf_likes": 0, "release_date": "2026-03-06", "_discovered": true }, { "name": "cyankiwi/SVD-Qwen3-Coder-Next-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "14.4B", "parameters_raw": 14444722944, "min_ram_gb": 5.3, "recommended_ram_gb": 10.7, "min_vram_gb": 8.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_next", "hf_downloads": 30, "hf_likes": 2, "release_date": "2026-03-09", "_discovered": true }, { "name": "cyankiwi/OmniCoder-9B-AWQ-BF16-INT8", "provider": "cyankiwi", "parameter_count": "9.0B", "parameters_raw": 9000000000, "min_ram_gb": 6.2, "recommended_ram_gb": 12.5, "min_vram_gb": 10.4, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_5", "hf_downloads": 132, "hf_likes": 1, "release_date": "2026-03-14", "_discovered": true }, { "name": "cyankiwi/Qwen3.5-27B-AWQ-INT8-INT4", "provider": "cyankiwi", "parameter_count": "27.0B", "parameters_raw": 27000000000, "min_ram_gb": 18.1, "recommended_ram_gb": 36.2, "min_vram_gb": 30.2, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 531, "hf_likes": 2, "release_date": "2026-03-29", "_discovered": true }, { "name": "cyankiwi/Qwen3.5-9B-AWQ-INT8-INT4", "provider": "cyankiwi", "parameter_count": "9.0B", "parameters_raw": 9000000000, "min_ram_gb": 6.2, "recommended_ram_gb": 12.5, "min_vram_gb": 10.4, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 3925, "hf_likes": 2, "release_date": "2026-03-29", "_discovered": true }, { "name": "cyankiwi/Qwen3.5-4B-AWQ-INT8-INT4", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.9, "recommended_ram_gb": 5.9, "min_vram_gb": 4.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 20289, "hf_likes": 2, "release_date": "2026-03-29", "_discovered": true }, { "name": "cyankiwi/Qwen3.5-2B-AWQ-INT8-INT4", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 2000000000, "min_ram_gb": 1.6, "recommended_ram_gb": 3.2, "min_vram_gb": 2.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 397, "hf_likes": 1, "release_date": "2026-03-29", "_discovered": true }, { "name": "cyankiwi/MiroThinker-1.7-mini-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "5.3B", "parameters_raw": 5306567040, "min_ram_gb": 2.2, "recommended_ram_gb": 4.3, "min_vram_gb": 3.6, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 44, "hf_likes": 1, "release_date": "2026-04-01", "_discovered": true }, { "name": "cyankiwi/MiroThinker-1.7-mini-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "9.0B", "parameters_raw": 9043691904, "min_ram_gb": 6.2, "recommended_ram_gb": 12.5, "min_vram_gb": 10.4, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "qwen3_moe", "hf_downloads": 3, "hf_likes": 0, "release_date": "2026-04-01", "_discovered": true }, { "name": "cyankiwi/gemma-4-26B-A4B-it-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "26.0B", "parameters_raw": 26000000000, "min_ram_gb": 17.5, "recommended_ram_gb": 34.9, "min_vram_gb": 29.1, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "gemma4", "hf_downloads": 291580, "hf_likes": 8, "release_date": "2026-04-03", "_discovered": true, "is_moe": true, "active_parameters": 4000000000 }, { "name": "cyankiwi/Nemotron-Cascade-2-30B-A3B-AWQ-8bit", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 20.1, "recommended_ram_gb": 40.2, "min_vram_gb": 33.5, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "nvidia", "hf_downloads": 111, "hf_likes": 1, "release_date": "2026-04-08", "_discovered": true, "is_moe": true, "active_parameters": 3000000000 }, { "name": "cyankiwi/Trinity-Large-Thinking-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "65.5B", "parameters_raw": 65542882332, "min_ram_gb": 23.1, "recommended_ram_gb": 46.2, "min_vram_gb": 38.5, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "afmoe", "hf_downloads": 175, "hf_likes": 2, "release_date": "2026-04-08", "_discovered": true }, { "name": "cyankiwi/GLM-5.1-AWQ-4bit", "provider": "cyankiwi", "parameter_count": "766.9B", "parameters_raw": 766909554882, "min_ram_gb": 267.2, "recommended_ram_gb": 534.4, "min_vram_gb": 445.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "glm_moe_dsa", "hf_downloads": 8512, "hf_likes": 11, "release_date": "2026-04-10", "_discovered": true }, { "name": "cyankiwi/granite-4.1-8b-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 3.1, "recommended_ram_gb": 6.1, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granite", "hf_downloads": 1920, "hf_likes": 1, "release_date": "2026-05-01", "_discovered": true }, { "name": "cyankiwi/granite-4.1-30b-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "30.0B", "parameters_raw": 30000000000, "min_ram_gb": 10.7, "recommended_ram_gb": 21.5, "min_vram_gb": 17.9, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granite", "hf_downloads": 1318, "hf_likes": 1, "release_date": "2026-05-03", "_discovered": true }, { "name": "cyankiwi/gemma-4-E4B-it-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 1.7, "recommended_ram_gb": 3.4, "min_vram_gb": 2.8, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "any-to-any", "architecture": "gemma4", "hf_downloads": 188508, "hf_likes": 2, "release_date": "2026-05-03", "_discovered": true }, { "name": "cyankiwi/GRM-2.6-Plus-AWQ-BF16-INT4", "provider": "cyankiwi", "parameter_count": "29.0B", "parameters_raw": 28979098878, "min_ram_gb": 10.4, "recommended_ram_gb": 20.8, "min_vram_gb": 17.3, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 237, "hf_likes": 1, "release_date": "2026-05-04", "_discovered": true }, { "name": "cyankiwi/GRM-2.6-Plus-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "29.3B", "parameters_raw": 29325129246, "min_ram_gb": 10.5, "recommended_ram_gb": 21.0, "min_vram_gb": 17.5, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 1528, "hf_likes": 0, "release_date": "2026-05-04", "_discovered": true }, { "name": "cyankiwi/granite-4.1-3b-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "3.0B", "parameters_raw": 3000000000, "min_ram_gb": 1.3, "recommended_ram_gb": 2.6, "min_vram_gb": 2.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "granite", "hf_downloads": 143, "hf_likes": 0, "release_date": "2026-05-05", "_discovered": true }, { "name": "cyankiwi/gemma-4-E4B-it-AWQ-INT8", "provider": "cyankiwi", "parameter_count": "4.0B", "parameters_raw": 4000000000, "min_ram_gb": 2.9, "recommended_ram_gb": 5.9, "min_vram_gb": 4.9, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "any-to-any", "architecture": "gemma4", "hf_downloads": 9631, "hf_likes": 0, "release_date": "2026-05-06", "_discovered": true }, { "name": "cyankiwi/gemma-4-E2B-it-AWQ-INT8", "provider": "cyankiwi", "parameter_count": "2.0B", "parameters_raw": 2000000000, "min_ram_gb": 1.6, "recommended_ram_gb": 3.2, "min_vram_gb": 2.7, "quantization": "AWQ-8bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "any-to-any", "architecture": "gemma4", "hf_downloads": 242, "hf_likes": 0, "release_date": "2026-05-06", "_discovered": true }, { "name": "cyankiwi/Llama-3.3-70B-Instruct-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "70.0B", "parameters_raw": 70000000000, "min_ram_gb": 24.7, "recommended_ram_gb": 49.3, "min_vram_gb": 41.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 33, "hf_likes": 0, "release_date": "2026-05-07", "_discovered": true }, { "name": "cyankiwi/Llama-3.1-8B-Instruct-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "8.0B", "parameters_raw": 8000000000, "min_ram_gb": 3.1, "recommended_ram_gb": 6.1, "min_vram_gb": 5.1, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 149, "hf_likes": 0, "release_date": "2026-05-12", "_discovered": true }, { "name": "cyankiwi/Llama-3.2-3B-Instruct-AWQ-INT4", "provider": "cyankiwi", "parameter_count": "3.0B", "parameters_raw": 3000000000, "min_ram_gb": 1.3, "recommended_ram_gb": 2.6, "min_vram_gb": 2.2, "quantization": "AWQ-4bit", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "llama", "hf_downloads": 425, "hf_likes": 0, "release_date": "2026-05-12", "_discovered": true }, { "name": "MiniMaxAI/MiniMax-M2.7", "provider": "MiniMaxAI", "parameter_count": "228.7B", "parameters_raw": 228700000000, "min_ram_gb": 240.0, "recommended_ram_gb": 280.0, "min_vram_gb": 240.0, "quantization": "FP8", "context_length": 196608, "use_case": "Chat, reasoning, tool use", "capabilities": [ "tool_use" ], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 534825, "hf_likes": 1134, "release_date": "2026-04-09", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 13600000000 }, { "name": "bullerwins/MiniMax-M2.7-REAP-172B-fp8", "provider": "bullerwins", "parameter_count": "172B", "parameters_raw": 172000000000, "min_ram_gb": 113.8, "recommended_ram_gb": 227.6, "min_vram_gb": 189.7, "quantization": "FP8", "context_length": 32768, "use_case": "General purpose", "capabilities": [], "pipeline_tag": "text-generation", "architecture": "minimax_m2", "hf_downloads": 9, "hf_likes": 0, "release_date": "2026-04-19", "_discovered": true }, { "name": "Qwen/Qwen3.6-27B-MTP", "provider": "Qwen", "parameter_count": "27.8B", "parameters_raw": 27781427952, "min_ram_gb": 16.6, "recommended_ram_gb": 21.6, "min_vram_gb": 16.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose, coding, MTP", "is_moe": false, "num_experts": null, "active_experts": null, "active_parameters": null, "architecture": "qwen3", "pipeline_tag": "text-generation", "release_date": "2026-04-01", "gguf_sources": [ { "repo": "unsloth/Qwen3.6-27B-MTP-GGUF", "provider": "unsloth" } ], "capabilities": [ "mtp" ], "_discovered": true }, { "name": "Qwen/Qwen3.6-35B-A3B-MTP", "provider": "Qwen", "parameter_count": "36.0B", "parameters_raw": 35951822704, "min_ram_gb": 21.4, "recommended_ram_gb": 27.8, "min_vram_gb": 21.4, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose (MoE), MTP", "is_moe": true, "num_experts": null, "active_experts": null, "active_parameters": 3000000000, "architecture": "qwen3_moe", "pipeline_tag": "text-generation", "release_date": "2026-04-01", "gguf_sources": [ { "repo": "unsloth/Qwen3.6-35B-A3B-MTP-GGUF", "provider": "unsloth" } ], "capabilities": [ "mtp" ], "_discovered": true }, { "name": "Qwen/Qwen3.5-0.8B-MTP", "provider": "Qwen", "parameter_count": "873M", "parameters_raw": 873438784, "min_ram_gb": 1.0, "recommended_ram_gb": 2.0, "min_vram_gb": 0.5, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose, MTP", "capabilities": [ "mtp", "tool_use", "vision" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 93448, "hf_likes": 208, "release_date": "2026-02-28", "gguf_sources": [ { "repo": "unsloth/Qwen3.5-0.8B-MTP-GGUF", "provider": "unsloth" } ], "_discovered": true }, { "name": "Qwen/Qwen3.5-2B-MTP", "provider": "Qwen", "parameter_count": "2.3B", "parameters_raw": 2274069824, "min_ram_gb": 1.3, "recommended_ram_gb": 2.1, "min_vram_gb": 1.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose, MTP", "capabilities": [ "mtp", "tool_use", "vision" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 46974, "hf_likes": 115, "release_date": "2026-02-28", "gguf_sources": [ { "repo": "unsloth/Qwen3.5-2B-MTP-GGUF", "provider": "unsloth" } ], "_discovered": true }, { "name": "Qwen/Qwen3.5-4B-MTP", "provider": "Qwen", "parameter_count": "4.7B", "parameters_raw": 4659865088, "min_ram_gb": 2.6, "recommended_ram_gb": 4.3, "min_vram_gb": 2.4, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose, MTP", "capabilities": [ "mtp", "tool_use", "vision" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 99087, "hf_likes": 202, "release_date": "2026-02-27", "gguf_sources": [ { "repo": "unsloth/Qwen3.5-4B-MTP-GGUF", "provider": "unsloth" } ], "_discovered": true }, { "name": "Qwen/Qwen3.5-9B-MTP", "provider": "Qwen", "parameter_count": "9.7B", "parameters_raw": 9653104368, "min_ram_gb": 5.4, "recommended_ram_gb": 9.0, "min_vram_gb": 4.9, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose, MTP", "capabilities": [ "mtp", "tool_use", "vision" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 172298, "hf_likes": 345, "release_date": "2026-02-27", "gguf_sources": [ { "repo": "unsloth/Qwen3.5-9B-MTP-GGUF", "provider": "unsloth" } ], "_discovered": true }, { "name": "Qwen/Qwen3.5-27B-MTP", "provider": "Qwen", "parameter_count": "27.8B", "parameters_raw": 27781427952, "min_ram_gb": 15.5, "recommended_ram_gb": 25.9, "min_vram_gb": 14.2, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose, MTP", "capabilities": [ "mtp", "tool_use", "vision" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5", "hf_downloads": 406808, "hf_likes": 565, "release_date": "2026-02-24", "gguf_sources": [ { "repo": "unsloth/Qwen3.5-27B-MTP-GGUF", "provider": "unsloth" } ], "_discovered": true }, { "name": "Qwen/Qwen3.5-35B-A3B-MTP", "provider": "Qwen", "parameter_count": "36.0B", "parameters_raw": 35951822704, "min_ram_gb": 20.1, "recommended_ram_gb": 33.5, "min_vram_gb": 18.4, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose, MTP", "capabilities": [ "mtp", "tool_use", "vision" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 769032, "hf_likes": 905, "release_date": "2026-02-24", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 3000000000, "gguf_sources": [ { "repo": "unsloth/Qwen3.5-35B-A3B-MTP-GGUF", "provider": "unsloth" } ], "_discovered": true }, { "name": "Qwen/Qwen3.5-122B-A10B-MTP", "provider": "Qwen", "parameter_count": "125.1B", "parameters_raw": 125086497008, "min_ram_gb": 69.9, "recommended_ram_gb": 116.5, "min_vram_gb": 64.1, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose, MTP", "capabilities": [ "mtp", "tool_use", "vision" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 171055, "hf_likes": 389, "release_date": "2026-02-24", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 10000000000, "gguf_sources": [ { "repo": "unsloth/Qwen3.5-122B-A10B-MTP-GGUF", "provider": "unsloth" } ], "_discovered": true }, { "name": "Qwen/Qwen3.5-397B-A17B-MTP", "provider": "Qwen", "parameter_count": "403.4B", "parameters_raw": 403397928944, "min_ram_gb": 225.4, "recommended_ram_gb": 375.7, "min_vram_gb": 206.6, "quantization": "Q4_K_M", "context_length": 262144, "use_case": "General purpose, MTP", "capabilities": [ "mtp", "tool_use", "vision" ], "pipeline_tag": "image-text-to-text", "architecture": "qwen3_5_moe", "hf_downloads": 1291825, "hf_likes": 1214, "release_date": "2026-02-16", "is_moe": true, "num_experts": 256, "active_experts": 8, "active_parameters": 17000000000, "gguf_sources": [ { "repo": "unsloth/Qwen3.5-397B-A17B-MTP-GGUF", "provider": "unsloth" } ], "_discovered": true } ]