- 
		
- 
		
- 
		
- 
		
- 
		
- 
		
Inference Providers
				
			 
		
	
		Active filters: 
					4-bit
				
			 
				MaziyarPanahi/Mistral-7B-Instruct-v0.3-GGUF
				
				
			
			Text Generation
			
• 
		
				7B
			• 
	
				Updated
					
				
				• 
					
					94.1k
				
	
				
• 
					
					126
				
 
				Qwen/Qwen3-14B-AWQ
				
				
			
			Text Generation
			
• 
		
				3B
			• 
	
				Updated
					
				
				• 
					
					126k
				
	
				
• 
					
					39
				
 
				dousery/medical-reasoning-gpt-oss-20b
				
				
			
			Text Generation
			
• 
		
				21B
			• 
	
				Updated
					
				
				• 
					
					1.76k
				
	
				
• 
					
					41
				
 
				Intel/Qwen3-Next-80B-A3B-Instruct-int4-mixed-AutoRound
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					1.16k
				
	
				
• 
					
					20
				
 
				mlx-community/GLM-4.6-4bit
				
				
			
			Text Generation
			
• 
		
				353B
			• 
	
				Updated
					
				
				• 
					
					3.83k
				
	
				
• 
					
					10
				
 
				nightmedia/VCoder-120b-1.0-qx86-hi-mlx
				
				
			
			Text Generation
			
• 
		
				117B
			• 
	
				Updated
					
				
				• 
					
					82
				
	
				
• 
					
					3
				
 
				unsloth/Qwen3-VL-8B-Instruct-unsloth-bnb-4bit
				
				
			
			Image-Text-to-Text
			
• 
		
				9B
			• 
	
				Updated
					
				
				• 
					
					15.4k
				
	
				
• 
					
					6
				
 
				TheBloke/MythoMax-L2-13B-GPTQ
				
				
			
			Text Generation
			
• 
		
				2B
			• 
	
				Updated
					
				
				• 
					
					1.02k
				
	
				
• 
					
					215
				
 
				unsloth/mistral-7b-instruct-v0.3-bnb-4bit
				
				
			
			Text Generation
			
• 
		
				4B
			• 
	
				Updated
					
				
				• 
					
					44.3k
				
	
				
• 
					
					33
				
 
				MaziyarPanahi/gemma-3-1b-it-GGUF
				
				
			
			Text Generation
			
• 
		
				1.0B
			• 
	
				Updated
					
				
				• 
					
					73k
				
	
				
• 
					
					10
				
 
				Qwen/Qwen3-30B-A3B-GPTQ-Int4
				
				
			
			Text Generation
			
• 
		
				5B
			• 
	
				Updated
					
				
				• 
					
					62.4k
				
	
				
• 
					
					36
				
 
				Intel/Qwen3-30B-A3B-Thinking-2507-int4-AutoRound
				
				
			
		
				0.6B
			• 
	
				Updated
					
				
				• 
					
					1.56k
				
	
				
• 
					
					8
				
  
				QuantTrio/Qwen3-VL-235B-A22B-Instruct-AWQ
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					5.38k
				
	
				
• 
					
					7
				
 
				QuantTrio/GLM-4.6-GPTQ-Int4-Int8Mix
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					367
				
	
				
• 
					
					2
				
 
				bullpoint/GLM-4.6-AWQ
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					3.72k
				
	
				
• 
					
					3
				
 
				Kavyaah/medical-coding-llm
				
				
			
		
				4B
			• 
	
				Updated
					
				
				• 
					
					77
				
	
				
• 
					
					4
				
  
				Edison2525/Qwen3-8B-AWQ
				
				
			
		
				8B
			• 
	
				Updated
					
				
				• 
					
					66
				
	
				
• 
					
					2
				
  
				manasmisra/GLM-4.5-Air-REAP-82B-A12B-mlx-4Bit
				
				
			
			Text Generation
			
• 
		
				82B
			• 
	
				Updated
					
				
				• 
					
					365
				
	
				
• 
					
					2
				
 
				unsloth/Qwen3-VL-2B-Instruct-unsloth-bnb-4bit
				
				
			
			Image-Text-to-Text
			
• 
		
				2B
			• 
	
				Updated
					
				
				• 
					
					583
				
	
				
• 
					
					2
				
 
				QuantTrio/Qwen3-VL-32B-Instruct-AWQ
				
				
			
			Image-Text-to-Text
			
• 
		
				33B
			• 
	
				Updated
					
				
				• 
					
					762
				
	
				
• 
					
					2
				
 
				TheBloke/Wizard-Vicuna-30B-Uncensored-GPTQ
				
				
			
			Text Generation
			
• 
		
				4B
			• 
	
				Updated
					
				
				• 
					
					558
				
	
				
• 
					
					586
				
 
				TheBloke/leo-hessianai-13B-chat-AWQ
				
				
			
			Text Generation
			
• 
		
				2B
			• 
	
				Updated
					
				
				• 
					
					35
				
	
				
• 
					
					1
				
 
				TheBloke/Psyfighter-13B-GPTQ
				
				
			
			Text Generation
			
• 
		
				2B
			• 
	
				Updated
					
				
				• 
					
					13
				
	
				
• 
					
					7
				
 
				TheBloke/Mistral-7B-Instruct-v0.2-AWQ
				
				
			
			Text Generation
			
• 
		
				1B
			• 
	
				Updated
					
				
				• 
					
					55.8k
				
	
				
• 
					
					51
				
 
				MaziyarPanahi/Mistral-7B-Instruct-Aya-101-GGUF
				
				
			
			Text Generation
			
• 
		
				7B
			• 
	
				Updated
					
				
				• 
					
					252
				
	
				
• 
					
					10
				
 
				macadeliccc/Hermes-2-Pro-Mistral-7B-AWQ
				
				
			
			Text Generation
			
• 
		
				1B
			• 
	
				Updated
					
				
				• 
					
					1
				
	
				
• 
					
					1
				
 
				unsloth/llama-3-8b-bnb-4bit
				
				
			
			Text Generation
			
• 
		
				5B
			• 
	
				Updated
					
				
				• 
					
					37.2k
				
	
				
• 
					
					202
				
 
				Qwen/Qwen1.5-110B-Chat-GPTQ-Int4
				
				
			
			Text Generation
			
• 
		
				17B
			• 
	
				Updated
					
				
				• 
					
					10.8k
				
	
				
• 
					
					18
				
 
				unsloth/Phi-3-mini-4k-instruct-bnb-4bit
				
				
			
			Text Generation
			
• 
		
				2B
			• 
	
				Updated
					
				
				• 
					
					50.1k
				
	
				
• 
					
					36
				
 
				RichardErkhov/akdeniz27_-_roberta-base-cuad-4bits
				
				
			
			Text Generation
			
• 
		
				83.6M
			• 
	
				Updated
					
				
				
				
	
				• 
					
					1