- 
		
 - 
		
 - 
		
 - 
		
 - 
		
 - 
		
 
Inference Providers
				
			 
	 
 
		
	
		Active filters: 
					awq
				 
		
			
				QuantTrio/MiniMax-M2-AWQ
				
				
			
			Text Generation
			
• 
		
				229B
			• 
	
				Updated
					
				
				• 
					
					3.12k
				
	
				
• 
					
					4
				
 
		
	
			
				QuantTrio/Qwen3-VL-30B-A3B-Instruct-AWQ
				
				
			
			Text Generation
			
• 
		
				31B
			• 
	
				Updated
					
				
				• 
					
					105k
				
	
				
• 
					
					27
				
 
		
	
			
				Qwen/Qwen2.5-7B-Instruct-AWQ
				
				
			
			Text Generation
			
• 
		
				2B
			• 
	
				Updated
					
				
				• 
					
					588k
				
	
				
• 
					
					32
				
 
		
	
			
				Qwen/Qwen2.5-Omni-7B-AWQ
				
				
			
			Any-to-Any
			
• 
		
				5B
			• 
	
				Updated
					
				
				• 
					
					18k
				
	
				
• 
					
					13
				
 
		
	
			
				TheBloke/LLaMA-Pro-8B-Instruct-AWQ
				
				
			
			Text Generation
			
• 
		
				1B
			• 
	
				Updated
					
				
				• 
					
					217
				
	
				
• 
					
					2
				
 
		
	
			
				Qwen/Qwen1.5-72B-Chat-AWQ
				
				
			
			Text Generation
			
• 
		
				12B
			• 
	
				Updated
					
				
				• 
					
					1.29k
				
	
				
• 
					
					25
				
 
		
	
			
				nateraw/defog-sqlcoder-70b-alpha-awq
				
				
			
			Text Generation
			
• 
		
				10B
			• 
	
				Updated
					
				
				• 
					
					5
				
	
				
• 
					
					2
				
 
		
	
			
				hugging-quants/Meta-Llama-3.1-405B-Instruct-AWQ-INT4
				
				
			
			Text Generation
			
• 
		
				59B
			• 
	
				Updated
					
				
				• 
					
					781
				
	
				
• 
					
					36
				
 
		
	
			
				vessl/gemma-2-9b-mental-counselor-marlin-awq
				
				
			
		
				3B
			• 
	
				Updated
					
				
				
				
	
				• 
					
					3
				
  
		
	
			
				Qwen/Qwen2.5-3B-Instruct-AWQ
				
				
			
			Text Generation
			
• 
		
				1.0B
			• 
	
				Updated
					
				
				• 
					
					68.9k
				
	
				
• 
					
					13
				
 
		
	
			
				Qwen/Qwen2.5-14B-Instruct-AWQ
				
				
			
			Text Generation
			
• 
		
				3B
			• 
	
				Updated
					
				
				• 
					
					111k
				
	
				
• 
					
					26
				
 
		
	
			
				AMead10/Llama-3.2-3B-Instruct-AWQ
				
				
			
			Text Generation
			
• 
		
				1B
			• 
	
				Updated
					
				
				• 
					
					794
				
	
				
• 
					
					3
				
 
		
	
			
				QuixiAI/DeepSeek-R1-AWQ
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					348
				
	
				
• 
					
					86
				
 
		
	
			
				gaunernst/gemma-3-27b-it-int4-awq
				
				
			
			Image-Text-to-Text
			
• 
		
				6B
			• 
	
				Updated
					
				
				• 
					
					19.2k
				
	
				
• 
					
					33
				
 
		
	
			
				Qwen/Qwen2.5-VL-32B-Instruct-AWQ
				
				
			
			Image-Text-to-Text
			
• 
		
				6B
			• 
	
				Updated
					
				
				• 
					
					70.4k
				
	
				
• 
					
					60
				
 
		
	
			
				Qwen/Qwen3-32B-AWQ
				
				
			
			Text Generation
			
• 
		
				6B
			• 
	
				Updated
					
				
				• 
					
					442k
				
	
				
• 
					
					113
				
 
		
	
			
				ELVISIO/Qwen3-30B-A3B-AWQ
				
				
			
		
				5B
			• 
	
				Updated
					
				
				• 
					
					435
				
	
				
• 
					
					4
				
  
		
	
			
				ReadyArt/Mistral-Small-3.1-DRAFT-0.5B-AWQ
				
				
			
			Text Generation
			
• 
		
				0.6B
			• 
	
				Updated
					
				
				• 
					
					46
				
	
				
• 
					
					1
				
 
		
	
			
				QuantTrio/Qwen3-Coder-480B-A35B-Instruct-AWQ
				
				
			
			Text Generation
			
• 
		
				66B
			• 
	
				Updated
					
				
				• 
					
					1.45k
				
	
				
• 
					
					6
				
 
		
	
			
				QuantTrio/Qwen3-Coder-30B-A3B-Instruct-AWQ
				
				
			
			Text Generation
			
• 
		
				5B
			• 
	
				Updated
					
				
				• 
					
					2.98k
				
	
				
• 
					
					4
				
 
		
	
			
				openbmb/MiniCPM-V-4_5-AWQ
				
				
			
			Image-Text-to-Text
			
• 
		
				3B
			• 
	
				Updated
					
				
				• 
					
					5.43k
				
	
				
• 
					
					10
				
 
		
	
			
				yapwithai/orpheus-3b-trt-int4-awq
				
				
			
			Text-to-Speech
			
• 
		
	
				Updated
					
				
				
				
	
				• 
					
					2
				
 
		
	
			
				yapwithai/impish-12b-awq
				
				
			
			Text Generation
			
• 
		
				12B
			• 
	
				Updated
					
				
				• 
					
					64
				
	
				
• 
					
					1
				
 
		
	
			
				QuantTrio/Qwen3-VL-32B-Instruct-AWQ
				
				
			
			Image-Text-to-Text
			
• 
		
				33B
			• 
	
				Updated
					
				
				• 
					
					2.15k
				
	
				
• 
					
					3
				
 
		
	
			
				ModelCloud/Marin-32B-Base-GPTQMODEL-AWQ-W4A16
				
				
			
			Text Generation
			
• 
		
				33B
			• 
	
				Updated
					
				
				• 
					
					26
				
	
				
• 
					
					1
				
 
		
	
			
				casperhansen/mpt-7b-8k-chat-awq
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					5
				
	
				
• 
					
					3
				
 
		
	
			
				casperhansen/falcon-7b-awq
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				
				
	
				• 
					
					1
				
 
		
	
			
				casperhansen/vicuna-7b-v1.5-awq
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					11
				
	
				
• 
					
					3
				
 
		
	
			
				casperhansen/vicuna-7b-v1.5-awq-gemv
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					2
				
	
				
• 
					
					1
				
 
		
	
			
				casperhansen/mpt-7b-8k-chat-awq-gemv
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					1