- 
		
 - 
		
 - 
		
 - 
		
 - 
		
 - 
		
 
Inference Providers
				
			 
	 
 
		
	
		Active filters: 
					fp8
				 
		
			
				FlorianJc/Mistral-Nemo-Instruct-2407-vllm-fp8
				
				
			
			Text Generation
			
• 
		
				12B
			• 
	
				Updated
					
				
				• 
					
					6
				
	
				
• 
					
					8
				
 
		
	
			
				mgoin/Nemotron-4-340B-Instruct-FP8-Dynamic
				
				
			
			Text Generation
			
• 
		
				341B
			• 
	
				Updated
					
				
				
				
	
				
				 
		
	
			
				RedHatAI/DeepSeek-Coder-V2-Base-FP8
				
				
			
			Text Generation
			
• 
		
				236B
			• 
	
				Updated
					
				
				• 
					
					4
				
	
				
				
 
		
	
			
				RedHatAI/DeepSeek-Coder-V2-Instruct-FP8
				
				
			
			Text Generation
			
• 
		
				236B
			• 
	
				Updated
					
				
				• 
					
					190
				
	
				
• 
					
					7
				
 
		
	
			
				mgoin/Minitron-4B-Base-FP8
				
				
			
			Text Generation
			
• 
		
				4B
			• 
	
				Updated
					
				
				• 
					
					2
				
	
				
• 
					
					3
				
 
		
	
			
				mgoin/Minitron-8B-Base-FP8
				
				
			
			Text Generation
			
• 
		
				8B
			• 
	
				Updated
					
				
				• 
					
					1
				
	
				
• 
					
					3
				
 
		
	
			
				nm-testing/Qwen2-0.5B-Instruct-FP8-SkipQKV
				
				
			
			Text Generation
			
• 
		
				0.5B
			• 
	
				Updated
					
				
				• 
					
					3.47k
				
	
				
				
 
		
	
			
				RedHatAI/Meta-Llama-3.1-8B-Instruct-FP8
				
				
			
			Text Generation
			
• 
		
				8B
			• 
	
				Updated
					
				
				• 
					
					154k
				
	
				
• 
					
					42
				
 
		
	
			
				RedHatAI/Meta-Llama-3.1-70B-Instruct-FP8-dynamic
				
				
			
			Text Generation
			
• 
		
				71B
			• 
	
				Updated
					
				
				• 
					
					1.75k
				
	
				
• 
					
					7
				
 
		
	
			
				PrimeIntellect/Meta-Llama-3.1-8B-Instruct-FP8
				
				
			
			Text Generation
			
• 
		
				8B
			• 
	
				Updated
					
				
				• 
					
					8
				
	
				
				
 
		
	
			
				RedHatAI/Meta-Llama-3.1-70B-Instruct-FP8
				
				
			
			Text Generation
			
• 
		
				71B
			• 
	
				Updated
					
				
				• 
					
					5.62k
				
	
				
• 
					
					50
				
 
		
	
			
				RedHatAI/Meta-Llama-3.1-405B-Instruct-FP8
				
				
			
			Text Generation
			
• 
		
				406B
			• 
	
				Updated
					
				
				• 
					
					692
				
	
				
• 
					
					31
				
 
		
	
			
				RedHatAI/Meta-Llama-3.1-405B-Instruct-FP8-dynamic
				
				
			
			Text Generation
			
• 
		
				406B
			• 
	
				Updated
					
				
				• 
					
					2.25k
				
	
				
• 
					
					15
				
 
		
	
			
				mgoin/Nemotron-4-340B-Base-hf-FP8
				
				
			
			Text Generation
			
• 
		
				341B
			• 
	
				Updated
					
				
				• 
					
					106
				
	
				
• 
					
					2
				
 
		
	
			
				mgoin/Nemotron-4-340B-Instruct-hf-FP8
				
				
			
			Text Generation
			
• 
		
				341B
			• 
	
				Updated
					
				
				• 
					
					2
				
	
				
• 
					
					3
				
 
		
	
			
				FlorianJc/ghost-8b-beta-vllm-fp8
				
				
			
			Text Generation
			
• 
		
				8B
			• 
	
				Updated
					
				
				• 
					
					1
				
	
				
				
 
		
	
			
				FlorianJc/Meta-Llama-3.1-8B-Instruct-vllm-fp8
				
				
			
			Text Generation
			
• 
		
				8B
			• 
	
				Updated
					
				
				• 
					
					1
				
	
				
				
 
		
	
			
				AuriAetherwiing/L3.1-8B-Celeste-V1.5-fp8-dynamic
				
				
			
			Text Generation
			
• 
		
				8B
			• 
	
				Updated
					
				
				
				
	
				
				 
		
	
			
				AuriAetherwiing/Celeste-12B-V1.6-fp8-dynamic
				
				
			
			Text Generation
			
• 
		
				12B
			• 
	
				Updated
					
				
				
				
	
				
				 
		
	
			
				AuriAetherwiing/magnum-72b-v1-fp8-dynamic
				
				
			
			Text Generation
			
• 
		
				73B
			• 
	
				Updated
					
				
				
				
	
				
				 
		
	
			
				PrimeIntellect/Meta-Llama-3.1-70B-Instruct-FP8
				
				
			
			Text Generation
			
• 
		
				71B
			• 
	
				Updated
					
				
				• 
					
					89
				
	
				
				
 
		
	
			
				RedHatAI/Meta-Llama-3.1-8B-FP8
				
				
			
			Text Generation
			
• 
		
				8B
			• 
	
				Updated
					
				
				• 
					
					8.83k
				
	
				
• 
					
					9
				
 
		
	
			
				RedHatAI/Meta-Llama-3.1-70B-FP8
				
				
			
			Text Generation
			
• 
		
				71B
			• 
	
				Updated
					
				
				• 
					
					428
				
	
				
• 
					
					2
				
 
		
	
			
				AuriAetherwiing/Llama-3-TenyxChat-DaybreakStorywriter-70B-fp8-dynamic
				
				
			
			Text Generation
			
• 
		
				71B
			• 
	
				Updated
					
				
				
				
	
				
				 
		
	
			
				Infermatic/L3-70B-Euryale-v2.1-fp8-dynamic
				
				
			
			Text Generation
			
• 
		
				71B
			• 
	
				Updated
					
				
				• 
					
					344
				
• 
			
	
				
				 
		
	
			
				RedHatAI/starcoder2-15b-FP8
				
				
			
			Text Generation
			
• 
		
				16B
			• 
	
				Updated
					
				
				• 
					
					6
				
	
				
				
 
		
	
			
				RedHatAI/starcoder2-7b-FP8
				
				
			
			Text Generation
			
• 
		
				7B
			• 
	
				Updated
					
				
				• 
					
					5
				
	
				
				
 
		
	
			
				RedHatAI/starcoder2-3b-FP8
				
				
			
			Text Generation
			
• 
		
				3B
			• 
	
				Updated
					
				
				• 
					
					6
				
	
				
				
 
		
	
			
				AuriAetherwiing/MN-12B-Celeste-V1.9-fp8-dynamic
				
				
			
			Text Generation
			
• 
		
				12B
			• 
	
				Updated
					
				
				• 
					
					2
				
	
				
				
 
		
	
			
				Svak/miquliz-120b-v2.0-FP8-Dynamic
				
				
			
			Text Generation
			
• 
		
				120B
			• 
	
				Updated
					
				
				• 
					
					1