Text Generation
	
	
	
	
	Transformers
	
	
	
	
	GGUF
	
	
	
	
	Safetensors
	
	
	
	
	mistral
	
	
	
	
	quantized
	
	
	
	
	2-bit
	
	
	
	
	3-bit
	
	
	
		
	
	
		4-bit precision
	
	
	
	
	5-bit
	
	
	
	
	6-bit
	
	
	
		
	
	
		8-bit precision
	
	
	
	
	GGUF
	
	
	
	
	gemma
	
	
	
	
	conversational
	
	
	
	
	arxiv:2312.11805
	
	
	
	
	arxiv:2009.03300
	
	
	
	
	arxiv:1905.07830
	
	
	
	
	arxiv:1911.11641
	
	
	
	
	arxiv:1904.09728
	
	
	
	
	arxiv:1905.10044
	
	
	
	
	arxiv:1907.10641
	
	
	
	
	arxiv:1811.00937
	
	
	
	
	arxiv:1809.02789
	
	
	
	
	arxiv:1911.01547
	
	
	
	
	arxiv:1705.03551
	
	
	
	
	arxiv:2107.03374
	
	
	
	
	arxiv:2108.07732
	
	
	
	
	arxiv:2110.14168
	
	
	
	
	arxiv:2304.06364
	
	
	
	
	arxiv:2206.04615
	
	
	
	
	arxiv:1804.06876
	
	
	
	
	arxiv:2110.08193
	
	
	
	
	has_space
	
	
	
		
	
	text-generation-inference
	
	
