mirror of
				https://github.com/huggingface/text-generation-inference.git
				synced 2023-08-15 01:09:35 +03:00 
			
		
		
		
	Cargo fmt
This commit is contained in:
		| @@ -104,7 +104,7 @@ struct Args { | |||||||
|     num_shard: Option<usize>, |     num_shard: Option<usize>, | ||||||
|  |  | ||||||
|     /// Whether you want the model to be quantized. This will use `bitsandbytes` for |     /// Whether you want the model to be quantized. This will use `bitsandbytes` for | ||||||
|     /// quantization on the fly, or `gptq`. 4bit quantization is available through  |     /// quantization on the fly, or `gptq`. 4bit quantization is available through | ||||||
|     /// `bitsandbytes` by providing the `bitsandbytes-fp4` or `bitsandbytes-nf4` options. |     /// `bitsandbytes` by providing the `bitsandbytes-fp4` or `bitsandbytes-nf4` options. | ||||||
|     #[clap(long, env, value_enum)] |     #[clap(long, env, value_enum)] | ||||||
|     quantize: Option<Quantization>, |     quantize: Option<Quantization>, | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Nicolas Patry
					Nicolas Patry