Spaces:

bsmit1659
/

certifaier

Sleeping

Adding vllm package

ca1ecab over 1 year ago

778 Bytes

	from typing import Type

	from vllm.model_executor.layers.quantization.base_config import QuantizationConfig
	from vllm.model_executor.layers.quantization.awq import AWQConfig
	from vllm.model_executor.layers.quantization.gptq import GPTQConfig
	from vllm.model_executor.layers.quantization.squeezellm import SqueezeLLMConfig

	_QUANTIZATION_CONFIG_REGISTRY = {
	"awq": AWQConfig,
	"gptq": GPTQConfig,
	"squeezellm": SqueezeLLMConfig,
	}


	def get_quantization_config(quantization: str) -> Type[QuantizationConfig]:
	if quantization not in _QUANTIZATION_CONFIG_REGISTRY:
	raise ValueError(f"Invalid quantization method: {quantization}")
	return _QUANTIZATION_CONFIG_REGISTRY[quantization]


	__all__ = [
	"QuantizationConfig",
	"get_quantization_config",
	]