diff --git a/server/text_generation_server/utils/gptq/quantize.py b/server/text_generation_server/utils/gptq/quantize.py index d379e5f3..abde0b02 100644 --- a/server/text_generation_server/utils/gptq/quantize.py +++ b/server/text_generation_server/utils/gptq/quantize.py @@ -15,7 +15,7 @@ import numpy as np import torch from text_generation_server.utils.gptq.quant_linear import QuantLinear from loguru import logger -from typings import Optional +from typing import Optional DEV = torch.device("cuda:0")