Skip to content

Commit

Permalink
Fix text-generation-server quantize
Browse files Browse the repository at this point in the history
The subcommand did not work due to some broken imports.
  • Loading branch information
danieldk committed Jun 21, 2024
1 parent bcb3faa commit dc58c33
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 2 deletions.
2 changes: 1 addition & 1 deletion server/text_generation_server/cli.py
Original file line number Diff line number Diff line change
Expand Up @@ -316,7 +316,7 @@ def quantize(
logger_level=logger_level,
json_output=json_output,
)
from text_generation_server.utils.gptq.quantize import quantize
from text_generation_server.layers.gptq.quantize import quantize

quantize(
model_id=model_id,
Expand Down
2 changes: 1 addition & 1 deletion server/text_generation_server/layers/gptq/quantize.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@
from accelerate import init_empty_weights
from text_generation_server.utils import initialize_torch_distributed, Weights
from text_generation_server.utils.hub import weight_files
from text_generation_server.utils.gptq.quant_linear import QuantLinear
from text_generation_server.layers.gptq.quant_linear import QuantLinear
from loguru import logger
from typing import Optional

Expand Down

0 comments on commit dc58c33

Please sign in to comment.