Skip to content

Commit

Permalink
fix auto_gptq layer error device
Browse files Browse the repository at this point in the history
  • Loading branch information
ZX-ModelCloud committed Dec 21, 2024
1 parent d21256c commit d3199ea
Showing 1 changed file with 0 additions and 4 deletions.
4 changes: 0 additions & 4 deletions optimum/gptq/quantizer.py
Original file line number Diff line number Diff line change
Expand Up @@ -519,8 +519,6 @@ def quantize_model(self, model: nn.Module, tokenizer: Optional[Any] = None):
blocks = recurse_getattr(model, self.block_name_to_quantize)

cur_layer_device = get_device(blocks[0])
if not is_gptqmodel_available():
cur_layer_device = 0

if not has_device_map:
# put modules from module_name_preceding_first_block on cuda or xpu or cpu
Expand Down Expand Up @@ -591,8 +589,6 @@ def store_input_hook(_, input, *args):
block = block.to(0)
layers = get_layers(block)
block_device = get_device(block)
if not is_gptqmodel_available():
block_device = 0
if isinstance(self.modules_in_block_to_quantize, list) and len(self.modules_in_block_to_quantize) > 0:
if self.true_sequential:
layers_name_list = self.modules_in_block_to_quantize
Expand Down

0 comments on commit d3199ea

Please sign in to comment.