Skip to content

Commit

Permalink
After rebase.
Browse files Browse the repository at this point in the history
  • Loading branch information
Narsil committed Jul 25, 2023
1 parent 95583ee commit 0635d0e
Showing 1 changed file with 2 additions and 5 deletions.
7 changes: 2 additions & 5 deletions server/text_generation_server/utils/weights.py
Original file line number Diff line number Diff line change
Expand Up @@ -187,11 +187,8 @@ def get_multi_weights_row(self, prefix: str, quantize: str):
qzeros = self.get_sharded(f"{prefix}.qzeros", dim=0)
scales = self.get_sharded(f"{prefix}.scales", dim=0)
else:
raise RuntimeError(
"Using exllama GPTQ kernel with groupsize<1 is not supported"
)
# qzeros = self.get_tensor(f"{prefix}.qzeros")
# scales = self.get_tensor(f"{prefix}.scales")
qzeros = self.get_tensor(f"{prefix}.qzeros")
scales = self.get_tensor(f"{prefix}.scales")

# For tp > 1, at this point we know we do not use act-order
if self.process_group.size() == 1:
Expand Down

0 comments on commit 0635d0e

Please sign in to comment.