Skip to content

Commit

Permalink
Fixing the other pathways.
Browse files Browse the repository at this point in the history
  • Loading branch information
Narsil committed Aug 14, 2024
1 parent c904766 commit 5c598cc
Showing 1 changed file with 13 additions and 11 deletions.
24 changes: 13 additions & 11 deletions server/text_generation_server/layers/gptq/exllamav2.py
Original file line number Diff line number Diff line change
Expand Up @@ -115,29 +115,31 @@ def ext_make_q_matrix(
w.qweight,
extra.q_perm,
extra.q_invperm,
none_tensor,
none_tensor,
none_tensor,
none_tensor,
none_tensor, # q_scale
none_tensor, # q_scale_max
none_tensor, # q_groups
none_tensor, # q_group_map
w.qzeros,
w.scales,
w.g_idx.cpu(),
none_tensor, # bias
temp_dq,
max_dq_rows,
)
# GPTQ without g_idx
else:
return make_q_matrix(
w.qweight,
none_tensor,
none_tensor,
none_tensor,
none_tensor,
none_tensor,
none_tensor,
none_tensor, # q_perm
none_tensor, # q_invperm
none_tensor, # q_scale
none_tensor, # q_scale_max
none_tensor, # q_groups
none_tensor, # q_group_map
w.qzeros,
w.scales,
none_tensor,
none_tensor, # g_idx
none_tensor, # bias
temp_dq,
max_dq_rows,
)
Expand Down

0 comments on commit 5c598cc

Please sign in to comment.