Skip to content

Commit 03f7546

Browse files
added TODOs
Signed-off-by: Brian Dellabetta <bdellabe@redhat.com>
1 parent a9c1cbe commit 03f7546

File tree

2 files changed

+5
-5
lines changed

2 files changed

+5
-5
lines changed

src/llmcompressor/modifiers/awq/base.py

+1
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,7 @@
2525
__all__ = ["AWQModifier"]
2626

2727

28+
# TODO (Brian INFERENG-531) Add support for offloaded models
2829
class AWQModifier(Modifier):
2930
"""
3031
Implements the AWQ (Activation-Weighted Quantization) algorithm,

src/llmcompressor/modifiers/awq/mappings.py

+4-5
Original file line numberDiff line numberDiff line change
@@ -28,8 +28,8 @@ class AWQMapping:
2828
"re:.*input_layernorm",
2929
["re:.*q_proj", "re:.*k_proj", "re:.*v_proj"],
3030
),
31-
# TODO this should only be added if v_proj/o_proj shapes match up
32-
# should we check during validation and skip if this is not the case?
31+
# TODO (Brian INFERENG-530) when resolving, only add
32+
# if v_proj/o_proj shapes match up
3333
AWQMapping("re:.*v_proj", ["re:.*o_proj"]),
3434
AWQMapping(
3535
"re:.*post_attention_layernorm",
@@ -40,9 +40,8 @@ class AWQMapping:
4040
["re:.*down_proj"],
4141
),
4242
],
43-
"Qwen": [
44-
# TODO add Qwen mappings
45-
],
43+
# TODO (Brian INFERENG-529) Add Qwen mappings
44+
# "Qwen": [ ],
4645
}
4746

4847

0 commit comments

Comments
 (0)