We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 67a1e18 commit d75e16fCopy full SHA for d75e16f
dlinfer/framework/lmdeploy_ext/quants/ascend_awq.py
@@ -137,6 +137,7 @@ def AscendMergedAwqLinear__init__(
137
replicate = tuple(False for _ in all_out_features)
138
139
self.split_section_s = all_out_features
140
+ self.is_tp = is_tp
141
elem_per_int = 32 // w_bit
142
self.split_section_wz = [size // elem_per_int for size in all_out_features]
143
0 commit comments