We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 9d4368d commit af40d33Copy full SHA for af40d33
vllm/model_executor/layers/quantization/utils/w8a8_utils.py
@@ -146,7 +146,8 @@ def __init__(self,
146
# as it breaks with dynamic shapes.
147
if pad_output is None:
148
config = get_current_vllm_config().compilation_config
149
- pad_output = config.level < CompilationLevel.PIECEWISE
+ pad_output = (not current_platform.is_rocm()
150
+ and config.level < CompilationLevel.PIECEWISE)
151
self.output_padding = 17 if pad_output else None
152
153
def apply(
0 commit comments