We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ac3ed5a commit a5464dcCopy full SHA for a5464dc
vllm/model_executor/layers/quantization/compressed_tensors/transform/linear.py
@@ -163,7 +163,7 @@ def apply(
163
if self.output_transform is not None:
164
for part_id, (start, length) in enumerate(self.partition_ranges):
165
x[:, start : start + length] = self.output_transform(
166
- x[:, start : start + length].contiguous(), part_id=part_id
+ x[:, start : start + length].clone(), part_id=part_id
167
)
168
169
return x
0 commit comments