We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 7a16eb9 commit e6b7eaeCopy full SHA for e6b7eae
vllm/model_executor/layers/layernorm.py
@@ -113,11 +113,18 @@ def forward_hpu(
113
orig_shape = x.shape
114
residual += x.view(residual.shape)
115
# Note: HPUFusedRMSNorm requires 3D tensors as inputs
116
+ residual_shape = residual.shape
117
+ if len(residual_shape) == 2:
118
+ residual = residual.unsqueeze(0)
119
x = HPUFusedRMSNorm.apply(residual, self.weight,
120
self.variance_epsilon)
- return x.view(orig_shape), residual
121
+ return x.view(orig_shape), residual.view(residual_shape)
122
123
+ orig_shape = x.shape
124
+ if len(orig_shape) == 2:
125
+ x = x.unsqueeze(0)
126
x = HPUFusedRMSNorm.apply(x, self.weight, self.variance_epsilon)
127
+ x = x.view(orig_shape)
128
return x
129
130
def forward_xpu(
0 commit comments