Skip to content

Commit ecda000

Browse files
remove atomic
1 parent fe60c8e commit ecda000

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

src/operator/contrib/multi_lamb-inl.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -302,10 +302,10 @@ inline void multiLAMB(const nnvm::NodeAttrs& attrs,
302302
Tensor<xpu, 1, int> block_to_chunk(reinterpret_cast<int*>(&workspace[pos_wspace]),
303303
Shape1(kernel_params.nchunks), s);
304304

305-
MultiSumSqRun<xpu>(weights, kernel_params.ntensors, r1.dptr_, s);
305+
MultiSumSqRun<xpu>(weights, kernel_params.ntensors, r1.dptr_, ctx);
306306
call_kernel1<MPDType, DType>(s, kernel_params, param, block_to_tensor.dptr_,
307307
block_to_chunk.dptr_);
308-
MultiSumSqRun<xpu>(temp_g, kernel_params.ntensors, r2.dptr_, s);
308+
MultiSumSqRun<xpu>(temp_g, kernel_params.ntensors, r2.dptr_, ctx);
309309
call_kernel2<MPDType, DType>(s, kernel_params, param, r1.dptr_, r2.dptr_,
310310
block_to_tensor.dptr_, block_to_chunk.dptr_,
311311
req[0]);

0 commit comments

Comments
 (0)