mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-08-27 20:22:09 +00:00
fix format (#564)
This commit is contained in:
parent
e014144c44
commit
5835631218
@ -304,7 +304,8 @@ __global__ void ker_attn_softmax_bw(T *grad, const T *inp, int softmax_length) {
|
|||||||
cg::thread_block b = cg::this_thread_block();
|
cg::thread_block b = cg::this_thread_block();
|
||||||
cg::thread_block_tile<WARP_SIZE> g = cg::tiled_partition<WARP_SIZE>(b);
|
cg::thread_block_tile<WARP_SIZE> g = cg::tiled_partition<WARP_SIZE>(b);
|
||||||
|
|
||||||
for (int i = 1; i < WARP_SIZE; i <<= 1) sum += g.shfl_xor(sum, i);
|
for (int i = 1; i < WARP_SIZE; i <<= 1)
|
||||||
|
sum += g.shfl_xor(sum, i);
|
||||||
|
|
||||||
#pragma unroll
|
#pragma unroll
|
||||||
for (int i = 0; i < ITERATIONS; ++i) {
|
for (int i = 0; i < ITERATIONS; ++i) {
|
||||||
|
Loading…
Reference in New Issue
Block a user