Skip to content

Commit 0080d5a

Browse files
committed
upd
1 parent 7c09ea8 commit 0080d5a

File tree

2 files changed

+7
-7
lines changed

2 files changed

+7
-7
lines changed

sgl-kernel/csrc/attention/cutlass_mla_kernel.cu

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -54,13 +54,13 @@ struct IsPersistent {
5454
static const bool value = v;
5555
};
5656

57-
template <typename T, typename PersistenceOption = IsPersistent<true>>
57+
template <typename T, typename PersistenceOption = IsPersistent<true> >
5858
struct MlaSm100 {
5959
using Element = T;
6060
using ElementAcc = float;
6161
using ElementOut = T;
6262

63-
using TileShape = Shape<_128, _128, Shape<_512, _64>>;
63+
using TileShape = Shape<_128, _128, Shape<_512, _64> >;
6464
using TileShapeH = cute::tuple_element_t<0, TileShape>;
6565
using TileShapeD = cute::tuple_element_t<2, TileShape>;
6666

sgl-kernel/csrc/grammar/apply_token_bitmask_inplace_cuda.cu

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -118,7 +118,7 @@ __global__ void __launch_bounds__(THREADS_PER_THREAD_BLOCK) LogitsBitmaskKernel(
118118
}
119119
}
120120

121-
template <typename T, typename = std::enable_if_t<std::is_integral<T>::value>>
121+
template <typename T, typename = std::enable_if_t<std::is_integral<T>::value> >
122122
constexpr auto CeilDiv(T numerator, T denominator) {
123123
return (numerator + denominator - 1) / denominator;
124124
}
@@ -142,19 +142,19 @@ void ApplyTokenBitmaskInplaceDispatchToBitsPerThread(
142142
if (num_bits_per_thread <= 4 && kAlignment <= 4) {
143143
const dim3 grid(CeilDiv(vocab_size, THREADS_PER_THREAD_BLOCK * 4), num_rows);
144144
LogitsBitmaskKernel<T, PackedT, 4>
145-
<<<grid, block, 0, stream>>>(logits, bitmask, indices, vocab_size, logits_stride, bitmask_stride);
145+
<<<grid, block, 0, stream> > >(logits, bitmask, indices, vocab_size, logits_stride, bitmask_stride);
146146
} else if (num_bits_per_thread <= 8 && kAlignment <= 8) {
147147
const dim3 grid(CeilDiv(vocab_size, THREADS_PER_THREAD_BLOCK * 8), num_rows);
148148
LogitsBitmaskKernel<T, PackedT, 8>
149-
<<<grid, block, 0, stream>>>(logits, bitmask, indices, vocab_size, logits_stride, bitmask_stride);
149+
<<<grid, block, 0, stream> > >(logits, bitmask, indices, vocab_size, logits_stride, bitmask_stride);
150150
} else if (num_bits_per_thread <= 16 && kAlignment <= 16) {
151151
const dim3 grid(CeilDiv(vocab_size, THREADS_PER_THREAD_BLOCK * 16), num_rows);
152152
LogitsBitmaskKernel<T, PackedT, 16>
153-
<<<grid, block, 0, stream>>>(logits, bitmask, indices, vocab_size, logits_stride, bitmask_stride);
153+
<<<grid, block, 0, stream> > >(logits, bitmask, indices, vocab_size, logits_stride, bitmask_stride);
154154
} else {
155155
const dim3 grid(CeilDiv(vocab_size, THREADS_PER_THREAD_BLOCK * 32), num_rows);
156156
LogitsBitmaskKernel<T, PackedT, 32>
157-
<<<grid, block, 0, stream>>>(logits, bitmask, indices, vocab_size, logits_stride, bitmask_stride);
157+
<<<grid, block, 0, stream> > >(logits, bitmask, indices, vocab_size, logits_stride, bitmask_stride);
158158
}
159159
}
160160

0 commit comments

Comments
 (0)