Skip to content

Commit cdf7c1a

Browse files
aakhundovfacebook-github-bot
authored andcommitted
Add meta-functions for asynchronous_*_cumsum ops (pytorch#2028)
Summary: ATT Differential Revision: D49467255
1 parent e41a2c5 commit cdf7c1a

File tree

1 file changed

+14
-0
lines changed

1 file changed

+14
-0
lines changed

fbgemm_gpu/src/sparse_ops/sparse_ops_meta.cpp

Lines changed: 14 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -46,12 +46,26 @@ Tensor batched_unary_embeddings_forward_meta(
4646
return at::empty_symint({N, B, T}, weight.options());
4747
}
4848

49+
Tensor asynchronous_inclusive_cumsum_meta(const Tensor& t_in) {
50+
return at::empty_symint(t_in.sym_sizes(), t_in.options());
51+
}
52+
53+
Tensor asynchronous_exclusive_cumsum_meta(const Tensor& t_in) {
54+
return at::empty_symint(t_in.sym_sizes(), t_in.options());
55+
}
56+
4957
} // namespace
5058

5159
} // namespace fbgemm_gpu
5260

5361
TORCH_LIBRARY_IMPL(fbgemm, Meta, m) {
5462
m.impl("pack_segments", TORCH_FN(fbgemm_gpu::pack_segments_forward_meta));
63+
m.impl(
64+
"asynchronous_inclusive_cumsum",
65+
TORCH_FN(fbgemm_gpu::asynchronous_inclusive_cumsum_meta));
66+
m.impl(
67+
"asynchronous_exclusive_cumsum",
68+
TORCH_FN(fbgemm_gpu::asynchronous_exclusive_cumsum_meta));
5569
m.impl(
5670
"asynchronous_complete_cumsum",
5771
TORCH_FN(fbgemm_gpu::asynchronous_complete_cumsum_meta));

0 commit comments

Comments
 (0)