We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 48c9a35 commit 86aaf3cCopy full SHA for 86aaf3c
src/tl_templates/cuda/common.h
@@ -18,6 +18,8 @@ using int4_t = int4;
18
#define hexp cutlass::fast_exp
19
#define hlog cutlass::fast_log
20
#define hsqrt cutlass::fast_sqrt
21
+#define hsin cutlass::fast_sin
22
+#define hcos cutlass::fast_cos
23
#define htanh cutlass::fast_tanh
24
#define hpow powf
25
0 commit comments