We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a0170cc commit 610027dCopy full SHA for 610027d
transformer_engine/common/comm_gemm_overlap/userbuffers/userbuffers.cu
@@ -1366,7 +1366,7 @@ __global__ void __launch_bounds__(MAX_THREADS)
1366
cfg.attrs = attribute_ub; \
1367
cfg.numAttrs = comm->sm_arch >= 9 ? 2 : 1;
1368
1369
-#if defined(__CUDA_ARCH__) && (__CUDA_ARCH__ >= 900) && (CUDART_VERSION >= 12030)
+#if (CUDART_VERSION >= 12030)
1370
#define ADD_LAUNCH_COMPLETION_EVENT(attribute_ub, comm_launch_event) \
1371
attribute_ub[2].id = cudaLaunchAttributeLaunchCompletionEvent; \
1372
attribute_ub[2].val.launchCompletionEvent.event = comm_launch_event;
0 commit comments