suppress kernel loading output (8fca9b49) · Commits · candle / Megatron-LM

megatron/fused_kernels/init.py

+2 −4

Original line number	Diff line number	Diff line
		@@ -69,8 +69,7 @@ def load_scaled_upper_triang_masked_softmax_fusion_kernel():
		'-U__CUDA_NO_HALF_CONVERSIONS__',
		'--expt-relaxed-constexpr',
		'--expt-extended-lambda',
		'--use_fast_math'] + cc_flag,
		verbose=True)
		'--use_fast_math'] + cc_flag)

		def load_scaled_masked_softmax_fusion_kernel():

		@@ -98,5 +97,4 @@ def load_scaled_masked_softmax_fusion_kernel():
		'-U__CUDA_NO_HALF_CONVERSIONS__',
		'--expt-relaxed-constexpr',
		'--expt-extended-lambda',
		'--use_fast_math'] + cc_flag,
		verbose=True)
		'--use_fast_math'] + cc_flag)