Updates to fused epilogue (#383)

* Enhancements and fixes to fused GEMM and Convolution epilogue.
* Need to explicitly list cudart as unit test library dependency.
This commit is contained in:
Andrew Kerr
2021-12-17 16:04:43 -05:00
committed by GitHub
parent 4e666e1dfd
commit ec4f7e5194
24 changed files with 372 additions and 193 deletions

View File

@ -1056,7 +1056,6 @@ def GenerateSM75_TensorOp_8832_TN(manifest, args):
min_cc = 75
max_cc = 1024
alignment_constraints = [32,]
for math_inst in math_instructions:
@ -1136,7 +1135,6 @@ def GenerateSM75_TensorOp_8832_Interleaved(manifest, args):
min_cc = 75
max_cc = 1024
alignment_constraints = [32,]
for math_inst in math_instructions:
@ -1907,7 +1905,6 @@ def GenerateSM80_TensorOp_16864_Interleaved(manifest, args):
min_cc = 80
max_cc = 1024
alignment_constraints = [32,]
for math_inst in math_instructions: