CUTLASS 2.2 (#96)

Adds support for NVIDIA Ampere Architecture features. CUDA 11 Toolkit recommended.
2020-06-08 16:17:35 -07:00
parent e33d90b361
commit 86931fef85
584 changed files with 51080 additions and 3373 deletions
--- a/test/unit/core/array.cu
+++ b/test/unit/core/array.cu
@ -1,5 +1,5 @@
 /***************************************************************************************************
- * Copyright (c) 2017-2019, NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2017-2020, NVIDIA CORPORATION.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without modification, are permitted
 * provided that the following conditions are met:
@ -228,6 +228,14 @@ TEST(Array, Float16x8) {
 }
 #endif

+TEST(Array, FloatBF16x8) {
+  TestArray<cutlass::bfloat16_t, 8>().run();
+}
+
+TEST(Array, FloatTF32x4) {
+  TestArray<cutlass::tfloat32_t, 4>().run();
+}
+
 TEST(Array, Float32x4) {
  TestArray<float, 4>().run();
 }