3.6.0 update (#2005)
* 3.6.0 update * doc and swap stuff --------- Co-authored-by: yuzhai <yuzhai@nvidia.com> Co-authored-by: Haicheng Wu <haichengw@nvidia.com>
This commit is contained in:
@ -100,7 +100,7 @@ void
|
||||
copy(Tensor<TA, ALayout> const& src, // Any logical shape
|
||||
Tensor<TB, BLayout> & dst) // Any logical shape
|
||||
{
|
||||
for (int i = 0; i < size(src); ++i) {
|
||||
for (int i = 0; i < size(dst); ++i) {
|
||||
dst(i) = src(i);
|
||||
}
|
||||
}
|
||||
|
||||
@ -185,7 +185,6 @@ $ cmake .. -DCUTLASS_NVCC_ARCHS=90a # compiles for NVIDIA Hopper GP
|
||||
```
|
||||
|
||||
**NVIDIA Ampere Architecture.**
|
||||
|
||||
```bash
|
||||
$ cmake .. -DCUTLASS_NVCC_ARCHS=80 # compiles for NVIDIA Ampere GPU architecture
|
||||
```
|
||||
|
||||
Reference in New Issue
Block a user