Skip to content

Commit 2332df4

Browse files
authored
Merge pull request #30 from NVIDIA/fix_utilities_example
Fixed cutlass_utilities example.
2 parents 6877595 + cfe4b93 commit 2332df4

File tree

1 file changed

+9
-9
lines changed

1 file changed

+9
-9
lines changed

examples/02_cutlass_utilities/cutlass_utilities.cu

Lines changed: 9 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -144,18 +144,18 @@ cudaError_t Cutlass_FP16_SgemmNN(
144144
typename Gemm::Params params;
145145

146146
int result = params.initialize(
147-
M, // GEMM M dimension
148-
N, // GEMM N dimension
149-
K, // GEMM K dimension
150-
half(float(alpha)), // scalar alpha - This is a legal conversion from cutlass::half_t to CUDA's half.
151-
A, // matrix A operand
147+
M, // GEMM M dimension
148+
N, // GEMM N dimension
149+
K, // GEMM K dimension
150+
reinterpret_cast<half const &>(alpha), // scalar alpha - This is a legal conversion from cutlass::half_t to CUDA's half.
151+
A, // matrix A operand
152152
lda,
153-
B, // matrix B operand
153+
B, // matrix B operand
154154
ldb,
155-
half(float(beta)), // scalar beta - This is a legal conversion from cutlass::half_t to CUDA's half.
156-
C, // source matrix C
155+
reinterpret_cast<half const &>(beta), // scalar beta - This is a legal conversion from cutlass::half_t to CUDA's half.
156+
C, // source matrix C
157157
ldc,
158-
C, // destination matrix C (may be different memory than source C matrix)
158+
C, // destination matrix C (may be different memory than source C matrix)
159159
ldc
160160
);
161161

0 commit comments

Comments
 (0)