@@ -1776,7 +1776,7 @@ def GPU_Create2To4SpMatOp : GPU_Op<"create_2to4_spmat", [GPU_AsyncOpInterface]>
1776
1776
Index:$cols,
1777
1777
GPU_Prune2To4SpMatFlagAttr:$pruneFlag,
1778
1778
AnyMemRef:$memref);
1779
- let results = (outs Res<GPU_SparseSpMatHandle>:$spMat,
1779
+ let results = (outs Res<GPU_SparseSpMatHandle>:$spMat,
1780
1780
Optional<GPU_AsyncToken>:$asyncToken);
1781
1781
1782
1782
let assemblyFormat = [{
@@ -2176,14 +2176,14 @@ def GPU_SpGEMMWorkEstimationOrComputeKind : I32EnumAttr<"SpGEMMWorkEstimationOrC
2176
2176
let cppNamespace = GPU_Dialect.cppNamespace;
2177
2177
}
2178
2178
2179
- def GPU_SpGEMMWorkEstimationOrComputeKindAttr : EnumAttr<GPU_Dialect,
2180
- GPU_SpGEMMWorkEstimationOrComputeKind,
2179
+ def GPU_SpGEMMWorkEstimationOrComputeKindAttr : EnumAttr<GPU_Dialect,
2180
+ GPU_SpGEMMWorkEstimationOrComputeKind,
2181
2181
"spgemm_work_estimation_or_compute_kind"> {}
2182
2182
2183
2183
def GPU_SpGEMMCreateDescrOp : GPU_Op<"spgemm_create_descr", [GPU_AsyncOpInterface]> {
2184
2184
let summary = "SpGEMM Create Descr operation";
2185
2185
let description = [{
2186
- The `gpu.spgemm_create_descr` creates a descriptor for the SpGEMM operation.
2186
+ The `gpu.spgemm_create_descr` creates a descriptor for the SpGEMM operation.
2187
2187
The descriptor describes the SpGEMM operation and stores the internal data
2188
2188
throughout the computation. It needs to be passed as an argument to
2189
2189
spgemm_* operations.
@@ -2238,11 +2238,11 @@ def GPU_SpGEMMDestroyDescrOp : GPU_Op<"spgemm_destroy_descr", [GPU_AsyncOpInterf
2238
2238
def GPU_SpGEMMWorkEstimationOrComputeOp : GPU_Op<"spgemm_work_estimation_or_compute", [GPU_AsyncOpInterface]> {
2239
2239
let summary = "SpGEMM work estimation operation";
2240
2240
let description = [{
2241
- The `gpu.spgemm_work_estimation_or_compute` is used to call
2241
+ The `gpu.spgemm_work_estimation_or_compute` is used to call
2242
2242
cusparseSpGEMM_workEstimation or cusparseSpGEMM_compute. Both of them are
2243
2243
for both determining the buffer size and performing the actual computation.
2244
2244
The operation expects handles returned by previous sparse operations to
2245
- construct an environment and the operands for SpGEMM.
2245
+ construct an environment and the operands for SpGEMM.
2246
2246
The buffer must have been allocated on the device.
2247
2247
2248
2248
@@ -2256,8 +2256,8 @@ def GPU_SpGEMMWorkEstimationOrComputeOp : GPU_Op<"spgemm_work_estimation_or_comp
2256
2256
2257
2257
```mlir
2258
2258
%bufferSz, %token = gpu.spgemm_work_estimation_or_compute async [%dep]{COMPUTE}
2259
- %desc, %spmatA{NON_TRANSPOSE}, %spmatB{NON_TRANSPOSE},
2260
- %spmatC, ALG2, %spgemmDesc, %c0, %alloc: f32 into
2259
+ %desc, %spmatA{NON_TRANSPOSE}, %spmatB{NON_TRANSPOSE},
2260
+ %spmatC, ALG2, %spgemmDesc, %c0, %alloc: f32 into
2261
2261
memref<0xi8>
2262
2262
```
2263
2263
@@ -2358,8 +2358,8 @@ def GPU_SpGEMMEstimateMemoryOp : GPU_Op<"spgemm_estimate_memory", [GPU_AsyncOpIn
2358
2358
auto modeA = gpu::TransposeMode::NON_TRANSPOSE;
2359
2359
auto modeB = gpu::TransposeMode::NON_TRANSPOSE;
2360
2360
auto alg = gpu::SpGEMMAlg::ALG1;
2361
- return build($_builder, $_state, bufferSz3New, bufferSz2New, asyncToken,
2362
- asyncDependencies, desc, modeA, modeB, spmatA, spmatB, spmatC,
2361
+ return build($_builder, $_state, bufferSz3New, bufferSz2New, asyncToken,
2362
+ asyncDependencies, desc, modeA, modeB, spmatA, spmatB, spmatC,
2363
2363
computeType, alg, bufferSz3, buffer3, bufferSz2);}]>
2364
2364
];
2365
2365
@@ -2375,7 +2375,7 @@ def GPU_SpGEMMCopyOp : GPU_Op<"spgemm_copy", [GPU_AsyncOpInterface]> {
2375
2375
let description = [{
2376
2376
The `gpu.spgemm_copy` operation copies a sparse matrix, e.g., the result of
2377
2377
the SpGEMM computation.
2378
-
2378
+
2379
2379
If the `async` keyword is present, the op is executed asynchronously (i.e.
2380
2380
it does not block until the execution has finished on the device). In
2381
2381
that case, it returns a `!gpu.async.token` in addition to the environment.
@@ -2430,7 +2430,7 @@ def GPU_SpGEMMGetSizeOp : GPU_Op<"spgemm_get_size", [GPU_AsyncOpInterface]> {
2430
2430
let description = [{
2431
2431
The `gpu.spgemm_get_size` operation retrieves the number of rows, number of
2432
2432
columns, and number of non-zero elements of a sparse matrix.
2433
-
2433
+
2434
2434
If the `async` keyword is present, the op is executed asynchronously (i.e.
2435
2435
it does not block until the execution has finished on the device). In
2436
2436
that case, it returns a `!gpu.async.token` in addition to the environment.
0 commit comments