// RUN: mlir-opt %s -convert-linalg-to-loops | FileCheck %s // Test that we can lower all the way to LLVM without crashing, don't check results here. // RUN: mlir-opt %s --convert-linalg-to-llvm -o=/dev/null 2>&1 // CHECK-DAG: #[[strided1D:.*]] = affine_map<(d0)[s0] -> (d0 + s0)> // CHECK-DAG: #[[strided2D:.*]] = affine_map<(d0, d1)[s0, s1] -> (d0 * s1 + s0 + d1)> // CHECK-DAG: #[[strided3D:.*]] = affine_map<(d0, d1, d2)[s0, s1, s2] -> (d0 * s1 + s0 + d1 * s2 + d2)> // CHECK-DAG: #[[strided4D:.*]] = affine_map<(d0, d1, d2, d3)[s0, s1, s2, s3] -> (d0 * s1 + s0 + d1 * s2 + d2 * s3 + d3)> // CHECK-DAG: #[[Stride2Dilation1:.*]] = affine_map<(d0, d1) -> (d0 * 2 + d1)> // CHECK-DAG: #[[Stride2Dilation4:.*]] = affine_map<(d0, d1) -> (d0 * 2 + d1 * 4)> // CHECK-DAG: #[[Stride3Dilation5:.*]] = affine_map<(d0, d1) -> (d0 * 3 + d1 * 5)> func @matmul(%arg0: memref, %M: index, %N: index, %K: index) { %c0 = constant 0 : index %c1 = constant 1 : index %A = view %arg0[%c0][%M, %K] : memref to memref %B = view %arg0[%c0][%K, %N] : memref to memref %C = view %arg0[%c0][%M, %N] : memref to memref linalg.matmul(%A, %B, %C) : memref, memref, memref return } // CHECK-LABEL: func @matmul(%{{.*}}: memref, // CHECK-SAME: [[M:arg[0-9]+]]: index // CHECK-SAME: [[N:arg[0-9]+]]: index // CHECK-SAME: [[K:arg[0-9]+]]: index // CHECK: %[[A:.*]] = std.view %{{.*}}[{{.*}}] : memref to memref // CHECK: %[[B:.*]] = std.view %{{.*}}[{{.*}}] : memref to memref // CHECK: %[[C:.*]] = std.view %{{.*}}[{{.*}}] : memref to memref // CHECK: loop.for %{{.*}} = %{{.*}} to %[[M]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[N]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[K]] step %{{.*}} { // CHECK-DAG: %[[a:.*]] = load %[[A]][%{{.*}}, %{{.*}}] : memref // CHECK-DAG: %[[b:.*]] = load %[[B]][%{{.*}}, %{{.*}}] : memref // CHECK-DAG: %[[inc:.*]] = mulf %[[a]], %[[b]] : f32 // CHECK-DAG: %[[c:.*]] = load %[[C]][%{{.*}}, %{{.*}}] : memref // CHECK-DAG: %[[res:.*]] = addf %[[c]], %[[inc]] : f32 // CHECK: store %[[res]], %[[C]][%{{.*}}, %{{.*}}] : memref func @matvec(%arg0: memref, %M: index, %N: index) { %c0 = constant 0 : index %c1 = constant 1 : index %2 = view %arg0[%c0][%M, %N] : memref to memref %3 = view %arg0[%c0][%M] : memref to memref %4 = view %arg0[%c0][%N] : memref to memref linalg.matvec(%2, %3, %4) : memref, memref, memref return } // CHECK-LABEL: func @matvec(%{{.*}}: memref, // CHECK-SAME: [[M:arg[0-9]+]]: index // CHECK-SAME: [[K:arg[0-9]+]]: index // CHECK: %[[A:.*]] = std.view %{{.*}}[{{.*}}] : memref to memref // CHECK: %[[B:.*]] = std.view %{{.*}}[{{.*}}] : memref to memref // CHECK: %[[C:.*]] = std.view %{{.*}}[{{.*}}] : memref to memref // CHECK: loop.for %{{.*}} = %{{.*}} to %[[M]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[K]] step %{{.*}} { // CHECK-DAG: %[[a:.*]] = load %[[A]][%{{.*}}, %{{.*}}] : memref // CHECK-DAG: %[[b:.*]] = load %[[B]][%{{.*}}] : memref // CHECK-DAG: %[[inc:.*]] = mulf %[[a]], %[[b]] : f32 // CHECK-DAG: %[[c:.*]] = load %[[C]][%{{.*}}] : memref // CHECK-DAG: %[[res:.*]] = addf %[[c]], %[[inc]] : f32 // CHECK: store %[[res]], %[[C]][%{{.*}}] : memref func @dot(%arg0: memref, %M: index) { %c0 = constant 0 : index %c1 = constant 1 : index %1 = view %arg0[%c0][%M] : memref to memref %2 = view %arg0[%c0][%M] : memref to memref %3 = view %arg0[][] : memref to memref linalg.dot(%1, %2, %3) : memref, memref, memref return } // CHECK-LABEL: func @dot(%{{.*}}: memref, // CHECK-SAME: [[K:arg[0-9]+]]: index // CHECK: %[[A:.*]] = std.view %{{.*}}[{{.*}}][{{.*}}] : memref to memref // CHECK: %[[B:.*]] = std.view %{{.*}}[{{.*}}][{{.*}}] : memref to memref // CHECK: %[[C:.*]] = std.view %{{.*}}[][] : memref to memref // CHECK: loop.for %{{.*}} = %{{.*}} to %[[K]] step %{{.*}} { // CHECK-DAG: %[[a:.*]] = load %[[A]][%{{.*}}] : memref // CHECK-DAG: %[[b:.*]] = load %[[B]][%{{.*}}] : memref // CHECK-DAG: %[[inc:.*]] = mulf %[[a]], %[[b]] : f32 // CHECK-DAG: %[[c:.*]] = load %[[C]][] : memref // CHECK-DAG: %[[res:.*]] = addf %[[c]], %[[inc]] : f32 // CHECK: store %[[res]], %[[C]][] : memref func @dot_view(%arg0: memref, %arg1: memref, %arg2: memref) { linalg.dot(%arg0, %arg1, %arg2) : memref, memref, memref return } // CHECK-LABEL: func @dot_view( // CHECK: %{{.*}}: memref, %{{.*}}: memref, %{{.*}}: memref) { // CHECK: %[[K:.*]] = dim %arg0, 0 : memref // CHECK: loop.for %{{.*}} = %{{.*}} to %[[K]] step %{{.*}} { // CHECK-DAG: %[[a:.*]] = load %arg0[%{{.*}}] : memref // CHECK-DAG: %[[b:.*]] = load %{{.*}}[%{{.*}}] : memref // CHECK-DAG: %[[inc:.*]] = mulf %[[a]], %[[b]] : f32 // CHECK-DAG: %[[c:.*]] = load %{{.*}}[] : memref // CHECK-DAG: %[[res:.*]] = addf %[[c]], %[[inc]] : f32 // CHECK: store %[[res]], %{{.*}}[] : memref func @fill_view(%arg0: memref, %arg1: f32) { linalg.fill(%arg0, %arg1) : memref, f32 return } // CHECK-LABEL: func @fill_view( // CHECK: %{{.*}}: memref, %{{.*}}: f32) { // CHECK: loop.for %{{.*}} = %{{.*}} to %{{.*}} step %{{.*}} { // CHECK: store %{{.*}}, %{{.*}}[%{{.*}}] : memref func @fill_view0(%arg0: memref, %arg1: f32) { linalg.fill(%arg0, %arg1) : memref, f32 return } // CHECK-LABEL: func @fill_view0(%{{.*}}: memref, %{{.*}}: f32) { // CHECK: store %{{.*}}, %{{.*}}[] : memref func @fill_view3(%arg0: memref, %arg1: f32) { linalg.fill(%arg0, %arg1) : memref, f32 return } // CHECK-LABEL: func @fill_view3( // CHECK: %{{.*}}: memref, %{{.*}}: f32) { // CHECK: loop.for %{{.*}} = %{{.*}} to %{{.*}} step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %{{.*}} step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %{{.*}} step %{{.*}} { // CHECK: store %{{.*}}, %{{.*}}[%{{.*}}, %{{.*}}, %{{.*}}] : memref func @copy_view(%arg0: memref, %arg1: memref) { linalg.copy(%arg0, %arg1) : memref, memref return } // CHECK-LABEL: func @copy_view( // CHECK: %{{.*}}: memref, %{{.*}}: memref) { // CHECK: loop.for %{{.*}} = %{{.*}} to %{{.*}} step %{{.*}} { // CHECK: %[[L:.*]] = load %{{.*}}[%{{.*}}] : memref // CHECK: store %[[L]], %{{.*}}[%{{.*}}] : memref func @copy_view0(%arg0: memref, %arg1: memref) { linalg.copy(%arg0, %arg1) : memref, memref return } // CHECK-LABEL: func @copy_view0(%{{.*}}: memref, %{{.*}}: memref) { // CHECK: %{{.*}} = load %{{.*}}[] : memref // CHECK: store %{{.*}}, %{{.*}}[] : memref func @copy_view3(%arg0: memref, %arg1: memref) { linalg.copy(%arg0, %arg1) {inputPermutation = affine_map<(i, j, k) -> (i, k, j)>, outputPermutation = affine_map<(i, j, k) -> (k, j, i)>} : memref, memref return } // CHECK-LABEL: func @copy_view3 // CHECK: (%{{.*}}: memref, %{{.*}}: memref) { // CHECK: loop.for %{{.*}} = %{{.*}} to %{{.*}} step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %{{.*}} step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %{{.*}} step %{{.*}} { // CHECK: %[[L:.*]] = load %{{.*}}[%{{.*}}, %{{.*}}, %{{.*}}] : memref // CHECK: store %[[L]], %{{.*}}[%{{.*}}, %{{.*}}, %{{.*}}] : memref func @conv_view3(%arg0: memref, %arg1: memref, %arg2: memref) { linalg.conv(%arg0, %arg1, %arg2) {strides = [2]}: memref, memref, memref return } // CHECK-LABEL: func @conv_view3( // CHECK: %{{.*}}: memref, %{{.*}}: memref, %{{.*}}: memref) { // CHECK: %[[Z0:.*]] = dim %arg0, 0 : memref // CHECK: %[[Q:.*]] = dim %arg0, 1 : memref // CHECK: %[[K:.*]] = dim %arg0, 2 : memref // CHECK: %[[B:.*]] = dim %arg1, 0 : memref // CHECK: %[[X0:.*]] = dim %arg2, 1 : memref // CHECK: loop.for %{{.*}} = %{{.*}} to %[[B]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[X0]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[K]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[Q]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[Z0]] step %{{.*}} { // CHECK: %[[SUM:.*]] = affine.apply #[[Stride2Dilation1]](%{{.*}}, %{{.*}}) // CHECK: %{{.*}} = load %{{.*}}[%{{.*}}, %[[SUM]], %{{.*}}] : memref // CHECK: %{{.*}} = load %{{.*}}[%{{.*}}, %{{.*}}, %{{.*}}] : memref // CHECK: %{{.*}} = mulf %{{.*}}, %{{.*}} : f32 // CHECK: %{{.*}} = load %{{.*}}[%{{.*}}, %{{.*}}, %{{.*}}] : memref // CHECK: %{{.*}} = addf %{{.*}}, %{{.*}} : f32 // CHECK: store %{{.*}}, %{{.*}}[%{{.*}}, %{{.*}}, %{{.*}}] : memref func @conv_view4(%arg0: memref, %arg1: memref, %arg2: memref) { linalg.conv(%arg0, %arg1, %arg2) {dilations = [4, 5], strides = [2, 3]} : memref, memref, memref return } // CHECK-LABEL: func @conv_view4( // CHECK: %{{.*}}: memref, %{{.*}}: memref, %{{.*}}: memref) { // CHECK: %[[Z0:.*]] = dim %arg0, 0 : memref // CHECK: %[[Z1:.*]] = dim %arg0, 1 : memref // CHECK: %[[Q:.*]] = dim %arg0, 2 : memref // CHECK: %[[K:.*]] = dim %arg0, 3 : memref // CHECK: %[[B:.*]] = dim %arg1, 0 : memref // CHECK: %[[X0:.*]] = dim %arg2, 1 : memref // CHECK: %[[X1:.*]] = dim %arg2, 2 : memref // CHECK: loop.for %{{.*}} = %{{.*}} to %[[B]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[X0]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[X1]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[K]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[Q]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[Z0]] step %{{.*}} { // CHECK: loop.for %{{.*}} = %{{.*}} to %[[Z1]] step %{{.*}} { // CHECK: %[[SUM0:.*]] = affine.apply #[[Stride2Dilation4]](%{{.*}}, %{{.*}}) // CHECK: %[[SUM1:.*]] = affine.apply #[[Stride3Dilation5]](%{{.*}}, %{{.*}}) // CHECK: %{{.*}} = load %{{.*}}[%{{.*}}, %[[SUM0]], %[[SUM1]], %{{.*}}] : memref // CHECK: %{{.*}} = load %{{.*}}[%{{.*}}, %{{.*}}, %{{.*}}, %{{.*}}] : memref // CHECK: %{{.*}} = mulf %{{.*}}, %{{.*}} : f32 // CHECK: %{{.*}} = load %{{.*}}[%{{.*}}, %{{.*}}, %{{.*}}, %{{.*}}] : memref // CHECK: %{{.*}} = addf %{{.*}}, %{{.*}} : f32 // CHECK: store %{{.*}}, %{{.*}}[%{{.*}}, %{{.*}}, %{{.*}}, %{{.*}}] : memref func @foo(%0: f32, %1: f32, %2: f32) -> (f32, f32) { %f0 = constant 0.0 : f32 return %f0, %f0 : f32, f32 } #accesses = [ affine_map<(i, j, k) -> (i, j)>, affine_map<(i, j, k) -> (i, j, k)>, affine_map<(i, j, k) -> (i, k, j)> ] #trait = { args_in = 1, args_out = 2, iterator_types = ["parallel", "parallel", "parallel"], indexing_maps = #accesses, fun = @foo, library_call = "some_external_function_name_1", doc = "B(i,j,k), C(i,k,j) = foo(A(i, j), B(i,j,k), C(i,k,j))" } func @generic_function(%arg0: memref, %arg1: memref, %arg2: memref) { linalg.generic #trait %arg0, %arg1, %arg2: memref, memref, memref return } // CHECK-LABEL: @foo // CHECK-LABEL: @generic_function // CHECK: loop.for %[[i:.*]] = {{.*}} // CHECK: loop.for %[[j:.*]] = {{.*}} // CHECK: loop.for %[[k:.*]] = {{.*}} // CHECK: %[[a:.*]] = load %{{.*}}[%[[i]], %[[j]]] : memref // CHECK: %[[b:.*]] = load %{{.*}}[%[[i]], %[[j]], %[[k]]] : memref // CHECK: %[[c:.*]] = load %{{.*}}[%[[i]], %[[k]], %[[j]]] : memref // CHECK: %[[res:.*]]:2 = call @foo(%[[a]], %[[b]], %[[c]]) : (f32, f32, f32) -> (f32, f32) // CHECK: store %[[res]]#0, %{{.*}}[%[[i]], %[[j]], %[[k]]] : memref // CHECK: store %[[res]]#1, %{{.*}}[%[[i]], %[[k]], %[[j]]] : memref #trait2 = { args_in = 1, args_out = 2, iterator_types = ["parallel", "parallel", "parallel"], indexing_maps = #accesses, library_call = "some_external_function_name_2", doc = "B(i,j,k), C(i,k,j) = foo(A(i, j), B(i,j,k), C(i,k,j))" } func @generic_region(%arg0: memref, %arg1: memref, %arg2: memref) { linalg.generic #trait2 %arg0, %arg1, %arg2 { ^bb0(%a: f32, %b: f32, %c: f32): %d = mulf %a, %b : f32 %e = addf %c, %d : f32 linalg.yield %d, %e : f32, f32 }: memref, memref, memref return } // CHECK-LABEL: @generic_region // CHECK: loop.for %[[i:.*]] = {{.*}} // CHECK: loop.for %[[j:.*]] = {{.*}} // CHECK: loop.for %[[k:.*]] = {{.*}} // CHECK: %[[a:.*]] = load %{{.*}}[%[[i]], %[[j]]] : memref // CHECK: %[[b:.*]] = load %{{.*}}[%[[i]], %[[j]], %[[k]]] : memref // CHECK: %[[c:.*]] = load %{{.*}}[%[[i]], %[[k]], %[[j]]] : memref // CHECK: %[[d:.*]] = mulf %[[a]], %[[b]] : f32 // CHECK: %[[e:.*]] = addf %[[c]], %[[d]] : f32 // CHECK: store %[[d]], %{{.*}}[%[[i]], %[[j]], %[[k]]] : memref // CHECK: store %[[e]], %{{.*}}[%[[i]], %[[k]], %[[j]]] : memref func @indexed_foo(%i: index, %j: index, %k: index, %0: f32, %1: f32, %2: f32) -> (f32, f32) { %i_int = index_cast %i: index to i32 %i_float = sitofp %i_int : i32 to f32 return %i_float, %i_float : f32, f32 } #trait3 = { args_in = 1, args_out = 2, iterator_types = ["parallel", "parallel", "parallel"], indexing_maps = #accesses, fun = @indexed_foo, library_call = "some_external_function_name_1", doc = "b(i,j,k), c(i,k,j) = foo(a(i, j), b(i,j,k), c(i,k,j))" } func @indexed_generic_function( %arg0: memref, %arg1: memref, %arg2: memref) { linalg.indexed_generic #trait3 %arg0, %arg1, %arg2: memref, memref, memref return } // CHECK-LABEL: @indexed_foo // CHECK-LABEL: @indexed_generic_function // CHECK: loop.for %[[i:.*]] = {{.*}} // CHECK: loop.for %[[j:.*]] = {{.*}} // CHECK: loop.for %[[k:.*]] = {{.*}} // CHECK: %[[a:.*]] = load %{{.*}}[%[[i]], %[[j]]] : memref // CHECK: %[[b:.*]] = load %{{.*}}[%[[i]], %[[j]], %[[k]]] : memref // CHECK: %[[c:.*]] = load %{{.*}}[%[[i]], %[[k]], %[[j]]] : memref // CHECK: %[[res:.*]]:2 = call @indexed_foo(%[[i]], %[[j]], %[[k]], %[[a]], %[[b]], %[[c]]) : (index, index, index, f32, f32, f32) -> (f32, f32) // CHECK: store %[[res]]#0, %{{.*}}[%[[i]], %[[j]], %[[k]]] : memref // CHECK: store %[[res]]#1, %{{.*}}[%[[i]], %[[k]], %[[j]]] : memref #trait4 = { args_in = 1, args_out = 2, iterator_types = ["parallel", "parallel", "parallel"], indexing_maps = #accesses, library_call = "some_external_function_name_2", doc = "B(i,j,k), C(i,k,j) = foo(A(i, j) * B(i,j,k), i * j * k + C(i,k,j))" } func @indexed_generic_region( %arg0: memref, %arg1: memref, %arg2: memref) { linalg.indexed_generic #trait4 %arg0, %arg1, %arg2 { ^bb0(%i: index, %j: index, %k: index, %a: f32, %b: f32, %c: f32): %result_1 = mulf %a, %b : f32 %ij = addi %i, %j : index %ijk = addi %ij, %k : index %ijk_int = index_cast %ijk : index to i32 %ijk_float = sitofp %ijk_int : i32 to f32 %result_2 = addf %c, %ijk_float : f32 linalg.yield %result_1, %result_2 : f32, f32 }: memref, memref, memref return } // CHECK-LABEL: @indexed_generic_region // CHECK: loop.for %[[i:.*]] = {{.*}} // CHECK: loop.for %[[j:.*]] = {{.*}} // CHECK: loop.for %[[k:.*]] = {{.*}} // CHECK: %[[a:.*]] = load %{{.*}}[%[[i]], %[[j]]] // CHECK: %[[b:.*]] = load %{{.*}}[%[[i]], %[[j]], %[[k]]] // CHECK: %[[c:.*]] = load %{{.*}}[%[[i]], %[[k]], %[[j]]] // CHECK: %[[result_1:.*]] = mulf %[[a]], %[[b]] : f32 // CHECK: %[[ij:.*]] = addi %[[i]], %[[j]] : index // CHECK: %[[ijk:.*]] = addi %[[ij]], %[[k]] : index // CHECK: %[[ijk_int:.*]] = index_cast %[[ijk]] : index to i32 // CHECK: %[[ijk_float:.*]] = sitofp %[[ijk_int]] : i32 to f32 // CHECK: %[[result_2:.*]] = addf %[[c]], %[[ijk_float]] : f32 // CHECK: store %[[result_1]], %{{.*}}[%[[i]], %[[j]], %[[k]]] // CHECK: store %[[result_2]], %{{.*}}[%[[i]], %[[k]], %[[j]]]