1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79
|
// RUN: mlir-opt %s -convert-scf-to-std -convert-vector-to-llvm -convert-std-to-llvm | \
// RUN: mlir-cpu-runner -e entry -entry-point-result=void \
// RUN: -shared-libs=%mlir_integration_test_dir/libmlir_c_runner_utils%shlibext | \
// RUN: FileCheck %s
func @entry() {
%f0 = constant 0.0: f32
%f1 = constant 1.0: f32
%f2 = constant 2.0: f32
%f3 = constant 3.0: f32
%f4 = constant 4.0: f32
%f5 = constant 5.0: f32
%f6 = constant 6.0: f32
%f7 = constant 7.0: f32
%f8 = constant 8.0: f32
%f9 = constant 9.0: f32
%f10 = constant 10.0: f32
%f11 = constant 11.0: f32
%f12 = constant 12.0: f32
%f13 = constant 13.0: f32
%f14 = constant 14.0: f32
%f15 = constant 15.0: f32
%a0 = vector.broadcast %f0 : f32 to vector<4x4xf32>
%a1 = vector.insert %f0, %a0[0, 0] : f32 into vector<4x4xf32>
%a2 = vector.insert %f1, %a1[0, 1] : f32 into vector<4x4xf32>
%a3 = vector.insert %f2, %a2[0, 2] : f32 into vector<4x4xf32>
%a4 = vector.insert %f3, %a3[0, 3] : f32 into vector<4x4xf32>
%a5 = vector.insert %f4, %a4[1, 0] : f32 into vector<4x4xf32>
%a6 = vector.insert %f5, %a5[1, 1] : f32 into vector<4x4xf32>
%a7 = vector.insert %f6, %a6[1, 2] : f32 into vector<4x4xf32>
%a8 = vector.insert %f7, %a7[1, 3] : f32 into vector<4x4xf32>
%a9 = vector.insert %f8, %a8[2, 0] : f32 into vector<4x4xf32>
%a10 = vector.insert %f9, %a9[2, 1] : f32 into vector<4x4xf32>
%a11 = vector.insert %f10, %a10[2, 2] : f32 into vector<4x4xf32>
%a12 = vector.insert %f11, %a11[2, 3] : f32 into vector<4x4xf32>
%a13 = vector.insert %f12, %a12[3, 0] : f32 into vector<4x4xf32>
%a14 = vector.insert %f13, %a13[3, 1] : f32 into vector<4x4xf32>
%a15 = vector.insert %f14, %a14[3, 2] : f32 into vector<4x4xf32>
%a16 = vector.insert %f15, %a15[3, 3] : f32 into vector<4x4xf32>
vector.print %a16 : vector<4x4xf32>
//
// test matrix:
//
// CHECK: ( ( 0, 1, 2, 3 ), ( 4, 5, 6, 7 ), ( 8, 9, 10, 11 ), ( 12, 13, 14, 15 ) )
// Tile 4x4 with 3x3 as follows:
//
// +--------+--+
// +0 1 2| 3|
// |4 5 6| 7|
// |8 9 10|11|
// +--------+--+
// |12 13 14|15|
// +--------+--+
//
%es = vector.extract_slices %a16, [3, 3], [1, 1] :
vector<4x4xf32> into tuple<vector<3x3xf32>, vector<3x1xf32>, vector<1x3xf32>, vector<1x1xf32>>
%0 = vector.tuple_get %es, 0 : tuple<vector<3x3xf32>, vector<3x1xf32>, vector<1x3xf32>, vector<1x1xf32>>
%1 = vector.tuple_get %es, 1 : tuple<vector<3x3xf32>, vector<3x1xf32>, vector<1x3xf32>, vector<1x1xf32>>
%2 = vector.tuple_get %es, 2 : tuple<vector<3x3xf32>, vector<3x1xf32>, vector<1x3xf32>, vector<1x1xf32>>
%3 = vector.tuple_get %es, 3 : tuple<vector<3x3xf32>, vector<3x1xf32>, vector<1x3xf32>, vector<1x1xf32>>
vector.print %0 : vector<3x3xf32>
vector.print %1 : vector<3x1xf32>
vector.print %2 : vector<1x3xf32>
vector.print %3 : vector<1x1xf32>
//
// extract slices:
//
// CHECK: ( ( 0, 1, 2 ), ( 4, 5, 6 ), ( 8, 9, 10 ) )
// CHECK: ( ( 3 ), ( 7 ), ( 11 ) )
// CHECK: ( ( 12, 13, 14 ) )
// CHECK: ( ( 15 ) )
return
}
|