forked from OSchip/llvm-project
80 lines
3.0 KiB
MLIR
80 lines
3.0 KiB
MLIR
// RUN: mlir-opt %s -convert-scf-to-std -convert-vector-to-llvm -convert-std-to-llvm | \
|
|
// RUN: mlir-cpu-runner -e entry -entry-point-result=void \
|
|
// RUN: -shared-libs=%mlir_integration_test_dir/libmlir_c_runner_utils%shlibext | \
|
|
// RUN: FileCheck %s
|
|
|
|
func @entry() {
|
|
%f0 = constant 0.0: f32
|
|
%f1 = constant 1.0: f32
|
|
%f2 = constant 2.0: f32
|
|
%f3 = constant 3.0: f32
|
|
%f4 = constant 4.0: f32
|
|
%f5 = constant 5.0: f32
|
|
%f6 = constant 6.0: f32
|
|
%f7 = constant 7.0: f32
|
|
%f8 = constant 8.0: f32
|
|
%f9 = constant 9.0: f32
|
|
%f10 = constant 10.0: f32
|
|
%f11 = constant 11.0: f32
|
|
%f12 = constant 12.0: f32
|
|
%f13 = constant 13.0: f32
|
|
%f14 = constant 14.0: f32
|
|
%f15 = constant 15.0: f32
|
|
|
|
%a0 = vector.broadcast %f0 : f32 to vector<4x4xf32>
|
|
%a1 = vector.insert %f0, %a0[0, 0] : f32 into vector<4x4xf32>
|
|
%a2 = vector.insert %f1, %a1[0, 1] : f32 into vector<4x4xf32>
|
|
%a3 = vector.insert %f2, %a2[0, 2] : f32 into vector<4x4xf32>
|
|
%a4 = vector.insert %f3, %a3[0, 3] : f32 into vector<4x4xf32>
|
|
%a5 = vector.insert %f4, %a4[1, 0] : f32 into vector<4x4xf32>
|
|
%a6 = vector.insert %f5, %a5[1, 1] : f32 into vector<4x4xf32>
|
|
%a7 = vector.insert %f6, %a6[1, 2] : f32 into vector<4x4xf32>
|
|
%a8 = vector.insert %f7, %a7[1, 3] : f32 into vector<4x4xf32>
|
|
%a9 = vector.insert %f8, %a8[2, 0] : f32 into vector<4x4xf32>
|
|
%a10 = vector.insert %f9, %a9[2, 1] : f32 into vector<4x4xf32>
|
|
%a11 = vector.insert %f10, %a10[2, 2] : f32 into vector<4x4xf32>
|
|
%a12 = vector.insert %f11, %a11[2, 3] : f32 into vector<4x4xf32>
|
|
%a13 = vector.insert %f12, %a12[3, 0] : f32 into vector<4x4xf32>
|
|
%a14 = vector.insert %f13, %a13[3, 1] : f32 into vector<4x4xf32>
|
|
%a15 = vector.insert %f14, %a14[3, 2] : f32 into vector<4x4xf32>
|
|
%a16 = vector.insert %f15, %a15[3, 3] : f32 into vector<4x4xf32>
|
|
|
|
vector.print %a16 : vector<4x4xf32>
|
|
//
|
|
// test matrix:
|
|
//
|
|
// CHECK: ( ( 0, 1, 2, 3 ), ( 4, 5, 6, 7 ), ( 8, 9, 10, 11 ), ( 12, 13, 14, 15 ) )
|
|
|
|
// Tile 4x4 with 3x3 as follows:
|
|
//
|
|
// +--------+--+
|
|
// +0 1 2| 3|
|
|
// |4 5 6| 7|
|
|
// |8 9 10|11|
|
|
// +--------+--+
|
|
// |12 13 14|15|
|
|
// +--------+--+
|
|
//
|
|
%es = vector.extract_slices %a16, [3, 3], [1, 1] :
|
|
vector<4x4xf32> into tuple<vector<3x3xf32>, vector<3x1xf32>, vector<1x3xf32>, vector<1x1xf32>>
|
|
|
|
%0 = vector.tuple_get %es, 0 : tuple<vector<3x3xf32>, vector<3x1xf32>, vector<1x3xf32>, vector<1x1xf32>>
|
|
%1 = vector.tuple_get %es, 1 : tuple<vector<3x3xf32>, vector<3x1xf32>, vector<1x3xf32>, vector<1x1xf32>>
|
|
%2 = vector.tuple_get %es, 2 : tuple<vector<3x3xf32>, vector<3x1xf32>, vector<1x3xf32>, vector<1x1xf32>>
|
|
%3 = vector.tuple_get %es, 3 : tuple<vector<3x3xf32>, vector<3x1xf32>, vector<1x3xf32>, vector<1x1xf32>>
|
|
|
|
vector.print %0 : vector<3x3xf32>
|
|
vector.print %1 : vector<3x1xf32>
|
|
vector.print %2 : vector<1x3xf32>
|
|
vector.print %3 : vector<1x1xf32>
|
|
//
|
|
// extract slices:
|
|
//
|
|
// CHECK: ( ( 0, 1, 2 ), ( 4, 5, 6 ), ( 8, 9, 10 ) )
|
|
// CHECK: ( ( 3 ), ( 7 ), ( 11 ) )
|
|
// CHECK: ( ( 12, 13, 14 ) )
|
|
// CHECK: ( ( 15 ) )
|
|
|
|
return
|
|
}
|