// RUN: mlir-opt %s --transform-interpreter --split-input-file | FileCheck %s // CHECK-LABEL: func @lower_permutation_with_mask_fixed_width( // CHECK: %[[vec:.*]] = arith.constant dense<-2.000000e+00> : vector<7x1xf32> // CHECK: %[[mask:.*]] = arith.constant dense<[true, false, true, false, true, true, true]> : vector<7xi1> // CHECK: %[[b:.*]] = vector.broadcast %[[mask]] : vector<7xi1> to vector<1x7xi1> // CHECK: %[[tp:.*]] = vector.transpose %[[b]], [1, 0] : vector<1x7xi1> to vector<7x1xi1> // CHECK: vector.transfer_write %[[vec]], %{{.*}}[%{{.*}}, %{{.*}}], %[[tp]] {in_bounds = [false, true]} : vector<7x1xf32>, memref func.func @lower_permutation_with_mask_fixed_width(%A : memref, %base1 : index, %base2 : index) { %fn1 = arith.constant -2.0 : f32 %vf0 = vector.splat %fn1 : vector<7xf32> %mask = arith.constant dense<[1, 0, 1, 0, 1, 1, 1]> : vector<7xi1> vector.transfer_write %vf0, %A[%base1, %base2], %mask {permutation_map = affine_map<(d0, d1) -> (d0)>, in_bounds = [false]} : vector<7xf32>, memref return } // CHECK-LABEL: func.func @permutation_with_mask_scalable( // CHECK-SAME: %[[ARG_0:.*]]: memref, // CHECK-SAME: %[[IDX_1:.*]]: index, // CHECK-SAME: %[[IDX_2:.*]]: index) -> vector<8x[4]x2xf32> { // CHECK: %[[C0:.*]] = arith.constant 0 : index // CHECK: %[[PASS_THROUGH:.*]] = arith.constant 0.000000e+00 : f32 // CHECK: %[[MASK:.*]] = vector.create_mask %[[IDX_2]], %[[IDX_1]] : vector<2x[4]xi1> // CHECK: %[[T_READ:.*]] = vector.transfer_read %[[ARG_0]]{{\[}}%[[C0]], %[[C0]]], %[[PASS_THROUGH]], %[[MASK]] {in_bounds = [true, true]} : memref, vector<2x[4]xf32> // CHECK: %[[BCAST:.*]] = vector.broadcast %[[T_READ]] : vector<2x[4]xf32> to vector<8x2x[4]xf32> // CHECK: %[[TRANSPOSE:.*]] = vector.transpose %[[BCAST]], [0, 2, 1] : vector<8x2x[4]xf32> to vector<8x[4]x2xf32> // CHECK: return %[[TRANSPOSE]] : vector<8x[4]x2xf32> // CHECK: } func.func @permutation_with_mask_scalable(%2: memref, %dim_1: index, %dim_2: index) -> (vector<8x[4]x2xf32>) { %c0 = arith.constant 0 : index %cst_0 = arith.constant 0.000000e+00 : f32 %mask = vector.create_mask %dim_2, %dim_1 : vector<2x[4]xi1> %1 = vector.transfer_read %2[%c0, %c0], %cst_0, %mask {in_bounds = [true, true, true], permutation_map = affine_map<(d0, d1) -> (0, d1, d0)>} : memref, vector<8x[4]x2xf32> return %1 : vector<8x[4]x2xf32> } module attributes {transform.with_named_sequence} { transform.named_sequence @__transform_main(%module_op: !transform.any_op {transform.readonly}) { %f = transform.structured.match ops{["func.func"]} in %module_op : (!transform.any_op) -> !transform.any_op transform.apply_patterns to %f { transform.apply_patterns.vector.transfer_permutation_patterns } : !transform.any_op transform.yield } }