// RUN: mlir-opt %s -allocate-arm-sme-tiles -split-input-file -verify-diagnostics | FileCheck %s // ----- // CHECK-LABEL: mixed_tiles // CHECK-SAME: attributes {arm_sme.tiles_in_use = 65534 : i32} func.func @mixed_tiles() { // ZA0.Q, ZA2.Q, ZA4.Q, ZA6.Q, ZA8.Q, ZA10.Q, ZA12.Q, ZA14.Q // CHECK-NEXT: tile_id = 0 %za0_h = arm_sme.get_tile : vector<[8]x[8]xi16> // ZA1.Q, ZA5.Q, ZA9.Q, ZA13.Q // CHECK-NEXT: tile_id = 1 %za1_s = arm_sme.get_tile : vector<[4]x[4]xi32> // ZA3.D ZA3.Q, ZA11.Q // CHECK-NEXT: tile_id = 3 %za3_d = arm_sme.get_tile : vector<[2]x[2]xi64> // ZA7.Q // CHECK-NEXT: tile_id = 7 %za7_q = arm_sme.get_tile : vector<[1]x[1]xi128> // ZA15.Q is still free. return } // ----- // CHECK-LABEL: za_b // CHECK-SAME: attributes {arm_sme.tiles_in_use = 65535 : i32} func.func @za_b() { // CHECK-NEXT: tile_id = 0 %za0_b = arm_sme.get_tile : vector<[16]x[16]xi8> return } // ----- func.func @za_b__out_of_tiles() { %za0_b = arm_sme.get_tile : vector<[16]x[16]xi8> // expected-warning @below {{failed to allocate SME virtual tile to operation, all tile operations will go through memory, expect degraded performance}} %next_tile = arm_sme.get_tile : vector<[16]x[16]xi8> return } // ----- func.func @za_b_overlapping_za_q() { %za0_b = arm_sme.get_tile : vector<[16]x[16]xi8> // expected-warning @below {{failed to allocate SME virtual tile to operation, all tile operations will go through memory, expect degraded performance}} %next_tile = arm_sme.get_tile : vector<[1]x[1]xi128> return } // ----- // CHECK-LABEL: za0_h // CHECK-SAME: attributes {arm_sme.tiles_in_use = 43690 : i32} func.func @za0_h() { // CHECK-NEXT: tile_id = 0 %za0_h = arm_sme.get_tile : vector<[8]x[8]xi16> return } // ----- // CHECK-LABEL: za_h // CHECK-SAME: attributes {arm_sme.tiles_in_use = 65535 : i32} func.func @za_h() { // CHECK-NEXT: tile_id = 0 %za0_h = arm_sme.get_tile : vector<[8]x[8]xi16> // CHECK-NEXT: tile_id = 1 %za1_h = arm_sme.get_tile : vector<[8]x[8]xi16> return } // ----- // CHECK-LABEL: za_h__out_of_tiles func.func @za_h__out_of_tiles() { // CHECK-NEXT: tile_id = 0 %za0_h = arm_sme.get_tile : vector<[8]x[8]xi16> // CHECK-NEXT: tile_id = 1 %za1_h = arm_sme.get_tile : vector<[8]x[8]xi16> // expected-warning @below {{failed to allocate SME virtual tile to operation, all tile operations will go through memory, expect degraded performance}} %next_tile = arm_sme.get_tile : vector<[8]x[8]xi16> return } // ----- // CHECK-LABEL: za_h_overlapping_za_s // CHECK-SAME: attributes {arm_sme.tiles_in_use = 65535 : i32} func.func @za_h_overlapping_za_s() { // ZA0.Q, ZA2.Q, ZA4.Q, ZA6.Q, ZA8.Q, ZA10.Q, ZA12.Q, ZA14.Q // CHECK-NEXT: tile_id = 0 %za0_h = arm_sme.get_tile : vector<[8]x[8]xi16> // ZA1.Q, ZA5.Q, ZA9.Q, ZA13.Q // CHECK-NEXT: tile_id = 1 %za1_s = arm_sme.get_tile : vector<[4]x[4]xi32> // ZA3.Q, ZA7.Q, ZA11.Q, ZA15.Q // CHECK-NEXT: tile_id = 3 %za3_s = arm_sme.get_tile : vector<[4]x[4]xi32> return } // ----- // CHECK-LABEL: za_h_overlapping_za_d // CHECK-SAME: attributes {arm_sme.tiles_in_use = 65535 : i32} func.func @za_h_overlapping_za_d() { // ZA0.Q, ZA2.Q, ZA4.Q, ZA6.Q, ZA8.Q, ZA10.Q, ZA12.Q, ZA14.Q // CHECK-NEXT: tile_id = 0 %za0_h = arm_sme.get_tile : vector<[8]x[8]xi16> // ZA1.Q, ZA9.Q // CHECK-NEXT: tile_id = 1 %za1_d = arm_sme.get_tile : vector<[2]x[2]xi64> // ZA3.Q, ZA11.Q // CHECK-NEXT: tile_id = 3 %za3_d = arm_sme.get_tile : vector<[2]x[2]xi64> // ZA5.Q, ZA13.Q // CHECK-NEXT: tile_id = 5 %za5_d = arm_sme.get_tile : vector<[2]x[2]xi64> // ZA7.Q, ZA15.Q // CHECK-NEXT: tile_id = 7 %za7_d = arm_sme.get_tile : vector<[2]x[2]xi64> return } // ----- func.func @za_h_overlapping_za_q() { %za0_h = arm_sme.get_tile : vector<[8]x[8]xi16> %za0_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za2_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za4_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za6_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za8_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za10_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za12_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za14_q = arm_sme.get_tile : vector<[1]x[1]xi128> // expected-warning @below {{failed to allocate SME virtual tile to operation, all tile operations will go through memory, expect degraded performance}} %next_tile = arm_sme.get_tile : vector<[1]x[1]xi128> return } // ----- // CHECK-LABEL: za0_s // CHECK-SAME: attributes {arm_sme.tiles_in_use = 34952 : i32} func.func @za0_s() { // CHECK-NEXT: tile_id = 0 %za0_s = arm_sme.get_tile : vector<[4]x[4]xi32> return } // ----- // CHECK-LABEL: za_s // CHECK-SAME: attributes {arm_sme.tiles_in_use = 65535 : i32} func.func @za_s() { // CHECK-NEXT: tile_id = 0 %za0_s = arm_sme.get_tile : vector<[4]x[4]xi32> // CHECK-NEXT: tile_id = 1 %za1_s = arm_sme.get_tile : vector<[4]x[4]xi32> // CHECK-NEXT: tile_id = 2 %za2_s = arm_sme.get_tile : vector<[4]x[4]xi32> // CHECK-NEXT: tile_id = 3 %za3_s = arm_sme.get_tile : vector<[4]x[4]xi32> return } // ----- func.func @za_s__out_of_tiles() { %za0_s = arm_sme.get_tile : vector<[4]x[4]xi32> %za1_s = arm_sme.get_tile : vector<[4]x[4]xi32> %za2_s = arm_sme.get_tile : vector<[4]x[4]xi32> %za3_s = arm_sme.get_tile : vector<[4]x[4]xi32> // expected-warning @below {{failed to allocate SME virtual tile to operation, all tile operations will go through memory, expect degraded performance}} %next_tile = arm_sme.get_tile : vector<[4]x[4]xi32> return } // ----- // CHECK-LABEL: za_s_overlapping_za_d // CHECK-SAME: attributes {arm_sme.tiles_in_use = 65535 : i32} func.func @za_s_overlapping_za_d() { // ZA0.Q, ZA4.Q, ZA8.Q, ZA12.Q // CHECK-NEXT: tile_id = 0 %za0_s = arm_sme.get_tile : vector<[4]x[4]xi32> // ZA1.Q, ZA5.Q, ZA9.Q, ZA13.Q // CHECK-NEXT: tile_id = 1 %za1_s = arm_sme.get_tile : vector<[4]x[4]xi32> // ZA2.Q, ZA6.Q, ZA10.Q, ZA14.Q // CHECK-NEXT: tile_id = 2 %za2_s = arm_sme.get_tile : vector<[4]x[4]xi32> // ZA3.Q, ZA11.Q // CHECK-NEXT: tile_id = 3 %za3_d = arm_sme.get_tile : vector<[2]x[2]xi64> // ZA7.Q, ZA15.Q // CHECK-NEXT: tile_id = 7 %za7_d = arm_sme.get_tile : vector<[2]x[2]xi64> return } // ----- func.func @za_s_overlapping_za_q() { %za0_s = arm_sme.get_tile : vector<[4]x[4]xi32> %za1_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za2_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za3_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za5_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za6_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za7_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za9_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za10_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za11_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za13_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za14_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za15_q = arm_sme.get_tile : vector<[1]x[1]xi128> // expected-warning @below {{failed to allocate SME virtual tile to operation, all tile operations will go through memory, expect degraded performance}} %next_tile = arm_sme.get_tile : vector<[1]x[1]xi128> return } // ----- // CHECK-LABEL: za0_d // CHECK-SAME: attributes {arm_sme.tiles_in_use = 32896 : i32} func.func @za0_d() { // CHECK-NEXT: tile_id = 0 %za0_d = arm_sme.get_tile : vector<[2]x[2]xi64> return } // ----- // CHECK-LABEL: za_d // CHECK-SAME: attributes {arm_sme.tiles_in_use = 65535 : i32} func.func @za_d() { // CHECK-NEXT: tile_id = 0 %za0_d = arm_sme.get_tile : vector<[2]x[2]xi64> // CHECK-NEXT: tile_id = 1 %za1_d = arm_sme.get_tile : vector<[2]x[2]xi64> // CHECK-NEXT: tile_id = 2 %za2_d = arm_sme.get_tile : vector<[2]x[2]xi64> // CHECK-NEXT: tile_id = 3 %za3_d = arm_sme.get_tile : vector<[2]x[2]xi64> // CHECK-NEXT: tile_id = 4 %za4_d = arm_sme.get_tile : vector<[2]x[2]xi64> // CHECK-NEXT: tile_id = 5 %za5_d = arm_sme.get_tile : vector<[2]x[2]xi64> // CHECK-NEXT: tile_id = 6 %za6_d = arm_sme.get_tile : vector<[2]x[2]xi64> // CHECK-NEXT: tile_id = 7 %za7_d = arm_sme.get_tile : vector<[2]x[2]xi64> return } // ----- func.func @za_d__out_of_tiles() { %za0_d = arm_sme.get_tile : vector<[2]x[2]xi64> %za1_d = arm_sme.get_tile : vector<[2]x[2]xi64> %za2_d = arm_sme.get_tile : vector<[2]x[2]xi64> %za3_d = arm_sme.get_tile : vector<[2]x[2]xi64> %za4_d = arm_sme.get_tile : vector<[2]x[2]xi64> %za5_d = arm_sme.get_tile : vector<[2]x[2]xi64> %za6_d = arm_sme.get_tile : vector<[2]x[2]xi64> %za7_d = arm_sme.get_tile : vector<[2]x[2]xi64> // expected-warning @below {{failed to allocate SME virtual tile to operation, all tile operations will go through memory, expect degraded performance}} %next_tile = arm_sme.get_tile : vector<[2]x[2]xi64> return } // ----- func.func @za_d_overlapping_za_q() { %za0_d = arm_sme.get_tile : vector<[2]x[2]xi64> %za1_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za2_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za3_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za4_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za5_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za6_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za7_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za9_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za10_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za11_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za12_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za13_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za14_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za15_q = arm_sme.get_tile : vector<[1]x[1]xi128> // expected-warning @below {{failed to allocate SME virtual tile to operation, all tile operations will go through memory, expect degraded performance}} %next_tile = arm_sme.get_tile : vector<[1]x[1]xi128> return } // ----- // CHECK-LABEL: za0_q // CHECK-SAME: attributes {arm_sme.tiles_in_use = 32768 : i32} func.func @za0_q() { // CHECK-NEXT: tile_id = 0 %za0_q = arm_sme.get_tile : vector<[1]x[1]xi128> return } // ----- // CHECK-LABEL: za_q // CHECK-SAME: attributes {arm_sme.tiles_in_use = 65535 : i32} func.func @za_q() { // CHECK-NEXT: tile_id = 0 %za0_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 1 %za1_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 2 %za2_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 3 %za3_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 4 %za4_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 5 %za5_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 6 %za6_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 7 %za7_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 8 %za8_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 9 %za9_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 10 %za10_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 11 %za11_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 12 %za12_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 13 %za13_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 14 %za14_q = arm_sme.get_tile : vector<[1]x[1]xi128> // CHECK-NEXT: tile_id = 15 %za15_q = arm_sme.get_tile : vector<[1]x[1]xi128> return } // ----- func.func @za_q__out_of_tiles() { %za0_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za1_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za2_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za3_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za4_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za5_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za6_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za7_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za8_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za9_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za10_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za11_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za12_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za13_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za14_q = arm_sme.get_tile : vector<[1]x[1]xi128> %za15_q = arm_sme.get_tile : vector<[1]x[1]xi128> // expected-warning @below {{failed to allocate SME virtual tile to operation, all tile operations will go through memory, expect degraded performance}} %next_tile = arm_sme.get_tile : vector<[1]x[1]xi128> return }