; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2 ; Test i128 atomicrmw operations. ; ; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z15 | FileCheck %s ; ; Test expansion of AtomicRMW instructions, which assume a natural alignment. ; Note that the multiple regmoves inside the CDSG loops hopefully will go away ; when the new i128 support is added. ; Check register exchange. define i128 @atomicrmw_xchg(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_xchg: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v1, 0(%r4), 3 ; CHECK-NEXT: vl %v0, 0(%r3), 4 ; CHECK-NEXT: vlgvg %r1, %v1, 1 ; CHECK-NEXT: vlgvg %r0, %v1, 0 ; CHECK-NEXT: .LBB0_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: vlgvg %r5, %v0, 1 ; CHECK-NEXT: vlgvg %r4, %v0, 0 ; CHECK-NEXT: cdsg %r4, %r0, 0(%r3) ; CHECK-NEXT: vlvgp %v0, %r4, %r5 ; CHECK-NEXT: jl .LBB0_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: vst %v0, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw xchg ptr %src, i128 %b seq_cst ret i128 %res } ; Check addition of a variable. define i128 @atomicrmw_add(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_add: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v1, 0(%r3), 4 ; CHECK-NEXT: .LBB1_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: vaq %v2, %v1, %v0 ; CHECK-NEXT: vlgvg %r1, %v2, 1 ; CHECK-NEXT: vlgvg %r0, %v2, 0 ; CHECK-NEXT: vlgvg %r5, %v1, 1 ; CHECK-NEXT: vlgvg %r4, %v1, 0 ; CHECK-NEXT: cdsg %r4, %r0, 0(%r3) ; CHECK-NEXT: vlvgp %v1, %r4, %r5 ; CHECK-NEXT: jl .LBB1_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: vst %v1, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw add ptr %src, i128 %b seq_cst ret i128 %res } ; Check subtraction of a variable. define i128 @atomicrmw_sub(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_sub: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v1, 0(%r3), 4 ; CHECK-NEXT: .LBB2_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: vsq %v2, %v1, %v0 ; CHECK-NEXT: vlgvg %r1, %v2, 1 ; CHECK-NEXT: vlgvg %r0, %v2, 0 ; CHECK-NEXT: vlgvg %r5, %v1, 1 ; CHECK-NEXT: vlgvg %r4, %v1, 0 ; CHECK-NEXT: cdsg %r4, %r0, 0(%r3) ; CHECK-NEXT: vlvgp %v1, %r4, %r5 ; CHECK-NEXT: jl .LBB2_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: vst %v1, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw sub ptr %src, i128 %b seq_cst ret i128 %res } ; Check AND of a variable. define i128 @atomicrmw_and(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_and: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v1, 0(%r3), 4 ; CHECK-NEXT: .LBB3_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: vn %v2, %v1, %v0 ; CHECK-NEXT: vlgvg %r1, %v2, 1 ; CHECK-NEXT: vlgvg %r0, %v2, 0 ; CHECK-NEXT: vlgvg %r5, %v1, 1 ; CHECK-NEXT: vlgvg %r4, %v1, 0 ; CHECK-NEXT: cdsg %r4, %r0, 0(%r3) ; CHECK-NEXT: vlvgp %v1, %r4, %r5 ; CHECK-NEXT: jl .LBB3_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: vst %v1, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw and ptr %src, i128 %b seq_cst ret i128 %res } ; Check NAND of a variable. define i128 @atomicrmw_nand(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_nand: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v1, 0(%r3), 4 ; CHECK-NEXT: .LBB4_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: vlgvg %r1, %v1, 1 ; CHECK-NEXT: vlgvg %r0, %v1, 0 ; CHECK-NEXT: vnn %v1, %v1, %v0 ; CHECK-NEXT: vlgvg %r5, %v1, 1 ; CHECK-NEXT: vlgvg %r4, %v1, 0 ; CHECK-NEXT: cdsg %r0, %r4, 0(%r3) ; CHECK-NEXT: vlvgp %v1, %r0, %r1 ; CHECK-NEXT: jl .LBB4_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: vst %v1, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw nand ptr %src, i128 %b seq_cst ret i128 %res } ; Check OR of a variable. define i128 @atomicrmw_or(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_or: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v1, 0(%r3), 4 ; CHECK-NEXT: .LBB5_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: vo %v2, %v1, %v0 ; CHECK-NEXT: vlgvg %r1, %v2, 1 ; CHECK-NEXT: vlgvg %r0, %v2, 0 ; CHECK-NEXT: vlgvg %r5, %v1, 1 ; CHECK-NEXT: vlgvg %r4, %v1, 0 ; CHECK-NEXT: cdsg %r4, %r0, 0(%r3) ; CHECK-NEXT: vlvgp %v1, %r4, %r5 ; CHECK-NEXT: jl .LBB5_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: vst %v1, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw or ptr %src, i128 %b seq_cst ret i128 %res } ; Check XOR of a variable. define i128 @atomicrmw_xor(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_xor: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v1, 0(%r3), 4 ; CHECK-NEXT: .LBB6_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: vx %v2, %v1, %v0 ; CHECK-NEXT: vlgvg %r1, %v2, 1 ; CHECK-NEXT: vlgvg %r0, %v2, 0 ; CHECK-NEXT: vlgvg %r5, %v1, 1 ; CHECK-NEXT: vlgvg %r4, %v1, 0 ; CHECK-NEXT: cdsg %r4, %r0, 0(%r3) ; CHECK-NEXT: vlvgp %v1, %r4, %r5 ; CHECK-NEXT: jl .LBB6_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: vst %v1, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw xor ptr %src, i128 %b seq_cst ret i128 %res } ; Check signed minimum. define i128 @atomicrmw_min(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_min: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v1, 0(%r3), 4 ; CHECK-NEXT: j .LBB7_2 ; CHECK-NEXT: .LBB7_1: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB7_2 Depth=1 ; CHECK-NEXT: vlgvg %r1, %v1, 1 ; CHECK-NEXT: vlgvg %r0, %v1, 0 ; CHECK-NEXT: vlgvg %r5, %v2, 1 ; CHECK-NEXT: vlgvg %r4, %v2, 0 ; CHECK-NEXT: cdsg %r0, %r4, 0(%r3) ; CHECK-NEXT: vlvgp %v1, %r0, %r1 ; CHECK-NEXT: je .LBB7_6 ; CHECK-NEXT: .LBB7_2: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: vecg %v0, %v1 ; CHECK-NEXT: jlh .LBB7_4 ; CHECK-NEXT: # %bb.3: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB7_2 Depth=1 ; CHECK-NEXT: vchlgs %v2, %v1, %v0 ; CHECK-NEXT: .LBB7_4: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB7_2 Depth=1 ; CHECK-NEXT: vlr %v2, %v1 ; CHECK-NEXT: jnl .LBB7_1 ; CHECK-NEXT: # %bb.5: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB7_2 Depth=1 ; CHECK-NEXT: vlr %v2, %v0 ; CHECK-NEXT: j .LBB7_1 ; CHECK-NEXT: .LBB7_6: # %atomicrmw.end ; CHECK-NEXT: vst %v1, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw min ptr %src, i128 %b seq_cst ret i128 %res } ; Check signed maximum. define i128 @atomicrmw_max(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_max: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v1, 0(%r3), 4 ; CHECK-NEXT: j .LBB8_2 ; CHECK-NEXT: .LBB8_1: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB8_2 Depth=1 ; CHECK-NEXT: vlgvg %r1, %v1, 1 ; CHECK-NEXT: vlgvg %r0, %v1, 0 ; CHECK-NEXT: vlgvg %r5, %v2, 1 ; CHECK-NEXT: vlgvg %r4, %v2, 0 ; CHECK-NEXT: cdsg %r0, %r4, 0(%r3) ; CHECK-NEXT: vlvgp %v1, %r0, %r1 ; CHECK-NEXT: je .LBB8_6 ; CHECK-NEXT: .LBB8_2: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: vecg %v0, %v1 ; CHECK-NEXT: jlh .LBB8_4 ; CHECK-NEXT: # %bb.3: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB8_2 Depth=1 ; CHECK-NEXT: vchlgs %v2, %v1, %v0 ; CHECK-NEXT: .LBB8_4: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB8_2 Depth=1 ; CHECK-NEXT: vlr %v2, %v1 ; CHECK-NEXT: jl .LBB8_1 ; CHECK-NEXT: # %bb.5: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB8_2 Depth=1 ; CHECK-NEXT: vlr %v2, %v0 ; CHECK-NEXT: j .LBB8_1 ; CHECK-NEXT: .LBB8_6: # %atomicrmw.end ; CHECK-NEXT: vst %v1, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw max ptr %src, i128 %b seq_cst ret i128 %res } ; Check unsigned minimum. define i128 @atomicrmw_umin(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_umin: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v1, 0(%r3), 4 ; CHECK-NEXT: j .LBB9_2 ; CHECK-NEXT: .LBB9_1: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB9_2 Depth=1 ; CHECK-NEXT: vlgvg %r1, %v1, 1 ; CHECK-NEXT: vlgvg %r0, %v1, 0 ; CHECK-NEXT: vlgvg %r5, %v2, 1 ; CHECK-NEXT: vlgvg %r4, %v2, 0 ; CHECK-NEXT: cdsg %r0, %r4, 0(%r3) ; CHECK-NEXT: vlvgp %v1, %r0, %r1 ; CHECK-NEXT: je .LBB9_6 ; CHECK-NEXT: .LBB9_2: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: veclg %v0, %v1 ; CHECK-NEXT: jlh .LBB9_4 ; CHECK-NEXT: # %bb.3: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB9_2 Depth=1 ; CHECK-NEXT: vchlgs %v2, %v1, %v0 ; CHECK-NEXT: .LBB9_4: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB9_2 Depth=1 ; CHECK-NEXT: vlr %v2, %v1 ; CHECK-NEXT: jnl .LBB9_1 ; CHECK-NEXT: # %bb.5: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB9_2 Depth=1 ; CHECK-NEXT: vlr %v2, %v0 ; CHECK-NEXT: j .LBB9_1 ; CHECK-NEXT: .LBB9_6: # %atomicrmw.end ; CHECK-NEXT: vst %v1, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw umin ptr %src, i128 %b seq_cst ret i128 %res } ; Check unsigned maximum. define i128 @atomicrmw_umax(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_umax: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v1, 0(%r3), 4 ; CHECK-NEXT: j .LBB10_2 ; CHECK-NEXT: .LBB10_1: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB10_2 Depth=1 ; CHECK-NEXT: vlgvg %r1, %v1, 1 ; CHECK-NEXT: vlgvg %r0, %v1, 0 ; CHECK-NEXT: vlgvg %r5, %v2, 1 ; CHECK-NEXT: vlgvg %r4, %v2, 0 ; CHECK-NEXT: cdsg %r0, %r4, 0(%r3) ; CHECK-NEXT: vlvgp %v1, %r0, %r1 ; CHECK-NEXT: je .LBB10_6 ; CHECK-NEXT: .LBB10_2: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: veclg %v0, %v1 ; CHECK-NEXT: jlh .LBB10_4 ; CHECK-NEXT: # %bb.3: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB10_2 Depth=1 ; CHECK-NEXT: vchlgs %v2, %v1, %v0 ; CHECK-NEXT: .LBB10_4: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB10_2 Depth=1 ; CHECK-NEXT: vlr %v2, %v1 ; CHECK-NEXT: jl .LBB10_1 ; CHECK-NEXT: # %bb.5: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB10_2 Depth=1 ; CHECK-NEXT: vlr %v2, %v0 ; CHECK-NEXT: j .LBB10_1 ; CHECK-NEXT: .LBB10_6: # %atomicrmw.end ; CHECK-NEXT: vst %v1, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw umax ptr %src, i128 %b seq_cst ret i128 %res } ; Check increment with wraparound. define i128 @atomicrmw_uinc_wrap(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_uinc_wrap: ; CHECK: # %bb.0: ; CHECK-NEXT: larl %r1, .LCPI11_0 ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v2, 0(%r3), 4 ; CHECK-NEXT: vl %v1, 0(%r1), 3 ; CHECK-NEXT: j .LBB11_2 ; CHECK-NEXT: .LBB11_1: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB11_2 Depth=1 ; CHECK-NEXT: vlgvg %r1, %v2, 1 ; CHECK-NEXT: vlgvg %r0, %v2, 0 ; CHECK-NEXT: vlgvg %r5, %v3, 1 ; CHECK-NEXT: vlgvg %r4, %v3, 0 ; CHECK-NEXT: cdsg %r0, %r4, 0(%r3) ; CHECK-NEXT: vlvgp %v2, %r0, %r1 ; CHECK-NEXT: je .LBB11_6 ; CHECK-NEXT: .LBB11_2: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: veclg %v2, %v0 ; CHECK-NEXT: jlh .LBB11_4 ; CHECK-NEXT: # %bb.3: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB11_2 Depth=1 ; CHECK-NEXT: vchlgs %v3, %v0, %v2 ; CHECK-NEXT: .LBB11_4: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB11_2 Depth=1 ; CHECK-NEXT: vgbm %v3, 0 ; CHECK-NEXT: jnl .LBB11_1 ; CHECK-NEXT: # %bb.5: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB11_2 Depth=1 ; CHECK-NEXT: vaq %v3, %v2, %v1 ; CHECK-NEXT: j .LBB11_1 ; CHECK-NEXT: .LBB11_6: # %atomicrmw.end ; CHECK-NEXT: vst %v2, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw uinc_wrap ptr %src, i128 %b seq_cst ret i128 %res } ; Check decrement with wraparound. define i128 @atomicrmw_udec_wrap(ptr %src, i128 %b) { ; CHECK-LABEL: atomicrmw_udec_wrap: ; CHECK: # %bb.0: ; CHECK-NEXT: vl %v0, 0(%r4), 3 ; CHECK-NEXT: vl %v3, 0(%r3), 4 ; CHECK-NEXT: vgbm %v1, 65535 ; CHECK-NEXT: vgbm %v2, 0 ; CHECK-NEXT: j .LBB12_2 ; CHECK-NEXT: .LBB12_1: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1 ; CHECK-NEXT: vlgvg %r1, %v3, 1 ; CHECK-NEXT: vlgvg %r0, %v3, 0 ; CHECK-NEXT: vlgvg %r5, %v4, 1 ; CHECK-NEXT: vlgvg %r4, %v4, 0 ; CHECK-NEXT: cdsg %r0, %r4, 0(%r3) ; CHECK-NEXT: vlvgp %v3, %r0, %r1 ; CHECK-NEXT: je .LBB12_8 ; CHECK-NEXT: .LBB12_2: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: veclg %v0, %v3 ; CHECK-NEXT: jlh .LBB12_4 ; CHECK-NEXT: # %bb.3: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1 ; CHECK-NEXT: vchlgs %v4, %v3, %v0 ; CHECK-NEXT: .LBB12_4: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1 ; CHECK-NEXT: vlr %v5, %v0 ; CHECK-NEXT: jl .LBB12_6 ; CHECK-NEXT: # %bb.5: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1 ; CHECK-NEXT: vaq %v5, %v3, %v1 ; CHECK-NEXT: .LBB12_6: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1 ; CHECK-NEXT: vceqgs %v4, %v3, %v2 ; CHECK-NEXT: vlr %v4, %v0 ; CHECK-NEXT: je .LBB12_1 ; CHECK-NEXT: # %bb.7: # %atomicrmw.start ; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1 ; CHECK-NEXT: vlr %v4, %v5 ; CHECK-NEXT: j .LBB12_1 ; CHECK-NEXT: .LBB12_8: # %atomicrmw.end ; CHECK-NEXT: vst %v3, 0(%r2), 3 ; CHECK-NEXT: br %r14 %res = atomicrmw udec_wrap ptr %src, i128 %b seq_cst ret i128 %res }