; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 ; RUN: llc < %s -mtriple=nvptx64 | FileCheck %s ; Fold: srl (or (x, shl(zext(y),c1)),c1) -> or(srl(x,c1), zext(y)) ; c1 <= leadingzeros(zext(y)) define i64 @test_or(i64 %x, i32 %y) { ; CHECK-LABEL: test_or( ; CHECK: { ; CHECK-NEXT: .reg .b64 %rd<5>; ; CHECK-EMPTY: ; CHECK-NEXT: // %bb.0: ; CHECK-NEXT: ld.param.b64 %rd1, [test_or_param_0]; ; CHECK-NEXT: ld.param.b32 %rd2, [test_or_param_1]; ; CHECK-NEXT: shr.u64 %rd3, %rd1, 5; ; CHECK-NEXT: or.b64 %rd4, %rd3, %rd2; ; CHECK-NEXT: st.param.b64 [func_retval0], %rd4; ; CHECK-NEXT: ret; %ext = zext i32 %y to i64 %shl = shl i64 %ext, 5 %or = or i64 %x, %shl %srl = lshr i64 %or, 5 ret i64 %srl } ; Fold: srl (xor (x, shl(zext(y),c1)),c1) -> xor(srl(x,c1), zext(y)) ; c1 <= leadingzeros(zext(y)) define i64 @test_xor(i64 %x, i32 %y) { ; CHECK-LABEL: test_xor( ; CHECK: { ; CHECK-NEXT: .reg .b64 %rd<5>; ; CHECK-EMPTY: ; CHECK-NEXT: // %bb.0: ; CHECK-NEXT: ld.param.b64 %rd1, [test_xor_param_0]; ; CHECK-NEXT: ld.param.b32 %rd2, [test_xor_param_1]; ; CHECK-NEXT: shr.u64 %rd3, %rd1, 5; ; CHECK-NEXT: xor.b64 %rd4, %rd3, %rd2; ; CHECK-NEXT: st.param.b64 [func_retval0], %rd4; ; CHECK-NEXT: ret; %ext = zext i32 %y to i64 %shl = shl i64 %ext, 5 %or = xor i64 %x, %shl %srl = lshr i64 %or, 5 ret i64 %srl } ; Fold: srl (and (x, shl(zext(y),c1)),c1) -> and(srl(x,c1), zext(y)) ; c1 <= leadingzeros(zext(y)) define i64 @test_and(i64 %x, i32 %y) { ; CHECK-LABEL: test_and( ; CHECK: { ; CHECK-NEXT: .reg .b64 %rd<5>; ; CHECK-EMPTY: ; CHECK-NEXT: // %bb.0: ; CHECK-NEXT: ld.param.b64 %rd1, [test_and_param_0]; ; CHECK-NEXT: ld.param.b32 %rd2, [test_and_param_1]; ; CHECK-NEXT: shr.u64 %rd3, %rd1, 5; ; CHECK-NEXT: and.b64 %rd4, %rd3, %rd2; ; CHECK-NEXT: st.param.b64 [func_retval0], %rd4; ; CHECK-NEXT: ret; %ext = zext i32 %y to i64 %shl = shl i64 %ext, 5 %or = and i64 %x, %shl %srl = lshr i64 %or, 5 ret i64 %srl } ; Fold: srl (or (x, shl(zext(y),c1)),c1) -> or(srl(x,c1), zext(y)) ; c1 <= leadingzeros(zext(y)) ; x, y - vectors define <2 x i16> @test_vec(<2 x i16> %x, <2 x i8> %y) { ; CHECK-LABEL: test_vec( ; CHECK: { ; CHECK-NEXT: .reg .b16 %rs<7>; ; CHECK-NEXT: .reg .b32 %r<4>; ; CHECK-EMPTY: ; CHECK-NEXT: // %bb.0: ; CHECK-NEXT: ld.param.v2.b16 {%rs1, %rs2}, [test_vec_param_0]; ; CHECK-NEXT: ld.param.v2.b8 {%rs3, %rs4}, [test_vec_param_1]; ; CHECK-NEXT: mov.b32 %r1, {%rs3, %rs4}; ; CHECK-NEXT: shr.u16 %rs5, %rs2, 5; ; CHECK-NEXT: shr.u16 %rs6, %rs1, 5; ; CHECK-NEXT: mov.b32 %r2, {%rs6, %rs5}; ; CHECK-NEXT: or.b32 %r3, %r2, %r1; ; CHECK-NEXT: st.param.b32 [func_retval0], %r3; ; CHECK-NEXT: ret; %ext = zext <2 x i8> %y to <2 x i16> %shl = shl <2 x i16> %ext, splat(i16 5) %or = or <2 x i16> %x, %shl %srl = lshr <2 x i16> %or, splat(i16 5) ret <2 x i16> %srl } ; Do not fold: srl (or (x, shl(zext(y),c1)),c1) -> or(srl(x,c1), zext(y)) ; Reason: c1 > leadingzeros(zext(y)). define i64 @test_negative_c(i64 %x, i32 %y) { ; CHECK-LABEL: test_negative_c( ; CHECK: { ; CHECK-NEXT: .reg .b64 %rd<6>; ; CHECK-EMPTY: ; CHECK-NEXT: // %bb.0: ; CHECK-NEXT: ld.param.b64 %rd1, [test_negative_c_param_0]; ; CHECK-NEXT: ld.param.b32 %rd2, [test_negative_c_param_1]; ; CHECK-NEXT: shl.b64 %rd3, %rd2, 33; ; CHECK-NEXT: or.b64 %rd4, %rd1, %rd3; ; CHECK-NEXT: shr.u64 %rd5, %rd4, 33; ; CHECK-NEXT: st.param.b64 [func_retval0], %rd5; ; CHECK-NEXT: ret; %ext = zext i32 %y to i64 %shl = shl i64 %ext, 33 %or = or i64 %x, %shl %srl = lshr i64 %or, 33 ret i64 %srl } declare void @use(i64) ; Do not fold: srl (or (x, shl(zext(y),c1)),c1) -> or(srl(x,c1), zext(y)) ; Reason: multiple usage of "or" define i64 @test_negative_use_lop(i64 %x, i32 %y) { ; CHECK-LABEL: test_negative_use_lop( ; CHECK: { ; CHECK-NEXT: .reg .b32 %r<2>; ; CHECK-NEXT: .reg .b64 %rd<5>; ; CHECK-EMPTY: ; CHECK-NEXT: // %bb.0: ; CHECK-NEXT: ld.param.b64 %rd1, [test_negative_use_lop_param_0]; ; CHECK-NEXT: ld.param.b32 %r1, [test_negative_use_lop_param_1]; ; CHECK-NEXT: mul.wide.u32 %rd2, %r1, 32; ; CHECK-NEXT: or.b64 %rd3, %rd1, %rd2; ; CHECK-NEXT: shr.u64 %rd4, %rd3, 5; ; CHECK-NEXT: { // callseq 0, 0 ; CHECK-NEXT: .param .b64 param0; ; CHECK-NEXT: st.param.b64 [param0], %rd3; ; CHECK-NEXT: call.uni use, (param0); ; CHECK-NEXT: } // callseq 0 ; CHECK-NEXT: st.param.b64 [func_retval0], %rd4; ; CHECK-NEXT: ret; %ext = zext i32 %y to i64 %shl = shl i64 %ext, 5 %or = or i64 %x, %shl %srl = lshr i64 %or, 5 call void @use(i64 %or) ret i64 %srl } ; Do not fold: srl (or (x, shl(zext(y),c1)),c1) -> or(srl(x,c1), zext(y)) ; Reason: multiple usage of "shl" define i64 @test_negative_use_shl(i64 %x, i32 %y) { ; CHECK-LABEL: test_negative_use_shl( ; CHECK: { ; CHECK-NEXT: .reg .b32 %r<2>; ; CHECK-NEXT: .reg .b64 %rd<5>; ; CHECK-EMPTY: ; CHECK-NEXT: // %bb.0: ; CHECK-NEXT: ld.param.b64 %rd1, [test_negative_use_shl_param_0]; ; CHECK-NEXT: ld.param.b32 %r1, [test_negative_use_shl_param_1]; ; CHECK-NEXT: mul.wide.u32 %rd2, %r1, 32; ; CHECK-NEXT: or.b64 %rd3, %rd1, %rd2; ; CHECK-NEXT: shr.u64 %rd4, %rd3, 5; ; CHECK-NEXT: { // callseq 1, 0 ; CHECK-NEXT: .param .b64 param0; ; CHECK-NEXT: st.param.b64 [param0], %rd2; ; CHECK-NEXT: call.uni use, (param0); ; CHECK-NEXT: } // callseq 1 ; CHECK-NEXT: st.param.b64 [func_retval0], %rd4; ; CHECK-NEXT: ret; %ext = zext i32 %y to i64 %shl = shl i64 %ext, 5 %or = or i64 %x, %shl %srl = lshr i64 %or, 5 call void @use(i64 %shl) ret i64 %srl }