; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc < %s -mtriple=i686-unknown | FileCheck %s --check-prefix=X86 ; RUN: llc < %s -mtriple=x86_64-unknown | FileCheck %s --check-prefix=X64 ; Shift i64 integers on 32-bit target define i64 @test1(i64 %X, i8 %C) nounwind { ; X86-LABEL: test1: ; X86: # %bb.0: ; X86-NEXT: pushl %esi ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %esi ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl %esi, %eax ; X86-NEXT: shll %cl, %eax ; X86-NEXT: shldl %cl, %esi, %edx ; X86-NEXT: testb $32, %cl ; X86-NEXT: je .LBB0_2 ; X86-NEXT: # %bb.1: ; X86-NEXT: movl %eax, %edx ; X86-NEXT: xorl %eax, %eax ; X86-NEXT: .LBB0_2: ; X86-NEXT: popl %esi ; X86-NEXT: retl ; ; X64-LABEL: test1: ; X64: # %bb.0: ; X64-NEXT: movl %esi, %ecx ; X64-NEXT: movq %rdi, %rax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shlq %cl, %rax ; X64-NEXT: retq %shift.upgrd.1 = zext i8 %C to i64 ; <i64> [#uses=1] %Y = shl i64 %X, %shift.upgrd.1 ; <i64> [#uses=1] ret i64 %Y } define i64 @test2(i64 %X, i8 %C) nounwind { ; X86-LABEL: test2: ; X86: # %bb.0: ; X86-NEXT: pushl %esi ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: movl {{[0-9]+}}(%esp), %esi ; X86-NEXT: movl %esi, %edx ; X86-NEXT: sarl %cl, %edx ; X86-NEXT: shrdl %cl, %esi, %eax ; X86-NEXT: testb $32, %cl ; X86-NEXT: je .LBB1_2 ; X86-NEXT: # %bb.1: ; X86-NEXT: sarl $31, %esi ; X86-NEXT: movl %edx, %eax ; X86-NEXT: movl %esi, %edx ; X86-NEXT: .LBB1_2: ; X86-NEXT: popl %esi ; X86-NEXT: retl ; ; X64-LABEL: test2: ; X64: # %bb.0: ; X64-NEXT: movl %esi, %ecx ; X64-NEXT: movq %rdi, %rax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: sarq %cl, %rax ; X64-NEXT: retq %shift.upgrd.2 = zext i8 %C to i64 ; <i64> [#uses=1] %Y = ashr i64 %X, %shift.upgrd.2 ; <i64> [#uses=1] ret i64 %Y } define i64 @test3(i64 %X, i8 %C) nounwind { ; X86-LABEL: test3: ; X86: # %bb.0: ; X86-NEXT: pushl %esi ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: movl {{[0-9]+}}(%esp), %esi ; X86-NEXT: movl %esi, %edx ; X86-NEXT: shrl %cl, %edx ; X86-NEXT: shrdl %cl, %esi, %eax ; X86-NEXT: testb $32, %cl ; X86-NEXT: je .LBB2_2 ; X86-NEXT: # %bb.1: ; X86-NEXT: movl %edx, %eax ; X86-NEXT: xorl %edx, %edx ; X86-NEXT: .LBB2_2: ; X86-NEXT: popl %esi ; X86-NEXT: retl ; ; X64-LABEL: test3: ; X64: # %bb.0: ; X64-NEXT: movl %esi, %ecx ; X64-NEXT: movq %rdi, %rax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shrq %cl, %rax ; X64-NEXT: retq %shift.upgrd.3 = zext i8 %C to i64 ; <i64> [#uses=1] %Y = lshr i64 %X, %shift.upgrd.3 ; <i64> [#uses=1] ret i64 %Y } ; Combine 2xi32/2xi16 shifts into SHLD define i32 @test4(i32 %A, i32 %B, i8 %C) nounwind { ; X86-LABEL: test4: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: shldl %cl, %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: test4: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %edi, %eax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shldl %cl, %esi, %eax ; X64-NEXT: retq %shift.upgrd.4 = zext i8 %C to i32 ; <i32> [#uses=1] %X = shl i32 %A, %shift.upgrd.4 ; <i32> [#uses=1] %Cv = sub i8 32, %C ; <i8> [#uses=1] %shift.upgrd.5 = zext i8 %Cv to i32 ; <i32> [#uses=1] %Y = lshr i32 %B, %shift.upgrd.5 ; <i32> [#uses=1] %Z = or i32 %Y, %X ; <i32> [#uses=1] ret i32 %Z } define i16 @test5(i16 %A, i16 %B, i8 %C) nounwind { ; X86-LABEL: test5: ; X86: # %bb.0: ; X86-NEXT: movzwl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: andb $15, %cl ; X86-NEXT: shldw %cl, %dx, %ax ; X86-NEXT: retl ; ; X64-LABEL: test5: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %edi, %eax ; X64-NEXT: andb $15, %cl ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shldw %cl, %si, %ax ; X64-NEXT: # kill: def $ax killed $ax killed $eax ; X64-NEXT: retq %shift.upgrd.6 = zext i8 %C to i16 ; <i16> [#uses=1] %X = shl i16 %A, %shift.upgrd.6 ; <i16> [#uses=1] %Cv = sub i8 16, %C ; <i8> [#uses=1] %shift.upgrd.7 = zext i8 %Cv to i16 ; <i16> [#uses=1] %Y = lshr i16 %B, %shift.upgrd.7 ; <i16> [#uses=1] %Z = or i16 %Y, %X ; <i16> [#uses=1] ret i16 %Z } ; Combine 2xi32/2xi16 shifts into SHRD define i32 @test6(i32 %A, i32 %B, i8 %C) nounwind { ; X86-LABEL: test6: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: shrdl %cl, %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: test6: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %edi, %eax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shrdl %cl, %esi, %eax ; X64-NEXT: retq %shift.upgrd.4 = zext i8 %C to i32 ; <i32> [#uses=1] %X = lshr i32 %A, %shift.upgrd.4 ; <i32> [#uses=1] %Cv = sub i8 32, %C ; <i8> [#uses=1] %shift.upgrd.5 = zext i8 %Cv to i32 ; <i32> [#uses=1] %Y = shl i32 %B, %shift.upgrd.5 ; <i32> [#uses=1] %Z = or i32 %Y, %X ; <i32> [#uses=1] ret i32 %Z } define i16 @test7(i16 %A, i16 %B, i8 %C) nounwind { ; X86-LABEL: test7: ; X86: # %bb.0: ; X86-NEXT: movzwl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: andb $15, %cl ; X86-NEXT: shrdw %cl, %dx, %ax ; X86-NEXT: retl ; ; X64-LABEL: test7: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %edi, %eax ; X64-NEXT: andb $15, %cl ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shrdw %cl, %si, %ax ; X64-NEXT: # kill: def $ax killed $ax killed $eax ; X64-NEXT: retq %shift.upgrd.6 = zext i8 %C to i16 ; <i16> [#uses=1] %X = lshr i16 %A, %shift.upgrd.6 ; <i16> [#uses=1] %Cv = sub i8 16, %C ; <i8> [#uses=1] %shift.upgrd.7 = zext i8 %Cv to i16 ; <i16> [#uses=1] %Y = shl i16 %B, %shift.upgrd.7 ; <i16> [#uses=1] %Z = or i16 %Y, %X ; <i16> [#uses=1] ret i16 %Z } ; Shift i64 integers on 32-bit target by shift value less then 32 (PR14593) define i64 @test8(i64 %val, i32 %bits) nounwind { ; X86-LABEL: test8: ; X86: # %bb.0: ; X86-NEXT: pushl %esi ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %esi ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl %esi, %eax ; X86-NEXT: shll %cl, %eax ; X86-NEXT: shldl %cl, %esi, %edx ; X86-NEXT: popl %esi ; X86-NEXT: retl ; ; X64-LABEL: test8: ; X64: # %bb.0: ; X64-NEXT: movl %esi, %ecx ; X64-NEXT: movq %rdi, %rax ; X64-NEXT: andb $31, %cl ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shlq %cl, %rax ; X64-NEXT: retq %and = and i32 %bits, 31 %sh_prom = zext i32 %and to i64 %shl = shl i64 %val, %sh_prom ret i64 %shl } define i64 @test9(i64 %val, i32 %bits) nounwind { ; X86-LABEL: test9: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: shrdl %cl, %edx, %eax ; X86-NEXT: sarl %cl, %edx ; X86-NEXT: retl ; ; X64-LABEL: test9: ; X64: # %bb.0: ; X64-NEXT: movl %esi, %ecx ; X64-NEXT: movq %rdi, %rax ; X64-NEXT: andb $31, %cl ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: sarq %cl, %rax ; X64-NEXT: retq %and = and i32 %bits, 31 %sh_prom = zext i32 %and to i64 %ashr = ashr i64 %val, %sh_prom ret i64 %ashr } define i64 @test10(i64 %val, i32 %bits) nounwind { ; X86-LABEL: test10: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: shrdl %cl, %edx, %eax ; X86-NEXT: shrl %cl, %edx ; X86-NEXT: retl ; ; X64-LABEL: test10: ; X64: # %bb.0: ; X64-NEXT: movl %esi, %ecx ; X64-NEXT: movq %rdi, %rax ; X64-NEXT: andb $31, %cl ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shrq %cl, %rax ; X64-NEXT: retq %and = and i32 %bits, 31 %sh_prom = zext i32 %and to i64 %lshr = lshr i64 %val, %sh_prom ret i64 %lshr } ; SHLD/SHRD manual shifts define i32 @test11(i32 %hi, i32 %lo, i32 %bits) nounwind { ; X86-LABEL: test11: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: shldl %cl, %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: test11: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %edi, %eax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shldl %cl, %esi, %eax ; X64-NEXT: retq %and = and i32 %bits, 31 %and32 = sub i32 32, %and %sh_lo = lshr i32 %lo, %and32 %sh_hi = shl i32 %hi, %and %sh = or i32 %sh_lo, %sh_hi ret i32 %sh } define i32 @test12(i32 %hi, i32 %lo, i32 %bits) nounwind { ; X86-LABEL: test12: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: shrdl %cl, %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: test12: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %esi, %eax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shrdl %cl, %edi, %eax ; X64-NEXT: retq %and = and i32 %bits, 31 %and32 = sub i32 32, %and %sh_lo = shl i32 %hi, %and32 %sh_hi = lshr i32 %lo, %and %sh = or i32 %sh_lo, %sh_hi ret i32 %sh } define i32 @test13(i32 %hi, i32 %lo, i32 %bits) nounwind { ; X86-LABEL: test13: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: shldl %cl, %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: test13: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %edi, %eax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shldl %cl, %esi, %eax ; X64-NEXT: retq %bits32 = sub i32 32, %bits %sh_lo = lshr i32 %lo, %bits32 %sh_hi = shl i32 %hi, %bits %sh = or i32 %sh_lo, %sh_hi ret i32 %sh } define i32 @test14(i32 %hi, i32 %lo, i32 %bits) nounwind { ; X86-LABEL: test14: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: shrdl %cl, %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: test14: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %esi, %eax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shrdl %cl, %edi, %eax ; X64-NEXT: retq %bits32 = sub i32 32, %bits %sh_lo = shl i32 %hi, %bits32 %sh_hi = lshr i32 %lo, %bits %sh = or i32 %sh_lo, %sh_hi ret i32 %sh } define i32 @test15(i32 %hi, i32 %lo, i32 %bits) nounwind { ; X86-LABEL: test15: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: shldl %cl, %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: test15: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %edi, %eax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shldl %cl, %esi, %eax ; X64-NEXT: retq %bits32 = xor i32 %bits, 31 %lo2 = lshr i32 %lo, 1 %sh_lo = lshr i32 %lo2, %bits32 %sh_hi = shl i32 %hi, %bits %sh = or i32 %sh_lo, %sh_hi ret i32 %sh } define i32 @test16(i32 %hi, i32 %lo, i32 %bits) nounwind { ; X86-LABEL: test16: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: shrdl %cl, %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: test16: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %edi, %eax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shrdl %cl, %esi, %eax ; X64-NEXT: retq %bits32 = xor i32 %bits, 31 %lo2 = shl i32 %lo, 1 %sh_lo = shl i32 %lo2, %bits32 %sh_hi = lshr i32 %hi, %bits %sh = or i32 %sh_lo, %sh_hi ret i32 %sh } define i32 @test17(i32 %hi, i32 %lo, i32 %bits) nounwind { ; X86-LABEL: test17: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: shrdl %cl, %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: test17: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %edi, %eax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shrdl %cl, %esi, %eax ; X64-NEXT: retq %bits32 = xor i32 %bits, 31 %lo2 = add i32 %lo, %lo %sh_lo = shl i32 %lo2, %bits32 %sh_hi = lshr i32 %hi, %bits %sh = or i32 %sh_lo, %sh_hi ret i32 %sh } define i32 @test18(i32 %hi, i32 %lo, i32 %bits) nounwind { ; X86-LABEL: test18: ; X86: # %bb.0: ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: shldl %cl, %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: test18: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %edi, %eax ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shldl %cl, %esi, %eax ; X64-NEXT: retq %tbits = trunc i32 %bits to i8 %tand = and i8 %tbits, 31 %tand64 = sub i8 32, %tand %and = zext i8 %tand to i32 %and64 = zext i8 %tand64 to i32 %sh_lo = lshr i32 %lo, %and64 %sh_hi = shl i32 %hi, %and %sh = or i32 %sh_lo, %sh_hi ret i32 %sh } ; These are not valid shld/shrd patterns. When the shift amount modulo ; the bitwidth is zero, the result should be an OR of both operands not a ; shift. define i32 @not_shld_i32(i32, i32, i32) { ; X86-LABEL: not_shld_i32: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: shll %cl, %edx ; X86-NEXT: negb %cl ; X86-NEXT: shrl %cl, %eax ; X86-NEXT: orl %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: not_shld_i32: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %esi, %eax ; X64-NEXT: shll %cl, %edi ; X64-NEXT: negb %cl ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shrl %cl, %eax ; X64-NEXT: orl %edi, %eax ; X64-NEXT: retq %4 = and i32 %2, 31 %5 = shl i32 %0, %4 %6 = sub i32 0, %2 %7 = and i32 %6, 31 %8 = lshr i32 %1, %7 %9 = or i32 %5, %8 ret i32 %9 } define i32 @not_shrd_i32(i32, i32, i32) { ; X86-LABEL: not_shrd_i32: ; X86: # %bb.0: ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax ; X86-NEXT: movzbl {{[0-9]+}}(%esp), %ecx ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx ; X86-NEXT: shrl %cl, %edx ; X86-NEXT: negb %cl ; X86-NEXT: shll %cl, %eax ; X86-NEXT: orl %edx, %eax ; X86-NEXT: retl ; ; X64-LABEL: not_shrd_i32: ; X64: # %bb.0: ; X64-NEXT: movl %edx, %ecx ; X64-NEXT: movl %esi, %eax ; X64-NEXT: shrl %cl, %edi ; X64-NEXT: negb %cl ; X64-NEXT: # kill: def $cl killed $cl killed $ecx ; X64-NEXT: shll %cl, %eax ; X64-NEXT: orl %edi, %eax ; X64-NEXT: retq %4 = and i32 %2, 31 %5 = lshr i32 %0, %4 %6 = sub i32 0, %2 %7 = and i32 %6, 31 %8 = shl i32 %1, %7 %9 = or i32 %5, %8 ret i32 %9 }