uniformshift.ll 1.38 KB
; RUN: llc -mtriple=x86_64-apple-darwin -mattr=+sse2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s
; RUN: opt -mtriple=x86_64-apple-darwin -mattr=+sse2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s

define <4 x i32> @shl(<4 x i32> %vector, i32 %scalar) {
entry:
  ; SSE2: 'shl'
  ; SSE2: cost of 1 {{.*}} shl
  ; SSE2-CODEGEN: movd  %edi, %xmm1
  ; SSE2-CODEGEN: pslld %xmm1, %xmm0
  %insert = insertelement <4 x i32> undef, i32 %scalar, i32 0
  %splat = shufflevector <4 x i32> %insert, <4 x i32> undef, <4 x i32> zeroinitializer
  %ret = shl <4 x i32> %vector , %splat
  ret <4 x i32> %ret
}

define <4 x i32> @ashr(<4 x i32> %vector, i32 %scalar) {
entry:
  ; SSE2: 'ashr'
  ; SSE2: cost of 1 {{.*}} ashr
  ; SSE2-CODEGEN: movd  %edi, %xmm1
  ; SSE2-CODEGEN: psrad %xmm1, %xmm0
  %insert = insertelement <4 x i32> undef, i32 %scalar, i32 0
  %splat = shufflevector <4 x i32> %insert, <4 x i32> undef, <4 x i32> zeroinitializer
  %ret = ashr <4 x i32> %vector , %splat
  ret <4 x i32> %ret
}

define <4 x i32> @lshr(<4 x i32> %vector, i32 %scalar) {
entry:
  ; SSE2: 'lshr'
  ; SSE2: cost of 1 {{.*}} lshr
  ; SSE2-CODEGEN: movd  %edi, %xmm1
  ; SSE2-CODEGEN: psrld %xmm1, %xmm0
  %insert = insertelement <4 x i32> undef, i32 %scalar, i32 0
  %splat = shufflevector <4 x i32> %insert, <4 x i32> undef, <4 x i32> zeroinitializer
  %ret = lshr <4 x i32> %vector , %splat
  ret <4 x i32> %ret
}