; RUN: llc < %s -march=x86 -mattr=+sse2                | not grep punpck
; RUN: llc < %s -march=x86 -mattr=+sse2                |     grep pshufd

define i32 @t() nounwind {
entry:
	%a = alloca <4 x i32>		; <<4 x i32>*> [#uses=2]
	%b = alloca <4 x i32>		; <<4 x i32>*> [#uses=5]
	store volatile <4 x i32> < i32 0, i32 1, i32 2, i32 3 >, <4 x i32>* %a
	%tmp = load <4 x i32>* %a		; <<4 x i32>> [#uses=1]
	store <4 x i32> %tmp, <4 x i32>* %b
	%tmp1 = load <4 x i32>* %b		; <<4 x i32>> [#uses=1]
	%tmp2 = load <4 x i32>* %b		; <<4 x i32>> [#uses=1]
	%punpckldq = shufflevector <4 x i32> %tmp1, <4 x i32> %tmp2, <4 x i32> < i32 0, i32 4, i32 1, i32 5 >		; <<4 x i32>> [#uses=1]
	store <4 x i32> %punpckldq, <4 x i32>* %b
	%tmp3 = load <4 x i32>* %b		; <<4 x i32>> [#uses=1]
	%result = extractelement <4 x i32> %tmp3, i32 0		; <i32> [#uses=1]
	ret i32 %result
}