; RUN: llvm-as < %s > %t1
; RUN: not llc -march=x86-64 -mattr=-sse < %t1 2> %t2
; RUN: grep "SSE register return with SSE disabled" %t2
; RUN: llc -march=x86-64 < %t1 | grep xmm
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128"
target triple = "x86_64-unknown-linux-gnu"
@f = external global float		; <float*> [#uses=4]
@d = external global double		; <double*> [#uses=4]

define void @test() nounwind {
entry:
	%0 = load float* @f, align 4		; <float> [#uses=1]
	%1 = tail call float @foo1(float %0) nounwind		; <float> [#uses=1]
	store float %1, float* @f, align 4
	%2 = load double* @d, align 8		; <double> [#uses=1]
	%3 = tail call double @foo2(double %2) nounwind		; <double> [#uses=1]
	store double %3, double* @d, align 8
	%4 = load float* @f, align 4		; <float> [#uses=1]
	%5 = tail call float @foo3(float %4) nounwind		; <float> [#uses=1]
	store float %5, float* @f, align 4
	%6 = load double* @d, align 8		; <double> [#uses=1]
	%7 = tail call double @foo4(double %6) nounwind		; <double> [#uses=1]
	store double %7, double* @d, align 8
	ret void
}

declare float @foo1(float)

declare double @foo2(double)

declare float @foo3(float)

declare double @foo4(double)