; This tests some of the subtleties of Phi lowering.  In particular,
; it tests that it does the right thing when it tries to enable
; compare/branch fusing.

; RUN: %p2i -i %s --filetype=obj --disassemble --args -O2 --phi-edge-split=0 \
; RUN:   | FileCheck %s
; RUN: %p2i -i %s --filetype=obj --disassemble --args -O2 --phi-edge-split=1 \
; RUN:   | FileCheck --check-prefix=SPLIT %s

define internal i32 @testPhi1(i32 %arg) {
entry:
  %cmp1 = icmp sgt i32 %arg, 0
  br i1 %cmp1, label %next, label %target
next:
  br label %target
target:
  %merge = phi i1 [ %cmp1, %entry ], [ false, %next ]
  %result = zext i1 %merge to i32
  ret i32 %result
}
; Test that compare/branch fusing does not happen, and Phi lowering is
; put in the right place.
; CHECK-LABEL: testPhi1
; CHECK: cmp {{.*}},0x0
; CHECK: setg
; CHECK: mov [[PHI:.*]],
; CHECK: cmp {{.*}},0x0
; CHECK: je
; CHECK: mov [[PHI]],0x0
; CHECK: movzx {{.*}},[[PHI]]

define internal i32 @testPhi2(i32 %arg) {
entry:
  %cmp1 = icmp sgt i32 %arg, 0
  br i1 %cmp1, label %next, label %target
next:
  br label %target
target:
  %merge = phi i32 [ 12345, %entry ], [ 54321, %next ]
  ret i32 %merge
}
; Test that compare/branch fusing and Phi lowering happens as expected.
; CHECK-LABEL: testPhi2
; CHECK: mov {{.*}},0x3039
; CHECK: cmp {{.*}},0x0
; CHECK-NEXT: jle
; CHECK: mov [[PHI:.*]],0xd431
; CHECK: mov {{.*}},[[PHI]]

; Test that address mode inference doesn't extend past
; multi-definition, non-SSA Phi temporaries.
define internal i32 @testPhi3(i32 %arg) {
entry:
  br label %body
body:
  %merge = phi i32 [ %arg, %entry ], [ %elt, %body ]
  %interior = add i32 %merge, 1000
  ; Trick to make a basic block local copy of interior for
  ; addressing mode optimization.
  %interior__4 = add i32 %interior, 0
  %__4 = inttoptr i32 %interior__4 to i32*
  %elt = load i32, i32* %__4, align 1
  %cmp = icmp eq i32 %elt, 0
  br i1 %cmp, label %exit, label %body
exit:
  ; Same trick (making a basic block local copy).
  %interior__6 = add i32 %interior, 0
  %__6 = inttoptr i32 %interior__6 to i32*
  store i32 %arg, i32* %__6, align 1
  ret i32 %arg
}
; I can't figure out how to reliably test this for correctness, so I
; will just include patterns for the entire current O2 sequence.  This
; may need to be changed when meaningful optimizations are added.
; The key is to avoid the "bad" pattern like this:
;
; testPhi3:
; .LtestPhi3$entry:
;         mov     eax, DWORD PTR [esp+4]
;         mov     ecx, eax
; .LtestPhi3$body:
;         mov     ecx, DWORD PTR [ecx+1000]
;         cmp     ecx, 0
;         jne     .LtestPhi3$body
; .LtestPhi3$exit:
;         mov     DWORD PTR [ecx+1000], eax
;         ret
;
; This is bad because the final store address is supposed to be the
; same as the load address in the loop, but it has clearly been
; over-optimized into a null pointer dereference.

; CHECK-LABEL: testPhi3
; CHECK: push [[EBX:.*]]
; CHECK: mov [[EAX:.*]],DWORD PTR [esp
; CHECK: mov [[ECX:.*]],[[EAX]]
;;; start of loop body
; CHECK: mov [[EDX:.*]],[[ECX]]
; CHECK: mov {{.*}},DWORD PTR [{{.*}}+0x3e8]
; CHECK: cmp {{.*}},0x0
; CHECK: jne
;;; start of epilog
; CHECK: mov DWORD PTR {{.}}[[EDX]]+0x3e8],
; CHECK: pop [[EBX]]

; Test of "advanced phi lowering" with undef phi arg (integer vector).
define internal <4 x i32> @test_split_undef_int_vec(<4 x i32> %arg, i32 %cond) {
entry:
  %cmp = icmp eq i32 %cond, 0
  br i1 %cmp, label %eq, label %exit
eq:
  br label %exit
exit:
  %merge = phi <4 x i32> [ %arg, %entry ], [ undef, %eq ]
  ret <4 x i32> %merge
}
; SPLIT-LABEL: test_split_undef_int_vec
; SPLIT: pxor

; Test of "advanced phi lowering" with undef phi arg (float vector).
define internal <4 x float> @test_split_undef_float_vec(<4 x float> %arg, i32 %cond) {
entry:
  %cmp = icmp eq i32 %cond, 0
  br i1 %cmp, label %eq, label %exit
eq:
  br label %exit
exit:
  %merge = phi <4 x float> [ %arg, %entry ], [ undef, %eq ]
  ret <4 x float> %merge
}
; SPLIT-LABEL: test_split_undef_float_vec
; SPLIT: pxor

; Test of "advanced phi lowering" with undef phi arg (integer scalar).
define internal i32 @test_split_undef_int_scalar(i32 %arg, i32 %cond) {
entry:
  %cmp = icmp eq i32 %cond, 0
  br i1 %cmp, label %eq, label %exit
eq:
  br label %exit
exit:
  %merge = phi i32 [ %arg, %entry ], [ undef, %eq ]
  ret i32 %merge
}
; SPLIT-LABEL: test_split_undef_int_scalar
; SPLIT: mov {{.*}},0x0

; Test of "advanced phi lowering" with undef phi arg (float scalar).
define internal float @test_split_undef_float_scalar(float %arg, i32 %cond) {
entry:
  %cmp = icmp eq i32 %cond, 0
  br i1 %cmp, label %eq, label %exit
eq:
  br label %exit
exit:
  %merge = phi float [ %arg, %entry ], [ undef, %eq ]
  ret float %merge
}
; SPLIT-LABEL: test_split_undef_float_scalar
; SPLIT: movss {{.*}},DWORD PTR