regbank-select.mir 5.93 KB
# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
# RUN: llc -mtriple=aarch64-apple-darwin -run-pass=regbankselect -verify-machineinstrs %s -o - | FileCheck %s

...
---
name:            select_f32
alignment:       4
legalized:       true
tracksRegLiveness: true
machineFunctionInfo: {}
body:             |
  bb.0:
    liveins: $s0, $s1, $w0

    ; CHECK-LABEL: name: select_f32
    ; CHECK: liveins: $s0, $s1, $w0
    ; CHECK: [[COPY:%[0-9]+]]:gpr(s32) = COPY $w0
    ; CHECK: [[TRUNC:%[0-9]+]]:gpr(s1) = G_TRUNC [[COPY]](s32)
    ; CHECK: [[COPY1:%[0-9]+]]:fpr(s32) = COPY $s0
    ; CHECK: [[COPY2:%[0-9]+]]:fpr(s32) = COPY $s1
    ; CHECK: [[SELECT:%[0-9]+]]:fpr(s32) = G_SELECT [[TRUNC]](s1), [[COPY1]], [[COPY2]]
    ; CHECK: $s0 = COPY [[SELECT]](s32)
    ; CHECK: RET_ReallyLR implicit $s0
    %3:_(s32) = COPY $w0
    %0:_(s1) = G_TRUNC %3(s32)
    %1:_(s32) = COPY $s0
    %2:_(s32) = COPY $s1
    %4:_(s32) = G_SELECT %0(s1), %1, %2
    $s0 = COPY %4(s32)
    RET_ReallyLR implicit $s0

...
---
name:            select_f64
alignment:       4
legalized:       true
tracksRegLiveness: true
machineFunctionInfo: {}
body:             |
  bb.0:
    liveins: $d0, $d1, $w0

    ; CHECK-LABEL: name: select_f64
    ; CHECK: liveins: $d0, $d1, $w0
    ; CHECK: [[COPY:%[0-9]+]]:gpr(s32) = COPY $w0
    ; CHECK: [[TRUNC:%[0-9]+]]:gpr(s1) = G_TRUNC [[COPY]](s32)
    ; CHECK: [[COPY1:%[0-9]+]]:fpr(s64) = COPY $d0
    ; CHECK: [[COPY2:%[0-9]+]]:fpr(s64) = COPY $d1
    ; CHECK: [[SELECT:%[0-9]+]]:fpr(s64) = G_SELECT [[TRUNC]](s1), [[COPY1]], [[COPY2]]
    ; CHECK: $d0 = COPY [[SELECT]](s64)
    ; CHECK: RET_ReallyLR implicit $d0
    %3:_(s32) = COPY $w0
    %0:_(s1) = G_TRUNC %3(s32)
    %1:_(s64) = COPY $d0
    %2:_(s64) = COPY $d1
    %4:_(s64) = G_SELECT %0(s1), %1, %2
    $d0 = COPY %4(s64)
    RET_ReallyLR implicit $d0

...
---
name:            two_fpr_inputs_gpr_output
alignment:       4
legalized:       true
tracksRegLiveness: true
machineFunctionInfo: {}
body:             |
  bb.0:
    liveins: $d0, $d1, $w0
    ; CHECK-LABEL: name: two_fpr_inputs_gpr_output
    ; CHECK: liveins: $d0, $d1, $w0
    ; CHECK: [[COPY:%[0-9]+]]:gpr(s32) = COPY $w0
    ; CHECK: [[TRUNC:%[0-9]+]]:gpr(s1) = G_TRUNC [[COPY]](s32)
    ; CHECK: [[COPY1:%[0-9]+]]:fpr(s64) = COPY $d0
    ; CHECK: [[COPY2:%[0-9]+]]:fpr(s64) = COPY $d1
    ; CHECK: [[SELECT:%[0-9]+]]:fpr(s64) = G_SELECT [[TRUNC]](s1), [[COPY1]], [[COPY2]]
    ; CHECK: $x0 = COPY [[SELECT]](s64)
    ; CHECK: RET_ReallyLR implicit $x0

    ; Verify that the G_SELECT only has FPRs.
    ; The only difference between fcsel and csel are the register banks. So,
    ; if we have two FPR inputs and a GPR output, we should do a floating point
    ; select anyway. This will cost one copy for the output, but that's less
    ; than doing two to put the inputs on GPRs.

    %3:_(s32) = COPY $w0
    %0:_(s1) = G_TRUNC %3(s32)
    %1:_(s64) = COPY $d0
    %2:_(s64) = COPY $d1
    %4:_(s64) = G_SELECT %0(s1), %1, %2
    $x0 = COPY %4(s64)
    RET_ReallyLR implicit $x0

...
---
name:            one_fpr_input_fpr_output
alignment:       4
legalized:       true
tracksRegLiveness: true
machineFunctionInfo: {}
body:             |
  bb.0:
    liveins: $d0, $x1, $w0
    ; CHECK-LABEL: name: one_fpr_input_fpr_output
    ; CHECK: liveins: $d0, $x1, $w0
    ; CHECK: [[COPY:%[0-9]+]]:gpr(s32) = COPY $w0
    ; CHECK: [[TRUNC:%[0-9]+]]:gpr(s1) = G_TRUNC [[COPY]](s32)
    ; CHECK: [[COPY1:%[0-9]+]]:fpr(s64) = COPY $d0
    ; CHECK: [[COPY2:%[0-9]+]]:gpr(s64) = COPY $x1
    ; CHECK: [[COPY3:%[0-9]+]]:fpr(s64) = COPY [[COPY2]](s64)
    ; CHECK: [[SELECT:%[0-9]+]]:fpr(s64) = G_SELECT [[TRUNC]](s1), [[COPY1]], [[COPY3]]
    ; CHECK: $d0 = COPY [[SELECT]](s64)
    ; CHECK: RET_ReallyLR implicit $d0

    ; Same idea as the above test. If the output is an FPR, and one of the
    ; inputs is an FPR, then it's fewer copies to just do a FCSEL.

    %3:_(s32) = COPY $w0
    %0:_(s1) = G_TRUNC %3(s32)
    %1:_(s64) = COPY $d0
    %2:_(s64) = COPY $x1
    %4:_(s64) = G_SELECT %0(s1), %1, %2
    $d0 = COPY %4(s64)
    RET_ReallyLR implicit $d0

...
---
name:            one_fpr_input_gpr_output
alignment:       4
legalized:       true
tracksRegLiveness: true
machineFunctionInfo: {}
body:             |
  bb.0:
    liveins: $d0, $x1, $w0
    ; CHECK-LABEL: name: one_fpr_input_gpr_output
    ; CHECK: liveins: $d0, $x1, $w0
    ; CHECK: [[COPY:%[0-9]+]]:gpr(s32) = COPY $w0
    ; CHECK: [[TRUNC:%[0-9]+]]:gpr(s1) = G_TRUNC [[COPY]](s32)
    ; CHECK: [[COPY1:%[0-9]+]]:fpr(s64) = COPY $d0
    ; CHECK: [[COPY2:%[0-9]+]]:gpr(s64) = COPY $x1
    ; CHECK: [[COPY3:%[0-9]+]]:gpr(s64) = COPY [[COPY1]](s64)
    ; CHECK: [[SELECT:%[0-9]+]]:gpr(s64) = G_SELECT [[TRUNC]](s1), [[COPY3]], [[COPY2]]
    ; CHECK: $x0 = COPY [[SELECT]](s64)
    ; CHECK: RET_ReallyLR implicit $x0

    ; Now we have more GPR registers on the G_SELECT. It's cheaper here to put
    ; everything on GPR.

    %3:_(s32) = COPY $w0
    %0:_(s1) = G_TRUNC %3(s32)
    %1:_(s64) = COPY $d0
    %2:_(s64) = COPY $x1
    %4:_(s64) = G_SELECT %0(s1), %1, %2
    $x0 = COPY %4(s64)
    RET_ReallyLR implicit $x0

...
---
name:            two_gpr_input_fpr_output
alignment:       4
legalized:       true
tracksRegLiveness: true
machineFunctionInfo: {}
body:             |
  bb.0:
    liveins: $x0, $x1, $w0
    ; CHECK-LABEL: name: two_gpr_input_fpr_output
    ; CHECK: liveins: $x0, $x1, $w0
    ; CHECK: [[COPY:%[0-9]+]]:gpr(s32) = COPY $w0
    ; CHECK: [[TRUNC:%[0-9]+]]:gpr(s1) = G_TRUNC [[COPY]](s32)
    ; CHECK: [[COPY1:%[0-9]+]]:gpr(s64) = COPY $x0
    ; CHECK: [[COPY2:%[0-9]+]]:gpr(s64) = COPY $x1
    ; CHECK: [[SELECT:%[0-9]+]]:gpr(s64) = G_SELECT [[TRUNC]](s1), [[COPY1]], [[COPY2]]
    ; CHECK: $d0 = COPY [[SELECT]](s64)
    ; CHECK: RET_ReallyLR implicit $d0

    ; Same as above. The G_SELECT should get all GPRS.

    %3:_(s32) = COPY $w0
    %0:_(s1) = G_TRUNC %3(s32)
    %1:_(s64) = COPY $x0
    %2:_(s64) = COPY $x1
    %4:_(s64) = G_SELECT %0(s1), %1, %2
    $d0 = COPY %4(s64)
    RET_ReallyLR implicit $d0