test/CodeGen/RISCV/split-offsets.ll

   1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
   2 ; RUN: llc -mtriple=riscv32 -verify-machineinstrs < %s \
   3 ; RUN:   | FileCheck %s -check-prefix=RV32I
   4 ; RUN: llc -mtriple=riscv64 -verify-machineinstrs < %s \
   5 ; RUN:   | FileCheck %s -check-prefix=RV64I
   6
   7 ; Check that memory accesses to array elements with large offsets have those
   8 ; offsets split into a base offset, plus a smaller offset that is folded into
   9 ; the memory operation. We should also only compute that base offset once,
  10 ; since it can be shared for all memory operations in this test.
  11 define void @test1([65536 x i32]** %sp, [65536 x i32]* %t, i32 %n) {
  12 ; RV32I-LABEL: test1:
  13 ; RV32I:       # %bb.0: # %entry
  14 ; RV32I-NEXT:    lw a0, 0(a0)
  15 ; RV32I-NEXT:    lui a2, 20
  16 ; RV32I-NEXT:    addi a2, a2, -1920
  17 ; RV32I-NEXT:    add a1, a1, a2
  18 ; RV32I-NEXT:    add a0, a0, a2
  19 ; RV32I-NEXT:    addi a2, zero, 2
  20 ; RV32I-NEXT:    sw a2, 0(a0)
  21 ; RV32I-NEXT:    addi a3, zero, 1
  22 ; RV32I-NEXT:    sw a3, 4(a0)
  23 ; RV32I-NEXT:    sw a3, 0(a1)
  24 ; RV32I-NEXT:    sw a2, 4(a1)
  25 ; RV32I-NEXT:    .cfi_def_cfa_offset 0
  26 ; RV32I-NEXT:    ret
  27 ;
  28 ; RV64I-LABEL: test1:
  29 ; RV64I:       # %bb.0: # %entry
  30 ; RV64I-NEXT:    ld a0, 0(a0)
  31 ; RV64I-NEXT:    lui a2, 20
  32 ; RV64I-NEXT:    addiw a2, a2, -1920
  33 ; RV64I-NEXT:    add a1, a1, a2
  34 ; RV64I-NEXT:    add a0, a0, a2
  35 ; RV64I-NEXT:    addi a2, zero, 2
  36 ; RV64I-NEXT:    sw a2, 0(a0)
  37 ; RV64I-NEXT:    addi a3, zero, 1
  38 ; RV64I-NEXT:    sw a3, 4(a0)
  39 ; RV64I-NEXT:    sw a3, 0(a1)
  40 ; RV64I-NEXT:    sw a2, 4(a1)
  41 ; RV64I-NEXT:    .cfi_def_cfa_offset 0
  42 ; RV64I-NEXT:    ret
  43 entry:
  44   %s = load [65536 x i32]*, [65536 x i32]** %sp
  45   %gep0 = getelementptr [65536 x i32], [65536 x i32]* %s, i64 0, i32 20000
  46   %gep1 = getelementptr [65536 x i32], [65536 x i32]* %s, i64 0, i32 20001
  47   %gep2 = getelementptr [65536 x i32], [65536 x i32]* %t, i64 0, i32 20000
  48   %gep3 = getelementptr [65536 x i32], [65536 x i32]* %t, i64 0, i32 20001
  49   store i32 2, i32* %gep0
  50   store i32 1, i32* %gep1
  51   store i32 1, i32* %gep2
  52   store i32 2, i32* %gep3
  53   ret void
  54 }
  55
  56 ; Ditto. Check it when the GEPs are not in the entry block.
  57 define void @test2([65536 x i32]** %sp, [65536 x i32]* %t, i32 %n) {
  58 ; RV32I-LABEL: test2:
  59 ; RV32I:       # %bb.0: # %entry
  60 ; RV32I-NEXT:    mv a3, zero
  61 ; RV32I-NEXT:    lw a4, 0(a0)
  62 ; RV32I-NEXT:    lui a0, 20
  63 ; RV32I-NEXT:    addi a5, a0, -1920
  64 ; RV32I-NEXT:    add a0, a1, a5
  65 ; RV32I-NEXT:    add a1, a4, a5
  66 ; RV32I-NEXT:    bge a3, a2, .LBB1_2
  67 ; RV32I-NEXT:  .LBB1_1: # %while_body
  68 ; RV32I-NEXT:    # =>This Inner Loop Header: Depth=1
  69 ; RV32I-NEXT:    addi a4, a3, 1
  70 ; RV32I-NEXT:    sw a4, 0(a1)
  71 ; RV32I-NEXT:    sw a3, 4(a1)
  72 ; RV32I-NEXT:    sw a4, 0(a0)
  73 ; RV32I-NEXT:    sw a3, 4(a0)
  74 ; RV32I-NEXT:    mv a3, a4
  75 ; RV32I-NEXT:    blt a3, a2, .LBB1_1
  76 ; RV32I-NEXT:  .LBB1_2: # %while_end
  77 ; RV32I-NEXT:    .cfi_def_cfa_offset 0
  78 ; RV32I-NEXT:    ret
  79 ;
  80 ; RV64I-LABEL: test2:
  81 ; RV64I:       # %bb.0: # %entry
  82 ; RV64I-NEXT:    mv a3, zero
  83 ; RV64I-NEXT:    ld a4, 0(a0)
  84 ; RV64I-NEXT:    lui a0, 20
  85 ; RV64I-NEXT:    addiw a5, a0, -1920
  86 ; RV64I-NEXT:    add a0, a1, a5
  87 ; RV64I-NEXT:    add a1, a4, a5
  88 ; RV64I-NEXT:    sext.w a2, a2
  89 ; RV64I-NEXT:    sext.w a4, a3
  90 ; RV64I-NEXT:    bge a4, a2, .LBB1_2
  91 ; RV64I-NEXT:  .LBB1_1: # %while_body
  92 ; RV64I-NEXT:    # =>This Inner Loop Header: Depth=1
  93 ; RV64I-NEXT:    addi a4, a3, 1
  94 ; RV64I-NEXT:    sw a4, 0(a1)
  95 ; RV64I-NEXT:    sw a3, 4(a1)
  96 ; RV64I-NEXT:    sw a4, 0(a0)
  97 ; RV64I-NEXT:    sw a3, 4(a0)
  98 ; RV64I-NEXT:    mv a3, a4
  99 ; RV64I-NEXT:    sext.w a4, a3
 100 ; RV64I-NEXT:    blt a4, a2, .LBB1_1
 101 ; RV64I-NEXT:  .LBB1_2: # %while_end
 102 ; RV64I-NEXT:    .cfi_def_cfa_offset 0
 103 ; RV64I-NEXT:    ret
 104 entry:
 105   %s = load [65536 x i32]*, [65536 x i32]** %sp
 106   br label %while_cond
 107 while_cond:
 108   %phi = phi i32 [ 0, %entry ], [ %i, %while_body ]
 109   %gep0 = getelementptr [65536 x i32], [65536 x i32]* %s, i64 0, i32 20000
 110   %gep1 = getelementptr [65536 x i32], [65536 x i32]* %s, i64 0, i32 20001
 111   %gep2 = getelementptr [65536 x i32], [65536 x i32]* %t, i64 0, i32 20000
 112   %gep3 = getelementptr [65536 x i32], [65536 x i32]* %t, i64 0, i32 20001
 113   %cmp = icmp slt i32 %phi, %n
 114   br i1 %cmp, label %while_body, label %while_end
 115 while_body:
 116   %i = add i32 %phi, 1
 117   %j = add i32 %phi, 2
 118   store i32 %i, i32* %gep0
 119   store i32 %phi, i32* %gep1
 120   store i32 %i, i32* %gep2
 121   store i32 %phi, i32* %gep3
 122   br label %while_cond
 123 while_end:
 124   ret void
 125 }
 126