|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5 |
| 2 | +; RUN: opt -passes=sandbox-vectorizer -sbvec-vec-reg-bits=1024 -sbvec-allow-non-pow2 -sbvec-passes="seed-collection<tr-save,bottom-up-vec,tr-accept>" --sbvec-stop-at=0 %s -S | FileCheck %s --check-prefix=STOPAT0 |
| 3 | +; RUN: opt -passes=sandbox-vectorizer -sbvec-vec-reg-bits=1024 -sbvec-allow-non-pow2 -sbvec-passes="seed-collection<tr-save,bottom-up-vec,tr-accept>" --sbvec-stop-at=1 %s -S | FileCheck %s --check-prefix=STOPAT1 |
| 4 | +; RUN: opt -passes=sandbox-vectorizer -sbvec-vec-reg-bits=1024 -sbvec-allow-non-pow2 -sbvec-passes="seed-collection<tr-save,bottom-up-vec,tr-accept>" --sbvec-stop-at=2 %s -S | FileCheck %s --check-prefix=STOPAT2 |
| 5 | + |
| 6 | +define void @widen(ptr %ptrA, ptr %ptrB) { |
| 7 | +; STOPAT0-LABEL: define void @widen( |
| 8 | +; STOPAT0-SAME: ptr [[PTRA:%.*]], ptr [[PTRB:%.*]]) { |
| 9 | +; STOPAT0-NEXT: [[PTRA0:%.*]] = getelementptr float, ptr [[PTRA]], i32 0 |
| 10 | +; STOPAT0-NEXT: [[PTRA1:%.*]] = getelementptr float, ptr [[PTRA]], i32 1 |
| 11 | +; STOPAT0-NEXT: [[LDA0:%.*]] = load float, ptr [[PTRA0]], align 4 |
| 12 | +; STOPAT0-NEXT: [[LDA1:%.*]] = load float, ptr [[PTRA1]], align 4 |
| 13 | +; STOPAT0-NEXT: store float [[LDA0]], ptr [[PTRA0]], align 4 |
| 14 | +; STOPAT0-NEXT: store float [[LDA1]], ptr [[PTRA1]], align 4 |
| 15 | +; STOPAT0-NEXT: [[PTRB0:%.*]] = getelementptr float, ptr [[PTRB]], i32 0 |
| 16 | +; STOPAT0-NEXT: [[PTRB1:%.*]] = getelementptr float, ptr [[PTRB]], i32 1 |
| 17 | +; STOPAT0-NEXT: [[LDB0:%.*]] = load float, ptr [[PTRB0]], align 4 |
| 18 | +; STOPAT0-NEXT: [[LDB1:%.*]] = load float, ptr [[PTRB1]], align 4 |
| 19 | +; STOPAT0-NEXT: store float [[LDB0]], ptr [[PTRB0]], align 4 |
| 20 | +; STOPAT0-NEXT: store float [[LDB1]], ptr [[PTRB1]], align 4 |
| 21 | +; STOPAT0-NEXT: ret void |
| 22 | +; |
| 23 | +; STOPAT1-LABEL: define void @widen( |
| 24 | +; STOPAT1-SAME: ptr [[PTRA:%.*]], ptr [[PTRB:%.*]]) { |
| 25 | +; STOPAT1-NEXT: [[PTRA0:%.*]] = getelementptr float, ptr [[PTRA]], i32 0 |
| 26 | +; STOPAT1-NEXT: [[VECL:%.*]] = load <2 x float>, ptr [[PTRA0]], align 4 |
| 27 | +; STOPAT1-NEXT: store <2 x float> [[VECL]], ptr [[PTRA0]], align 4 |
| 28 | +; STOPAT1-NEXT: [[PTRB0:%.*]] = getelementptr float, ptr [[PTRB]], i32 0 |
| 29 | +; STOPAT1-NEXT: [[PTRB1:%.*]] = getelementptr float, ptr [[PTRB]], i32 1 |
| 30 | +; STOPAT1-NEXT: [[LDB0:%.*]] = load float, ptr [[PTRB0]], align 4 |
| 31 | +; STOPAT1-NEXT: [[LDB1:%.*]] = load float, ptr [[PTRB1]], align 4 |
| 32 | +; STOPAT1-NEXT: store float [[LDB0]], ptr [[PTRB0]], align 4 |
| 33 | +; STOPAT1-NEXT: store float [[LDB1]], ptr [[PTRB1]], align 4 |
| 34 | +; STOPAT1-NEXT: ret void |
| 35 | +; |
| 36 | +; STOPAT2-LABEL: define void @widen( |
| 37 | +; STOPAT2-SAME: ptr [[PTRA:%.*]], ptr [[PTRB:%.*]]) { |
| 38 | +; STOPAT2-NEXT: [[PTRA0:%.*]] = getelementptr float, ptr [[PTRA]], i32 0 |
| 39 | +; STOPAT2-NEXT: [[VECL:%.*]] = load <2 x float>, ptr [[PTRA0]], align 4 |
| 40 | +; STOPAT2-NEXT: store <2 x float> [[VECL]], ptr [[PTRA0]], align 4 |
| 41 | +; STOPAT2-NEXT: [[PTRB0:%.*]] = getelementptr float, ptr [[PTRB]], i32 0 |
| 42 | +; STOPAT2-NEXT: [[VECL1:%.*]] = load <2 x float>, ptr [[PTRB0]], align 4 |
| 43 | +; STOPAT2-NEXT: store <2 x float> [[VECL1]], ptr [[PTRB0]], align 4 |
| 44 | +; STOPAT2-NEXT: ret void |
| 45 | +; |
| 46 | + %ptrA0 = getelementptr float, ptr %ptrA, i32 0 |
| 47 | + %ptrA1 = getelementptr float, ptr %ptrA, i32 1 |
| 48 | + %ldA0 = load float, ptr %ptrA0 |
| 49 | + %ldA1 = load float, ptr %ptrA1 |
| 50 | + store float %ldA0, ptr %ptrA0 |
| 51 | + store float %ldA1, ptr %ptrA1 |
| 52 | + |
| 53 | + %ptrB0 = getelementptr float, ptr %ptrB, i32 0 |
| 54 | + %ptrB1 = getelementptr float, ptr %ptrB, i32 1 |
| 55 | + %ldB0 = load float, ptr %ptrB0 |
| 56 | + %ldB1 = load float, ptr %ptrB1 |
| 57 | + store float %ldB0, ptr %ptrB0 |
| 58 | + store float %ldB1, ptr %ptrB1 |
| 59 | + |
| 60 | + ret void |
| 61 | +} |
0 commit comments