| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py |
| ; RUN: opt -vector-combine -S %s | FileCheck %s |
| |
| target triple = "arm64-apple-darwin" |
| |
| define void @load_extract_insert_store_const_idx(<225 x double>* %A) { |
| ; CHECK-LABEL: @load_extract_insert_store_const_idx( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: [[LV:%.*]] = load <225 x double>, <225 x double>* [[A:%.*]], align 8 |
| ; CHECK-NEXT: [[EXT_0:%.*]] = extractelement <225 x double> [[LV]], i64 0 |
| ; CHECK-NEXT: [[MUL:%.*]] = fmul double 2.000000e+01, [[EXT_0]] |
| ; CHECK-NEXT: [[EXT_1:%.*]] = extractelement <225 x double> [[LV]], i64 1 |
| ; CHECK-NEXT: [[SUB:%.*]] = fsub double [[EXT_1]], [[MUL]] |
| ; CHECK-NEXT: [[TMP0:%.*]] = getelementptr inbounds <225 x double>, <225 x double>* [[A]], i64 0, i64 1 |
| ; CHECK-NEXT: store double [[SUB]], double* [[TMP0]], align 8 |
| ; CHECK-NEXT: ret void |
| ; |
| entry: |
| %lv = load <225 x double>, <225 x double>* %A, align 8 |
| %ext.0 = extractelement <225 x double> %lv, i64 0 |
| %mul = fmul double 20.0, %ext.0 |
| %ext.1 = extractelement <225 x double> %lv, i64 1 |
| %sub = fsub double %ext.1, %mul |
| %ins = insertelement <225 x double> %lv, double %sub, i64 1 |
| store <225 x double> %ins, <225 x double>* %A, align 8 |
| ret void |
| } |
| |
| define void @load_extract_insert_store_var_idx_assume_valid(i64 %idx.1, i64 %idx.2, <225 x double>* %A) { |
| ; CHECK-LABEL: @load_extract_insert_store_var_idx_assume_valid( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: [[CMP_1:%.*]] = icmp ult i64 [[IDX_1:%.*]], 225 |
| ; CHECK-NEXT: call void @llvm.assume(i1 [[CMP_1]]) |
| ; CHECK-NEXT: [[CMP_2:%.*]] = icmp ult i64 [[IDX_2:%.*]], 225 |
| ; CHECK-NEXT: call void @llvm.assume(i1 [[CMP_2]]) |
| ; CHECK-NEXT: [[LV:%.*]] = load <225 x double>, <225 x double>* [[A:%.*]], align 8 |
| ; CHECK-NEXT: [[EXT_0:%.*]] = extractelement <225 x double> [[LV]], i64 [[IDX_1]] |
| ; CHECK-NEXT: [[MUL:%.*]] = fmul double 2.000000e+01, [[EXT_0]] |
| ; CHECK-NEXT: [[EXT_1:%.*]] = extractelement <225 x double> [[LV]], i64 [[IDX_2]] |
| ; CHECK-NEXT: [[SUB:%.*]] = fsub double [[EXT_1]], [[MUL]] |
| ; CHECK-NEXT: [[TMP0:%.*]] = getelementptr inbounds <225 x double>, <225 x double>* [[A]], i64 0, i64 [[IDX_1]] |
| ; CHECK-NEXT: store double [[SUB]], double* [[TMP0]], align 8 |
| ; CHECK-NEXT: ret void |
| ; |
| entry: |
| %cmp.1 = icmp ult i64 %idx.1, 225 |
| call void @llvm.assume(i1 %cmp.1) |
| %cmp.2 = icmp ult i64 %idx.2, 225 |
| call void @llvm.assume(i1 %cmp.2) |
| |
| %lv = load <225 x double>, <225 x double>* %A, align 8 |
| %ext.0 = extractelement <225 x double> %lv, i64 %idx.1 |
| %mul = fmul double 20.0, %ext.0 |
| %ext.1 = extractelement <225 x double> %lv, i64 %idx.2 |
| %sub = fsub double %ext.1, %mul |
| %ins = insertelement <225 x double> %lv, double %sub, i64 %idx.1 |
| store <225 x double> %ins, <225 x double>* %A, align 8 |
| ret void |
| } |
| |
| |
| define void @load_extract_insert_store_var_idx_no_assume_valid(i64 %idx.1, i64 %idx.2, <225 x double>* %A) { |
| ; CHECK-LABEL: @load_extract_insert_store_var_idx_no_assume_valid( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: [[LV:%.*]] = load <225 x double>, <225 x double>* [[A:%.*]], align 8 |
| ; CHECK-NEXT: [[EXT_0:%.*]] = extractelement <225 x double> [[LV]], i64 [[IDX_1:%.*]] |
| ; CHECK-NEXT: [[MUL:%.*]] = fmul double 2.000000e+01, [[EXT_0]] |
| ; CHECK-NEXT: [[EXT_1:%.*]] = extractelement <225 x double> [[LV]], i64 [[IDX_2:%.*]] |
| ; CHECK-NEXT: [[SUB:%.*]] = fsub double [[EXT_1]], [[MUL]] |
| ; CHECK-NEXT: [[INS:%.*]] = insertelement <225 x double> [[LV]], double [[SUB]], i64 [[IDX_1]] |
| ; CHECK-NEXT: store <225 x double> [[INS]], <225 x double>* [[A]], align 8 |
| ; CHECK-NEXT: ret void |
| ; |
| entry: |
| %lv = load <225 x double>, <225 x double>* %A, align 8 |
| %ext.0 = extractelement <225 x double> %lv, i64 %idx.1 |
| %mul = fmul double 20.0, %ext.0 |
| %ext.1 = extractelement <225 x double> %lv, i64 %idx.2 |
| %sub = fsub double %ext.1, %mul |
| %ins = insertelement <225 x double> %lv, double %sub, i64 %idx.1 |
| store <225 x double> %ins, <225 x double>* %A, align 8 |
| ret void |
| } |
| |
| declare void @llvm.assume(i1) |