; RUN: opt -licm -mtriple aarch64-linux-gnu -mattr=+sve -S < %s | FileCheck %s define void @no_hoist_load1_nxv2i64(<vscale x 2 x i64>* %out, i8* %in8, i32 %n) { ; CHECK-LABEL: @no_hoist_load1_nxv2i64( ; CHECK: entry: ; CHECK-NOT: load ; CHECK: for.body: ; CHECK: load entry: %cmp0 = icmp ugt i32 %n, 0 %invst = call {}* @llvm.invariant.start.p0i8(i64 16, i8* %in8) %in = bitcast i8* %in8 to <vscale x 2 x i64>* br i1 %cmp0, label %for.body, label %for.end for.body: %i = phi i32 [0, %entry], [%inc, %for.body] %i2 = zext i32 %i to i64 %ptr = getelementptr <vscale x 2 x i64>, <vscale x 2 x i64>* %out, i64 %i2 %val = load <vscale x 2 x i64>, <vscale x 2 x i64>* %in, align 16 store <vscale x 2 x i64> %val, <vscale x 2 x i64>* %ptr, align 16 %inc = add nuw nsw i32 %i, 1 %cmp = icmp ult i32 %inc, %n br i1 %cmp, label %for.body, label %for.end for.end: ret void } define void @no_hoist_gather(<vscale x 2 x i32>* %out_ptr, <vscale x 2 x i32>* %in_ptr, <vscale x 2 x i64> %ptr_vec, i64 %n, <vscale x 2 x i1> %pred) { ; CHECK-LABEL: @no_hoist_gather( ; CHECK: entry: ; CHECK-NOT: llvm.aarch64.sve.ld1.gather.scalar.offset ; CHECK: for.body: ; CHECK: llvm.aarch64.sve.ld1.gather.scalar.offset entry: br label %for.body for.body: %i = phi i64 [0, %entry], [%inc, %for.body] %gather = call <vscale x 2 x i32> @llvm.aarch64.sve.ld1.gather.scalar.offset.nxv2i32.nxv2i64(<vscale x 2 x i1> %pred, <vscale x 2 x i64> %ptr_vec, i64 0) %in_ptr_gep = getelementptr <vscale x 2 x i32>, <vscale x 2 x i32>* %in_ptr, i64 %i %in_ptr_load = load <vscale x 2 x i32>, <vscale x 2 x i32>* %in_ptr_gep, align 8 %sum = add <vscale x 2 x i32> %gather, %in_ptr_load %out_ptr_gep = getelementptr <vscale x 2 x i32>, <vscale x 2 x i32>* %out_ptr, i64 %i store <vscale x 2 x i32> %sum, <vscale x 2 x i32>* %out_ptr_gep, align 8 %inc = add nuw nsw i64 %i, 1 %cmp = icmp ult i64 %inc, %n br i1 %cmp, label %for.body, label %for.end for.end: ret void } define void @no_hoist_scatter(<vscale x 2 x i32>* %out_ptr, <vscale x 2 x i32>* %in_ptr, <vscale x 2 x i64> %ptr_vec, i64 %n, <vscale x 2 x i1> %pred) { ; CHECK-LABEL: @no_hoist_scatter( ; CHECK: entry: ; CHECK-NOT: load ; CHECK: for.body: ; CHECK: load entry: br label %for.body for.body: %i = phi i64 [0, %entry], [%inc, %for.body] %in_ptr_load = load <vscale x 2 x i32>, <vscale x 2 x i32>* %in_ptr, align 8 call void @llvm.aarch64.sve.st1.scatter.scalar.offset.nxv2i32.nxv2i64(<vscale x 2 x i32> %in_ptr_load, <vscale x 2 x i1> %pred, <vscale x 2 x i64> %ptr_vec, i64 %i) %inc = add nuw nsw i64 %i, 1 %cmp = icmp ult i64 %inc, %n br i1 %cmp, label %for.body, label %for.end for.end: ret void } declare {}* @llvm.invariant.start.p0i8(i64, i8* nocapture) nounwind readonly declare void @llvm.aarch64.sve.st1.scatter.scalar.offset.nxv2i32.nxv2i64(<vscale x 2 x i32>, <vscale x 2 x i1>, <vscale x 2 x i64>, i64) declare <vscale x 2 x i32> @llvm.aarch64.sve.ld1.gather.scalar.offset.nxv2i32.nxv2i64(<vscale x 2 x i1>, <vscale x 2 x i64>, i64)