Fix GEP lowering overflow issues

YuriPlyakhin · igcbot · commit 314d922f43b6 · 2025-06-25T01:53:03.000+02:00
This change prevents usage of potentially
negative values which are then zero-extended to
64 bits as indexes.
diff --git a/IGC/Compiler/CISACodeGen/GenIRLowering.cpp b/IGC/Compiler/CISACodeGen/GenIRLowering.cpp
@@ -1,6 +1,6 @@
 /*========================== begin_copyright_notice ============================
 
-Copyright (C) 2017-2021 Intel Corporation
+Copyright (C) 2017-2025 Intel Corporation
 
 SPDX-License-Identifier: MIT
 
@@ -441,6 +441,9 @@ bool GEPLowering::simplifyGEP(BasicBlock &BB) const {
         auto *Idx = GEP->getOperand(1);
         if (auto *ZExt = dyn_cast<ZExtInst>(Idx)) {
             Idx = ZExt->getOperand(0);
+            auto *Op = dyn_cast<OverflowingBinaryOperator>(Idx);
+            if (Op && !Op->hasNoUnsignedWrap())
+              continue;
         } else if (auto *SExt = dyn_cast<SExtInst>(Idx)) {
             Idx = SExt->getOperand(0);
             Operator* Opr = dyn_cast<Operator>(Idx);
diff --git a/IGC/Compiler/tests/GEPLowering/gep_simplification-typed-pointers.ll b/IGC/Compiler/tests/GEPLowering/gep_simplification-typed-pointers.ll
@@ -1,6 +1,6 @@
 ;=========================== begin_copyright_notice ============================
 ;
-; Copyright (C) 2022-2024 Intel Corporation
+; Copyright (C) 2022-2025 Intel Corporation
 ;
 ; SPDX-License-Identifier: MIT
 ;
@@ -36,21 +36,21 @@ define spir_kernel void @test_gep(i32 addrspace(1)* %dst, i32 addrspace(1)* %src
 case1:
   %simdLaneId16 = call i16 @llvm.genx.GenISA.simdLaneId()
   %simdLaneId = zext i16 %simdLaneId16 to i32
-  %idbase1 = add nsw i32 %Offset32, %simdLaneId
+  %idbase1 = add nsw nuw i32 %Offset32, %simdLaneId
   %id1.1 = zext i32 %idbase1 to i64
   %addr1.1 = getelementptr inbounds i32, i32 addrspace(1)* %src, i64 %id1.1
   %res1.0 = load i32, i32 addrspace(1)* %addr1.1, align 4
-  %add11.1 = add nsw i32 %idbase1, 4
+  %add11.1 = add nsw nuw i32 %idbase1, 4
   %id1.2 = zext i32 %add11.1 to i64
   %addr1.2 = getelementptr inbounds i32, i32 addrspace(1)* %src, i64 %id1.2
   %res1.1 = load i32, i32 addrspace(1)* %addr1.2, align 4
   %sum1.0 = add nsw i32 %res1.0, %res1.1
-  %add11.2 = add nsw i32 %idbase1, 8
+  %add11.2 = add nsw nuw i32 %idbase1, 8
   %id1.3 = zext i32 %add11.2 to i64
   %addr1.3 = getelementptr inbounds i32, i32 addrspace(1)* %src, i64 %id1.3
   %res1.2 = load i32, i32 addrspace(1)* %addr1.3, align 4
   %sum1.1 = add nsw i32 %sum1.0, %res1.2
-  %add11.3 = add nsw i32 %idbase1, 12
+  %add11.3 = add nsw nuw i32 %idbase1, 12
   %id1.4 = zext i32 %add11.3 to i64
   %addr1.4 = getelementptr inbounds i32, i32 addrspace(1)* %src, i64 %id1.4
   %res1.3 = load i32, i32 addrspace(1)* %addr1.4, align 4
diff --git a/IGC/Compiler/tests/GEPLowering/gep_simplification.ll b/IGC/Compiler/tests/GEPLowering/gep_simplification.ll
@@ -1,6 +1,6 @@
 ;=========================== begin_copyright_notice ============================
 ;
-; Copyright (C) 2022-2024 Intel Corporation
+; Copyright (C) 2022-2025 Intel Corporation
 ;
 ; SPDX-License-Identifier: MIT
 ;
@@ -36,21 +36,21 @@ define spir_kernel void @test_gep(i32 addrspace(1)* %dst, i32 addrspace(1)* %src
 case1:
   %simdLaneId16 = call i16 @llvm.genx.GenISA.simdLaneId()
   %simdLaneId = zext i16 %simdLaneId16 to i32
-  %idbase1 = add nsw i32 %Offset32, %simdLaneId
+  %idbase1 = add nsw nuw i32 %Offset32, %simdLaneId
   %id1.1 = zext i32 %idbase1 to i64
   %addr1.1 = getelementptr inbounds i32, i32 addrspace(1)* %src, i64 %id1.1
   %res1.0 = load i32, i32 addrspace(1)* %addr1.1, align 4
-  %add11.1 = add nsw i32 %idbase1, 4
+  %add11.1 = add nsw nuw i32 %idbase1, 4
   %id1.2 = zext i32 %add11.1 to i64
   %addr1.2 = getelementptr inbounds i32, i32 addrspace(1)* %src, i64 %id1.2
   %res1.1 = load i32, i32 addrspace(1)* %addr1.2, align 4
   %sum1.0 = add nsw i32 %res1.0, %res1.1
-  %add11.2 = add nsw i32 %idbase1, 8
+  %add11.2 = add nsw nuw i32 %idbase1, 8
   %id1.3 = zext i32 %add11.2 to i64
   %addr1.3 = getelementptr inbounds i32, i32 addrspace(1)* %src, i64 %id1.3
   %res1.2 = load i32, i32 addrspace(1)* %addr1.3, align 4
   %sum1.1 = add nsw i32 %sum1.0, %res1.2
-  %add11.3 = add nsw i32 %idbase1, 12
+  %add11.3 = add nsw nuw i32 %idbase1, 12
   %id1.4 = zext i32 %add11.3 to i64
   %addr1.4 = getelementptr inbounds i32, i32 addrspace(1)* %src, i64 %id1.4
   %res1.3 = load i32, i32 addrspace(1)* %addr1.4, align 4
diff --git a/IGC/Compiler/tests/GEPLowering/unsigned-overflow.ll b/IGC/Compiler/tests/GEPLowering/unsigned-overflow.ll
@@ -0,0 +1,74 @@
+;=========================== begin_copyright_notice ============================
+;
+; Copyright (C) 2025 Intel Corporation
+;
+; SPDX-License-Identifier: MIT
+;
+;============================ end_copyright_notice =============================
+;
+; ------------------------------------------------
+; REQUIRES: llvm-14-plus
+; RUN: igc_opt --opaque-pointers --igc-gep-lowering -S < %s 2>&1 | FileCheck %s
+; ------------------------------------------------
+; GEPLowering - verify that address arithmetic based on first GEP index is not
+;               applied, when GEP index can be negative and zext if used on
+;               negative index may turn it into large positive value
+; ------------------------------------------------
+
+define spir_func void @test_gep_overflow(ptr addrspace(1) %src, i32 %conv13) {
+; CHECK-LABEL: @test_gep_overflow(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    [[SUB:%.*]] = add nsw i32 [[CONV13:%.*]], -2
+; CHECK-NEXT:    [[IDX_EXT19:%.*]] = zext i32 [[SUB]] to i64
+; CHECK-NEXT:    [[TMP0:%.*]] = ptrtoint ptr addrspace(1) [[SRC:%.*]] to i64
+; CHECK-NEXT:    [[TMP1:%.*]] = shl i64 [[IDX_EXT19]], 2
+; CHECK-NEXT:    [[TMP2:%.*]] = add i64 [[TMP0]], [[TMP1]]
+; CHECK-NEXT:    [[TMP3:%.*]] = inttoptr i64 [[TMP2]] to ptr addrspace(1)
+; CHECK-NEXT:    [[SUB22:%.*]] = add nsw i32 [[CONV13]], -1
+; CHECK-NEXT:    [[IDX_EXT35:%.*]] = zext i32 [[SUB22]] to i64
+; CHECK-NEXT:    [[TMP4:%.*]] = ptrtoint ptr addrspace(1) [[SRC]] to i64
+; CHECK-NEXT:    [[TMP5:%.*]] = shl i64 [[IDX_EXT35]], 2
+; CHECK-NEXT:    [[TMP6:%.*]] = add i64 [[TMP4]], [[TMP5]]
+; CHECK-NEXT:    [[TMP7:%.*]] = inttoptr i64 [[TMP6]] to ptr addrspace(1)
+; CHECK-NEXT:    ret void
+;
+entry:
+  %sub = add nsw i32 %conv13, -2
+  %idx.ext19 = zext i32 %sub to i64
+  %add.ptr20 = getelementptr inbounds float, ptr addrspace(1) %src, i64 %idx.ext19
+  %sub22 = add nsw i32 %conv13, -1
+  %idx.ext35 = zext i32 %sub22 to i64
+  %add.ptr36 = getelementptr inbounds float, ptr addrspace(1) %src, i64 %idx.ext35
+  ret void
+}
+
+define spir_func void @test_gep_no_overflow(ptr addrspace(1) %src, i32 %conv13) {
+; CHECK-LABEL: @test_gep_no_overflow(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    [[SUB:%.*]] = add nuw nsw i32 [[CONV13:%.*]], -2
+; CHECK-NEXT:    [[IDX_EXT19:%.*]] = zext i32 [[SUB]] to i64
+; CHECK-NEXT:    [[TMP0:%.*]] = ptrtoint ptr addrspace(1) [[SRC:%.*]] to i64
+; CHECK-NEXT:    [[TMP1:%.*]] = shl i64 [[IDX_EXT19]], 2
+; CHECK-NEXT:    [[TMP2:%.*]] = add i64 [[TMP0]], [[TMP1]]
+; CHECK-NEXT:    [[TMP3:%.*]] = inttoptr i64 [[TMP2]] to ptr addrspace(1)
+; CHECK-NEXT:    [[TMP4:%.*]] = add i64 [[TMP2]], 4
+; CHECK-NEXT:    [[TMP5:%.*]] = inttoptr i64 [[TMP4]] to ptr addrspace(1)
+; CHECK-NEXT:    ret void
+;
+entry:
+  %sub = add nsw nuw i32 %conv13, -2
+  %idx.ext19 = zext i32 %sub to i64
+  %add.ptr20 = getelementptr inbounds float, ptr addrspace(1) %src, i64 %idx.ext19
+  %sub22 = add nsw nuw i32 %conv13, -1
+  %idx.ext35 = zext i32 %sub22 to i64
+  %add.ptr36 = getelementptr inbounds float, ptr addrspace(1) %src, i64 %idx.ext35
+  ret void
+}
+
+!igc.functions = !{!0, !4}
+
+!0 = !{ptr @test_gep_overflow, !1}
+!1 = !{!2, !3}
+!2 = !{!"function_type", i32 0}
+!3 = !{!"implicit_arg_desc"}
+!4 = !{ptr @test_gep_no_overflow, !1}