Skip to content
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions src/coreclr/jit/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -97,6 +97,7 @@ set( JIT_SOURCES
asyncanalysis.cpp
bitset.cpp
block.cpp
boundscheckcoalesce.cpp
buildstring.cpp
codegencommon.cpp
codegenlinear.cpp
Expand Down
241 changes: 241 additions & 0 deletions src/coreclr/jit/boundscheckcoalesce.cpp
Original file line number Diff line number Diff line change
@@ -0,0 +1,241 @@
// Licensed to the .NET Foundation under one or more agreements.
// The .NET Foundation licenses this file to you under the MIT license.

//
// Bounds Check Coalescing
//
// Within a single block, when multiple GT_BOUNDS_CHECK nodes share the same
// length VN and use constant indices, only the bounds check with the largest
// constant index is actually needed. This pass finds such groups and
// strengthens the FIRST bounds check in the group by replacing its constant
// index with the maximum constant index in the group. Forward assertion prop
// then drops the now-redundant later bounds checks.
//
// Example: `a[0] + a[1] + a[2] + a[3]` produces four bounds checks with
// indices 0, 1, 2, 3 and the same length. We rewrite the first BC's index
// to 3; forward assertion prop then drops the other three as redundant.
//
// Safety:
// * Strengthening is sound: if the new (stronger) check passes, all the
// original (weaker) checks would have passed too. If it fails, one of
// the original checks would have failed too -- both throw the same
// IndexOutOfRangeException.
// * We only coalesce bounds checks that are not separated by side effects
// that could change observable exception ordering: calls, any other
// potentially-throwing node (div/mod, checked arithmetic, faulting
// indirections / null checks, etc.), `GTF_ORDER_SIDEEFF` (e.g. volatile
// loads), heap-visible stores, and stores to locals that are live across
// an exception handler reachable from this block. Other bounds checks
// between members of the group are not barriers (they only throw IOOB,
// the same exception type our strengthened check throws).
// * We require all candidates in the group to have the same length VN
// and constant non-negative indices. The first BC's index must itself
// be a constant so it can be mutated in place.
//
// This phase runs before PHASE_ASSERTION_PROP_MAIN so that the existing
// forward direction of assertion prop sees the strengthened first BC and
// drops the redundant followers.
//

#include "jitpch.h"

#ifdef _MSC_VER
#pragma hdrstop
#endif

namespace
{
struct BoundsCheckCandidate
{
GenTreeBoundsChk* m_bc;
Statement* m_stmt;
ValueNum m_lenVN;
int m_offset;
int m_barrierCount;

BoundsCheckCandidate(GenTreeBoundsChk* bc, Statement* stmt, ValueNum lenVN, int offset, int barrierCount)
: m_bc(bc)
, m_stmt(stmt)
, m_lenVN(lenVN)
, m_offset(offset)
, m_barrierCount(barrierCount)
{
}
};

//------------------------------------------------------------------------
// IsSideEffectBarrier: check if a node blocks bounds check coalescing
//
// Returns true if a node may have a side effect that should prevent us from
// reordering an earlier bounds-check failure across it.
//
// Bounds checks themselves are not barriers: their only exception is IOOB,
// the same exception type our strengthened check throws.
//
// Stores to tracked locals that are not live across any exception handler
// reachable from this block are not barriers: they cannot be observed if a
// bounds-check failure is reordered to before them.
//
bool IsSideEffectBarrier(Compiler* comp, GenTree* node, bool blockHasEHSuccs)
{
if (node->IsCall())
{
return true;
}
if (node->OperIs(GT_BOUNDS_CHECK))
{
return false;
}
if (node->OperMayThrow(comp))
{
return true;
}
if ((node->gtFlags & GTF_ORDER_SIDEEFF) != 0)
{
return true;
}
if (node->OperIsStore())
{
if (!node->OperIsLocalStore())
{
return true;
}
if (!blockHasEHSuccs)
{
return false;
}
LclVarDsc const* const dsc = comp->lvaGetDesc(node->AsLclVarCommon());
return !dsc->lvTracked || dsc->lvLiveInOutOfHndlr;
}
return false;
}
} // namespace

//------------------------------------------------------------------------
// optBoundsCheckCoalesce: Coalesce bounds checks within each block.
//
// Returns:
// Suitable phase status.
//
PhaseStatus Compiler::optBoundsCheckCoalesce()
{
if (!doesMethodHaveBoundsChecks())
{
JITDUMP("Method has no bounds checks\n");
return PhaseStatus::MODIFIED_NOTHING;
}

if (fgSsaPassesCompleted == 0)
{
return PhaseStatus::MODIFIED_NOTHING;
}

bool modified = false;
CompAllocator alloc(getAllocator(CMK_AssertionProp));

// Per-block scratch state, reused across blocks. The candidates stack
// holds the "head" (first) candidate in each (barrierCount, lenVN) group;
// followers only update the head's running max offset and are not retained.
// groupMap maps a packed (barrierCount, lenVN) key to the candidate index
// of the group head.
typedef JitHashTable<UINT64, JitLargePrimitiveKeyFuncs<UINT64>, int> GroupMap;
ArrayStack<BoundsCheckCandidate> candidates(alloc);
GroupMap groupMap(alloc);

auto const makeKey = [](int barrierCount, ValueNum lenVN) -> UINT64 {
return (static_cast<UINT64>(static_cast<UINT32>(barrierCount)) << 32) | static_cast<UINT32>(lenVN);
};

for (BasicBlock* const block : Blocks())
{
candidates.Reset();
groupMap.RemoveAll();
int barrierCount = 0;
bool const blockHasEHSuccs = block->HasPotentialEHSuccs(this);

for (Statement* const stmt : block->Statements())
{
for (GenTree* const node : stmt->TreeList())
{
if (IsSideEffectBarrier(this, node, blockHasEHSuccs))
{
barrierCount++;
continue;
}

if (!node->OperIs(GT_BOUNDS_CHECK))
{
continue;
}

GenTreeBoundsChk* const bc = node->AsBoundsChk();
if (bc->gtThrowKind != SCK_RNGCHK_FAIL)
{
continue;
}

GenTree* const idx = bc->GetIndex();
if (!idx->IsIntCnsFitsInI32())
{
continue;
}

int const offset = static_cast<int>(idx->AsIntCon()->IconValue());
if (offset < 0)
{
continue;
}

ValueNum const lenVN = vnStore->VNConservativeNormalValue(bc->GetArrayLength()->gtVNPair);
if (lenVN == ValueNumStore::NoVN)
{
continue;
}

UINT64 const key = makeKey(barrierCount, lenVN);
int headIndex;
if (!groupMap.Lookup(key, &headIndex))
{
// First member of this group: record it as the head and keep it
// in the candidates stack so we can strengthen it later.
groupMap.Set(key, candidates.Height());
candidates.Emplace(bc, stmt, lenVN, offset, barrierCount);
continue;
}

// Follower: bump the head's running max offset. Once we
// strengthen the head, forward assertion prop will drop us.
BoundsCheckCandidate& head = candidates.BottomRef(headIndex);
JITDUMP("BC coalesce in " FMT_BB ": [%06u] (offset %d) is redundant given [%06u]\n", block->bbNum,
dspTreeID(bc), offset, dspTreeID(head.m_bc));
if (offset > head.m_offset)
{
head.m_offset = offset;
}
}
}

// Strengthen each group head whose recorded max exceeds its original
// index. Heads with no stronger follower are left alone -- existing
// forward assertion prop already handles equal-or-weaker followers.
for (int i = 0; i < candidates.Height(); i++)
{
BoundsCheckCandidate& head = candidates.BottomRef(i);
GenTreeIntCon* const idxCns = head.m_bc->GetIndex()->AsIntCon();
int const original = static_cast<int>(idxCns->IconValue());
if (head.m_offset == original)
{
continue;
}

JITDUMP("BC coalesce in " FMT_BB ": strengthen [%06u] offset %d -> %d (lenVN " FMT_VN ")\n", block->bbNum,
dspTreeID(head.m_bc), original, head.m_offset, head.m_lenVN);

idxCns->SetIconValue(head.m_offset);
idxCns->gtVNPair.SetBoth(vnStore->VNForIntCon(head.m_offset));
modified = true;
}
}

return modified ? PhaseStatus::MODIFIED_EVERYTHING : PhaseStatus::MODIFIED_NOTHING;
}
4 changes: 4 additions & 0 deletions src/coreclr/jit/compiler.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -4807,6 +4807,10 @@ void Compiler::compCompile(void** methodCodePtr, uint32_t* methodCodeSize, JitFl

if (doAssertionProp)
{
// Coalesce groups of constant-indexed bounds checks.
//
DoPhase(this, PHASE_BOUNDS_CHECK_COALESCE, &Compiler::optBoundsCheckCoalesce);
Comment thread
AndyAyersMS marked this conversation as resolved.

// Assertion propagation
//
DoPhase(this, PHASE_ASSERTION_PROP_MAIN, &Compiler::optAssertionPropMain);
Expand Down
1 change: 1 addition & 0 deletions src/coreclr/jit/compiler.h
Original file line number Diff line number Diff line change
Expand Up @@ -7281,6 +7281,7 @@ class Compiler

PhaseStatus optCloneLoops();
PhaseStatus optRangeCheckCloning();
PhaseStatus optBoundsCheckCoalesce();
void optCloneLoop(FlowGraphNaturalLoop* loop, LoopCloneContext* context);
PhaseStatus optUnrollLoops(); // Unrolls loops (needs to have cost info)
bool optTryUnrollLoop(FlowGraphNaturalLoop* loop, bool* changedIR);
Expand Down
1 change: 1 addition & 0 deletions src/coreclr/jit/compphases.h
Original file line number Diff line number Diff line change
Expand Up @@ -102,6 +102,7 @@ CompPhaseNameMacro(PHASE_OPTIMIZE_VALNUM_CSES, "Optimize Valnum CSEs",
CompPhaseNameMacro(PHASE_VN_COPY_PROP, "VN based copy prop", false, -1, false)
CompPhaseNameMacro(PHASE_VN_BASED_INTRINSIC_EXPAND, "VN based intrinsic expansion", false, -1, false)
CompPhaseNameMacro(PHASE_OPTIMIZE_BRANCHES, "Redundant branch opts", false, -1, false)
CompPhaseNameMacro(PHASE_BOUNDS_CHECK_COALESCE, "Coalesce bounds checks", false, -1, false)
CompPhaseNameMacro(PHASE_ASSERTION_PROP_MAIN, "Assertion prop", false, -1, false)
CompPhaseNameMacro(PHASE_RANGE_CHECK_CLONING, "Clone blocks with range checks", false, -1, false)
CompPhaseNameMacro(PHASE_IF_CONVERSION, "If conversion", false, -1, false)
Expand Down
108 changes: 108 additions & 0 deletions src/tests/JIT/opt/RangeChecks/ElidedBoundsChecks.cs
Original file line number Diff line number Diff line change
Expand Up @@ -95,6 +95,74 @@ static bool TryStripFirstChar(ref ReadOnlySpan<char> span, char value)
return false;
}

[MethodImpl(MethodImplOptions.NoInlining)]
static int Sum4Increasing(int[] a) => a[0] + a[1] + a[2] + a[3];

[MethodImpl(MethodImplOptions.NoInlining)]
static int Sum4Span(ReadOnlySpan<int> s) => s[0] + s[1] + s[2] + s[3];

[MethodImpl(MethodImplOptions.NoInlining)]
static int Sum4MixedOrder(int[] a) => a[2] + a[3] + a[0] + a[1];

[MethodImpl(MethodImplOptions.NoInlining)]
static int DivBetweenBCs(int[] a, int divisor)
{
// The divide must not be reordered with a[5]: when divisor == 0 we
// must observe DivideByZeroException, not IndexOutOfRangeException.
int x = a[3];
int y = 100 / divisor;
return x + y + a[5];
}

[MethodImpl(MethodImplOptions.NoInlining)]
static int NreBetweenBCs(int[] a, int[] b)
{
// First touch of b may throw NRE; that must not be reordered with
// a[5]: when b == null we must observe NullReferenceException.
int x = a[3];
int y = b.Length;
return x + y + a[5];
}

[MethodImpl(MethodImplOptions.NoInlining)]
static int LocalLiveInCatch(int[] a)
{
// The store `x = 99` is between two BCs in a try block whose local is
// live in the catch. It must act as a barrier: if a[3]'s BC were
// strengthened to length 6, the IOOB would fire before x=99 and the
// catch would observe x == -1 instead of 99.
int x = -1;
try
{
int t = a[3];
x = 99;
return t + a[5];
}
catch (IndexOutOfRangeException)
{
return x;
}
}

static int s_finallyObserved;

[MethodImpl(MethodImplOptions.NoInlining)]
static int LocalLiveInFinally(int[] a)
{
// Same idea, but the local is live into a finally rather than a catch.
int x = -1;
try
{
int t = a[3];
x = 99;
return t + a[5];
}
finally
{
s_finallyObserved = x;
}
}

[Fact]
public static int TestEntryPoint()
{
Expand Down Expand Up @@ -139,6 +207,46 @@ public static int TestEntryPoint()
if (TryStripFirstChar(ref chars, 'h') != false)
return 0;

// Bounds-check coalescing: 4 constant indices, same length VN.
int[] arr4 = new int[] { 10, 20, 30, 40 };
if (Sum4Increasing(arr4) != 100)
return 0;
if (Sum4Span(arr4) != 100)
return 0;
if (Sum4MixedOrder(arr4) != 100)
return 0;

// Short array: must throw IndexOutOfRangeException.
Assert.Throws<IndexOutOfRangeException>(() => Sum4Increasing(new int[3]));
Assert.Throws<IndexOutOfRangeException>(() => Sum4MixedOrder(new int[3]));

// Exception ordering must be preserved across non-IOOB throwers.
int[] arr6 = new int[] { 1, 2, 3, 4, 5, 6 };
if (DivBetweenBCs(arr6, 5) != (arr6[3] + 100 / 5 + arr6[5]))
return 0;

// divisor == 0 with a too short for a[5]: must be DivideByZero, not IOOB.
Assert.Throws<DivideByZeroException>(() => DivBetweenBCs(new int[4], 0));

// b == null with a too short for a[5]: must be NRE, not IOOB.
Assert.Throws<NullReferenceException>(() => NreBetweenBCs(new int[4], null));

// Local live in catch handler: a[3]'s BC must not be strengthened to
// a[5] across the `x = 99` store, otherwise the catch would see -1.
if (LocalLiveInCatch(new int[4]) != 99)
return 0;

// Local live in finally: same constraint, observed via static field.
s_finallyObserved = 0;
try
{
LocalLiveInFinally(new int[4]);
return 0;
}
catch (IndexOutOfRangeException) { }
if (s_finallyObserved != 99)
return 0;

return 100;
}
}
Loading