Enzyme/CacheUtility_8h_source.html

//===- CacheUtility.h - Caching values in the forward pass for later use

//---===//

//

//                             Enzyme Project

//

// Part of the Enzyme Project, under the Apache License v2.0 with LLVM

// Exceptions. See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

// If using this code in an academic setting, please cite the following:

// @incollection{enzymeNeurips,

// title = {Instead of Rewriting Foreign Code for Machine Learning,

//          Automatically Synthesize Fast Gradients},

// author = {Moses, William S. and Churavy, Valentin},

// booktitle = {Advances in Neural Information Processing Systems 33},

// year = {2020},

// note = {To appear in},

// }

//

//===----------------------------------------------------------------------===//

//

// This file declares a base helper class CacheUtility that manages the cache

// of values from the forward pass for later use.

//

//===----------------------------------------------------------------------===//


#ifndef ENZYME_CACHE_UTILITY_H

#define ENZYME_CACHE_UTILITY_H


#include <llvm/Config/llvm-config.h>

#if LLVM_VERSION_MAJOR >= 16

#define private public

#include "llvm/Analysis/ScalarEvolution.h"

#include "llvm/Transforms/Utils/ScalarEvolutionExpander.h"

#undef private

#else

#include "SCEV/ScalarEvolution.h"

#include "SCEV/ScalarEvolutionExpander.h"

#endif


#include "llvm/ADT/STLExtras.h"

#include "llvm/ADT/SmallPtrSet.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/IR/Instructions.h"


#include "llvm/Analysis/AssumptionCache.h"

#include "llvm/Analysis/TargetLibraryInfo.h"

#include "llvm/IR/Dominators.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Transforms/Utils/ValueMapper.h"


#include "FunctionUtils.h"

#include "MustExitScalarEvolution.h"


extern "C" {

/// Pack 8 bools together in a single byte

extern llvm::cl::opt<bool> EfficientBoolCache;


extern llvm::cl::opt<bool> EnzymeZeroCache;

}


/// Container for all loop information to synthesize gradients


struct LoopContext {

  /// Canonical induction variable of the loop

  llvm::AssertingVH<llvm::PHINode> var;


  /// Increment of the induction

  llvm::AssertingVH<llvm::Instruction> incvar;


  /// Allocation of induction variable of reverse pass

  llvm::AssertingVH<llvm::AllocaInst> antivaralloc;


  /// Header of this loop

  llvm::BasicBlock *header;


  /// Preheader of this loop

  llvm::BasicBlock *preheader;


  /// Whether this loop has a statically analyzable number of iterations

  bool dynamic;


  /// limit is last value of a canonical induction variable

  /// iters is number of times loop is run (thus iters = limit + 1)

  AssertingReplacingVH maxLimit;


  AssertingReplacingVH trueLimit;


  /// An offset to add to the index when getting the cache pointer.

  AssertingReplacingVH offset;


  /// An overriding allocation limit size.

  AssertingReplacingVH allocLimit;


  /// All blocks this loop exits too

  llvm::SmallPtrSet<llvm::BasicBlock *, 8> exitBlocks;


  /// Parent loop of this loop

  llvm::Loop *parent;

};


static inline bool operator==(const LoopContext &lhs, const LoopContext &rhs) {

  return lhs.parent == rhs.parent;

}


/// Modes of potential unwraps


enum class UnwrapMode {

  // It is already known that it is legal to fully unwrap

  // this instruction. This means unwrap this instruction,

  // its operands, etc. However, this will stop at known

  // cached available from a tape.

  LegalFullUnwrap,

  // Unlike LegalFullUnwrap, this will unwrap through a tape

  LegalFullUnwrapNoTapeReplace,

  // Attempt to fully unwrap this, looking up whenever it

  // is not legal to unwrap

  AttemptFullUnwrapWithLookup,

  // Attempt to fully unwrap this

  AttemptFullUnwrap,

  // Unwrap the current instruction but not its operand

  AttemptSingleUnwrap,

};


static inline llvm::raw_ostream &operator<<(llvm::raw_ostream &os,

                                            UnwrapMode mode) {

  switch (mode) {

  case UnwrapMode::LegalFullUnwrap:

    os << "LegalFullUnwrap";

    break;

  case UnwrapMode::LegalFullUnwrapNoTapeReplace:

    os << "LegalFullUnwrapNoTapeReplace";

    break;

  case UnwrapMode::AttemptFullUnwrapWithLookup:

    os << "AttemptFullUnwrapWithLookup";

    break;

  case UnwrapMode::AttemptFullUnwrap:

    os << "AttemptFullUnwrap";

    break;

  case UnwrapMode::AttemptSingleUnwrap:

    os << "AttemptSingleUnwrap";

    break;

  }

  return os;

}


class CacheUtility {

public:

  /// The function whose instructions we are caching

  llvm::Function *const newFunc;


  /// Various analysis results of newFunc

  llvm::TargetLibraryInfo &TLI;

  llvm::DominatorTree DT;


protected:

  llvm::LoopInfo LI;

  llvm::AssumptionCache AC;

  MustExitScalarEvolution SE;


public:

  // Helper basicblock where all new allocations will be added to

  // This includes allocations for cache variables

  llvm::BasicBlock *inversionAllocs;


protected:


  CacheUtility(llvm::TargetLibraryInfo &TLI, llvm::Function *newFunc)

      : newFunc(newFunc), TLI(TLI), DT(*newFunc), LI(DT), AC(*newFunc),

        SE(*newFunc, TLI, AC, DT, LI) {

    inversionAllocs = llvm::BasicBlock::Create(newFunc->getContext(),

                                               "allocsForInversion", newFunc);

  }


public:

  virtual ~CacheUtility();


protected:

  /// Map of Loop to requisite loop information needed for AD (forward/reverse

  /// induction/etc)

  std::map<llvm::Loop *, LoopContext> loopContexts;


public:

  /// Given a BasicBlock BB in newFunc, set loopContext to the relevant

  /// contained loop and return true. If BB is not in a loop, return false

  bool getContext(llvm::BasicBlock *BB, LoopContext &loopContext,

                  bool ReverseLimit);

  /// Return whether the given instruction is used as necessary as part of a

  /// loop context This includes as the canonical induction variable or

  /// increment


  bool isInstructionUsedInLoopInduction(llvm::Instruction &I) {

    for (auto &context : loopContexts) {

      if (context.second.var == &I || context.second.incvar == &I ||

          context.second.maxLimit == &I || context.second.trueLimit == &I) {

        return true;

      }

    }

    return false;

  }


  llvm::AllocaInst *getDynamicLoopLimit(llvm::Loop *L,

                                        bool ReverseLimit = true);


  /// Print out all currently cached values


  void dumpScope() {

    llvm::errs() << "scope:\n";

    for (auto a : scopeMap) {

      llvm::errs() << "   scopeMap[" << *a.first << "] = " << *a.second.first

                   << " ctx:" << a.second.second.Block->getName() << "\n";

    }

    llvm::errs() << "end scope\n";

  }


  unsigned getCacheAlignment(unsigned bsize) const {

    if ((bsize & (bsize - 1)) == 0) {

      if (bsize > 8)

        return 8;

      else

        return bsize;

    } else if (bsize > 0 && bsize % 8 == 0) {

      return 8;

    } else if (bsize > 0 && bsize % 4 == 0) {

      return 4;

    } else if (bsize > 0 && bsize % 2 == 0) {

      return 2;

    } else

      return 1;

  }


  /// Erase this instruction both from LLVM modules and any local

  /// data-structures

  virtual void erase(llvm::Instruction *I);

  /// Replace this instruction both in LLVM modules and any local

  /// data-structures

  virtual void replaceAWithB(llvm::Value *A, llvm::Value *B,

                             bool storeInCache = false);


  // Context information to request calculation of loop limit information


  struct LimitContext {

    // Whether the limit needs to be accessible for a reverse pass

    bool ReverseLimit;


    // A block inside of the loop, defining the location

    llvm::BasicBlock *Block;

    // Instead of getting the actual limits, return a limit of one

    bool ForceSingleIteration;


    LimitContext(bool ReverseLimit, llvm::BasicBlock *Block,

                 bool ForceSingleIteration = false)

        : ReverseLimit(ReverseLimit), Block(Block),

          ForceSingleIteration(ForceSingleIteration) {}


  };


  /// Given a LimitContext ctx, representing a location inside a loop nest,

  /// break each of the loops up into chunks of loops where each chunk's number

  /// of iterations can be computed at the chunk preheader. Every dynamic loop

  /// defines the start of a chunk. SubLimitType is a vector of chunk objects.

  /// More specifically it is a vector of { # iters in a Chunk (sublimit), Chunk

  /// } Each chunk object is a vector of loops contained within the chunk. For

  /// every loop, this returns pair of the LoopContext and the limit of that

  /// loop Both the vector of Chunks and vector of Loops within a Chunk go from

  /// innermost loop to outermost loop.

  typedef llvm::SmallVector<std::pair<

                                /*sublimit*/ llvm::Value *,

                                /*loop limits*/ llvm::SmallVector<

                                    std::pair<LoopContext, llvm::Value *>, 4>>,

                            0>

      SubLimitType;

  SubLimitType getSubLimits(bool inForwardPass, llvm::IRBuilder<> *RB,

                            LimitContext ctx, llvm::Value *extraSize = nullptr);


private:

  /// Internal data structure used by getSubLimit to avoid computing the same

  /// loop limit multiple times if possible. Map's a desired limitMinus1 (see

  /// getSubLimits) and the block the true limit requested to the value of the

  /// limit accessible at that block

  llvm::ValueMap<llvm::Value *,

                 std::map<llvm::BasicBlock *, llvm::WeakTrackingVH>>

      LimitCache;

  /// Internal data structure used by getSubLimit to avoid computing the

  /// cumulative loop limit multiple times if possible. Map's a desired pair of

  /// operands to be multiplied (see getSubLimits) and the block the cumulative

  /// limit requested to the value of the limit accessible at that block This

  /// cache is also shared with computeIndexOfChunk

  std::map<std::tuple<llvm::Value *, llvm::Value *, llvm::BasicBlock *>,

           llvm::Value *>

      SizeCache;


  /// Given a loop context, compute the corresponding index into said loop at

  /// the IRBuilder<>

  llvm::Value *computeIndexOfChunk(

      bool inForwardPass, llvm::IRBuilder<> &v,

      llvm::ArrayRef<std::pair<LoopContext, llvm::Value *>> containedloops,

      const llvm::ValueToValueMapTy &available);


private:

  /// Given a cache allocation and an index denoting how many Chunks deep the

  /// allocation is being indexed into, return the invariant metadata describing

  /// used to describe loads/stores to the indexed pointer

  /// Note that the cache allocation should either be an allocainst (if in

  /// fwd/both) or an extraction from the tape

  std::map<std::pair<llvm::Value *, int>, llvm::MDNode *>

      CachePointerInvariantGroups;

  /// Given a value being cached, return the invariant metadata of any

  /// loads/stores to memory storing that value

  std::map<llvm::Value *, llvm::MDNode *> ValueInvariantGroups;


protected:

  /// A map of values being cached to their underlying allocation/limit context

  std::map<llvm::Value *,

           std::pair<llvm::AssertingVH<llvm::AllocaInst>, LimitContext>>

      scopeMap;


  /// A map of allocations to a vector of instruction used to create by the

  /// allocation Keeping track of these values is useful for deallocation. This

  /// is stored as a vector explicitly to order theses instructions in such a

  /// way that they can be erased by iterating in reverse order.

  std::map<llvm::AllocaInst *,

           llvm::SmallVector<llvm::AssertingVH<llvm::Instruction>, 4>>

      scopeInstructions;


  /// A map of allocations to a set of instructions which free memory as part of

  /// the cache.

  std::map<llvm::AllocaInst *, std::set<llvm::AssertingVH<llvm::CallInst>>>

      scopeFrees;


  /// A map of allocations to a set of instructions which allocate memory as

  /// part of the cache

  std::map<llvm::AllocaInst *,

           llvm::SmallVector<llvm::AssertingVH<llvm::CallInst>, 4>>

      scopeAllocs;


  /// Perform the final load from the cache, applying requisite invariant

  /// group and alignment

  llvm::Value *loadFromCachePointer(llvm::Type *T, llvm::IRBuilder<> &BuilderM,

                                    llvm::Value *cptr, llvm::Value *cache);


public:

  /// Create a cache of Type T at the given LimitContext. If allocateInternal is

  /// set this will allocate the requesite memory. If extraSize is set,

  /// allocations will be a factor of extraSize larger

  llvm::AllocaInst *createCacheForScope(LimitContext ctx, llvm::Type *T,

                                        llvm::StringRef name, bool shouldFree,

                                        bool allocateInternal = true,

                                        llvm::Value *extraSize = nullptr);


  /// High-level utility to "unwrap" an instruction at a new location specified

  /// by BuilderM. Depending on the mode, it will either just unwrap this

  /// instruction, all of its instructions operands, and optionally lookup

  /// values when it is not legal to unwrap. If a value cannot be unwrap'd at a

  /// given location, this will null. This high-level utility should be

  /// implemented based off the low-level caching infrastructure provided in

  /// this class.

  virtual llvm::Value *

  unwrapM(llvm::Value *const val, llvm::IRBuilder<> &BuilderM,

          const llvm::ValueToValueMapTy &available, UnwrapMode mode,

          llvm::BasicBlock *scope = nullptr, bool permitCache = true) = 0;


  /// High-level utility to get the value an instruction at a new location

  /// specified by BuilderM. Unlike unwrap, this function can never fail --

  /// falling back to creating a cache if necessary. This function is

  /// prepopulated with a set of values that are already known to be available

  /// and may contain optimizations for getting the value in more efficient ways

  /// (e.g. unwrap'ing when legal, looking up equivalent values, etc). This

  /// high-level utility should be implemented based off the low-level caching

  /// infrastructure provided in this class.

  virtual llvm::Value *

  lookupM(llvm::Value *val, llvm::IRBuilder<> &BuilderM,

          const llvm::ValueToValueMapTy &incoming_availalble =

              llvm::ValueToValueMapTy(),

          bool tryLegalityCheck = true, llvm::BasicBlock *scope = nullptr) = 0;


  virtual bool assumeDynamicLoopOfSizeOne(llvm::Loop *L) const = 0;


  /// If an allocation is requested to be freed, this subclass will be called to

  /// chose how and where to free it. It is by default not implemented, falling

  /// back to an error. Subclasses who want to free memory should implement this

  /// function.


  virtual llvm::CallInst *freeCache(llvm::BasicBlock *forwardPreheader,

                                    const SubLimitType &antimap, int i,

                                    llvm::AllocaInst *alloc, llvm::Type *myType,

                                    llvm::ConstantInt *byteSizeOfType,

                                    llvm::Value *storeInto,

                                    llvm::MDNode *InvariantMD) {

    assert(0 && "freeing cache not handled in this scenario");

    llvm_unreachable("freeing cache not handled in this scenario");

  }


  /// Given an allocation defined at a particular ctx, store the value val

  /// in the cache at the location defined in the given builder

  void storeInstructionInCache(LimitContext ctx, llvm::IRBuilder<> &BuilderM,

                               llvm::Value *val, llvm::AllocaInst *cache,

                               llvm::MDNode *TBAA = nullptr);


  /// Given an allocation defined at a particular ctx, store the instruction

  /// in the cache right after the instruction is executed

  void storeInstructionInCache(LimitContext ctx, llvm::Instruction *inst,

                               llvm::AllocaInst *cache,

                               llvm::MDNode *TBAA = nullptr);


  /// Given an allocation specified by the LimitContext ctx and cache, compute a

  /// pointer that can hold the underlying type being cached. This value should

  /// be computed at BuilderM. Optionally, instructions needed to generate this

  /// pointer can be stored in scopeInstructions

  llvm::Value *getCachePointer(llvm::Type *T, bool inForwardPass,

                               llvm::IRBuilder<> &BuilderM, LimitContext ctx,

                               llvm::Value *cache, bool storeInInstructionsMap,

                               const llvm::ValueToValueMapTy &available,

                               llvm::Value *extraSize);


  /// Given an allocation specified by the LimitContext ctx and cache, lookup

  /// the underlying cached value.

  llvm::Value *lookupValueFromCache(llvm::Type *T, bool inForwardPass,

                                    llvm::IRBuilder<> &BuilderM,

                                    LimitContext ctx, llvm::Value *cache,

                                    bool isi1,

                                    const llvm::ValueToValueMapTy &available,

                                    llvm::Value *extraSize = nullptr,

                                    llvm::Value *extraOffset = nullptr);


protected:

  // List of values loaded from the cache

  llvm::SmallPtrSet<llvm::LoadInst *, 10> CacheLookups;

};


// Create a new canonical induction variable of Type Ty for Loop L

// Return the variable and the increment instruction

std::pair<llvm::PHINode *, llvm::Instruction *>

InsertNewCanonicalIV(llvm::Loop *L, llvm::Type *Ty,

                     const llvm::Twine &Name = "iv");


// Attempt to rewrite all phinode's in the loop in terms of the

// induction variable

void RemoveRedundantIVs(

    llvm::BasicBlock *Header, llvm::PHINode *CanonicalIV,

    llvm::Instruction *Increment, MustExitScalarEvolution &SE,

    llvm::function_ref<void(llvm::Instruction *, llvm::Value *)> replacer,

    llvm::function_ref<void(llvm::Instruction *)> eraser);

#endif

InsertNewCanonicalIV
std::pair< llvm::PHINode *, llvm::Instruction * > InsertNewCanonicalIV(llvm::Loop *L, llvm::Type *Ty, const llvm::Twine &Name="iv")

EnzymeZeroCache
llvm::cl::opt< bool > EnzymeZeroCache

EfficientBoolCache
llvm::cl::opt< bool > EfficientBoolCache
Pack 8 bools together in a single byte.

UnwrapMode
UnwrapMode
Modes of potential unwraps.
Definition CacheUtility.h:105

UnwrapMode::LegalFullUnwrap
@ LegalFullUnwrap

UnwrapMode::AttemptSingleUnwrap
@ AttemptSingleUnwrap

UnwrapMode::AttemptFullUnwrap
@ AttemptFullUnwrap

UnwrapMode::LegalFullUnwrapNoTapeReplace
@ LegalFullUnwrapNoTapeReplace

UnwrapMode::AttemptFullUnwrapWithLookup
@ AttemptFullUnwrapWithLookup

RemoveRedundantIVs
void RemoveRedundantIVs(llvm::BasicBlock *Header, llvm::PHINode *CanonicalIV, llvm::Instruction *Increment, MustExitScalarEvolution &SE, llvm::function_ref< void(llvm::Instruction *, llvm::Value *)> replacer, llvm::function_ref< void(llvm::Instruction *)> eraser)

operator<<
static llvm::raw_ostream & operator<<(llvm::raw_ostream &os, UnwrapMode mode)
Definition CacheUtility.h:122

operator==
static bool operator==(const LoopContext &lhs, const LoopContext &rhs)
Definition CacheUtility.h:100

FunctionUtils.h

MustExitScalarEvolution.h

AssertingReplacingVH
Definition Utils.h:1219

CacheUtility
Definition CacheUtility.h:144

CacheUtility::newFunc
llvm::Function *const newFunc
The function whose instructions we are caching.
Definition CacheUtility.h:147

CacheUtility::SE
MustExitScalarEvolution SE
Definition CacheUtility.h:156

CacheUtility::unwrapM
virtual llvm::Value * unwrapM(llvm::Value *const val, llvm::IRBuilder<> &BuilderM, const llvm::ValueToValueMapTy &available, UnwrapMode mode, llvm::BasicBlock *scope=nullptr, bool permitCache=true)=0
High-level utility to "unwrap" an instruction at a new location specified by BuilderM.

CacheUtility::freeCache
virtual llvm::CallInst * freeCache(llvm::BasicBlock *forwardPreheader, const SubLimitType &antimap, int i, llvm::AllocaInst *alloc, llvm::Type *myType, llvm::ConstantInt *byteSizeOfType, llvm::Value *storeInto, llvm::MDNode *InvariantMD)
If an allocation is requested to be freed, this subclass will be called to chose how and where to fre...
Definition CacheUtility.h:375

CacheUtility::scopeAllocs
std::map< llvm::AllocaInst *, llvm::SmallVector< llvm::AssertingVH< llvm::CallInst >, 4 > > scopeAllocs
A map of allocations to a set of instructions which allocate memory as part of the cache.
Definition CacheUtility.h:327

CacheUtility::createCacheForScope
llvm::AllocaInst * createCacheForScope(LimitContext ctx, llvm::Type *T, llvm::StringRef name, bool shouldFree, bool allocateInternal=true, llvm::Value *extraSize=nullptr)
Create a cache of Type T at the given LimitContext.
Definition CacheUtility.cpp:789

CacheUtility::erase
virtual void erase(llvm::Instruction *I)
Erase this instruction both from LLVM modules and any local data-structures.
Definition CacheUtility.cpp:55

CacheUtility::CacheUtility
CacheUtility(llvm::TargetLibraryInfo &TLI, llvm::Function *newFunc)
Definition CacheUtility.h:164

CacheUtility::getCachePointer
llvm::Value * getCachePointer(llvm::Type *T, bool inForwardPass, llvm::IRBuilder<> &BuilderM, LimitContext ctx, llvm::Value *cache, bool storeInInstructionsMap, const llvm::ValueToValueMapTy &available, llvm::Value *extraSize)
Given an allocation specified by the LimitContext ctx and cache, compute a pointer that can hold the ...
Definition CacheUtility.cpp:1481

CacheUtility::lookupValueFromCache
llvm::Value * lookupValueFromCache(llvm::Type *T, bool inForwardPass, llvm::IRBuilder<> &BuilderM, LimitContext ctx, llvm::Value *cache, bool isi1, const llvm::ValueToValueMapTy &available, llvm::Value *extraSize=nullptr, llvm::Value *extraOffset=nullptr)
Given an allocation specified by the LimitContext ctx and cache, lookup the underlying cached value.
Definition CacheUtility.cpp:1614

CacheUtility::getContext
bool getContext(llvm::BasicBlock *BB, LoopContext &loopContext, bool ReverseLimit)
Given a BasicBlock BB in newFunc, set loopContext to the relevant contained loop and return true.
Definition CacheUtility.cpp:496

CacheUtility::loadFromCachePointer
llvm::Value * loadFromCachePointer(llvm::Type *T, llvm::IRBuilder<> &BuilderM, llvm::Value *cptr, llvm::Value *cache)
Perform the final load from the cache, applying requisite invariant group and alignment.
Definition CacheUtility.cpp:1586

CacheUtility::scopeFrees
std::map< llvm::AllocaInst *, std::set< llvm::AssertingVH< llvm::CallInst > > > scopeFrees
A map of allocations to a set of instructions which free memory as part of the cache.
Definition CacheUtility.h:321

CacheUtility::~CacheUtility
virtual ~CacheUtility()
Definition CacheUtility.cpp:52

CacheUtility::dumpScope
void dumpScope()
Print out all currently cached values.
Definition CacheUtility.h:201

CacheUtility::DT
llvm::DominatorTree DT
Definition CacheUtility.h:151

CacheUtility::TLI
llvm::TargetLibraryInfo & TLI
Various analysis results of newFunc.
Definition CacheUtility.h:150

CacheUtility::LI
llvm::LoopInfo LI
Definition CacheUtility.h:154

CacheUtility::loopContexts
std::map< llvm::Loop *, LoopContext > loopContexts
Map of Loop to requisite loop information needed for AD (forward/reverse induction/etc)
Definition CacheUtility.h:177

CacheUtility::scopeInstructions
std::map< llvm::AllocaInst *, llvm::SmallVector< llvm::AssertingVH< llvm::Instruction >, 4 > > scopeInstructions
A map of allocations to a vector of instruction used to create by the allocation Keeping track of the...
Definition CacheUtility.h:316

CacheUtility::inversionAllocs
llvm::BasicBlock * inversionAllocs
Definition CacheUtility.h:161

CacheUtility::scopeMap
std::map< llvm::Value *, std::pair< llvm::AssertingVH< llvm::AllocaInst >, LimitContext > > scopeMap
A map of values being cached to their underlying allocation/limit context.
Definition CacheUtility.h:308

CacheUtility::SubLimitType
llvm::SmallVector< std::pair< llvm::Value *, llvm::SmallVector< std::pair< LoopContext, llvm::Value * >, 4 > >, 0 > SubLimitType
Given a LimitContext ctx, representing a location inside a loop nest, break each of the loops up into...
Definition CacheUtility.h:264

CacheUtility::replaceAWithB
virtual void replaceAWithB(llvm::Value *A, llvm::Value *B, bool storeInCache=false)
Replace this instruction both in LLVM modules and any local data-structures.
Definition CacheUtility.cpp:91

CacheUtility::getCacheAlignment
unsigned getCacheAlignment(unsigned bsize) const
Definition CacheUtility.h:210

CacheUtility::getDynamicLoopLimit
llvm::AllocaInst * getDynamicLoopLimit(llvm::Loop *L, bool ReverseLimit=true)
Definition CacheUtility.cpp:463

CacheUtility::CacheLookups
llvm::SmallPtrSet< llvm::LoadInst *, 10 > CacheLookups
Definition CacheUtility.h:419

CacheUtility::getSubLimits
SubLimitType getSubLimits(bool inForwardPass, llvm::IRBuilder<> *RB, LimitContext ctx, llvm::Value *extraSize=nullptr)
Given a LimitContext ctx, representing a location inside a loop nest, break each of the loops up into...
Definition CacheUtility.cpp:1109

CacheUtility::storeInstructionInCache
void storeInstructionInCache(LimitContext ctx, llvm::IRBuilder<> &BuilderM, llvm::Value *val, llvm::AllocaInst *cache, llvm::MDNode *TBAA=nullptr)
Given an allocation defined at a particular ctx, store the value val in the cache at the location def...

CacheUtility::isInstructionUsedInLoopInduction
bool isInstructionUsedInLoopInduction(llvm::Instruction &I)
Return whether the given instruction is used as necessary as part of a loop context This includes as ...
Definition CacheUtility.h:187

CacheUtility::AC
llvm::AssumptionCache AC
Definition CacheUtility.h:155

CacheUtility::lookupM
virtual llvm::Value * lookupM(llvm::Value *val, llvm::IRBuilder<> &BuilderM, const llvm::ValueToValueMapTy &incoming_availalble=llvm::ValueToValueMapTy(), bool tryLegalityCheck=true, llvm::BasicBlock *scope=nullptr)=0
High-level utility to get the value an instruction at a new location specified by BuilderM.

CacheUtility::assumeDynamicLoopOfSizeOne
virtual bool assumeDynamicLoopOfSizeOne(llvm::Loop *L) const =0

MustExitScalarEvolution
Definition MustExitScalarEvolution.h:44

CacheUtility::LimitContext
Definition CacheUtility.h:235

CacheUtility::LimitContext::LimitContext
LimitContext(bool ReverseLimit, llvm::BasicBlock *Block, bool ForceSingleIteration=false)
Definition CacheUtility.h:244

CacheUtility::LimitContext::ForceSingleIteration
bool ForceSingleIteration
Definition CacheUtility.h:242

CacheUtility::LimitContext::Block
llvm::BasicBlock * Block
Definition CacheUtility.h:240

CacheUtility::LimitContext::ReverseLimit
bool ReverseLimit
Definition CacheUtility.h:237

LoopContext
Container for all loop information to synthesize gradients.
Definition CacheUtility.h:63

LoopContext::parent
llvm::Loop * parent
Parent loop of this loop.
Definition CacheUtility.h:98

LoopContext::header
llvm::BasicBlock * header
Header of this loop.
Definition CacheUtility.h:74

LoopContext::incvar
llvm::AssertingVH< llvm::Instruction > incvar
Increment of the induction.
Definition CacheUtility.h:68

LoopContext::dynamic
bool dynamic
Whether this loop has a statically analyzable number of iterations.
Definition CacheUtility.h:80

LoopContext::exitBlocks
llvm::SmallPtrSet< llvm::BasicBlock *, 8 > exitBlocks
All blocks this loop exits too.
Definition CacheUtility.h:95

LoopContext::antivaralloc
llvm::AssertingVH< llvm::AllocaInst > antivaralloc
Allocation of induction variable of reverse pass.
Definition CacheUtility.h:71

LoopContext::var
llvm::AssertingVH< llvm::PHINode > var
Canonical induction variable of the loop.
Definition CacheUtility.h:65

LoopContext::offset
AssertingReplacingVH offset
An offset to add to the index when getting the cache pointer.
Definition CacheUtility.h:89

LoopContext::preheader
llvm::BasicBlock * preheader
Preheader of this loop.
Definition CacheUtility.h:77

LoopContext::maxLimit
AssertingReplacingVH maxLimit
limit is last value of a canonical induction variable iters is number of times loop is run (thus iter...
Definition CacheUtility.h:84

LoopContext::allocLimit
AssertingReplacingVH allocLimit
An overriding allocation limit size.
Definition CacheUtility.h:92

LoopContext::trueLimit
AssertingReplacingVH trueLimit
Definition CacheUtility.h:86