From 7b1d63e4065823b7dbef3001dcd602142d22b50e Mon Sep 17 00:00:00 2001 From: Akash Kothari <akashk4@tyler.cs.illinois.edu> Date: Mon, 13 Jan 2020 08:15:00 -0600 Subject: [PATCH] Deprecating __visc__node in GenVISC --- hpvm/include/GenVISC/GenVISC.h | 3 - hpvm/lib/Transforms/GenVISC/GenVISC.cpp | 743 +----------------------- 2 files changed, 1 insertion(+), 745 deletions(-) diff --git a/hpvm/include/GenVISC/GenVISC.h b/hpvm/include/GenVISC/GenVISC.h index ef1ca3469c..585af33953 100644 --- a/hpvm/include/GenVISC/GenVISC.h +++ b/hpvm/include/GenVISC/GenVISC.h @@ -44,9 +44,6 @@ public: // Functions virtual bool runOnModule(Module &M); - void generateTest(CallInst* CI); - Function* genKernel(Function* KernelFunction, StructType* RetTy); - void genHost(CallInst*, Function*, unsigned, unsigned, unsigned, unsigned, StructType*); }; } // End of namespace diff --git a/hpvm/lib/Transforms/GenVISC/GenVISC.cpp b/hpvm/lib/Transforms/GenVISC/GenVISC.cpp index e19f084992..9cce997f34 100644 --- a/hpvm/lib/Transforms/GenVISC/GenVISC.cpp +++ b/hpvm/lib/Transforms/GenVISC/GenVISC.cpp @@ -154,7 +154,6 @@ IS_VISC_CALL(cos) IS_VISC_CALL(init) -IS_VISC_CALL(node) IS_VISC_CALL(cleanup) IS_VISC_CALL(wait) IS_VISC_CALL(trackMemory) @@ -170,48 +169,6 @@ static unsigned getNumericValue(Value* V) { return cast<ConstantInt>(V)->getZExtValue(); } - - -// Add <numArgs> to the argument list of Function <F>. The names for these arguments -// should be put in the string array <names>. Ideally the length of <names> -// array should be numArgs. But, even when the length is not numArgs the -// arguments would be added correctly. The names however would not be as -// intuitive. -static Function* addArgs(Function* F, unsigned numArgs, std::string names[]) { - if(numArgs == 0) return F; // Return if no arguments are to be added. - - // Create the argument type list with added argument types - std::vector<Type*> ArgTypes; - for(Function::const_arg_iterator ai = F->arg_begin(), ae = F->arg_end(); - ai != ae; ++ai) { - ArgTypes.push_back(ai->getType()); - } - // Adding new arguments to the function argument list, would not change the - // function type. We need to change the type of this function to reflect the - // added arguments - for(unsigned i = 0; i < numArgs; ++i) { -// ArgTypes.push_back(Type::getInt32Ty(F->getContext())); - ArgTypes.push_back(Type::getInt64Ty(F->getContext())); - } - FunctionType* newFT = FunctionType::get(F->getReturnType(), ArgTypes, F->isVarArg()); - - // Change the function type - Function* newF = cloneFunction(F, newFT, false); - - // Add names to the extra arguments to the Function argument list - unsigned numOldArgs = F->getFunctionType()->getNumParams(); - for(Function::arg_iterator ai = newF->arg_begin(), ae = newF->arg_end(); - ai != ae; ++ai) { - if (ai->getArgNo() < numOldArgs) - continue; - ai->setName(names[(ai->getArgNo() - numOldArgs) % names->size()]); - } - - replaceNodeFunctionInIR(*F->getParent(), F, newF); - return newF; -} - - // Take the __visc__return instruction and generate code for combining the // values being returned into a struct and returning it. // The first operand is the number of returned values @@ -255,130 +212,6 @@ static Value* genCodeForReturn(CallInst* CI) { return IV; } -// The visc launch intrinsic requires all the input parameters to the kernel -// function be placed in contiguous memory and pointer to that input be passed -// as the second argument to the launch intrinsic. This generates code to bring -// together all the input and dimension arguments in one packed struct -// <InStruct>. First pack the arguments to the kernel function and then add the -// dimension arguments depending on the hierarchy of DFG user wants to generate. -static void marshallArguments(unsigned levels, unsigned numArgs, unsigned argOffset, unsigned numDims, unsigned dimOffset, Value* InStruct, CallInst* CI, Function* KernelF) { - DEBUG(errs() << "Kernel Function = " << KernelF->getName() << "\n"); - - // Get module context and i32 0 constant, as they would be frequently used in - // this function. - LLVMContext& Ctx = CI->getParent()->getContext(); - Constant* IntZero = ConstantInt::get(Type::getInt32Ty(Ctx), 0); - - // Find the arguments to be passed to kernel function and pack them in a - // struct. Specifically first generate a GEP instruction to find the correct - // memory location in InStruct and then generate Store instruction to store - // the argument in that location. - Function::arg_iterator ai = KernelF->arg_begin(); - Function::arg_iterator ae = KernelF->arg_end(); - - for(unsigned i = 0; i < numArgs && ai != ae; i++, ai++) { - Value* arg = CI->getArgOperand(i+argOffset); - DEBUG(errs() << "Argument: " << ai->getName() << "\n"); - DEBUG(errs() << "Passing: " << *arg << "\n"); - // Create constant int (i) - Constant* Int_i = ConstantInt::get(Type::getInt32Ty(Ctx), i); - // Get Element pointer instruction - Value* GEPIndices[] = { IntZero, Int_i }; - GetElementPtrInst* GEP = GetElementPtrInst::Create(nullptr, InStruct, - ArrayRef<Value*>(GEPIndices, 2), - InStruct->getName()+"."+ai->getName(), - CI); - // Store instruction - if(GEP->getType()->getPointerElementType() != arg->getType()) { - // Arguments type might not match with the kernel function definition - // One reason might be because of default argument promotions, where all - // arguments of type float are always promoted to double and types char, - // short int are promoted to int. - // LLVM 4.0 also promotes pointers to i8*. In case both are pointer types, - // we just issue a warning and cast it to appropriate type - if(arg->getType() == Type::getDoubleTy(Ctx)) { - DEBUG(errs() << "Cast from " << *arg->getType() << " To " << - *GEP->getType()->getPointerElementType() << "\n"); - CastInst* CastI = BitCastInst::CreateFPCast(arg, - GEP->getType()->getPointerElementType(), GEP->getName()+".cast", - CI); - new StoreInst(CastI, GEP, CI); - } else if (arg->getType() == Type::getInt32Ty(Ctx)) { - CastInst* CastI = BitCastInst::CreateIntegerCast(arg, - GEP->getType()->getPointerElementType(), false, - GEP->getName()+".cast", CI); - new StoreInst(CastI, GEP, CI); - } else if (arg->getType()->isPointerTy() && GEP->getType()->getPointerElementType()->isPointerTy()) { - errs() << "WARNING: Argument type mismatch between kernel and __visc__node call. Forcing cast\n"; - CastInst* CastI = CastInst::CreatePointerCast(arg, - GEP->getType()->getPointerElementType(), GEP->getName()+".cast", - CI); - new StoreInst(CastI, GEP, CI); - } else { - errs() << "Error: Mismatch in argument types\n"; - errs() << "__visc__node call: " << *CI << "\n"; - errs() << "Argument: " << *arg << "\n"; - errs() << "Expected: " << *ai << "\n"; - llvm_unreachable("Mismatch in argument types of kernel function and __visc__node call"); - } - } else { - new StoreInst(arg, GEP, CI); - } - } - - // Based on the hierarchy of the DFG we want, we need to pass the dimension - // for each level. The number of dimensions we need to pass to the launch - // intrinsic is the product of the number of levels and dimesions at each - // level. - // Marshall dim arguments - DEBUG(errs() << *CI << "\n"); - std::string names[] = {"dimX", "dimY", "dimZ"}; - for(unsigned i=0; i< numDims*levels; i++) { - Value* arg = CI->getArgOperand(i+dimOffset); - DEBUG(errs() << "Passing: " << *arg << "\n"); - // Create constant int (i) - Constant* Int_i = ConstantInt::get(Type::getInt32Ty(Ctx), i+numArgs); - // Get Element pointer instruction - Value* GEPIndices[] = { IntZero, Int_i }; - GetElementPtrInst* GEP = GetElementPtrInst::Create(nullptr, InStruct, - ArrayRef<Value*>(GEPIndices, 2), - InStruct->getName()+"."+names[i%numDims]+Twine(i/levels), - CI); - // Store instruction - DEBUG(errs() << *arg << " " << *GEP << "\n"); - StoreInst* SI = new StoreInst(arg, GEP, CI); - DEBUG(errs() << *SI << "\n"); - - } -} - -// Returns vector of all wait instructions, waiting on the passed graphID value -static std::vector<CallInst*>* getWaitList(Value* GraphID) { - DEBUG(errs() << "Getting Uses of: " << *GraphID << "\n"); - std::vector<CallInst*>* WaitList = new std::vector<CallInst*>(); - // It must have been loaded from memory somewhere - for(Value::user_iterator ui = GraphID->user_begin(), - ue = GraphID->user_end(); ui!=ue; ++ui) { - if(CallInst* waitI = dyn_cast<CallInst>(*ui)) { - DEBUG(errs() << "Use: " << *waitI << "\n"); - assert(isVISCCall_wait(waitI) - && "GraphID can only be used by __visc__wait call"); - WaitList->push_back(waitI); - } - //else if (PHINode* PN = dyn_cast<PHINode>(*ui)){ - //errs() << "Found PhiNode use of graphID\n"; - //std::vector<CallInst*>* phiWaitList = getWaitList(PN); - //WaitList->insert(WaitList->end(), phiWaitList->begin(), phiWaitList->end()); - //free(phiWaitList); - //} - else { - DEBUG(errs() << *(*ui) << "\n"); - llvm_unreachable("Error: Operation on Graph ID not supported!\n"); - } - } - return WaitList; -} - // Analyse the attribute call for this function. Add the in and out // attributes to pointer parameters. static void handleVISCAttributes(Function* F, CallInst* CI) { @@ -420,380 +253,6 @@ static void handleVISCAttributes(Function* F, CallInst* CI) { DEBUG(errs() << "Kernel after adding In/Out VISC attributes:\n" << *F << "\n"); } -// Recursively generate internal nodes for all the levels. Node at each level -// will create the appropriate instances of the child node at that level using -// the visc createNode intrinsic, and pass on the remaining dimensions to the -// child node. -static Function* genInternalNode(Function* KernelF, unsigned level, - unsigned numArgs, unsigned numDims, unsigned dimOffset, CallInst* CI) { - // Create new function with the same type - Module* module = KernelF->getParent(); - Function* ChildNodeF; - - // Recursively generate node for lower level - if(level > 1) { - ChildNodeF = genInternalNode(KernelF, level-1, numArgs, numDims, dimOffset, CI); - addHint(ChildNodeF, getPreferredTarget(KernelF)); -// Internal nodes always get a CPU hint. If code geneation for them is not -// needed and can be skipped, this is handled by the accelerator backends -// addHint(ChildNodeF, visc::CPU_TARGET); - } else { - ChildNodeF = KernelF; - } - - // Generate Internal node for current level - Function* InternalF = Function::Create(ChildNodeF->getFunctionType(), - ChildNodeF->getLinkage(), - KernelF->getName()+"Internal_level"+Twine(level), - module); - // Create a basic block in this function - BasicBlock *BB = BasicBlock::Create(InternalF->getContext(), "entry", InternalF); - ReturnInst* RI = ReturnInst::Create(InternalF->getContext(), - UndefValue::get(InternalF->getReturnType()), BB); - // Copy correct attributes - InternalF->setAttributes(ChildNodeF->getAttributes()); - // Loop over the arguments, copying the names of arguments over. - Function::arg_iterator dest_iterator = InternalF->arg_begin(); - for (Function::const_arg_iterator i = ChildNodeF->arg_begin(), e = ChildNodeF->arg_end(); - i != e; ++i, ++dest_iterator) { - DEBUG(errs() << "Copying argument: " << i->getName() << "\n"); - dest_iterator->setName(i->getName()); // Copy the name over... - DEBUG(errs() << "New Argument: " << *dest_iterator << "\n"); - } - - // Add extra dimesnion arguments - std::string dimNames[] = {"dimX", "dimY", "dimZ"}; - DEBUG(errs() << "Adding extra args to function Function:\n" << *InternalF << "\n"); - InternalF = addArgs(InternalF, numDims, dimNames); - // update RI - RI = cast<ReturnInst>(InternalF->getEntryBlock().getTerminator()); - DEBUG(errs() << "After Adding extra args to function Function:\n" << *InternalF << "\n"); - - // Insert createNode intrinsic - // First generate constant expression to bitcast the function pointer to - // internal node to i8* - Value* NodeF = ConstantExpr::getPointerCast(ChildNodeF, Type::getInt8PtrTy(module->getContext())); - - // Use args vectors to get the arguments for visc createNode - // intrinsic - std::vector<Value*> args; - - // Push the i8* pointer to internal node into the args vector - args.push_back(NodeF); - - // Traverse the argument list of internal node function in reverse to get the - // dimesnions to be used to create instances of child node at this level - Function::arg_iterator ai = InternalF->arg_end(); - for(unsigned i=0; i<numDims; i++, ai--); - DEBUG(errs() << "Iterator at: " << *ai << "\n"); - - // ai now points to the first dimension argument to be passed to the - // createNode intrinsic. Follow it to push the dim argument into - // the args vector - for(unsigned i=0; i < numDims; i++, ai++) { - args.push_back(&*ai); - } - - // Based on the number of dimensions choose the appropriate visc createNode - // intrinsic - DEBUG(errs() << "Number of dims = " << numDims << "\n"); - Intrinsic::ID createNodeXD; - switch(numDims) { - case 0: - createNodeXD = Intrinsic::visc_createNode; - break; - case 1: - createNodeXD = Intrinsic::visc_createNode1D; - break; - case 2: - createNodeXD = Intrinsic::visc_createNode2D; - break; - case 3: - createNodeXD = Intrinsic::visc_createNode3D; - break; - default: - llvm_unreachable("Invalid number of dimensions!"); - break; - }; - - // Generate the visc createNode intrinsic, using the args vector as parameter - Function* CreateNodeF = Intrinsic::getDeclaration(module, createNodeXD); - DEBUG(errs() << "Function chosen:\n" << *CreateNodeF << "\n"); - CallInst *CreateNodeCall = CallInst::Create(CreateNodeF, args, ChildNodeF->getName()+".node", RI); - DEBUG(errs() << "Generate call: " << *CreateNodeCall << "\n"); - - // Generate Bind intrinsics - Function* bindInputF = Intrinsic::getDeclaration(module, Intrinsic::visc_bind_input); - DEBUG(errs() << "Generating input binding:\n" << *bindInputF << "\n"); - for(unsigned i=0; i < ChildNodeF->arg_size(); i++) { - std::vector<Value*> bindArgs; - bindArgs.push_back(CreateNodeCall); - bindArgs.push_back(ConstantInt::get(Type::getInt32Ty(module->getContext()), i)); - bindArgs.push_back(ConstantInt::get(Type::getInt32Ty(module->getContext()), i)); - bindArgs.push_back(ConstantInt::getFalse(module->getContext())); - CallInst* bindInputCall = CallInst::Create(bindInputF, bindArgs, "", RI); - DEBUG(errs() << *bindInputCall << "\n"); - } - - // Print the generated internal node for debugging - DEBUG(errs() << "Generated Function:\n" << *InternalF << "\n"); - - return InternalF; -} - -// Change the OpenCL query function calls with visc intrinsics in function F. -static void replaceOpenCLCallsWithVISCIntrinsics(Function *F) { - Module* module = F->getParent(); - std::vector<CallInst *> IItoRemove; - - // Get first instruction - inst_iterator i = inst_begin(F); - Instruction *FI = &(*i); - - // Insert getNode intrinsic - Intrinsic::ID getNodeID = Intrinsic::visc_getNode; - Function* GetNodeF = Intrinsic::getDeclaration(module, getNodeID); - std::vector<Value*> args; - CallInst *GetNodeCall = CallInst::Create(GetNodeF, args, F->getName()+".node", FI); - DEBUG(errs() << "Generate getNode intrinsic: " << *GetNodeCall << "\n"); - - // Insert getParentNode intrinsic - Intrinsic::ID getParentNodeID = Intrinsic::visc_getParentNode; - Function* GetParentNodeF = Intrinsic::getDeclaration(module, getParentNodeID); - args.push_back(GetNodeCall); - CallInst *GetParentNodeCall = CallInst::Create(GetParentNodeF, args, F->getName()+".parentNode", FI); - DEBUG(errs() << "Generate getParentNode intrinsic: " << *GetParentNodeCall << "\n"); - - // Iterate through all instructions - for (inst_iterator i = inst_begin(F), e = inst_end(F); i != e; ++i) { - Instruction *I = &(*i); - CallInst *CI; - - // Find OpenCL function calls - if ((CI = dyn_cast<CallInst>(I))) { - if ((CI->getCalledValue()->stripPointerCasts()->getName()).equals("get_global_id")) { - DEBUG(errs() << "Found get_global_id call: " << *CI << "\n"); - CallSite OpenCLCallSite(CI); - Value *arg0 = OpenCLCallSite.getArgument(0); - // Find the intrinsic function to be called - unsigned dim = getNumericValue(arg0); - Intrinsic::ID getNodeInstanceID; - Intrinsic::ID getNumNodeInstancesID; - switch (dim) { - case 0: - getNodeInstanceID = Intrinsic::visc_getNodeInstanceID_x; - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_x; - break; - case 1: - getNodeInstanceID = Intrinsic::visc_getNodeInstanceID_y; - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_y; - break; - case 2: - getNodeInstanceID = Intrinsic::visc_getNodeInstanceID_z; - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_z; - break; - default: - assert(false && "Invalid dimension from valid OpenCL source!"); - break; - } - - - // Creating getNodeInstanceID intrinsic for parent node - ArrayRef<Value *> Args0(GetParentNodeCall); - Function* GetNodeInstanceIDF = Intrinsic::getDeclaration(module, getNodeInstanceID); - CallInst* ParentIDIntrinsic = CallInst::Create(GetNodeInstanceIDF, Args0, "", CI); - - // Creating getNumNodeInstances intrinsic for this node - ArrayRef<Value *> Args1(GetNodeCall); - Function* GetNumNodeInstancesF = Intrinsic::getDeclaration(module, getNumNodeInstancesID); - CallInst* InstancesIntrinsic = CallInst::Create(GetNumNodeInstancesF, Args1, "", CI); - // Creating mul instruction - BinaryOperator* MulInst = BinaryOperator::Create(Instruction::Mul, - ParentIDIntrinsic, - InstancesIntrinsic, - "", CI); - // Creating getNodeInstanceID intrinsic for this node - CallInst* LocalIDIntrinsic = CallInst::Create(GetNodeInstanceIDF, Args1, "", CI); - // Creating add instruction - BinaryOperator* AddInst = BinaryOperator::Create(Instruction::Add, - MulInst, - LocalIDIntrinsic, - "", CI); - CI->replaceAllUsesWith(AddInst); - IItoRemove.push_back(CI); - } - if ((CI->getCalledValue()->stripPointerCasts()->getName()).equals("get_local_id")) { - DEBUG(errs() << "Found get_local_id call: " << *CI << "\n"); - // Value *arg0 = CI->getOperand(0); - CallSite OpenCLCallSite(CI); - Value *arg0 = OpenCLCallSite.getArgument(0); - - // Argument of the function to be called - ArrayRef<Value *> Args(GetNodeCall); - - // Find the intrinsic function to be called - unsigned dim = getNumericValue(arg0); - Intrinsic::ID getNodeInstanceID; - switch (dim) { - case 0: - getNodeInstanceID = Intrinsic::visc_getNodeInstanceID_x; - break; - case 1: - getNodeInstanceID = Intrinsic::visc_getNodeInstanceID_y; - break; - case 2: - getNodeInstanceID = Intrinsic::visc_getNodeInstanceID_z; - break; - default: - assert(false && "Invalid dimension from valid OpenCL source!"); - break; - } - Function* GetNodeInstanceIDF = Intrinsic::getDeclaration(module, getNodeInstanceID); - CallInst* VI = CallInst::Create(GetNodeInstanceIDF, Args, "", CI); - CI->replaceAllUsesWith(VI); - IItoRemove.push_back(CI); - } - if ((CI->getCalledValue()->stripPointerCasts()->getName()).equals("get_group_id")) { - DEBUG(errs() << "Found get_group_id call: " << *CI << "\n"); - // Value *arg0 = CI->getOperand(0); - CallSite OpenCLCallSite(CI); - Value *arg0 = OpenCLCallSite.getArgument(0); - - // Argument of the function to be called - ArrayRef<Value *> Args(GetParentNodeCall); - - // Find the intrinsic function to be called - unsigned dim = getNumericValue(arg0); - Intrinsic::ID getNodeInstanceID; - switch (dim) { - case 0: - getNodeInstanceID = Intrinsic::visc_getNodeInstanceID_x; - break; - case 1: - getNodeInstanceID = Intrinsic::visc_getNodeInstanceID_y; - break; - case 2: - getNodeInstanceID = Intrinsic::visc_getNodeInstanceID_z; - break; - default: - assert(false && "Invalid dimension from valid OpenCL source!"); - break; - } - Function* GetNodeInstanceIDF = Intrinsic::getDeclaration(module, getNodeInstanceID); - CallInst* VI = CallInst::Create(GetNodeInstanceIDF, Args, "", CI); - CI->replaceAllUsesWith(VI); - IItoRemove.push_back(CI); - } - if ((CI->getCalledValue()->stripPointerCasts()->getName()).equals("get_global_size")) { - DEBUG(errs() << "Found get_global_size call: " << *CI << "\n"); - CallSite OpenCLCallSite(CI); - Value *arg0 = OpenCLCallSite.getArgument(0); - // Find the intrinsic function to be called - unsigned dim = getNumericValue(arg0); - Intrinsic::ID getNumNodeInstancesID; - switch (dim) { - case 0: - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_x; - break; - case 1: - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_y; - break; - case 2: - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_z; - break; - default: - assert(false && "Invalid dimension from valid OpenCL source!"); - break; - } - - - // Creating getNumNodeInstances intrinsic for parent node - ArrayRef<Value *> Args0(GetParentNodeCall); - Function* GetNumNodeInstancesF = Intrinsic::getDeclaration(module, getNumNodeInstancesID); - CallInst* ParentInstancesIntrinsic = CallInst::Create(GetNumNodeInstancesF, Args0, "", CI); - // Creating getNumNodeInstances intrinsic for this node - ArrayRef<Value *> Args1(GetNodeCall); - CallInst* InstancesIntrinsic = CallInst::Create(GetNumNodeInstancesF, Args1, "", CI); - // Creating mul instruction - BinaryOperator* MulInst = BinaryOperator::Create(Instruction::Mul, - ParentInstancesIntrinsic, - InstancesIntrinsic, - "", CI); - CI->replaceAllUsesWith(MulInst); - IItoRemove.push_back(CI); - - } - if ((CI->getCalledValue()->stripPointerCasts()->getName()).equals("get_local_size")) { - DEBUG(errs() << "Found get_local_size call: " << *CI << "\n"); - CallSite OpenCLCallSite(CI); - Value *arg0 = OpenCLCallSite.getArgument(0); - - // Argument of the function to be called - ArrayRef<Value *> Args(GetNodeCall); - - // Find the intrinsic function to be called - unsigned dim = getNumericValue(arg0); - Intrinsic::ID getNumNodeInstancesID; - switch (dim) { - case 0: - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_x; - break; - case 1: - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_y; - break; - case 2: - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_z; - break; - default: - assert(false && "Invalid dimension from valid OpenCL source!"); - break; - } - Function* GetNumNodeInstancesF = Intrinsic::getDeclaration(module, getNumNodeInstancesID); - CallInst* VI = CallInst::Create(GetNumNodeInstancesF, Args, "", CI); - CI->replaceAllUsesWith(VI); - IItoRemove.push_back(CI); - } - if ((CI->getCalledValue()->stripPointerCasts()->getName()).equals("get_num_groups")) { - DEBUG(errs() << "Found get_num_groups call: " << *CI << "\n"); - CallSite OpenCLCallSite(CI); - Value *arg0 = OpenCLCallSite.getArgument(0); - - // Argument of the function to be called - ArrayRef<Value *> Args(GetParentNodeCall); - - // Find the intrinsic function to be called - unsigned dim = getNumericValue(arg0); - Intrinsic::ID getNumNodeInstancesID; - switch (dim) { - case 0: - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_x; - break; - case 1: - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_y; - break; - case 2: - getNumNodeInstancesID = Intrinsic::visc_getNumNodeInstances_z; - break; - default: - assert(false && "Invalid dimension from valid OpenCL source!"); - break; - } - Function* GetNumNodeInstancesF = Intrinsic::getDeclaration(module, getNumNodeInstancesID); - CallInst* VI = CallInst::Create(GetNumNodeInstancesF, Args, "", CI); - CI->replaceAllUsesWith(VI); - IItoRemove.push_back(CI); - } - } - } - -//for (std::vector<CallInst *>::reverse_iterator ri = IItoRemove.rbegin(), - // re = IItoRemove.rend(); ri != re; ++ri) - for (CallInst *CI : reverse(IItoRemove)) - CI->eraseFromParent(); - -} - - // Public Functions of GenVISC pass bool GenVISC::runOnModule(Module &M) { errs() << "\nGENVISC PASS\n"; @@ -879,16 +338,7 @@ bool GenVISC::runOnModule(Module &M) { CallInst* CI = cast<CallInst>(I); LLVMContext& Ctx = CI->getContext(); - // If __visc__node call found, generate the test case - - if(isVISCCall_node(I)) { - errs() << "Found visc node call in Function: " << f->getName() << "\n"; - assert(CI->getNumArgOperands() >= 5 - && "__visc__node call should have atleast 5 arguments!"); - generateTest(CI); - // Place this call in the list of instructions to be erased. - toBeErased.push_back(CI); - } + if(isVISCCall_init(I)) { ReplaceCallWithIntrinsic(I, Intrinsic::visc_init, &toBeErased); } @@ -1343,197 +793,6 @@ Value* GenVISC::getStringPointer(const Twine& S, Instruction* IB, const Twine& N return SPtr; } - - -// Generate the test case using the dummy __visc__node call CI -// First parse the arguments to find the kernel function, num of levels, -// dimensions, arguments, inputs and outputs. Pass this information to genKernel -// and genInternalNode functions to generate the test case. -void GenVISC::generateTest(CallInst* CI) { - // Parse the dummy function call here - LLVMContext& Ctx = CI->getParent()->getContext(); - - unsigned offset = 1; // argument at offset 1 is the number of dimensions - // Find number of arguments - assert(CI->getNumArgOperands() > offset - && "Too few arguments for __visc__node call!"); - unsigned levels = getNumericValue(CI->getArgOperand(offset)); - errs() << "\tNum of levels = " << levels << "\n"; - - // Find number of dimensions - offset += 1; - assert(CI->getNumArgOperands() > offset - && "Too few arguments for __visc__node call!"); - unsigned numDims = getNumericValue(CI->getOperand(offset)); - errs() << "\tNum of dimensions = " << numDims << "\n"; - - - // Find number of arguments - offset += numDims*levels + 1; // skip the dimesnions - assert(CI->getNumArgOperands() > offset - && "Too few arguments for __visc__node call!"); - unsigned numArgs = getNumericValue(CI->getArgOperand(offset)); - errs() << "\tNum of kernel arguments = " << numArgs << "\n"; - - // Find number of outputs - offset += numArgs + 1; // skip the kernel arguments - assert(CI->getNumArgOperands() > offset - && "Too few arguments for __visc__node call!"); - unsigned numOutputs = getNumericValue(CI->getArgOperand(offset)); - errs() << "\tNum of kernel outputs = " << numOutputs << "\n"; - - // Find return struct type - assert(numOutputs == 0 && "Not handled case where number of outputs is non-zero!"); - // This is always zero. One should look at the number of struct elements of - // kernel function - StructType* RetTy = StructType::create(Ctx, None, "rtype"); - - Function* KernelF = genKernel(cast<Function>(CI->getArgOperand(0)->stripPointerCasts()), RetTy); - genHost(CI, KernelF, levels, numDims, numArgs, numOutputs, RetTy); -} - - - -// Make all the required changes to the kernel function. This would include -// changing the function signature by adding any extra arguments required. -// Changing the return type. Changing all the OpenCL query intrinsics with the -// visc intrinsics. -Function* GenVISC::genKernel(Function* KernelF, StructType* RetTy) { - // Make changes to kernel here - DEBUG(errs() << "Modifying Node Function: " << KernelF->getName() << "\n"); - - // Find dummy __visc__attribute call in this function and add visc attributes - // in/out to pointer arguments - for (inst_iterator i = inst_begin(KernelF), e = inst_end(KernelF); i != e; ++i) { - Instruction *I = &(*i); - if(isVISCCall_attributes(I)) { - handleVISCAttributes(KernelF, cast<CallInst>(I)); - //I->eraseFromParent(); - break; - } - } - - // Change arguments and types - // Create the argument type list with added argument types - //Function::ArgumentListType& argList = KernelF->getArgumentList(); - std::vector<Type*> argTypes; - // Insert an i32 argument after every pointer argument. However adding an - // argument does not change the attribute list of function and so the - // arguments need to be shifted accordingly. - //bool shiftAttr = false; - for(Function::arg_iterator ai = KernelF->arg_begin(), ae = KernelF->arg_end(); - ai != ae; ++ai) { - - argTypes.push_back(ai->getType()); - if(ai->getType()->isPointerTy()) { - // If it is a pointer argument, add an i64 type next - argTypes.push_back(Type::getInt64Ty(KernelF->getContext())); - } - - } - // Adding new arguments to the function argument list, would not change the - // function type. We need to change the type of this function to reflect the - // added arguments - FunctionType* newFT = FunctionType::get(RetTy, argTypes, KernelF->isVarArg()); - - // Change the function type - SmallVector<ReturnInst*, 8> Returns; - Function* newKernelF = cloneFunction(KernelF, newFT, true, &Returns); - DEBUG(errs() << *newKernelF << "\n"); - - // Replace ret void instruction with ret %RetTy undef - for(auto RI: Returns) { - DEBUG(errs() << "Found return inst: "<< *RI << "\n"); - ReturnInst* newRI = ReturnInst::Create(KernelF->getContext(), UndefValue::get(RetTy)); - ReplaceInstWithInst(RI, newRI); - } - - replaceNodeFunctionInIR(*KernelF->getParent(), KernelF, newKernelF); - // Replace opencl query intrinsics with visc query intrinsics - replaceOpenCLCallsWithVISCIntrinsics(newKernelF); - return newKernelF; -} - -// Generate the code replacing the dummy __visc__node call with visc launch -// intrinsic and also generate the internal nodes required at each level -// depending on the hierarchy of DFG needed. This would also involve marhsalling -// all the input arguments to the kernel function in memory. Replaceing CI with -// launch intrinsic, and all the dummy __visc__wait calls with the visc wait -// intrinsic. -void GenVISC::genHost(CallInst* CI, Function* KernelF, unsigned levels, unsigned numDims, unsigned numArgs, unsigned numOutputs, StructType* RetTy) { - // Make host code changes here - DEBUG(errs() << "Modifying Host code for __visc__node call site: " << *CI << "\n"); - DEBUG(errs() << "Kernel Function: " << KernelF->getName() << "\n"); - LLVMContext& Ctx = CI->getParent()->getContext(); - - // Create a root funtion which has this as internal node - Function* Root = genInternalNode(KernelF, levels, numArgs, numDims, 3, CI); - - // Add hint to compile root for CPU. This is always true. - addHint(Root, visc::CPU_TARGET); - - // Generate argument struct type (All arguments followed by return struct type) - std::vector<Type*> ArgList; - unsigned offset = numDims*levels + 2 + 1 + 1; - for(Function::arg_iterator ai=KernelF->arg_begin(), ae=KernelF->arg_end(); - ai!=ae; ai++) { - Type* Ty = ai->getType(); - ArgList.push_back(Ty); - } - // Add the dimesnions arguments - for(unsigned i=0; i<numDims*levels; i++) { -// ArgList.push_back(Type::getInt32Ty(Ctx)); - ArgList.push_back(Type::getInt64Ty(Ctx)); - } - ArgList.push_back(RetTy); - StructType* ArgStructTy = StructType::create(ArgList, "struct.arg", true); - DEBUG(errs() << *ArgStructTy << "\n"); - - switchToTimer(visc_TimerID_ARG_PACK, CI); - // Insert alloca inst for this argument struct type - AllocaInst* AI = new AllocaInst(ArgStructTy, 0, "in.addr", CI); - - // Marshall all input arguments and dimension arguments into argument struct - // type - marshallArguments(levels, numArgs, offset, numDims, 3, AI, CI, KernelF); - - // Type cast argument struct to i8* - CastInst* BI = BitCastInst::CreatePointerCast(AI, - Type::getInt8PtrTy(Ctx), - "args", - CI); - - switchToTimer(visc_TimerID_NONE, CI); - - // Bitcast Root function to i8* - Constant* Root_i8ptr = ConstantExpr::getPointerCast(Root, Type::getInt8PtrTy(Ctx)); - // Replace CI with launch call to a Root function - Function* LaunchF = Intrinsic::getDeclaration(Root->getParent(), Intrinsic::visc_launch); - DEBUG(errs() << "Intrinsic for launch: " << *LaunchF << "\n"); - - Value* LaunchInstArgs[] = {Root_i8ptr, BI, ConstantInt::getFalse(Ctx)}; - CallInst* LaunchInst = CallInst::Create(LaunchF, - ArrayRef<Value*>(LaunchInstArgs,3), - "graph"+Root->getName(), CI); - //ReplaceInstWithInst(LI, LaunchInst); - - DEBUG(errs() << *LaunchInst << "\n"); - // Add wait call - // Replace all wait instructions with visc wait intrinsic instructions - Function* WaitF = Intrinsic::getDeclaration(Root->getParent(), Intrinsic::visc_wait); - std::vector<CallInst*>* WaitList = getWaitList(CI); - for(unsigned i=0; i < WaitList->size(); ++i) { - CallInst* waitCall = WaitList->at(i); - CallInst* waitInst = CallInst::Create(WaitF, - ArrayRef<Value*>(LaunchInst), - "", CI); - DEBUG(errs() << *waitInst << "\n"); - waitCall->eraseFromParent(); - } - - // Get result (optional) -} - void GenVISC::initializeTimerSet(Instruction* InsertBefore) { Value* TimerSetAddr; StoreInst* SI; -- GitLab