140 lines
4.6 KiB
C++
140 lines
4.6 KiB
C++
//===- OCL20To12.cpp - Transform OCL 2.0 builtins to OCL 1.2 builtins -----===//
|
|
//
|
|
// The LLVM/SPIRV Translator
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
// Copyright (c) 2014 Advanced Micro Devices, Inc. All rights reserved.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a
|
|
// copy of this software and associated documentation files (the "Software"),
|
|
// to deal with the Software without restriction, including without limitation
|
|
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
// and/or sell copies of the Software, and to permit persons to whom the
|
|
// Software is furnished to do so, subject to the following conditions:
|
|
//
|
|
// Redistributions of source code must retain the above copyright notice,
|
|
// this list of conditions and the following disclaimers.
|
|
// Redistributions in binary form must reproduce the above copyright notice,
|
|
// this list of conditions and the following disclaimers in the documentation
|
|
// and/or other materials provided with the distribution.
|
|
// Neither the names of Advanced Micro Devices, Inc., nor the names of its
|
|
// contributors may be used to endorse or promote products derived from this
|
|
// Software without specific prior written permission.
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS WITH
|
|
// THE SOFTWARE.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file implements transform OCL 2.0 builtins to OCL 1.2 builtins.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
#define DEBUG_TYPE "ocl20to12"
|
|
|
|
#include "SPIRVInternal.h"
|
|
#include "OCLUtil.h"
|
|
#include "llvm/ADT/StringSwitch.h"
|
|
#include "llvm/IR/InstVisitor.h"
|
|
#include "llvm/IR/Instructions.h"
|
|
#include "llvm/IR/IRBuilder.h"
|
|
#include "llvm/IR/Verifier.h"
|
|
#include "llvm/Pass.h"
|
|
#include "llvm/PassSupport.h"
|
|
#include "llvm/Support/Debug.h"
|
|
#include "llvm/Support/ErrorHandling.h"
|
|
#include "llvm/Support/raw_ostream.h"
|
|
|
|
using namespace llvm;
|
|
using namespace SPIRV;
|
|
using namespace OCLUtil;
|
|
|
|
namespace SPIRV {
|
|
class OCL20To12: public ModulePass,
|
|
public InstVisitor<OCL20To12> {
|
|
public:
|
|
OCL20To12():ModulePass(ID), M(nullptr), Ctx(nullptr) {
|
|
initializeOCL20To12Pass(*PassRegistry::getPassRegistry());
|
|
}
|
|
virtual bool runOnModule(Module &M);
|
|
virtual void visitCallInst(CallInst &CI);
|
|
|
|
/// Transform atomic_work_item_fence to mem_fence.
|
|
/// atomic_work_item_fence(flag, relaxed, work_group) =>
|
|
/// mem_fence(flag)
|
|
void visitCallAtomicWorkItemFence(CallInst *CI);
|
|
|
|
static char ID;
|
|
private:
|
|
Module *M;
|
|
LLVMContext *Ctx;
|
|
};
|
|
|
|
char OCL20To12::ID = 0;
|
|
|
|
bool
|
|
OCL20To12::runOnModule(Module& Module) {
|
|
M = &Module;
|
|
if (getOCLVersion(M) >= kOCLVer::CL20)
|
|
return false;
|
|
|
|
Ctx = &M->getContext();
|
|
visit(*M);
|
|
|
|
DEBUG(dbgs() << "After OCL20To12:\n" << *M);
|
|
|
|
std::string Err;
|
|
raw_string_ostream ErrorOS(Err);
|
|
if (verifyModule(*M, &ErrorOS)){
|
|
DEBUG(errs() << "Fails to verify module: " << ErrorOS.str());
|
|
}
|
|
return true;
|
|
}
|
|
|
|
void
|
|
OCL20To12::visitCallInst(CallInst& CI) {
|
|
DEBUG(dbgs() << "[visistCallInst] " << CI << '\n');
|
|
auto F = CI.getCalledFunction();
|
|
if (!F)
|
|
return;
|
|
|
|
auto MangledName = F->getName();
|
|
std::string DemangledName;
|
|
if (!oclIsBuiltin(MangledName, &DemangledName))
|
|
return;
|
|
DEBUG(dbgs() << "DemangledName = " << DemangledName.c_str() << '\n');
|
|
|
|
if (DemangledName == kOCLBuiltinName::AtomicWorkItemFence) {
|
|
visitCallAtomicWorkItemFence(&CI);
|
|
return;
|
|
}
|
|
}
|
|
|
|
void OCL20To12::visitCallAtomicWorkItemFence(CallInst* CI) {
|
|
auto Lit = getAtomicWorkItemFenceLiterals(CI);
|
|
if (std::get<1>(Lit) != OCLLegacyAtomicMemOrder ||
|
|
std::get<2>(Lit) != OCLLegacyAtomicMemScope)
|
|
report_fatal_error("OCL 2.0 builtin atomic_work_item_fence used in 1.2",
|
|
false);
|
|
|
|
AttributeSet Attrs = CI->getCalledFunction()->getAttributes();
|
|
mutateCallInstOCL(M, CI, [=](CallInst *, std::vector<Value *> &Args){
|
|
Args.resize(1);
|
|
Args[0] = getInt32(M, std::get<0>(Lit));
|
|
return kOCLBuiltinName::MemFence;
|
|
}, &Attrs);
|
|
}
|
|
|
|
}
|
|
|
|
INITIALIZE_PASS(OCL20To12, "ocl20to12",
|
|
"Translate OCL 2.0 builtins to OCL 1.2 builtins", false, false)
|
|
|
|
ModulePass *llvm::createOCL20To12() {
|
|
return new OCL20To12();
|
|
}
|