blob: 1331cfc2ec4d21b8159ac780ba2d4af526181ad0 [file] [log] [blame]
//===- OCL20To12.cpp - Transform OCL 2.0 builtins to OCL 1.2 builtins -----===//
//
// The LLVM/SPIRV Translator
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
// Copyright (c) 2014 Advanced Micro Devices, Inc. All rights reserved.
//
// Permission is hereby granted, free of charge, to any person obtaining a
// copy of this software and associated documentation files (the "Software"),
// to deal with the Software without restriction, including without limitation
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
// and/or sell copies of the Software, and to permit persons to whom the
// Software is furnished to do so, subject to the following conditions:
//
// Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimers.
// Redistributions in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimers in the documentation
// and/or other materials provided with the distribution.
// Neither the names of Advanced Micro Devices, Inc., nor the names of its
// contributors may be used to endorse or promote products derived from this
// Software without specific prior written permission.
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS WITH
// THE SOFTWARE.
//
//===----------------------------------------------------------------------===//
//
// This file implements transform OCL 2.0 builtins to OCL 1.2 builtins.
//
//===----------------------------------------------------------------------===//
#define DEBUG_TYPE "ocl20to12"
#include "SPIRVInternal.h"
#include "OCLUtil.h"
#include "llvm/ADT/StringSwitch.h"
#include "llvm/IR/InstVisitor.h"
#include "llvm/IR/Instructions.h"
#include "llvm/IR/IRBuilder.h"
#include "llvm/IR/Verifier.h"
#include "llvm/Pass.h"
#include "llvm/PassSupport.h"
#include "llvm/Support/Debug.h"
#include "llvm/Support/ErrorHandling.h"
#include "llvm/Support/raw_ostream.h"
using namespace llvm;
using namespace SPIRV;
using namespace OCLUtil;
namespace SPIRV {
class OCL20To12: public ModulePass,
public InstVisitor<OCL20To12> {
public:
OCL20To12():ModulePass(ID), M(nullptr), Ctx(nullptr) {
initializeOCL20To12Pass(*PassRegistry::getPassRegistry());
}
virtual bool runOnModule(Module &M);
virtual void visitCallInst(CallInst &CI);
/// Transform atomic_work_item_fence to mem_fence.
/// atomic_work_item_fence(flag, relaxed, work_group) =>
/// mem_fence(flag)
void visitCallAtomicWorkItemFence(CallInst *CI);
static char ID;
private:
Module *M;
LLVMContext *Ctx;
};
char OCL20To12::ID = 0;
bool
OCL20To12::runOnModule(Module& Module) {
M = &Module;
if (getOCLVersion(M) >= kOCLVer::CL20)
return false;
Ctx = &M->getContext();
visit(*M);
DEBUG(dbgs() << "After OCL20To12:\n" << *M);
std::string Err;
raw_string_ostream ErrorOS(Err);
if (verifyModule(*M, &ErrorOS)){
DEBUG(errs() << "Fails to verify module: " << ErrorOS.str());
}
return true;
}
void
OCL20To12::visitCallInst(CallInst& CI) {
DEBUG(dbgs() << "[visistCallInst] " << CI << '\n');
auto F = CI.getCalledFunction();
if (!F)
return;
auto MangledName = F->getName();
std::string DemangledName;
if (!oclIsBuiltin(MangledName, &DemangledName))
return;
DEBUG(dbgs() << "DemangledName = " << DemangledName.c_str() << '\n');
if (DemangledName == kOCLBuiltinName::AtomicWorkItemFence) {
visitCallAtomicWorkItemFence(&CI);
return;
}
}
void OCL20To12::visitCallAtomicWorkItemFence(CallInst* CI) {
auto Lit = getAtomicWorkItemFenceLiterals(CI);
if (std::get<1>(Lit) != OCLLegacyAtomicMemOrder ||
std::get<2>(Lit) != OCLLegacyAtomicMemScope)
report_fatal_error("OCL 2.0 builtin atomic_work_item_fence used in 1.2",
false);
AttributeSet Attrs = CI->getCalledFunction()->getAttributes();
mutateCallInstOCL(M, CI, [=](CallInst *, std::vector<Value *> &Args){
Args.resize(1);
Args[0] = getInt32(M, std::get<0>(Lit));
return kOCLBuiltinName::MemFence;
}, &Attrs);
}
}
INITIALIZE_PASS(OCL20To12, "ocl20to12",
"Translate OCL 2.0 builtins to OCL 1.2 builtins", false, false)
ModulePass *llvm::createOCL20To12() {
return new OCL20To12();
}