C++程序  |  141行  |  4.63 KB

//===- OCL20To12.cpp - Transform OCL 2.0 builtins to OCL 1.2 builtins -----===//
//
//                     The LLVM/SPIRV Translator
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
// Copyright (c) 2014 Advanced Micro Devices, Inc. All rights reserved.
//
// Permission is hereby granted, free of charge, to any person obtaining a
// copy of this software and associated documentation files (the "Software"),
// to deal with the Software without restriction, including without limitation
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
// and/or sell copies of the Software, and to permit persons to whom the
// Software is furnished to do so, subject to the following conditions:
//
// Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimers.
// Redistributions in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimers in the documentation
// and/or other materials provided with the distribution.
// Neither the names of Advanced Micro Devices, Inc., nor the names of its
// contributors may be used to endorse or promote products derived from this
// Software without specific prior written permission.
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS WITH
// THE SOFTWARE.
//
//===----------------------------------------------------------------------===//
//
// This file implements transform OCL 2.0 builtins to OCL 1.2 builtins.
//
//===----------------------------------------------------------------------===//
#define DEBUG_TYPE "ocl20to12"

#include "SPIRVInternal.h"
#include "OCLUtil.h"
#include "llvm/ADT/StringSwitch.h"
#include "llvm/IR/InstVisitor.h"
#include "llvm/IR/Instructions.h"
#include "llvm/IR/IRBuilder.h"
#include "llvm/IR/Verifier.h"
#include "llvm/Pass.h"
#include "llvm/PassSupport.h"
#include "llvm/Support/Debug.h"
#include "llvm/Support/ErrorHandling.h"
#include "llvm/Support/raw_ostream.h"

using namespace llvm;
using namespace SPIRV;
using namespace OCLUtil;

namespace SPIRV {
class OCL20To12: public ModulePass,
  public InstVisitor<OCL20To12> {
public:
  OCL20To12():ModulePass(ID), M(nullptr), Ctx(nullptr) {
    initializeOCL20To12Pass(*PassRegistry::getPassRegistry());
  }
  virtual bool runOnModule(Module &M);
  virtual void visitCallInst(CallInst &CI);

  /// Transform atomic_work_item_fence to mem_fence.
  ///   atomic_work_item_fence(flag, relaxed, work_group) =>
  ///       mem_fence(flag)
  void visitCallAtomicWorkItemFence(CallInst *CI);

  static char ID;
private:
  Module *M;
  LLVMContext *Ctx;
};

char OCL20To12::ID = 0;

bool
OCL20To12::runOnModule(Module& Module) {
  M = &Module;
  if (getOCLVersion(M) >= kOCLVer::CL20)
    return false;

  Ctx = &M->getContext();
  visit(*M);

  DEBUG(dbgs() << "After OCL20To12:\n" << *M);

  std::string Err;
  raw_string_ostream ErrorOS(Err);
  if (verifyModule(*M, &ErrorOS)){
    DEBUG(errs() << "Fails to verify module: " << ErrorOS.str());
  }
  return true;
}

void
OCL20To12::visitCallInst(CallInst& CI) {
  DEBUG(dbgs() << "[visistCallInst] " << CI << '\n');
  auto F = CI.getCalledFunction();
  if (!F)
    return;

  auto MangledName = F->getName();
  std::string DemangledName;
  if (!oclIsBuiltin(MangledName, &DemangledName))
    return;
  DEBUG(dbgs() << "DemangledName = " << DemangledName.c_str() << '\n');

  if (DemangledName == kOCLBuiltinName::AtomicWorkItemFence) {
    visitCallAtomicWorkItemFence(&CI);
    return;
  }
}

void OCL20To12::visitCallAtomicWorkItemFence(CallInst* CI) {
  auto Lit = getAtomicWorkItemFenceLiterals(CI);
  if (std::get<1>(Lit) != OCLLegacyAtomicMemOrder ||
      std::get<2>(Lit) != OCLLegacyAtomicMemScope)
    report_fatal_error("OCL 2.0 builtin atomic_work_item_fence used in 1.2",
        false);

  AttributeSet Attrs = CI->getCalledFunction()->getAttributes();
  mutateCallInstOCL(M, CI, [=](CallInst *, std::vector<Value *> &Args){
    Args.resize(1);
    Args[0] = getInt32(M, std::get<0>(Lit));
    return kOCLBuiltinName::MemFence;
  }, &Attrs);
}

}

INITIALIZE_PASS(OCL20To12, "ocl20to12",
    "Translate OCL 2.0 builtins to OCL 1.2 builtins", false, false)

ModulePass *llvm::createOCL20To12() {
  return new OCL20To12();
}