all of the features in the current working draft of the upcoming C++ standard, provisionally named C++1y. The code generator's performance is greatly increased, and the loop auto-vectorizer is now enabled at -Os and -O2 in addition to -O3. The PowerPC backend has made several major improvements to code generation quality and compile time, and the X86, SPARC, ARM32, Aarch64 and SystemZ backends have all seen major feature work. Release notes for llvm and clang can be found here: <http://llvm.org/releases/3.4/docs/ReleaseNotes.html> <http://llvm.org/releases/3.4/tools/clang/docs/ReleaseNotes.html> MFC after: 1 month
56 lines
1.8 KiB
C++
56 lines
1.8 KiB
C++
//===----- CGCUDARuntime.cpp - Interface to CUDA Runtimes -----------------===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This provides an abstract class for CUDA code generation. Concrete
|
|
// subclasses of this implement code generation for specific CUDA
|
|
// runtime libraries.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "CGCUDARuntime.h"
|
|
#include "CGCall.h"
|
|
#include "CodeGenFunction.h"
|
|
#include "clang/AST/Decl.h"
|
|
#include "clang/AST/ExprCXX.h"
|
|
|
|
using namespace clang;
|
|
using namespace CodeGen;
|
|
|
|
CGCUDARuntime::~CGCUDARuntime() {}
|
|
|
|
RValue CGCUDARuntime::EmitCUDAKernelCallExpr(CodeGenFunction &CGF,
|
|
const CUDAKernelCallExpr *E,
|
|
ReturnValueSlot ReturnValue) {
|
|
llvm::BasicBlock *ConfigOKBlock = CGF.createBasicBlock("kcall.configok");
|
|
llvm::BasicBlock *ContBlock = CGF.createBasicBlock("kcall.end");
|
|
|
|
CodeGenFunction::ConditionalEvaluation eval(CGF);
|
|
CGF.EmitBranchOnBoolExpr(E->getConfig(), ContBlock, ConfigOKBlock);
|
|
|
|
eval.begin(CGF);
|
|
CGF.EmitBlock(ConfigOKBlock);
|
|
|
|
const Decl *TargetDecl = 0;
|
|
if (const ImplicitCastExpr *CE = dyn_cast<ImplicitCastExpr>(E->getCallee())) {
|
|
if (const DeclRefExpr *DRE = dyn_cast<DeclRefExpr>(CE->getSubExpr())) {
|
|
TargetDecl = DRE->getDecl();
|
|
}
|
|
}
|
|
|
|
llvm::Value *Callee = CGF.EmitScalarExpr(E->getCallee());
|
|
CGF.EmitCall(E->getCallee()->getType(), Callee, E->getLocStart(),
|
|
ReturnValue, E->arg_begin(), E->arg_end(), TargetDecl);
|
|
CGF.EmitBranch(ContBlock);
|
|
|
|
CGF.EmitBlock(ContBlock);
|
|
eval.end(CGF);
|
|
|
|
return RValue::get(0);
|
|
}
|