//===-- PTXAsmPrinter.cpp - PTX LLVM assembly writer ----------------------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This file contains a printer that converts from our internal representation // of machine-dependent LLVM code to PTX assembly language. // //===----------------------------------------------------------------------===// #define DEBUG_TYPE "ptx-asm-printer" #include "PTX.h" #include "PTXAsmPrinter.h" #include "PTXMachineFunctionInfo.h" #include "PTXParamManager.h" #include "PTXRegisterInfo.h" #include "PTXTargetMachine.h" #include "llvm/Argument.h" #include "llvm/DerivedTypes.h" #include "llvm/Function.h" #include "llvm/Module.h" #include "llvm/ADT/SmallString.h" #include "llvm/ADT/Twine.h" #include "llvm/Analysis/DebugInfo.h" #include "llvm/CodeGen/AsmPrinter.h" #include "llvm/CodeGen/MachineFrameInfo.h" #include "llvm/CodeGen/MachineInstr.h" #include "llvm/CodeGen/MachineRegisterInfo.h" #include "llvm/MC/MCContext.h" #include "llvm/MC/MCExpr.h" #include "llvm/MC/MCInst.h" #include "llvm/MC/MCStreamer.h" #include "llvm/MC/MCSymbol.h" #include "llvm/Target/Mangler.h" #include "llvm/Target/TargetLoweringObjectFile.h" #include "llvm/Support/CommandLine.h" #include "llvm/Support/Debug.h" #include "llvm/Support/ErrorHandling.h" #include "llvm/Support/MathExtras.h" #include "llvm/Support/Path.h" #include "llvm/Support/TargetRegistry.h" #include "llvm/Support/raw_ostream.h" using namespace llvm; static const char PARAM_PREFIX[] = "__param_"; static const char RETURN_PREFIX[] = "__ret_"; static const char *getRegisterTypeName(unsigned RegType) { switch (RegType) { default: llvm_unreachable("Unknown register type"); case PTXRegisterType::Pred: return ".pred"; case PTXRegisterType::B16: return ".b16"; case PTXRegisterType::B32: return ".b32"; case PTXRegisterType::B64: return ".b64"; case PTXRegisterType::F32: return ".f32"; case PTXRegisterType::F64: return ".f64"; } } static const char *getStateSpaceName(unsigned addressSpace) { switch (addressSpace) { default: llvm_unreachable("Unknown state space"); case PTXStateSpace::Global: return "global"; case PTXStateSpace::Constant: return "const"; case PTXStateSpace::Local: return "local"; case PTXStateSpace::Parameter: return "param"; case PTXStateSpace::Shared: return "shared"; } return NULL; } static const char *getTypeName(Type* type) { while (true) { switch (type->getTypeID()) { default: llvm_unreachable("Unknown type"); case Type::FloatTyID: return ".f32"; case Type::DoubleTyID: return ".f64"; case Type::IntegerTyID: switch (type->getPrimitiveSizeInBits()) { default: llvm_unreachable("Unknown integer bit-width"); case 16: return ".u16"; case 32: return ".u32"; case 64: return ".u64"; } case Type::ArrayTyID: case Type::PointerTyID: type = dyn_cast(type)->getElementType(); break; } } return NULL; } bool PTXAsmPrinter::doFinalization(Module &M) { // XXX Temproarily remove global variables so that doFinalization() will not // emit them again (global variables are emitted at beginning). Module::GlobalListType &global_list = M.getGlobalList(); int i, n = global_list.size(); GlobalVariable **gv_array = new GlobalVariable* [n]; // first, back-up GlobalVariable in gv_array i = 0; for (Module::global_iterator I = global_list.begin(), E = global_list.end(); I != E; ++I) gv_array[i++] = &*I; // second, empty global_list while (!global_list.empty()) global_list.remove(global_list.begin()); // call doFinalization bool ret = AsmPrinter::doFinalization(M); // now we restore global variables for (i = 0; i < n; i ++) global_list.insert(global_list.end(), gv_array[i]); delete[] gv_array; return ret; } void PTXAsmPrinter::EmitStartOfAsmFile(Module &M) { const PTXSubtarget& ST = TM.getSubtarget(); // Emit the PTX .version and .target attributes OutStreamer.EmitRawText(Twine("\t.version ") + ST.getPTXVersionString()); OutStreamer.EmitRawText(Twine("\t.target ") + ST.getTargetString() + (ST.supportsDouble() ? "" : ", map_f64_to_f32")); // .address_size directive is optional, but it must immediately follow // the .target directive if present within a module if (ST.supportsPTX23()) { const char *addrSize = ST.is64Bit() ? "64" : "32"; OutStreamer.EmitRawText(Twine("\t.address_size ") + addrSize); } OutStreamer.AddBlankLine(); // Define any .file directives DebugInfoFinder DbgFinder; DbgFinder.processModule(M); for (DebugInfoFinder::iterator I = DbgFinder.compile_unit_begin(), E = DbgFinder.compile_unit_end(); I != E; ++I) { DICompileUnit DIUnit(*I); StringRef FN = DIUnit.getFilename(); StringRef Dir = DIUnit.getDirectory(); GetOrCreateSourceID(FN, Dir); } OutStreamer.AddBlankLine(); // declare external functions for (Module::const_iterator i = M.begin(), e = M.end(); i != e; ++i) EmitFunctionDeclaration(i); // declare global variables for (Module::const_global_iterator i = M.global_begin(), e = M.global_end(); i != e; ++i) EmitVariableDeclaration(i); } void PTXAsmPrinter::EmitFunctionBodyStart() { OutStreamer.EmitRawText(Twine("{")); const PTXMachineFunctionInfo *MFI = MF->getInfo(); const PTXParamManager &PM = MFI->getParamManager(); // Print register definitions SmallString<128> regDefs; raw_svector_ostream os(regDefs); unsigned numRegs; // pred numRegs = MFI->countRegisters(PTXRegisterType::Pred, PTXRegisterSpace::Reg); if(numRegs > 0) os << "\t.reg .pred %p<" << numRegs << ">;\n"; // i16 numRegs = MFI->countRegisters(PTXRegisterType::B16, PTXRegisterSpace::Reg); if(numRegs > 0) os << "\t.reg .b16 %rh<" << numRegs << ">;\n"; // i32 numRegs = MFI->countRegisters(PTXRegisterType::B32, PTXRegisterSpace::Reg); if(numRegs > 0) os << "\t.reg .b32 %r<" << numRegs << ">;\n"; // i64 numRegs = MFI->countRegisters(PTXRegisterType::B64, PTXRegisterSpace::Reg); if(numRegs > 0) os << "\t.reg .b64 %rd<" << numRegs << ">;\n"; // f32 numRegs = MFI->countRegisters(PTXRegisterType::F32, PTXRegisterSpace::Reg); if(numRegs > 0) os << "\t.reg .f32 %f<" << numRegs << ">;\n"; // f64 numRegs = MFI->countRegisters(PTXRegisterType::F64, PTXRegisterSpace::Reg); if(numRegs > 0) os << "\t.reg .f64 %fd<" << numRegs << ">;\n"; // Local params for (PTXParamManager::param_iterator i = PM.local_begin(), e = PM.local_end(); i != e; ++i) os << "\t.param .b" << PM.getParamSize(*i) << ' ' << PM.getParamName(*i) << ";\n"; OutStreamer.EmitRawText(os.str()); const MachineFrameInfo* FrameInfo = MF->getFrameInfo(); DEBUG(dbgs() << "Have " << FrameInfo->getNumObjects() << " frame object(s)\n"); for (unsigned i = 0, e = FrameInfo->getNumObjects(); i != e; ++i) { DEBUG(dbgs() << "Size of object: " << FrameInfo->getObjectSize(i) << "\n"); if (FrameInfo->getObjectSize(i) > 0) { OutStreamer.EmitRawText("\t.local .align " + Twine(FrameInfo->getObjectAlignment(i)) + " .b8 __local" + Twine(i) + "[" + Twine(FrameInfo->getObjectSize(i)) + "];"); } } //unsigned Index = 1; // Print parameter passing params //for (PTXMachineFunctionInfo::param_iterator // i = MFI->paramBegin(), e = MFI->paramEnd(); i != e; ++i) { // std::string def = "\t.param .b"; // def += utostr(*i); // def += " __ret_"; // def += utostr(Index); // Index++; // def += ";"; // OutStreamer.EmitRawText(Twine(def)); //} } void PTXAsmPrinter::EmitFunctionBodyEnd() { OutStreamer.EmitRawText(Twine("}")); } void PTXAsmPrinter::EmitInstruction(const MachineInstr *MI) { MCInst TmpInst; LowerPTXMachineInstrToMCInst(MI, TmpInst, *this); OutStreamer.EmitInstruction(TmpInst); } void PTXAsmPrinter::EmitVariableDeclaration(const GlobalVariable *gv) { // Check to see if this is a special global used by LLVM, if so, emit it. if (EmitSpecialLLVMGlobal(gv)) return; MCSymbol *gvsym = Mang->getSymbol(gv); assert(gvsym->isUndefined() && "Cannot define a symbol twice!"); SmallString<128> decl; raw_svector_ostream os(decl); // check if it is defined in some other translation unit if (gv->isDeclaration()) os << ".extern "; // state space: e.g., .global os << '.' << getStateSpaceName(gv->getType()->getAddressSpace()) << ' '; // alignment (optional) unsigned alignment = gv->getAlignment(); if (alignment != 0) os << ".align " << gv->getAlignment() << ' '; if (PointerType::classof(gv->getType())) { PointerType* pointerTy = dyn_cast(gv->getType()); Type* elementTy = pointerTy->getElementType(); if (elementTy->isArrayTy()) { assert(elementTy->isArrayTy() && "Only pointers to arrays are supported"); ArrayType* arrayTy = dyn_cast(elementTy); elementTy = arrayTy->getElementType(); unsigned numElements = arrayTy->getNumElements(); while (elementTy->isArrayTy()) { arrayTy = dyn_cast(elementTy); elementTy = arrayTy->getElementType(); numElements *= arrayTy->getNumElements(); } // FIXME: isPrimitiveType() == false for i16? assert(elementTy->isSingleValueType() && "Non-primitive types are not handled"); // Find the size of the element in bits unsigned elementSize = elementTy->getPrimitiveSizeInBits(); os << ".b" << elementSize << ' ' << gvsym->getName() << '[' << numElements << ']'; } else { os << ".b8" << gvsym->getName() << "[]"; } // handle string constants (assume ConstantArray means string) if (gv->hasInitializer()) { const Constant *C = gv->getInitializer(); if (const ConstantArray *CA = dyn_cast(C)) { os << " = {"; for (unsigned i = 0, e = C->getNumOperands(); i != e; ++i) { if (i > 0) os << ','; os << "0x"; os.write_hex(cast(CA->getOperand(i))->getZExtValue()); } os << '}'; } } } else { // Note: this is currently the fall-through case and most likely generates // incorrect code. os << getTypeName(gv->getType()) << ' ' << gvsym->getName(); if (isa(gv->getType()) || isa(gv->getType())) os << "[]"; } os << ';'; OutStreamer.EmitRawText(os.str()); OutStreamer.AddBlankLine(); } void PTXAsmPrinter::EmitFunctionEntryLabel() { // The function label could have already been emitted if two symbols end up // conflicting due to asm renaming. Detect this and emit an error. if (!CurrentFnSym->isUndefined()) { report_fatal_error("'" + Twine(CurrentFnSym->getName()) + "' label emitted multiple times to assembly file"); return; } const PTXMachineFunctionInfo *MFI = MF->getInfo(); const PTXParamManager &PM = MFI->getParamManager(); const bool isKernel = MFI->isKernel(); const PTXSubtarget& ST = TM.getSubtarget(); SmallString<128> decl; raw_svector_ostream os(decl); os << (isKernel ? ".entry" : ".func"); if (!isKernel) { os << " ("; if (ST.useParamSpaceForDeviceArgs()) { for (PTXParamManager::param_iterator i = PM.ret_begin(), e = PM.ret_end(), b = i; i != e; ++i) { if (i != b) os << ", "; os << ".param .b" << PM.getParamSize(*i) << ' ' << PM.getParamName(*i); } } else { for (PTXMachineFunctionInfo::reg_iterator i = MFI->retreg_begin(), e = MFI->retreg_end(), b = i; i != e; ++i) { if (i != b) os << ", "; os << ".reg " << getRegisterTypeName(MFI->getRegisterType(*i)) << ' ' << MFI->getRegisterName(*i); } } os << ')'; } // Print function name os << ' ' << CurrentFnSym->getName() << " ("; const Function *F = MF->getFunction(); // Print parameters if (isKernel || ST.useParamSpaceForDeviceArgs()) { /*for (PTXParamManager::param_iterator i = PM.arg_begin(), e = PM.arg_end(), b = i; i != e; ++i) { if (i != b) os << ", "; os << ".param .b" << PM.getParamSize(*i) << ' ' << PM.getParamName(*i); }*/ int Counter = 1; for (Function::const_arg_iterator i = F->arg_begin(), e = F->arg_end(), b = i; i != e; ++i) { if (i != b) os << ", "; const Type *ArgType = (*i).getType(); os << ".param .b"; if (ArgType->isPointerTy()) { if (ST.is64Bit()) os << "64"; else os << "32"; } else { os << ArgType->getPrimitiveSizeInBits(); } if (ArgType->isPointerTy() && ST.emitPtrAttribute()) { const PointerType *PtrType = dyn_cast(ArgType); os << " .ptr"; switch (PtrType->getAddressSpace()) { default: llvm_unreachable("Unknown address space in argument"); case PTXStateSpace::Global: os << " .global"; break; case PTXStateSpace::Shared: os << " .shared"; break; } } os << " __param_" << Counter++; } } else { for (PTXMachineFunctionInfo::reg_iterator i = MFI->argreg_begin(), e = MFI->argreg_end(), b = i; i != e; ++i) { if (i != b) os << ", "; os << ".reg " << getRegisterTypeName(MFI->getRegisterType(*i)) << ' ' << MFI->getRegisterName(*i); } } os << ')'; OutStreamer.EmitRawText(os.str()); } void PTXAsmPrinter::EmitFunctionDeclaration(const Function* func) { const PTXSubtarget& ST = TM.getSubtarget(); std::string decl = ""; // hard-coded emission of extern vprintf function if (func->getName() == "printf" || func->getName() == "puts") { decl += ".extern .func (.param .b32 __param_1) vprintf (.param .b"; if (ST.is64Bit()) decl += "64"; else decl += "32"; decl += " __param_2, .param .b"; if (ST.is64Bit()) decl += "64"; else decl += "32"; decl += " __param_3)\n"; } OutStreamer.EmitRawText(Twine(decl)); } unsigned PTXAsmPrinter::GetOrCreateSourceID(StringRef FileName, StringRef DirName) { // If FE did not provide a file name, then assume stdin. if (FileName.empty()) return GetOrCreateSourceID("", StringRef()); // MCStream expects full path name as filename. if (!DirName.empty() && !sys::path::is_absolute(FileName)) { SmallString<128> FullPathName = DirName; sys::path::append(FullPathName, FileName); // Here FullPathName will be copied into StringMap by GetOrCreateSourceID. return GetOrCreateSourceID(StringRef(FullPathName), StringRef()); } StringMapEntry &Entry = SourceIdMap.GetOrCreateValue(FileName); if (Entry.getValue()) return Entry.getValue(); unsigned SrcId = SourceIdMap.size(); Entry.setValue(SrcId); // Print out a .file directive to specify files for .loc directives. OutStreamer.EmitDwarfFileDirective(SrcId, "", Entry.getKey()); return SrcId; } MCOperand PTXAsmPrinter::GetSymbolRef(const MachineOperand &MO, const MCSymbol *Symbol) { const MCExpr *Expr; Expr = MCSymbolRefExpr::Create(Symbol, MCSymbolRefExpr::VK_None, OutContext); return MCOperand::CreateExpr(Expr); } MCOperand PTXAsmPrinter::lowerOperand(const MachineOperand &MO) { MCOperand MCOp; const PTXMachineFunctionInfo *MFI = MF->getInfo(); unsigned EncodedReg; switch (MO.getType()) { default: llvm_unreachable("Unknown operand type"); case MachineOperand::MO_Register: if (MO.getReg() > 0) { // Encode the register EncodedReg = MFI->getEncodedRegister(MO.getReg()); } else { EncodedReg = 0; } MCOp = MCOperand::CreateReg(EncodedReg); break; case MachineOperand::MO_Immediate: MCOp = MCOperand::CreateImm(MO.getImm()); break; case MachineOperand::MO_MachineBasicBlock: MCOp = MCOperand::CreateExpr(MCSymbolRefExpr::Create( MO.getMBB()->getSymbol(), OutContext)); break; case MachineOperand::MO_GlobalAddress: MCOp = GetSymbolRef(MO, Mang->getSymbol(MO.getGlobal())); break; case MachineOperand::MO_ExternalSymbol: MCOp = GetSymbolRef(MO, GetExternalSymbolSymbol(MO.getSymbolName())); break; case MachineOperand::MO_FPImmediate: APFloat Val = MO.getFPImm()->getValueAPF(); bool ignored; Val.convert(APFloat::IEEEdouble, APFloat::rmTowardZero, &ignored); MCOp = MCOperand::CreateFPImm(Val.convertToDouble()); break; } return MCOp; } // Force static initialization. extern "C" void LLVMInitializePTXAsmPrinter() { RegisterAsmPrinter X(ThePTX32Target); RegisterAsmPrinter Y(ThePTX64Target); }