| //===-- PTXAsmPrinter.cpp - PTX LLVM assembly writer ----------------------===// |
| // |
| // The LLVM Compiler Infrastructure |
| // |
| // This file is distributed under the University of Illinois Open Source |
| // License. See LICENSE.TXT for details. |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // This file contains a printer that converts from our internal representation |
| // of machine-dependent LLVM code to PTX assembly language. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #define DEBUG_TYPE "ptx-asm-printer" |
| |
| #include "PTX.h" |
| #include "PTXAsmPrinter.h" |
| #include "PTXMachineFunctionInfo.h" |
| #include "PTXParamManager.h" |
| #include "PTXRegisterInfo.h" |
| #include "PTXTargetMachine.h" |
| #include "llvm/Argument.h" |
| #include "llvm/DerivedTypes.h" |
| #include "llvm/Function.h" |
| #include "llvm/Module.h" |
| #include "llvm/ADT/SmallString.h" |
| #include "llvm/ADT/StringExtras.h" |
| #include "llvm/ADT/Twine.h" |
| #include "llvm/Analysis/DebugInfo.h" |
| #include "llvm/CodeGen/AsmPrinter.h" |
| #include "llvm/CodeGen/MachineFrameInfo.h" |
| #include "llvm/CodeGen/MachineInstr.h" |
| #include "llvm/CodeGen/MachineRegisterInfo.h" |
| #include "llvm/MC/MCContext.h" |
| #include "llvm/MC/MCExpr.h" |
| #include "llvm/MC/MCInst.h" |
| #include "llvm/MC/MCStreamer.h" |
| #include "llvm/MC/MCSymbol.h" |
| #include "llvm/Target/Mangler.h" |
| #include "llvm/Target/TargetLoweringObjectFile.h" |
| #include "llvm/Support/CommandLine.h" |
| #include "llvm/Support/Debug.h" |
| #include "llvm/Support/ErrorHandling.h" |
| #include "llvm/Support/MathExtras.h" |
| #include "llvm/Support/Path.h" |
| #include "llvm/Support/TargetRegistry.h" |
| #include "llvm/Support/raw_ostream.h" |
| |
| using namespace llvm; |
| |
| static const char PARAM_PREFIX[] = "__param_"; |
| static const char RETURN_PREFIX[] = "__ret_"; |
| |
| static const char *getRegisterTypeName(unsigned RegNo, |
| const MachineRegisterInfo& MRI) { |
| const TargetRegisterClass *TRC = MRI.getRegClass(RegNo); |
| |
| #define TEST_REGCLS(cls, clsstr) \ |
| if (PTX::cls ## RegisterClass == TRC) return # clsstr; |
| |
| TEST_REGCLS(RegPred, pred); |
| TEST_REGCLS(RegI16, b16); |
| TEST_REGCLS(RegI32, b32); |
| TEST_REGCLS(RegI64, b64); |
| TEST_REGCLS(RegF32, b32); |
| TEST_REGCLS(RegF64, b64); |
| #undef TEST_REGCLS |
| |
| llvm_unreachable("Not in any register class!"); |
| return NULL; |
| } |
| |
| static const char *getStateSpaceName(unsigned addressSpace) { |
| switch (addressSpace) { |
| default: llvm_unreachable("Unknown state space"); |
| case PTXStateSpace::Global: return "global"; |
| case PTXStateSpace::Constant: return "const"; |
| case PTXStateSpace::Local: return "local"; |
| case PTXStateSpace::Parameter: return "param"; |
| case PTXStateSpace::Shared: return "shared"; |
| } |
| return NULL; |
| } |
| |
| static const char *getTypeName(Type* type) { |
| while (true) { |
| switch (type->getTypeID()) { |
| default: llvm_unreachable("Unknown type"); |
| case Type::FloatTyID: return ".f32"; |
| case Type::DoubleTyID: return ".f64"; |
| case Type::IntegerTyID: |
| switch (type->getPrimitiveSizeInBits()) { |
| default: llvm_unreachable("Unknown integer bit-width"); |
| case 16: return ".u16"; |
| case 32: return ".u32"; |
| case 64: return ".u64"; |
| } |
| case Type::ArrayTyID: |
| case Type::PointerTyID: |
| type = dyn_cast<SequentialType>(type)->getElementType(); |
| break; |
| } |
| } |
| return NULL; |
| } |
| |
| bool PTXAsmPrinter::doFinalization(Module &M) { |
| // XXX Temproarily remove global variables so that doFinalization() will not |
| // emit them again (global variables are emitted at beginning). |
| |
| Module::GlobalListType &global_list = M.getGlobalList(); |
| int i, n = global_list.size(); |
| GlobalVariable **gv_array = new GlobalVariable* [n]; |
| |
| // first, back-up GlobalVariable in gv_array |
| i = 0; |
| for (Module::global_iterator I = global_list.begin(), E = global_list.end(); |
| I != E; ++I) |
| gv_array[i++] = &*I; |
| |
| // second, empty global_list |
| while (!global_list.empty()) |
| global_list.remove(global_list.begin()); |
| |
| // call doFinalization |
| bool ret = AsmPrinter::doFinalization(M); |
| |
| // now we restore global variables |
| for (i = 0; i < n; i ++) |
| global_list.insert(global_list.end(), gv_array[i]); |
| |
| delete[] gv_array; |
| return ret; |
| } |
| |
| void PTXAsmPrinter::EmitStartOfAsmFile(Module &M) |
| { |
| const PTXSubtarget& ST = TM.getSubtarget<PTXSubtarget>(); |
| |
| // Emit the PTX .version and .target attributes |
| OutStreamer.EmitRawText(Twine("\t.version " + ST.getPTXVersionString())); |
| OutStreamer.EmitRawText(Twine("\t.target " + ST.getTargetString() + |
| (ST.supportsDouble() ? "" |
| : ", map_f64_to_f32"))); |
| // .address_size directive is optional, but it must immediately follow |
| // the .target directive if present within a module |
| if (ST.supportsPTX23()) { |
| std::string addrSize = ST.is64Bit() ? "64" : "32"; |
| OutStreamer.EmitRawText(Twine("\t.address_size " + addrSize)); |
| } |
| |
| OutStreamer.AddBlankLine(); |
| |
| // Define any .file directives |
| DebugInfoFinder DbgFinder; |
| DbgFinder.processModule(M); |
| |
| for (DebugInfoFinder::iterator I = DbgFinder.compile_unit_begin(), |
| E = DbgFinder.compile_unit_end(); I != E; ++I) { |
| DICompileUnit DIUnit(*I); |
| StringRef FN = DIUnit.getFilename(); |
| StringRef Dir = DIUnit.getDirectory(); |
| GetOrCreateSourceID(FN, Dir); |
| } |
| |
| OutStreamer.AddBlankLine(); |
| |
| // declare global variables |
| for (Module::const_global_iterator i = M.global_begin(), e = M.global_end(); |
| i != e; ++i) |
| EmitVariableDeclaration(i); |
| } |
| |
| void PTXAsmPrinter::EmitFunctionBodyStart() { |
| OutStreamer.EmitRawText(Twine("{")); |
| |
| const PTXMachineFunctionInfo *MFI = MF->getInfo<PTXMachineFunctionInfo>(); |
| const PTXParamManager &PM = MFI->getParamManager(); |
| |
| // Print register definitions |
| std::string regDefs; |
| unsigned numRegs; |
| |
| // pred |
| numRegs = MFI->getNumRegistersForClass(PTX::RegPredRegisterClass); |
| if(numRegs > 0) { |
| regDefs += "\t.reg .pred %p<"; |
| regDefs += utostr(numRegs); |
| regDefs += ">;\n"; |
| } |
| |
| // i16 |
| numRegs = MFI->getNumRegistersForClass(PTX::RegI16RegisterClass); |
| if(numRegs > 0) { |
| regDefs += "\t.reg .b16 %rh<"; |
| regDefs += utostr(numRegs); |
| regDefs += ">;\n"; |
| } |
| |
| // i32 |
| numRegs = MFI->getNumRegistersForClass(PTX::RegI32RegisterClass); |
| if(numRegs > 0) { |
| regDefs += "\t.reg .b32 %r<"; |
| regDefs += utostr(numRegs); |
| regDefs += ">;\n"; |
| } |
| |
| // i64 |
| numRegs = MFI->getNumRegistersForClass(PTX::RegI64RegisterClass); |
| if(numRegs > 0) { |
| regDefs += "\t.reg .b64 %rd<"; |
| regDefs += utostr(numRegs); |
| regDefs += ">;\n"; |
| } |
| |
| // f32 |
| numRegs = MFI->getNumRegistersForClass(PTX::RegF32RegisterClass); |
| if(numRegs > 0) { |
| regDefs += "\t.reg .f32 %f<"; |
| regDefs += utostr(numRegs); |
| regDefs += ">;\n"; |
| } |
| |
| // f64 |
| numRegs = MFI->getNumRegistersForClass(PTX::RegF64RegisterClass); |
| if(numRegs > 0) { |
| regDefs += "\t.reg .f64 %fd<"; |
| regDefs += utostr(numRegs); |
| regDefs += ">;\n"; |
| } |
| |
| // Local params |
| for (PTXParamManager::param_iterator i = PM.local_begin(), e = PM.local_end(); |
| i != e; ++i) { |
| regDefs += "\t.param .b"; |
| regDefs += utostr(PM.getParamSize(*i)); |
| regDefs += " "; |
| regDefs += PM.getParamName(*i); |
| regDefs += ";\n"; |
| } |
| |
| OutStreamer.EmitRawText(Twine(regDefs)); |
| |
| |
| const MachineFrameInfo* FrameInfo = MF->getFrameInfo(); |
| DEBUG(dbgs() << "Have " << FrameInfo->getNumObjects() |
| << " frame object(s)\n"); |
| for (unsigned i = 0, e = FrameInfo->getNumObjects(); i != e; ++i) { |
| DEBUG(dbgs() << "Size of object: " << FrameInfo->getObjectSize(i) << "\n"); |
| if (FrameInfo->getObjectSize(i) > 0) { |
| std::string def = "\t.local .align "; |
| def += utostr(FrameInfo->getObjectAlignment(i)); |
| def += " .b8"; |
| def += " __local"; |
| def += utostr(i); |
| def += "["; |
| def += utostr(FrameInfo->getObjectSize(i)); // Convert to bits |
| def += "]"; |
| def += ";"; |
| OutStreamer.EmitRawText(Twine(def)); |
| } |
| } |
| |
| //unsigned Index = 1; |
| // Print parameter passing params |
| //for (PTXMachineFunctionInfo::param_iterator |
| // i = MFI->paramBegin(), e = MFI->paramEnd(); i != e; ++i) { |
| // std::string def = "\t.param .b"; |
| // def += utostr(*i); |
| // def += " __ret_"; |
| // def += utostr(Index); |
| // Index++; |
| // def += ";"; |
| // OutStreamer.EmitRawText(Twine(def)); |
| //} |
| } |
| |
| void PTXAsmPrinter::EmitFunctionBodyEnd() { |
| OutStreamer.EmitRawText(Twine("}")); |
| } |
| |
| void PTXAsmPrinter::EmitInstruction(const MachineInstr *MI) { |
| MCInst TmpInst; |
| LowerPTXMachineInstrToMCInst(MI, TmpInst, *this); |
| OutStreamer.EmitInstruction(TmpInst); |
| } |
| |
| void PTXAsmPrinter::EmitVariableDeclaration(const GlobalVariable *gv) { |
| // Check to see if this is a special global used by LLVM, if so, emit it. |
| if (EmitSpecialLLVMGlobal(gv)) |
| return; |
| |
| MCSymbol *gvsym = Mang->getSymbol(gv); |
| |
| assert(gvsym->isUndefined() && "Cannot define a symbol twice!"); |
| |
| std::string decl; |
| |
| // check if it is defined in some other translation unit |
| if (gv->isDeclaration()) |
| decl += ".extern "; |
| |
| // state space: e.g., .global |
| decl += "."; |
| decl += getStateSpaceName(gv->getType()->getAddressSpace()); |
| decl += " "; |
| |
| // alignment (optional) |
| unsigned alignment = gv->getAlignment(); |
| if (alignment != 0) { |
| decl += ".align "; |
| decl += utostr(gv->getAlignment()); |
| decl += " "; |
| } |
| |
| |
| if (PointerType::classof(gv->getType())) { |
| PointerType* pointerTy = dyn_cast<PointerType>(gv->getType()); |
| Type* elementTy = pointerTy->getElementType(); |
| |
| decl += ".b8 "; |
| decl += gvsym->getName(); |
| decl += "["; |
| |
| if (elementTy->isArrayTy()) |
| { |
| assert(elementTy->isArrayTy() && "Only pointers to arrays are supported"); |
| |
| ArrayType* arrayTy = dyn_cast<ArrayType>(elementTy); |
| elementTy = arrayTy->getElementType(); |
| |
| unsigned numElements = arrayTy->getNumElements(); |
| |
| while (elementTy->isArrayTy()) { |
| |
| arrayTy = dyn_cast<ArrayType>(elementTy); |
| elementTy = arrayTy->getElementType(); |
| |
| numElements *= arrayTy->getNumElements(); |
| } |
| |
| // FIXME: isPrimitiveType() == false for i16? |
| assert(elementTy->isSingleValueType() && |
| "Non-primitive types are not handled"); |
| |
| // Compute the size of the array, in bytes. |
| uint64_t arraySize = (elementTy->getPrimitiveSizeInBits() >> 3) |
| * numElements; |
| |
| decl += utostr(arraySize); |
| } |
| |
| decl += "]"; |
| |
| // handle string constants (assume ConstantArray means string) |
| |
| if (gv->hasInitializer()) |
| { |
| const Constant *C = gv->getInitializer(); |
| if (const ConstantArray *CA = dyn_cast<ConstantArray>(C)) |
| { |
| decl += " = {"; |
| |
| for (unsigned i = 0, e = C->getNumOperands(); i != e; ++i) |
| { |
| if (i > 0) decl += ","; |
| |
| decl += "0x" + |
| utohexstr(cast<ConstantInt>(CA->getOperand(i))->getZExtValue()); |
| } |
| |
| decl += "}"; |
| } |
| } |
| } |
| else { |
| // Note: this is currently the fall-through case and most likely generates |
| // incorrect code. |
| decl += getTypeName(gv->getType()); |
| decl += " "; |
| |
| decl += gvsym->getName(); |
| |
| if (ArrayType::classof(gv->getType()) || |
| PointerType::classof(gv->getType())) |
| decl += "[]"; |
| } |
| |
| decl += ";"; |
| |
| OutStreamer.EmitRawText(Twine(decl)); |
| |
| OutStreamer.AddBlankLine(); |
| } |
| |
| void PTXAsmPrinter::EmitFunctionEntryLabel() { |
| // The function label could have already been emitted if two symbols end up |
| // conflicting due to asm renaming. Detect this and emit an error. |
| if (!CurrentFnSym->isUndefined()) { |
| report_fatal_error("'" + Twine(CurrentFnSym->getName()) + |
| "' label emitted multiple times to assembly file"); |
| return; |
| } |
| |
| const PTXMachineFunctionInfo *MFI = MF->getInfo<PTXMachineFunctionInfo>(); |
| const PTXParamManager &PM = MFI->getParamManager(); |
| const bool isKernel = MFI->isKernel(); |
| const PTXSubtarget& ST = TM.getSubtarget<PTXSubtarget>(); |
| const MachineRegisterInfo& MRI = MF->getRegInfo(); |
| |
| std::string decl = isKernel ? ".entry" : ".func"; |
| |
| if (!isKernel) { |
| decl += " ("; |
| if (ST.useParamSpaceForDeviceArgs()) { |
| for (PTXParamManager::param_iterator i = PM.ret_begin(), e = PM.ret_end(), |
| b = i; i != e; ++i) { |
| if (i != b) { |
| decl += ", "; |
| } |
| |
| decl += ".param .b"; |
| decl += utostr(PM.getParamSize(*i)); |
| decl += " "; |
| decl += PM.getParamName(*i); |
| } |
| } else { |
| for (PTXMachineFunctionInfo::reg_iterator |
| i = MFI->retreg_begin(), e = MFI->retreg_end(), b = i; |
| i != e; ++i) { |
| if (i != b) { |
| decl += ", "; |
| } |
| decl += ".reg ."; |
| decl += getRegisterTypeName(*i, MRI); |
| decl += " "; |
| decl += MFI->getRegisterName(*i); |
| } |
| } |
| decl += ")"; |
| } |
| |
| // Print function name |
| decl += " "; |
| decl += CurrentFnSym->getName().str(); |
| |
| decl += " ("; |
| |
| const Function *F = MF->getFunction(); |
| |
| // Print parameters |
| if (isKernel || ST.useParamSpaceForDeviceArgs()) { |
| /*for (PTXParamManager::param_iterator i = PM.arg_begin(), e = PM.arg_end(), |
| b = i; i != e; ++i) { |
| if (i != b) { |
| decl += ", "; |
| } |
| |
| decl += ".param .b"; |
| decl += utostr(PM.getParamSize(*i)); |
| decl += " "; |
| decl += PM.getParamName(*i); |
| }*/ |
| int Counter = 1; |
| for (Function::const_arg_iterator i = F->arg_begin(), e = F->arg_end(), |
| b = i; i != e; ++i) { |
| if (i != b) |
| decl += ", "; |
| const Type *ArgType = (*i).getType(); |
| decl += ".param .b"; |
| if (ArgType->isPointerTy()) { |
| if (ST.is64Bit()) |
| decl += "64"; |
| else |
| decl += "32"; |
| } else { |
| decl += utostr(ArgType->getPrimitiveSizeInBits()); |
| } |
| if (ArgType->isPointerTy() && ST.emitPtrAttribute()) { |
| const PointerType *PtrType = dyn_cast<const PointerType>(ArgType); |
| decl += " .ptr"; |
| switch (PtrType->getAddressSpace()) { |
| default: |
| llvm_unreachable("Unknown address space in argument"); |
| case PTXStateSpace::Global: |
| decl += " .global"; |
| break; |
| case PTXStateSpace::Shared: |
| decl += " .shared"; |
| break; |
| } |
| } |
| decl += " __param_"; |
| decl += utostr(Counter++); |
| } |
| } else { |
| for (PTXMachineFunctionInfo::reg_iterator |
| i = MFI->argreg_begin(), e = MFI->argreg_end(), b = i; |
| i != e; ++i) { |
| if (i != b) { |
| decl += ", "; |
| } |
| |
| decl += ".reg ."; |
| decl += getRegisterTypeName(*i, MRI); |
| decl += " "; |
| decl += MFI->getRegisterName(*i); |
| } |
| } |
| decl += ")"; |
| |
| OutStreamer.EmitRawText(Twine(decl)); |
| } |
| |
| unsigned PTXAsmPrinter::GetOrCreateSourceID(StringRef FileName, |
| StringRef DirName) { |
| // If FE did not provide a file name, then assume stdin. |
| if (FileName.empty()) |
| return GetOrCreateSourceID("<stdin>", StringRef()); |
| |
| // MCStream expects full path name as filename. |
| if (!DirName.empty() && !sys::path::is_absolute(FileName)) { |
| SmallString<128> FullPathName = DirName; |
| sys::path::append(FullPathName, FileName); |
| // Here FullPathName will be copied into StringMap by GetOrCreateSourceID. |
| return GetOrCreateSourceID(StringRef(FullPathName), StringRef()); |
| } |
| |
| StringMapEntry<unsigned> &Entry = SourceIdMap.GetOrCreateValue(FileName); |
| if (Entry.getValue()) |
| return Entry.getValue(); |
| |
| unsigned SrcId = SourceIdMap.size(); |
| Entry.setValue(SrcId); |
| |
| // Print out a .file directive to specify files for .loc directives. |
| OutStreamer.EmitDwarfFileDirective(SrcId, Entry.getKey()); |
| |
| return SrcId; |
| } |
| |
| MCOperand PTXAsmPrinter::GetSymbolRef(const MachineOperand &MO, |
| const MCSymbol *Symbol) { |
| const MCExpr *Expr; |
| Expr = MCSymbolRefExpr::Create(Symbol, MCSymbolRefExpr::VK_None, OutContext); |
| return MCOperand::CreateExpr(Expr); |
| } |
| |
| MCOperand PTXAsmPrinter::lowerOperand(const MachineOperand &MO) { |
| MCOperand MCOp; |
| const PTXMachineFunctionInfo *MFI = MF->getInfo<PTXMachineFunctionInfo>(); |
| const MCExpr *Expr; |
| const char *RegSymbolName; |
| switch (MO.getType()) { |
| default: |
| llvm_unreachable("Unknown operand type"); |
| case MachineOperand::MO_Register: |
| // We create register operands as symbols, since the PTXInstPrinter class |
| // has no way to map virtual registers back to a name without some ugly |
| // hacks. |
| // FIXME: Figure out a better way to handle virtual register naming. |
| RegSymbolName = MFI->getRegisterName(MO.getReg()); |
| Expr = MCSymbolRefExpr::Create(RegSymbolName, MCSymbolRefExpr::VK_None, |
| OutContext); |
| MCOp = MCOperand::CreateExpr(Expr); |
| break; |
| case MachineOperand::MO_Immediate: |
| MCOp = MCOperand::CreateImm(MO.getImm()); |
| break; |
| case MachineOperand::MO_MachineBasicBlock: |
| MCOp = MCOperand::CreateExpr(MCSymbolRefExpr::Create( |
| MO.getMBB()->getSymbol(), OutContext)); |
| break; |
| case MachineOperand::MO_GlobalAddress: |
| MCOp = GetSymbolRef(MO, Mang->getSymbol(MO.getGlobal())); |
| break; |
| case MachineOperand::MO_ExternalSymbol: |
| MCOp = GetSymbolRef(MO, GetExternalSymbolSymbol(MO.getSymbolName())); |
| break; |
| case MachineOperand::MO_FPImmediate: |
| APFloat Val = MO.getFPImm()->getValueAPF(); |
| bool ignored; |
| Val.convert(APFloat::IEEEdouble, APFloat::rmTowardZero, &ignored); |
| MCOp = MCOperand::CreateFPImm(Val.convertToDouble()); |
| break; |
| } |
| |
| return MCOp; |
| } |
| |
| // Force static initialization. |
| extern "C" void LLVMInitializePTXAsmPrinter() { |
| RegisterAsmPrinter<PTXAsmPrinter> X(ThePTX32Target); |
| RegisterAsmPrinter<PTXAsmPrinter> Y(ThePTX64Target); |
| } |
| |