radeon_llvm_emit.cpp revision 509ddb0a0414cfc83102c463da542d95d83eabad
1a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard/* 2a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Copyright 2011 Advanced Micro Devices, Inc. 3a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 4a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Permission is hereby granted, free of charge, to any person obtaining a 5a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * copy of this software and associated documentation files (the "Software"), 6a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * to deal in the Software without restriction, including without limitation 7a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * and/or sell copies of the Software, and to permit persons to whom the 9a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Software is furnished to do so, subject to the following conditions: 10a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 11a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * The above copyright notice and this permission notice (including the next 12a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * paragraph) shall be included in all copies or substantial portions of the 13a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Software. 14a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 15a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * SOFTWARE. 22a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 23a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Authors: Tom Stellard <thomas.stellard@amd.com> 24a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 25a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard */ 26509ddb0a0414cfc83102c463da542d95d83eabadTom Stellard#include "radeon_llvm_emit.h" 27a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 28a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/LLVMContext.h> 29a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Module.h> 30a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/PassManager.h> 31a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/ADT/Triple.h> 32a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/FormattedStream.h> 33a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/Host.h> 34a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/IRReader.h> 35a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/SourceMgr.h> 36a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/TargetRegistry.h> 37a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/TargetSelect.h> 38a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Target/TargetData.h> 39a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Target/TargetMachine.h> 40a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 41a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Transforms/Scalar.h> 42a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 43a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm-c/Target.h> 44a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 45a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <iostream> 46a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <stdlib.h> 47a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <stdio.h> 48a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 49a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardusing namespace llvm; 50a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 51a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#ifndef EXTERNAL_LLVM 52a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardextern "C" { 53a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 54a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardvoid LLVMInitializeAMDILTargetMC(void); 55a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardvoid LLVMInitializeAMDILTarget(void); 56a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardvoid LLVMInitializeAMDILTargetInfo(void); 57a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard} 58a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#endif 59a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 60a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard/** 61a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Compile an LLVM module to machine code. 62a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 63a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * @param bytes This function allocates memory for the byte stream, it is the 64a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * caller's responsibility to free it. 65a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard */ 66a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardextern "C" unsigned 67a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardradeon_llvm_compile(LLVMModuleRef M, unsigned char ** bytes, 68a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard unsigned * byte_count, const char * gpu_family, 69a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard unsigned dump) { 70a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 71a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard Triple AMDGPUTriple(sys::getDefaultTargetTriple()); 72a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 73a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#ifdef EXTERNAL_LLVM 74a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard /* XXX: Can we just initialize the AMDGPU target here? */ 75a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard InitializeAllTargets(); 76a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard InitializeAllTargetMCs(); 77a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#else 78a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard LLVMInitializeAMDILTargetInfo(); 79a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard LLVMInitializeAMDILTarget(); 80a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard LLVMInitializeAMDILTargetMC(); 81a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#endif 82a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard std::string err; 83a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard const Target * AMDGPUTarget = TargetRegistry::lookupTarget("r600", err); 84a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard fprintf(stderr, "%s\n", err.c_str()); 85a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard if(!AMDGPUTarget) { 86a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard fprintf(stderr, "Can't find target\n"); 87a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard return 1; 88a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard } 89a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 90a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard Triple::ArchType Arch = Triple::getArchTypeForLLVMName("r600"); 91a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard if (Arch == Triple::UnknownArch) { 92a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard fprintf(stderr, "Unknown Arch\n"); 93a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard } 94a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard AMDGPUTriple.setArch(Arch); 95a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 96a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard Module * mod = unwrap(M); 97a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard std::string FS = gpu_family; 98a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard TargetOptions TO; 99a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 100a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard std::auto_ptr<TargetMachine> tm(AMDGPUTarget->createTargetMachine( 101a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard AMDGPUTriple.getTriple(), gpu_family, "" /* Features */, 102a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard TO, Reloc::Default, CodeModel::Default, 103a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard CodeGenOpt::Default 104a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard )); 105a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard TargetMachine &AMDGPUTargetMachine = *tm.get(); 106a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard /* XXX: Use TargetMachine.Options in 3.0 */ 107a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard if (dump) { 108a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard mod->dump(); 109a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard } 110a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard PassManager PM; 111a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard PM.add(new TargetData(*AMDGPUTargetMachine.getTargetData())); 112a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard PM.add(createPromoteMemoryToRegisterPass()); 113a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard AMDGPUTargetMachine.setAsmVerbosityDefault(true); 114a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 115a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard std::string CodeString; 116a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard raw_string_ostream oStream(CodeString); 117a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard formatted_raw_ostream out(oStream); 118a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 119a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard /* Optional extra paramater true / false to disable verify */ 120a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard if (AMDGPUTargetMachine.addPassesToEmitFile(PM, out, TargetMachine::CGFT_AssemblyFile, 121a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard true)){ 122a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard fprintf(stderr, "AddingPasses failed.\n"); 123a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard return 1; 124a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard } 125a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard PM.run(*mod); 126a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 127a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard out.flush(); 128a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard std::string &data = oStream.str(); 129a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 130a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *bytes = (unsigned char*)malloc(data.length() * sizeof(unsigned char)); 131a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard memcpy(*bytes, data.c_str(), data.length() * sizeof(unsigned char)); 132a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *byte_count = data.length(); 133a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 134a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard return 0; 135a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard} 136