1a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard/* 2a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Copyright 2011 Advanced Micro Devices, Inc. 3a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 4a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Permission is hereby granted, free of charge, to any person obtaining a 5a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * copy of this software and associated documentation files (the "Software"), 6a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * to deal in the Software without restriction, including without limitation 7a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * and/or sell copies of the Software, and to permit persons to whom the 9a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Software is furnished to do so, subject to the following conditions: 10a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 11a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * The above copyright notice and this permission notice (including the next 12a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * paragraph) shall be included in all copies or substantial portions of the 13a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Software. 14a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 15a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * SOFTWARE. 22a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 23a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Authors: Tom Stellard <thomas.stellard@amd.com> 24a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 25a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard */ 26509ddb0a0414cfc83102c463da542d95d83eabadTom Stellard#include "radeon_llvm_emit.h" 27a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 28a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/LLVMContext.h> 29a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Module.h> 30a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/PassManager.h> 31a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/ADT/Triple.h> 32a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/FormattedStream.h> 33a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/Host.h> 34a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/IRReader.h> 35a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/SourceMgr.h> 36a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/TargetRegistry.h> 37a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/TargetSelect.h> 38926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich#include <llvm/Support/Threading.h> 39a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Target/TargetData.h> 40a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Target/TargetMachine.h> 41a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 42a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Transforms/Scalar.h> 43a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 44a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm-c/Target.h> 45a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 46a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <iostream> 47a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <stdlib.h> 48a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <stdio.h> 49a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 50a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardusing namespace llvm; 51a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 52a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#ifndef EXTERNAL_LLVM 53a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardextern "C" { 54a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 55235318a578b3d7772a60590c7e76791ed6d1a78eTom Stellardvoid LLVMInitializeAMDGPUAsmPrinter(void); 5649fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellardvoid LLVMInitializeAMDGPUTargetMC(void); 5749fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellardvoid LLVMInitializeAMDGPUTarget(void); 5849fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellardvoid LLVMInitializeAMDGPUTargetInfo(void); 59a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard} 60a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#endif 61a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 62926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlichnamespace { 63926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich 64926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlichclass LLVMEnsureMultithreaded { 65926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlichpublic: 66926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich LLVMEnsureMultithreaded() 67926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich { 68926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich llvm_start_multithreaded(); 69926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich } 70926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich}; 71926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich 72926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlichstatic LLVMEnsureMultithreaded lLVMEnsureMultithreaded; 73926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich 74926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich} 75926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich 76a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard/** 77a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Compile an LLVM module to machine code. 78a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * 79a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * @param bytes This function allocates memory for the byte stream, it is the 80a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * caller's responsibility to free it. 81a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard */ 82a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardextern "C" unsigned 83a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardradeon_llvm_compile(LLVMModuleRef M, unsigned char ** bytes, 84a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard unsigned * byte_count, const char * gpu_family, 85a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard unsigned dump) { 86a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 87a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard Triple AMDGPUTriple(sys::getDefaultTargetTriple()); 88a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 89a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#ifdef EXTERNAL_LLVM 90a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard /* XXX: Can we just initialize the AMDGPU target here? */ 91a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard InitializeAllTargets(); 92a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard InitializeAllTargetMCs(); 93a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#else 9449fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellard LLVMInitializeAMDGPUTargetInfo(); 9549fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellard LLVMInitializeAMDGPUTarget(); 9649fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellard LLVMInitializeAMDGPUTargetMC(); 97235318a578b3d7772a60590c7e76791ed6d1a78eTom Stellard LLVMInitializeAMDGPUAsmPrinter(); 98a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#endif 99a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard std::string err; 100a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard const Target * AMDGPUTarget = TargetRegistry::lookupTarget("r600", err); 101a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard if(!AMDGPUTarget) { 102d7f9b6ce13dcfc4f1d7c84c121d66606f8d05f7bTom Stellard fprintf(stderr, "Can't find target: %s\n", err.c_str()); 103a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard return 1; 104a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard } 105a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 106a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard Triple::ArchType Arch = Triple::getArchTypeForLLVMName("r600"); 107a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard if (Arch == Triple::UnknownArch) { 108a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard fprintf(stderr, "Unknown Arch\n"); 109a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard } 110a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard AMDGPUTriple.setArch(Arch); 111a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 112a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard Module * mod = unwrap(M); 113c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard std::string FS; 114a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard TargetOptions TO; 115a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 116c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard if (dump) { 117c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard mod->dump(); 118c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard FS += "+DumpCode"; 119c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard } 120c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard 121a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard std::auto_ptr<TargetMachine> tm(AMDGPUTarget->createTargetMachine( 122c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard AMDGPUTriple.getTriple(), gpu_family, FS, 123a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard TO, Reloc::Default, CodeModel::Default, 124a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard CodeGenOpt::Default 125a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard )); 126a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard TargetMachine &AMDGPUTargetMachine = *tm.get(); 127a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard PassManager PM; 128a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard PM.add(new TargetData(*AMDGPUTargetMachine.getTargetData())); 129a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard PM.add(createPromoteMemoryToRegisterPass()); 130a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard AMDGPUTargetMachine.setAsmVerbosityDefault(true); 131a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 132a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard std::string CodeString; 133a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard raw_string_ostream oStream(CodeString); 134a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard formatted_raw_ostream out(oStream); 135a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 136a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard /* Optional extra paramater true / false to disable verify */ 137235318a578b3d7772a60590c7e76791ed6d1a78eTom Stellard if (AMDGPUTargetMachine.addPassesToEmitFile(PM, out, TargetMachine::CGFT_ObjectFile, 138a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard true)){ 139a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard fprintf(stderr, "AddingPasses failed.\n"); 140a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard return 1; 141a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard } 142a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard PM.run(*mod); 143a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 144a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard out.flush(); 145a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard std::string &data = oStream.str(); 146a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 147a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *bytes = (unsigned char*)malloc(data.length() * sizeof(unsigned char)); 148a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard memcpy(*bytes, data.c_str(), data.length() * sizeof(unsigned char)); 149a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *byte_count = data.length(); 150a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard 151a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard return 0; 152a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard} 153