radeon_llvm_emit.cpp revision 509ddb0a0414cfc83102c463da542d95d83eabad
1a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard/*
2a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Copyright 2011 Advanced Micro Devices, Inc.
3a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
4a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Permission is hereby granted, free of charge, to any person obtaining a
5a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * copy of this software and associated documentation files (the "Software"),
6a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * to deal in the Software without restriction, including without limitation
7a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * and/or sell copies of the Software, and to permit persons to whom the
9a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Software is furnished to do so, subject to the following conditions:
10a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
11a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * The above copyright notice and this permission notice (including the next
12a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * paragraph) shall be included in all copies or substantial portions of the
13a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Software.
14a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
15a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * SOFTWARE.
22a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
23a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Authors: Tom Stellard <thomas.stellard@amd.com>
24a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
25a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard */
26509ddb0a0414cfc83102c463da542d95d83eabadTom Stellard#include "radeon_llvm_emit.h"
27a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
28a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/LLVMContext.h>
29a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Module.h>
30a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/PassManager.h>
31a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/ADT/Triple.h>
32a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/FormattedStream.h>
33a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/Host.h>
34a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/IRReader.h>
35a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/SourceMgr.h>
36a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/TargetRegistry.h>
37a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/TargetSelect.h>
38a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Target/TargetData.h>
39a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Target/TargetMachine.h>
40a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
41a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Transforms/Scalar.h>
42a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
43a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm-c/Target.h>
44a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
45a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <iostream>
46a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <stdlib.h>
47a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <stdio.h>
48a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
49a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardusing namespace llvm;
50a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
51a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#ifndef EXTERNAL_LLVM
52a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardextern "C" {
53a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
54a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardvoid LLVMInitializeAMDILTargetMC(void);
55a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardvoid LLVMInitializeAMDILTarget(void);
56a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardvoid LLVMInitializeAMDILTargetInfo(void);
57a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard}
58a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#endif
59a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
60a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard/**
61a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Compile an LLVM module to machine code.
62a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
63a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * @param bytes This function allocates memory for the byte stream, it is the
64a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * caller's responsibility to free it.
65a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard */
66a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardextern "C" unsigned
67a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardradeon_llvm_compile(LLVMModuleRef M, unsigned char ** bytes,
68a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                 unsigned * byte_count, const char * gpu_family,
69a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                 unsigned dump) {
70a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
71a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   Triple AMDGPUTriple(sys::getDefaultTargetTriple());
72a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
73a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#ifdef EXTERNAL_LLVM
74a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   /* XXX: Can we just initialize the AMDGPU target here? */
75a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   InitializeAllTargets();
76a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   InitializeAllTargetMCs();
77a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#else
78a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   LLVMInitializeAMDILTargetInfo();
79a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   LLVMInitializeAMDILTarget();
80a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   LLVMInitializeAMDILTargetMC();
81a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#endif
82a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   std::string err;
83a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   const Target * AMDGPUTarget = TargetRegistry::lookupTarget("r600", err);
84a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   fprintf(stderr, "%s\n", err.c_str());
85a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   if(!AMDGPUTarget) {
86a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard      fprintf(stderr, "Can't find target\n");
87a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard      return 1;
88a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   }
89a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
90a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   Triple::ArchType Arch = Triple::getArchTypeForLLVMName("r600");
91a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   if (Arch == Triple::UnknownArch) {
92a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard      fprintf(stderr, "Unknown Arch\n");
93a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   }
94a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   AMDGPUTriple.setArch(Arch);
95a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
96a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   Module * mod = unwrap(M);
97a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   std::string FS = gpu_family;
98a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   TargetOptions TO;
99a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
100a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   std::auto_ptr<TargetMachine> tm(AMDGPUTarget->createTargetMachine(
101a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                     AMDGPUTriple.getTriple(), gpu_family, "" /* Features */,
102a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                     TO, Reloc::Default, CodeModel::Default,
103a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                     CodeGenOpt::Default
104a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                     ));
105a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   TargetMachine &AMDGPUTargetMachine = *tm.get();
106a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   /* XXX: Use TargetMachine.Options in 3.0 */
107a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   if (dump) {
108a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard      mod->dump();
109a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   }
110a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   PassManager PM;
111a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   PM.add(new TargetData(*AMDGPUTargetMachine.getTargetData()));
112a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   PM.add(createPromoteMemoryToRegisterPass());
113a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   AMDGPUTargetMachine.setAsmVerbosityDefault(true);
114a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
115a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   std::string CodeString;
116a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   raw_string_ostream oStream(CodeString);
117a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   formatted_raw_ostream out(oStream);
118a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
119a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   /* Optional extra paramater true / false to disable verify */
120a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   if (AMDGPUTargetMachine.addPassesToEmitFile(PM, out, TargetMachine::CGFT_AssemblyFile,
121a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                                               true)){
122a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard      fprintf(stderr, "AddingPasses failed.\n");
123a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard      return 1;
124a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   }
125a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   PM.run(*mod);
126a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
127a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   out.flush();
128a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   std::string &data = oStream.str();
129a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
130a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   *bytes = (unsigned char*)malloc(data.length() * sizeof(unsigned char));
131a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   memcpy(*bytes, data.c_str(), data.length() * sizeof(unsigned char));
132a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   *byte_count = data.length();
133a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
134a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   return 0;
135a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard}
136