1a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard/*
2a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Copyright 2011 Advanced Micro Devices, Inc.
3a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
4a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Permission is hereby granted, free of charge, to any person obtaining a
5a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * copy of this software and associated documentation files (the "Software"),
6a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * to deal in the Software without restriction, including without limitation
7a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * and/or sell copies of the Software, and to permit persons to whom the
9a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Software is furnished to do so, subject to the following conditions:
10a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
11a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * The above copyright notice and this permission notice (including the next
12a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * paragraph) shall be included in all copies or substantial portions of the
13a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Software.
14a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
15a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * SOFTWARE.
22a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
23a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Authors: Tom Stellard <thomas.stellard@amd.com>
24a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
25a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard */
26509ddb0a0414cfc83102c463da542d95d83eabadTom Stellard#include "radeon_llvm_emit.h"
27a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
28a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/LLVMContext.h>
29a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Module.h>
30a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/PassManager.h>
31a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/ADT/Triple.h>
32a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/FormattedStream.h>
33a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/Host.h>
34a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/IRReader.h>
35a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/SourceMgr.h>
36a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/TargetRegistry.h>
37a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Support/TargetSelect.h>
38926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich#include <llvm/Support/Threading.h>
39a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Target/TargetData.h>
40a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Target/TargetMachine.h>
41a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
42a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm/Transforms/Scalar.h>
43a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
44a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <llvm-c/Target.h>
45a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
46a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <iostream>
47a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <stdlib.h>
48a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#include <stdio.h>
49a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
50a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardusing namespace llvm;
51a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
52a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#ifndef EXTERNAL_LLVM
53a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardextern "C" {
54a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
55235318a578b3d7772a60590c7e76791ed6d1a78eTom Stellardvoid LLVMInitializeAMDGPUAsmPrinter(void);
5649fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellardvoid LLVMInitializeAMDGPUTargetMC(void);
5749fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellardvoid LLVMInitializeAMDGPUTarget(void);
5849fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellardvoid LLVMInitializeAMDGPUTargetInfo(void);
59a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard}
60a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#endif
61a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
62926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlichnamespace {
63926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich
64926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlichclass LLVMEnsureMultithreaded {
65926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlichpublic:
66926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich   LLVMEnsureMultithreaded()
67926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich   {
68926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich      llvm_start_multithreaded();
69926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich   }
70926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich};
71926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich
72926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlichstatic LLVMEnsureMultithreaded lLVMEnsureMultithreaded;
73926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich
74926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich}
75926a4a922f9a5ec397cb3d316dd915b00b39c54dMathias Fröhlich
76a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard/**
77a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * Compile an LLVM module to machine code.
78a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard *
79a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * @param bytes This function allocates memory for the byte stream, it is the
80a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard * caller's responsibility to free it.
81a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard */
82a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardextern "C" unsigned
83a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellardradeon_llvm_compile(LLVMModuleRef M, unsigned char ** bytes,
84a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                 unsigned * byte_count, const char * gpu_family,
85a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                 unsigned dump) {
86a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
87a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   Triple AMDGPUTriple(sys::getDefaultTargetTriple());
88a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
89a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#ifdef EXTERNAL_LLVM
90a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   /* XXX: Can we just initialize the AMDGPU target here? */
91a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   InitializeAllTargets();
92a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   InitializeAllTargetMCs();
93a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#else
9449fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellard   LLVMInitializeAMDGPUTargetInfo();
9549fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellard   LLVMInitializeAMDGPUTarget();
9649fb99bd131a4ed89e6f55cf360f67618acafec4Tom Stellard   LLVMInitializeAMDGPUTargetMC();
97235318a578b3d7772a60590c7e76791ed6d1a78eTom Stellard   LLVMInitializeAMDGPUAsmPrinter();
98a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard#endif
99a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   std::string err;
100a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   const Target * AMDGPUTarget = TargetRegistry::lookupTarget("r600", err);
101a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   if(!AMDGPUTarget) {
102d7f9b6ce13dcfc4f1d7c84c121d66606f8d05f7bTom Stellard      fprintf(stderr, "Can't find target: %s\n", err.c_str());
103a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard      return 1;
104a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   }
105a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
106a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   Triple::ArchType Arch = Triple::getArchTypeForLLVMName("r600");
107a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   if (Arch == Triple::UnknownArch) {
108a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard      fprintf(stderr, "Unknown Arch\n");
109a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   }
110a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   AMDGPUTriple.setArch(Arch);
111a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
112a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   Module * mod = unwrap(M);
113c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard   std::string FS;
114a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   TargetOptions TO;
115a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
116c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard   if (dump) {
117c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard      mod->dump();
118c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard      FS += "+DumpCode";
119c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard   }
120c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard
121a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   std::auto_ptr<TargetMachine> tm(AMDGPUTarget->createTargetMachine(
122c8fb30abf1131072c855f2539db6455fac65dcb0Tom Stellard                     AMDGPUTriple.getTriple(), gpu_family, FS,
123a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                     TO, Reloc::Default, CodeModel::Default,
124a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                     CodeGenOpt::Default
125a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                     ));
126a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   TargetMachine &AMDGPUTargetMachine = *tm.get();
127a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   PassManager PM;
128a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   PM.add(new TargetData(*AMDGPUTargetMachine.getTargetData()));
129a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   PM.add(createPromoteMemoryToRegisterPass());
130a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   AMDGPUTargetMachine.setAsmVerbosityDefault(true);
131a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
132a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   std::string CodeString;
133a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   raw_string_ostream oStream(CodeString);
134a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   formatted_raw_ostream out(oStream);
135a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
136a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   /* Optional extra paramater true / false to disable verify */
137235318a578b3d7772a60590c7e76791ed6d1a78eTom Stellard   if (AMDGPUTargetMachine.addPassesToEmitFile(PM, out, TargetMachine::CGFT_ObjectFile,
138a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard                                               true)){
139a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard      fprintf(stderr, "AddingPasses failed.\n");
140a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard      return 1;
141a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   }
142a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   PM.run(*mod);
143a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
144a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   out.flush();
145a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   std::string &data = oStream.str();
146a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
147a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   *bytes = (unsigned char*)malloc(data.length() * sizeof(unsigned char));
148a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   memcpy(*bytes, data.c_str(), data.length() * sizeof(unsigned char));
149a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   *byte_count = data.length();
150a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard
151a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard   return 0;
152a75c6163e605f35b14f26930dd9227e4f337ec9eTom Stellard}
153