1f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/*
2f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Copyright 2011 Advanced Micro Devices, Inc.
3f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
4f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Permission is hereby granted, free of charge, to any person obtaining a
5f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * copy of this software and associated documentation files (the "Software"),
6f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * to deal in the Software without restriction, including without limitation
7f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * and/or sell copies of the Software, and to permit persons to whom the
9f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Software is furnished to do so, subject to the following conditions:
10f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
11f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * The above copyright notice and this permission notice (including the next
12f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * paragraph) shall be included in all copies or substantial portions of the
13f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Software.
14f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
15f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * SOFTWARE.
22f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
23f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Authors: Tom Stellard <thomas.stellard@amd.com>
24f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
25f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org */
26f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "radeon_llvm_emit.h"
27f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
28f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/LLVMContext.h>
29f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/Module.h>
30f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/PassManager.h>
31f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/ADT/Triple.h>
32f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/Support/FormattedStream.h>
33f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/Support/Host.h>
34f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/Support/IRReader.h>
35f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/Support/SourceMgr.h>
36f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/Support/TargetRegistry.h>
37f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/Support/TargetSelect.h>
38f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/Support/Threading.h>
39f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/Target/TargetData.h>
40f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/Target/TargetMachine.h>
41f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
42f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm/Transforms/Scalar.h>
43f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
44f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <llvm-c/Target.h>
45f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
46f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <iostream>
47f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <stdlib.h>
48f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include <stdio.h>
49f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
50f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgusing namespace llvm;
51f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
52f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#ifndef EXTERNAL_LLVM
53f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgextern "C" {
54f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
55f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgvoid LLVMInitializeAMDGPUAsmPrinter(void);
56f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgvoid LLVMInitializeAMDGPUTargetMC(void);
57f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgvoid LLVMInitializeAMDGPUTarget(void);
58f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgvoid LLVMInitializeAMDGPUTargetInfo(void);
59f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
60f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#endif
61f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
62f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgnamespace {
63f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
64f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgclass LLVMEnsureMultithreaded {
65f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgpublic:
66f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMEnsureMultithreaded()
67f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   {
68f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      llvm_start_multithreaded();
69f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   }
70f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org};
71f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
72f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgstatic LLVMEnsureMultithreaded lLVMEnsureMultithreaded;
73f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
74f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
75f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
76f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/**
77f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Compile an LLVM module to machine code.
78f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
79f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * @param bytes This function allocates memory for the byte stream, it is the
80f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * caller's responsibility to free it.
81f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org */
82f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgextern "C" unsigned
83f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgradeon_llvm_compile(LLVMModuleRef M, unsigned char ** bytes,
84f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                 unsigned * byte_count, const char * gpu_family,
85f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                 unsigned dump) {
86f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
87f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   Triple AMDGPUTriple(sys::getDefaultTargetTriple());
88f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
89f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#ifdef EXTERNAL_LLVM
90f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   /* XXX: Can we just initialize the AMDGPU target here? */
91f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   InitializeAllTargets();
92f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   InitializeAllTargetMCs();
93f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#else
94f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMInitializeAMDGPUTargetInfo();
95f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMInitializeAMDGPUTarget();
96f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMInitializeAMDGPUTargetMC();
97f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMInitializeAMDGPUAsmPrinter();
98f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#endif
99f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   std::string err;
100f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   const Target * AMDGPUTarget = TargetRegistry::lookupTarget("r600", err);
101f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   if(!AMDGPUTarget) {
102f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      fprintf(stderr, "Can't find target: %s\n", err.c_str());
103f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      return 1;
104f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   }
105f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
106f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   Triple::ArchType Arch = Triple::getArchTypeForLLVMName("r600");
107f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   if (Arch == Triple::UnknownArch) {
108f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      fprintf(stderr, "Unknown Arch\n");
109f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   }
110f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   AMDGPUTriple.setArch(Arch);
111f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
112f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   Module * mod = unwrap(M);
113f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   std::string FS;
114f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   TargetOptions TO;
115f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
116f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   if (dump) {
117f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      mod->dump();
118f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      FS += "+DumpCode";
119f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   }
120f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
121f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   std::auto_ptr<TargetMachine> tm(AMDGPUTarget->createTargetMachine(
122f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                     AMDGPUTriple.getTriple(), gpu_family, FS,
123f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                     TO, Reloc::Default, CodeModel::Default,
124f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                     CodeGenOpt::Default
125f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                     ));
126f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   TargetMachine &AMDGPUTargetMachine = *tm.get();
127f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   PassManager PM;
128f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   PM.add(new TargetData(*AMDGPUTargetMachine.getTargetData()));
129f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   PM.add(createPromoteMemoryToRegisterPass());
130f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   AMDGPUTargetMachine.setAsmVerbosityDefault(true);
131f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
132f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   std::string CodeString;
133f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   raw_string_ostream oStream(CodeString);
134f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   formatted_raw_ostream out(oStream);
135f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
136f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   /* Optional extra paramater true / false to disable verify */
137f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   if (AMDGPUTargetMachine.addPassesToEmitFile(PM, out, TargetMachine::CGFT_ObjectFile,
138f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                               true)){
139f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      fprintf(stderr, "AddingPasses failed.\n");
140f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      return 1;
141f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   }
142f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   PM.run(*mod);
143f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
144f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   out.flush();
145f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   std::string &data = oStream.str();
146f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
147f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   *bytes = (unsigned char*)malloc(data.length() * sizeof(unsigned char));
148f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   memcpy(*bytes, data.c_str(), data.length() * sizeof(unsigned char));
149f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   *byte_count = data.length();
150f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
151f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   return 0;
152f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
153