16974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard/*
26974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * Copyright 2014 Advanced Micro Devices, Inc.
36974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard *
46974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * Permission is hereby granted, free of charge, to any person obtaining a
56974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * copy of this software and associated documentation files (the "Software"),
66974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * to deal in the Software without restriction, including without limitation
76974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * the rights to use, copy, modify, merge, publish, distribute, sublicense,
86974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * and/or sell copies of the Software, and to permit persons to whom the
96974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * Software is furnished to do so, subject to the following conditions:
106974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard *
116974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * The above copyright notice and this permission notice (including the next
126974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * paragraph) shall be included in all copies or substantial portions of the
136974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * Software.
146974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard *
156974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
166974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
176974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
186974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
196974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
206974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
216974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * SOFTWARE.
226974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard *
236974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * Authors: Tom Stellard <thomas.stellard@amd.com>
246974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard *
256974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard */
266974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard
276974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include "radeon_elf_util.h"
286974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include "r600_pipe_common.h"
296974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard
306974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include "util/u_memory.h"
316974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard
326974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include <gelf.h>
336974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include <libelf.h>
346974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include <stdio.h>
356974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard
36e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellardstatic void parse_symbol_table(Elf_Data *symbol_table_data,
37e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard				const GElf_Shdr *symbol_table_header,
38e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard				struct radeon_shader_binary *binary)
39e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard{
40e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	GElf_Sym symbol;
41e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	unsigned i = 0;
42e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	unsigned symbol_count =
43e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		symbol_table_header->sh_size / symbol_table_header->sh_entsize;
44e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard
45e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	/* We are over allocating this list, because symbol_count gives the
46e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 	 * total number of symbols, and we will only be filling the list
47e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 	 * with offsets of global symbols.  The memory savings from
48e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 	 * allocating the correct size of this list will be small, and
49e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 	 * I don't think it is worth the cost of pre-computing the number
50e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 	 * of global symbols.
51e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 	 */
52e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	binary->global_symbol_offsets = CALLOC(symbol_count, sizeof(uint64_t));
53e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard
54e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	while (gelf_getsym(symbol_table_data, i++, &symbol)) {
55e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		unsigned i;
56dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		if (GELF_ST_BIND(symbol.st_info) != STB_GLOBAL ||
57dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		    symbol.st_shndx == 0 /* Undefined symbol */) {
58e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard			continue;
59e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		}
60e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard
61e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		binary->global_symbol_offsets[binary->global_symbol_count] =
62e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard					symbol.st_value;
63e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard
64e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		/* Sort the list using bubble sort.  This list will usually
65e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		 * be small. */
66e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		for (i = binary->global_symbol_count; i > 0; --i) {
67e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard			uint64_t lhs = binary->global_symbol_offsets[i - 1];
68e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard			uint64_t rhs = binary->global_symbol_offsets[i];
69e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard			if (lhs < rhs) {
70e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard				break;
71e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard			}
72e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard			binary->global_symbol_offsets[i] = lhs;
73e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard			binary->global_symbol_offsets[i - 1] = rhs;
74e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		}
75e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		++binary->global_symbol_count;
76e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	}
77e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard}
78e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard
79dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellardstatic void parse_relocs(Elf *elf, Elf_Data *relocs, Elf_Data *symbols,
80dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard			unsigned symbol_sh_link,
81dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard			struct radeon_shader_binary *binary)
82dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard{
83dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard	unsigned i;
84dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard
85dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard	if (!relocs || !symbols || !binary->reloc_count) {
86dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		return;
87dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard	}
88dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard	binary->relocs = CALLOC(binary->reloc_count,
89dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard			sizeof(struct radeon_shader_reloc));
90dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard	for (i = 0; i < binary->reloc_count; i++) {
91dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		GElf_Sym symbol;
92dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		GElf_Rel rel;
93dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		char *symbol_name;
94dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		struct radeon_shader_reloc *reloc = &binary->relocs[i];
95dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard
96dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		gelf_getrel(relocs, i, &rel);
97dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		gelf_getsym(symbols, GELF_R_SYM(rel.r_info), &symbol);
98dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		symbol_name = elf_strptr(elf, symbol_sh_link, symbol.st_name);
99dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard
100dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		reloc->offset = rel.r_offset;
10150ac2612d08f2425972dde42e32a71fdce70cebdMarek Olšák		strncpy(reloc->name, symbol_name, sizeof(reloc->name)-1);
10250ac2612d08f2425972dde42e32a71fdce70cebdMarek Olšák		reloc->name[sizeof(reloc->name)-1] = 0;
103dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard	}
104dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard}
105dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard
1066974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellardvoid radeon_elf_read(const char *elf_data, unsigned elf_size,
1077dd1f45bc41c4a936b0ff84400840524bb9f8871Marek Olšák		     struct radeon_shader_binary *binary)
1086974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard{
1096974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	char *elf_buffer;
1106974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	Elf *elf;
1116974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	Elf_Scn *section = NULL;
112dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard	Elf_Data *symbols = NULL, *relocs = NULL;
1136974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	size_t section_str_index;
114f5ac5e20b16d17b0adda6d856829dd0cf997f7dcMarek Olšák	unsigned symbol_sh_link = 0;
1156974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard
1166974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	/* One of the libelf implementations
1176974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	 * (http://www.mr511.de/software/english.htm) requires calling
1186974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	 * elf_version() before elf_memory().
1196974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	 */
1206974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	elf_version(EV_CURRENT);
1216974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	elf_buffer = MALLOC(elf_size);
1226974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	memcpy(elf_buffer, elf_data, elf_size);
1236974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard
1246974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	elf = elf_memory(elf_buffer, elf_size);
1256974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard
1266974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	elf_getshdrstrndx(elf, &section_str_index);
1276974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard
1286974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	while ((section = elf_nextscn(elf, section))) {
1296974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard		const char *name;
1306974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard		Elf_Data *section_data = NULL;
1316974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard		GElf_Shdr section_header;
1326974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard		if (gelf_getshdr(section, &section_header) != &section_header) {
1336974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard			fprintf(stderr, "Failed to read ELF section header\n");
1346974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard			return;
1356974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard		}
1366974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard		name = elf_strptr(elf, section_str_index, section_header.sh_name);
1376974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard		if (!strcmp(name, ".text")) {
1386974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard			section_data = elf_getdata(section, section_data);
1396974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard			binary->code_size = section_data->d_size;
1406974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard			binary->code = MALLOC(binary->code_size * sizeof(unsigned char));
1416974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard			memcpy(binary->code, section_data->d_buf, binary->code_size);
1426974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard		} else if (!strcmp(name, ".AMDGPU.config")) {
1436974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard			section_data = elf_getdata(section, section_data);
1446974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard			binary->config_size = section_data->d_size;
1456974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard			binary->config = MALLOC(binary->config_size * sizeof(unsigned char));
1466974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard			memcpy(binary->config, section_data->d_buf, binary->config_size);
1477dd1f45bc41c4a936b0ff84400840524bb9f8871Marek Olšák		} else if (!strcmp(name, ".AMDGPU.disasm")) {
1487dd1f45bc41c4a936b0ff84400840524bb9f8871Marek Olšák			/* Always read disassembly if it's available. */
1496974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard			section_data = elf_getdata(section, section_data);
1507dd1f45bc41c4a936b0ff84400840524bb9f8871Marek Olšák			binary->disasm_string = strndup(section_data->d_buf,
1517dd1f45bc41c4a936b0ff84400840524bb9f8871Marek Olšák							section_data->d_size);
1529ba3105e0a4b186d6b1ee4c23886a3c4cd0a3543Tom Stellard		} else if (!strncmp(name, ".rodata", 7)) {
1539ba3105e0a4b186d6b1ee4c23886a3c4cd0a3543Tom Stellard			section_data = elf_getdata(section, section_data);
1549ba3105e0a4b186d6b1ee4c23886a3c4cd0a3543Tom Stellard			binary->rodata_size = section_data->d_size;
1559ba3105e0a4b186d6b1ee4c23886a3c4cd0a3543Tom Stellard			binary->rodata = MALLOC(binary->rodata_size * sizeof(unsigned char));
1569ba3105e0a4b186d6b1ee4c23886a3c4cd0a3543Tom Stellard			memcpy(binary->rodata, section_data->d_buf, binary->rodata_size);
157e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		} else if (!strncmp(name, ".symtab", 7)) {
158dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard			symbols = elf_getdata(section, section_data);
159dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard			symbol_sh_link = section_header.sh_link;
160dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard			parse_symbol_table(symbols, &section_header, binary);
161dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard		} else if (!strcmp(name, ".rel.text")) {
162dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard			relocs = elf_getdata(section, section_data);
163dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard			binary->reloc_count = section_header.sh_size /
164dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard					section_header.sh_entsize;
1656974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard		}
1666974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	}
1676974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard
168dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard	parse_relocs(elf, relocs, symbols, symbol_sh_link, binary);
169dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard
1706974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	if (elf){
1716974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard		elf_end(elf);
1726974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	}
1736974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard	FREE(elf_buffer);
174e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard
175e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	/* Cache the config size per symbol */
176e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	if (binary->global_symbol_count) {
177e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		binary->config_size_per_symbol =
178e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard			binary->config_size / binary->global_symbol_count;
179e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	} else {
180e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		binary->global_symbol_count = 1;
181e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		binary->config_size_per_symbol = binary->config_size;
182e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	}
183e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard}
184e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard
185e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellardconst unsigned char *radeon_shader_binary_config_start(
186e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	const struct radeon_shader_binary *binary,
187e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	uint64_t symbol_offset)
188e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard{
189e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	unsigned i;
190e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	for (i = 0; i < binary->global_symbol_count; ++i) {
191e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		if (binary->global_symbol_offsets[i] == symbol_offset) {
192e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard			unsigned offset = i * binary->config_size_per_symbol;
193e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard			return binary->config + offset;
194e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard		}
195e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	}
196e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard	return binary->config;
1976974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard}
198