16974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard/* 26974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * Copyright 2014 Advanced Micro Devices, Inc. 36974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * 46974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * Permission is hereby granted, free of charge, to any person obtaining a 56974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * copy of this software and associated documentation files (the "Software"), 66974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * to deal in the Software without restriction, including without limitation 76974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * the rights to use, copy, modify, merge, publish, distribute, sublicense, 86974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * and/or sell copies of the Software, and to permit persons to whom the 96974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * Software is furnished to do so, subject to the following conditions: 106974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * 116974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * The above copyright notice and this permission notice (including the next 126974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * paragraph) shall be included in all copies or substantial portions of the 136974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * Software. 146974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * 156974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 166974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 176974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 186974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 196974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 206974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 216974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * SOFTWARE. 226974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * 236974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * Authors: Tom Stellard <thomas.stellard@amd.com> 246974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * 256974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard */ 266974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard 276974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include "radeon_elf_util.h" 286974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include "r600_pipe_common.h" 296974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard 306974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include "util/u_memory.h" 316974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard 326974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include <gelf.h> 336974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include <libelf.h> 346974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard#include <stdio.h> 356974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard 36e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellardstatic void parse_symbol_table(Elf_Data *symbol_table_data, 37e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard const GElf_Shdr *symbol_table_header, 38e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard struct radeon_shader_binary *binary) 39e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard{ 40e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard GElf_Sym symbol; 41e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard unsigned i = 0; 42e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard unsigned symbol_count = 43e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard symbol_table_header->sh_size / symbol_table_header->sh_entsize; 44e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 45e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard /* We are over allocating this list, because symbol_count gives the 46e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard * total number of symbols, and we will only be filling the list 47e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard * with offsets of global symbols. The memory savings from 48e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard * allocating the correct size of this list will be small, and 49e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard * I don't think it is worth the cost of pre-computing the number 50e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard * of global symbols. 51e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard */ 52e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard binary->global_symbol_offsets = CALLOC(symbol_count, sizeof(uint64_t)); 53e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 54e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard while (gelf_getsym(symbol_table_data, i++, &symbol)) { 55e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard unsigned i; 56dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard if (GELF_ST_BIND(symbol.st_info) != STB_GLOBAL || 57dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard symbol.st_shndx == 0 /* Undefined symbol */) { 58e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard continue; 59e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard } 60e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 61e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard binary->global_symbol_offsets[binary->global_symbol_count] = 62e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard symbol.st_value; 63e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 64e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard /* Sort the list using bubble sort. This list will usually 65e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard * be small. */ 66e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard for (i = binary->global_symbol_count; i > 0; --i) { 67e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard uint64_t lhs = binary->global_symbol_offsets[i - 1]; 68e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard uint64_t rhs = binary->global_symbol_offsets[i]; 69e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard if (lhs < rhs) { 70e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard break; 71e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard } 72e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard binary->global_symbol_offsets[i] = lhs; 73e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard binary->global_symbol_offsets[i - 1] = rhs; 74e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard } 75e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard ++binary->global_symbol_count; 76e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard } 77e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard} 78e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 79dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellardstatic void parse_relocs(Elf *elf, Elf_Data *relocs, Elf_Data *symbols, 80dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard unsigned symbol_sh_link, 81dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard struct radeon_shader_binary *binary) 82dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard{ 83dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard unsigned i; 84dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard 85dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard if (!relocs || !symbols || !binary->reloc_count) { 86dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard return; 87dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard } 88dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard binary->relocs = CALLOC(binary->reloc_count, 89dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard sizeof(struct radeon_shader_reloc)); 90dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard for (i = 0; i < binary->reloc_count; i++) { 91dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard GElf_Sym symbol; 92dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard GElf_Rel rel; 93dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard char *symbol_name; 94dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard struct radeon_shader_reloc *reloc = &binary->relocs[i]; 95dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard 96dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard gelf_getrel(relocs, i, &rel); 97dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard gelf_getsym(symbols, GELF_R_SYM(rel.r_info), &symbol); 98dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard symbol_name = elf_strptr(elf, symbol_sh_link, symbol.st_name); 99dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard 100dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard reloc->offset = rel.r_offset; 10150ac2612d08f2425972dde42e32a71fdce70cebdMarek Olšák strncpy(reloc->name, symbol_name, sizeof(reloc->name)-1); 10250ac2612d08f2425972dde42e32a71fdce70cebdMarek Olšák reloc->name[sizeof(reloc->name)-1] = 0; 103dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard } 104dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard} 105dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard 1066974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellardvoid radeon_elf_read(const char *elf_data, unsigned elf_size, 1077dd1f45bc41c4a936b0ff84400840524bb9f8871Marek Olšák struct radeon_shader_binary *binary) 1086974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard{ 1096974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard char *elf_buffer; 1106974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard Elf *elf; 1116974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard Elf_Scn *section = NULL; 112dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard Elf_Data *symbols = NULL, *relocs = NULL; 1136974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard size_t section_str_index; 114f5ac5e20b16d17b0adda6d856829dd0cf997f7dcMarek Olšák unsigned symbol_sh_link = 0; 1156974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard 1166974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard /* One of the libelf implementations 1176974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * (http://www.mr511.de/software/english.htm) requires calling 1186974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard * elf_version() before elf_memory(). 1196974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard */ 1206974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard elf_version(EV_CURRENT); 1216974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard elf_buffer = MALLOC(elf_size); 1226974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard memcpy(elf_buffer, elf_data, elf_size); 1236974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard 1246974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard elf = elf_memory(elf_buffer, elf_size); 1256974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard 1266974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard elf_getshdrstrndx(elf, §ion_str_index); 1276974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard 1286974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard while ((section = elf_nextscn(elf, section))) { 1296974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard const char *name; 1306974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard Elf_Data *section_data = NULL; 1316974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard GElf_Shdr section_header; 1326974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard if (gelf_getshdr(section, §ion_header) != §ion_header) { 1336974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard fprintf(stderr, "Failed to read ELF section header\n"); 1346974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard return; 1356974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard } 1366974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard name = elf_strptr(elf, section_str_index, section_header.sh_name); 1376974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard if (!strcmp(name, ".text")) { 1386974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard section_data = elf_getdata(section, section_data); 1396974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard binary->code_size = section_data->d_size; 1406974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard binary->code = MALLOC(binary->code_size * sizeof(unsigned char)); 1416974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard memcpy(binary->code, section_data->d_buf, binary->code_size); 1426974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard } else if (!strcmp(name, ".AMDGPU.config")) { 1436974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard section_data = elf_getdata(section, section_data); 1446974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard binary->config_size = section_data->d_size; 1456974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard binary->config = MALLOC(binary->config_size * sizeof(unsigned char)); 1466974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard memcpy(binary->config, section_data->d_buf, binary->config_size); 1477dd1f45bc41c4a936b0ff84400840524bb9f8871Marek Olšák } else if (!strcmp(name, ".AMDGPU.disasm")) { 1487dd1f45bc41c4a936b0ff84400840524bb9f8871Marek Olšák /* Always read disassembly if it's available. */ 1496974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard section_data = elf_getdata(section, section_data); 1507dd1f45bc41c4a936b0ff84400840524bb9f8871Marek Olšák binary->disasm_string = strndup(section_data->d_buf, 1517dd1f45bc41c4a936b0ff84400840524bb9f8871Marek Olšák section_data->d_size); 1529ba3105e0a4b186d6b1ee4c23886a3c4cd0a3543Tom Stellard } else if (!strncmp(name, ".rodata", 7)) { 1539ba3105e0a4b186d6b1ee4c23886a3c4cd0a3543Tom Stellard section_data = elf_getdata(section, section_data); 1549ba3105e0a4b186d6b1ee4c23886a3c4cd0a3543Tom Stellard binary->rodata_size = section_data->d_size; 1559ba3105e0a4b186d6b1ee4c23886a3c4cd0a3543Tom Stellard binary->rodata = MALLOC(binary->rodata_size * sizeof(unsigned char)); 1569ba3105e0a4b186d6b1ee4c23886a3c4cd0a3543Tom Stellard memcpy(binary->rodata, section_data->d_buf, binary->rodata_size); 157e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard } else if (!strncmp(name, ".symtab", 7)) { 158dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard symbols = elf_getdata(section, section_data); 159dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard symbol_sh_link = section_header.sh_link; 160dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard parse_symbol_table(symbols, §ion_header, binary); 161dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard } else if (!strcmp(name, ".rel.text")) { 162dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard relocs = elf_getdata(section, section_data); 163dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard binary->reloc_count = section_header.sh_size / 164dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard section_header.sh_entsize; 1656974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard } 1666974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard } 1676974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard 168dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard parse_relocs(elf, relocs, symbols, symbol_sh_link, binary); 169dfdaf3eb7edac939f5d1a32db2968944852b28faTom Stellard 1706974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard if (elf){ 1716974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard elf_end(elf); 1726974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard } 1736974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard FREE(elf_buffer); 174e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 175e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard /* Cache the config size per symbol */ 176e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard if (binary->global_symbol_count) { 177e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard binary->config_size_per_symbol = 178e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard binary->config_size / binary->global_symbol_count; 179e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard } else { 180e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard binary->global_symbol_count = 1; 181e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard binary->config_size_per_symbol = binary->config_size; 182e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard } 183e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard} 184e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard 185e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellardconst unsigned char *radeon_shader_binary_config_start( 186e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard const struct radeon_shader_binary *binary, 187e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard uint64_t symbol_offset) 188e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard{ 189e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard unsigned i; 190e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard for (i = 0; i < binary->global_symbol_count; ++i) { 191e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard if (binary->global_symbol_offsets[i] == symbol_offset) { 192e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard unsigned offset = i * binary->config_size_per_symbol; 193e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard return binary->config + offset; 194e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard } 195e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard } 196e91735a641b71bc2bccabd0c779a626fa412b314Tom Stellard return binary->config; 1976974eb907600b9d0176d3158ff0fd30ac3e56a55Tom Stellard} 198