target_x86.cc revision 35e1e6ad4b50f1adbe9f93fe467766f042491896
1efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* 2efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * Copyright (C) 2012 The Android Open Source Project 3efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * 4efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * Licensed under the Apache License, Version 2.0 (the "License"); 5efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * you may not use this file except in compliance with the License. 6efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * You may obtain a copy of the License at 7efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * 8efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * http://www.apache.org/licenses/LICENSE-2.0 9efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * 10efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * Unless required by applicable law or agreed to in writing, software 11efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * distributed under the License is distributed on an "AS IS" BASIS, 12efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * See the License for the specific language governing permissions and 14efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * limitations under the License. 15efc6369224b036a1fb77849f7ae65b3492c832c0buzbee */ 16efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 17f3e2cc4a38389aa75eb8ee3973a535254bf1c8d2Nicolas Geoffray#include <string> 18f3e2cc4a38389aa75eb8ee3973a535254bf1c8d2Nicolas Geoffray#include <inttypes.h> 19f3e2cc4a38389aa75eb8ee3973a535254bf1c8d2Nicolas Geoffray 2002031b185b4653e6c72e21f7a51238b903f6d638buzbee#include "codegen_x86.h" 217940e44f4517de5e2634a7e07d58d0fb26160513Brian Carlstrom#include "dex/compiler_internals.h" 227940e44f4517de5e2634a7e07d58d0fb26160513Brian Carlstrom#include "dex/quick/mir_to_lir-inl.h" 23b5860fb459f1ed71f39d8a87b45bee6727d79fe8buzbee#include "dex/reg_storage_eq.h" 24e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell#include "mirror/array.h" 25e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell#include "mirror/string.h" 26641ce0371c2f0dc95d26be02d8366124c8b66653Brian Carlstrom#include "x86_lir.h" 27efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 28efc6369224b036a1fb77849f7ae65b3492c832c0buzbeenamespace art { 29efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 30089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_regs_arr_32[] = { 319ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rAX, rs_rCX, rs_rDX, rs_rBX, rs_rX86_SP_32, rs_rBP, rs_rSI, rs_rDI, 329ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 33089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_regs_arr_64[] = { 3476af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko rs_rAX, rs_rCX, rs_rDX, rs_rBX, rs_rX86_SP_32, rs_rBP, rs_rSI, rs_rDI, 35091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_r8, rs_r9, rs_r10, rs_r11, rs_r12, rs_r13, rs_r14, rs_r15 36efc6369224b036a1fb77849f7ae65b3492c832c0buzbee}; 37089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_regs_arr_64q[] = { 380999a6f7c83d10aa59b75f079f0d2fdbac982cf7Dmitry Petrochenko rs_r0q, rs_r1q, rs_r2q, rs_r3q, rs_rX86_SP_64, rs_r5q, rs_r6q, rs_r7q, 39a20468c004264592f309a548fc71ba62a69b8742Dmitry Petrochenko rs_r8q, rs_r9q, rs_r10q, rs_r11q, rs_r12q, rs_r13q, rs_r14q, rs_r15q 400999a6f7c83d10aa59b75f079f0d2fdbac982cf7Dmitry Petrochenko}; 41089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage sp_regs_arr_32[] = { 429ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_fr0, rs_fr1, rs_fr2, rs_fr3, rs_fr4, rs_fr5, rs_fr6, rs_fr7, 439ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 44089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage sp_regs_arr_64[] = { 45091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_fr0, rs_fr1, rs_fr2, rs_fr3, rs_fr4, rs_fr5, rs_fr6, rs_fr7, 46091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_fr8, rs_fr9, rs_fr10, rs_fr11, rs_fr12, rs_fr13, rs_fr14, rs_fr15 47efc6369224b036a1fb77849f7ae65b3492c832c0buzbee}; 48089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage dp_regs_arr_32[] = { 499ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_dr0, rs_dr1, rs_dr2, rs_dr3, rs_dr4, rs_dr5, rs_dr6, rs_dr7, 509ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 51089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage dp_regs_arr_64[] = { 52091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_dr0, rs_dr1, rs_dr2, rs_dr3, rs_dr4, rs_dr5, rs_dr6, rs_dr7, 53091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_dr8, rs_dr9, rs_dr10, rs_dr11, rs_dr12, rs_dr13, rs_dr14, rs_dr15 54efc6369224b036a1fb77849f7ae65b3492c832c0buzbee}; 55c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovstatic constexpr RegStorage xp_regs_arr_32[] = { 56c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_xr0, rs_xr1, rs_xr2, rs_xr3, rs_xr4, rs_xr5, rs_xr6, rs_xr7, 57c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov}; 58c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovstatic constexpr RegStorage xp_regs_arr_64[] = { 59c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_xr0, rs_xr1, rs_xr2, rs_xr3, rs_xr4, rs_xr5, rs_xr6, rs_xr7, 60c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_xr8, rs_xr9, rs_xr10, rs_xr11, rs_xr12, rs_xr13, rs_xr14, rs_xr15 61c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov}; 62089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage reserved_regs_arr_32[] = {rs_rX86_SP_32}; 6376af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenkostatic constexpr RegStorage reserved_regs_arr_64[] = {rs_rX86_SP_32}; 64089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage reserved_regs_arr_64q[] = {rs_rX86_SP_64}; 65089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_temps_arr_32[] = {rs_rAX, rs_rCX, rs_rDX, rs_rBX}; 66089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_temps_arr_64[] = { 679ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rAX, rs_rCX, rs_rDX, rs_rSI, rs_rDI, 689ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_r8, rs_r9, rs_r10, rs_r11 699ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 70c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov 71c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// How to add register to be available for promotion: 72c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 1) Remove register from array defining temp 73c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 2) Update ClobberCallerSave 74c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 3) Update JNI compiler ABI: 75c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 3.1) add reg in JniCallingConvention method 76c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 3.2) update CoreSpillMask/FpSpillMask 77c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 4) Update entrypoints 78c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 4.1) Update constants in asm_support_x86_64.h for new frame size 79c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 4.2) Remove entry in SmashCallerSaves 80c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 4.3) Update jni_entrypoints to spill/unspill new callee save reg 81c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 4.4) Update quick_entrypoints to spill/unspill new callee save reg 82c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 5) Update runtime ABI 83c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 5.1) Update quick_method_frame_info with new required spills 84c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 5.2) Update QuickArgumentVisitor with new offsets to gprs and xmms 85c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// Note that you cannot use register corresponding to incoming args 86c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// according to ABI and QCG needs one additional XMM temp for 87c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// bulk copy in preparation to call. 88089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_temps_arr_64q[] = { 890999a6f7c83d10aa59b75f079f0d2fdbac982cf7Dmitry Petrochenko rs_r0q, rs_r1q, rs_r2q, rs_r6q, rs_r7q, 900999a6f7c83d10aa59b75f079f0d2fdbac982cf7Dmitry Petrochenko rs_r8q, rs_r9q, rs_r10q, rs_r11q 910999a6f7c83d10aa59b75f079f0d2fdbac982cf7Dmitry Petrochenko}; 92089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage sp_temps_arr_32[] = { 939ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_fr0, rs_fr1, rs_fr2, rs_fr3, rs_fr4, rs_fr5, rs_fr6, rs_fr7, 949ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 95089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage sp_temps_arr_64[] = { 96091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_fr0, rs_fr1, rs_fr2, rs_fr3, rs_fr4, rs_fr5, rs_fr6, rs_fr7, 97c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_fr8, rs_fr9, rs_fr10, rs_fr11 98091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee}; 99089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage dp_temps_arr_32[] = { 1009ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_dr0, rs_dr1, rs_dr2, rs_dr3, rs_dr4, rs_dr5, rs_dr6, rs_dr7, 1019ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 102089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage dp_temps_arr_64[] = { 103091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_dr0, rs_dr1, rs_dr2, rs_dr3, rs_dr4, rs_dr5, rs_dr6, rs_dr7, 104c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_dr8, rs_dr9, rs_dr10, rs_dr11 105091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee}; 106091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee 107089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage xp_temps_arr_32[] = { 108fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell rs_xr0, rs_xr1, rs_xr2, rs_xr3, rs_xr4, rs_xr5, rs_xr6, rs_xr7, 109fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell}; 110089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage xp_temps_arr_64[] = { 111fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell rs_xr0, rs_xr1, rs_xr2, rs_xr3, rs_xr4, rs_xr5, rs_xr6, rs_xr7, 112c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_xr8, rs_xr9, rs_xr10, rs_xr11 113fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell}; 114fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 115089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> empty_pool; 116089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_regs_32(core_regs_arr_32); 117089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_regs_64(core_regs_arr_64); 118089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_regs_64q(core_regs_arr_64q); 119089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> sp_regs_32(sp_regs_arr_32); 120089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> sp_regs_64(sp_regs_arr_64); 121089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> dp_regs_32(dp_regs_arr_32); 122089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> dp_regs_64(dp_regs_arr_64); 123c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovstatic constexpr ArrayRef<const RegStorage> xp_regs_32(xp_regs_arr_32); 124c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovstatic constexpr ArrayRef<const RegStorage> xp_regs_64(xp_regs_arr_64); 125089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> reserved_regs_32(reserved_regs_arr_32); 126089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> reserved_regs_64(reserved_regs_arr_64); 127089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> reserved_regs_64q(reserved_regs_arr_64q); 128089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_temps_32(core_temps_arr_32); 129089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_temps_64(core_temps_arr_64); 130089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_temps_64q(core_temps_arr_64q); 131089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> sp_temps_32(sp_temps_arr_32); 132089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> sp_temps_64(sp_temps_arr_64); 133089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> dp_temps_32(dp_temps_arr_32); 134089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> dp_temps_64(dp_temps_arr_64); 135089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Marko 136089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> xp_temps_32(xp_temps_arr_32); 137089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> xp_temps_64(xp_temps_arr_64); 138fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 1399ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_SP; 1409ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko 1419ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_ARG0; 1429ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_ARG1; 1439ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_ARG2; 1449ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_ARG3; 14558994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_ARG4; 14658994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_ARG5; 1479ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_FARG0; 1489ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_FARG1; 1499ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_FARG2; 1509ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_FARG3; 15158994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_FARG4; 15258994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_FARG5; 15358994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_FARG6; 15458994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_FARG7; 1559ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_RET0; 1569ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_RET1; 1579ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_INVOKE_TGT; 1589ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_COUNT; 1599ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko 1609ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_ARG0; 1619ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_ARG1; 1629ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_ARG2; 1639ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_ARG3; 16458994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_ARG4; 16558994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_ARG5; 1669ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_FARG0; 1679ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_FARG1; 1689ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_FARG2; 1699ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_FARG3; 17058994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_FARG4; 17158994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_FARG5; 17258994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_FARG6; 17358994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_FARG7; 1749ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_RET0; 1759ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_RET1; 1769ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_INVOKE_TGT; 1779ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_COUNT; 178efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 1792ce745c06271d5223d57dbf08117b20d5b60694aBrian CarlstromRegLocation X86Mir2Lir::LocCReturn() { 18000e1ec6581b5b7b46ca4c314c2854e9caa647dd2Bill Buzbee return x86_loc_c_return; 181efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 182efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 183a0cd2d701f29e0bc6275f1b13c0edfd4ec391879buzbeeRegLocation X86Mir2Lir::LocCReturnRef() { 184a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu return cu_->target64 ? x86_64_loc_c_return_ref : x86_loc_c_return_ref; 185a0cd2d701f29e0bc6275f1b13c0edfd4ec391879buzbee} 186a0cd2d701f29e0bc6275f1b13c0edfd4ec391879buzbee 1872ce745c06271d5223d57dbf08117b20d5b60694aBrian CarlstromRegLocation X86Mir2Lir::LocCReturnWide() { 188dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina return cu_->target64 ? x86_64_loc_c_return_wide : x86_loc_c_return_wide; 189efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 190efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 1912ce745c06271d5223d57dbf08117b20d5b60694aBrian CarlstromRegLocation X86Mir2Lir::LocCReturnFloat() { 19200e1ec6581b5b7b46ca4c314c2854e9caa647dd2Bill Buzbee return x86_loc_c_return_float; 193efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 194efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 1952ce745c06271d5223d57dbf08117b20d5b60694aBrian CarlstromRegLocation X86Mir2Lir::LocCReturnDouble() { 19600e1ec6581b5b7b46ca4c314c2854e9caa647dd2Bill Buzbee return x86_loc_c_return_double; 197efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 198efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 199a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu// Return a target-dependent special register for 32-bit. 200a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying FuRegStorage X86Mir2Lir::TargetReg32(SpecialTargetRegister reg) { 201091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee RegStorage res_reg = RegStorage::InvalidReg(); 202efc6369224b036a1fb77849f7ae65b3492c832c0buzbee switch (reg) { 203091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kSelf: res_reg = RegStorage::InvalidReg(); break; 204091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kSuspend: res_reg = RegStorage::InvalidReg(); break; 205091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kLr: res_reg = RegStorage::InvalidReg(); break; 206091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kPc: res_reg = RegStorage::InvalidReg(); break; 207ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe case kSp: res_reg = rs_rX86_SP_32; break; // This must be the concrete one, as _SP is target- 208ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe // specific size. 209091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kArg0: res_reg = rs_rX86_ARG0; break; 210091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kArg1: res_reg = rs_rX86_ARG1; break; 211091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kArg2: res_reg = rs_rX86_ARG2; break; 212091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kArg3: res_reg = rs_rX86_ARG3; break; 21358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kArg4: res_reg = rs_rX86_ARG4; break; 21458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kArg5: res_reg = rs_rX86_ARG5; break; 215091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kFArg0: res_reg = rs_rX86_FARG0; break; 216091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kFArg1: res_reg = rs_rX86_FARG1; break; 217091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kFArg2: res_reg = rs_rX86_FARG2; break; 218091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kFArg3: res_reg = rs_rX86_FARG3; break; 21958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kFArg4: res_reg = rs_rX86_FARG4; break; 22058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kFArg5: res_reg = rs_rX86_FARG5; break; 22158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kFArg6: res_reg = rs_rX86_FARG6; break; 22258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kFArg7: res_reg = rs_rX86_FARG7; break; 223091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kRet0: res_reg = rs_rX86_RET0; break; 224091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kRet1: res_reg = rs_rX86_RET1; break; 225091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kInvokeTgt: res_reg = rs_rX86_INVOKE_TGT; break; 226091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kHiddenArg: res_reg = rs_rAX; break; 227dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina case kHiddenFpArg: DCHECK(!cu_->target64); res_reg = rs_fr0; break; 228091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kCount: res_reg = rs_rX86_COUNT; break; 22958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko default: res_reg = RegStorage::InvalidReg(); 230091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee } 231091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee return res_reg; 232efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 233efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 234a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying FuRegStorage X86Mir2Lir::TargetReg(SpecialTargetRegister reg) { 235a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu LOG(FATAL) << "Do not use this function!!!"; 236a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu return RegStorage::InvalidReg(); 237a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu} 238a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu 239efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* 240efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * Decode the register id. 241efc6369224b036a1fb77849f7ae65b3492c832c0buzbee */ 2428dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir MarkoResourceMask X86Mir2Lir::GetRegMaskCommon(const RegStorage& reg) const { 2438dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko /* Double registers in x86 are just a single FP register. This is always just a single bit. */ 2448dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko return ResourceMask::Bit( 2458dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko /* FP register starts at bit position 16 */ 2468dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ((reg.IsFloat() || reg.StorageSize() > 8) ? kX86FPReg0 : 0) + reg.GetRegNum()); 2478dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko} 2488dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko 2498dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir MarkoResourceMask X86Mir2Lir::GetPCUseDefEncoding() const { 2508dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko return kEncodeNone; 251efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 252efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 2538dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Markovoid X86Mir2Lir::SetupTargetResourceMasks(LIR* lir, uint64_t flags, 2548dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ResourceMask* use_mask, ResourceMask* def_mask) { 2556a58cb16d803c9a7b3a75ccac8be19dd9d4e520dDmitry Petrochenko DCHECK(cu_->instruction_set == kX86 || cu_->instruction_set == kX86_64); 256b48819db07f9a0992a72173380c24249d7fc648abuzbee DCHECK(!lir->flags.use_def_invalid); 257efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 258efc6369224b036a1fb77849f7ae65b3492c832c0buzbee // X86-specific resource map setup here. 259efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_USE_SP) { 2608dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko use_mask->SetBit(kX86RegSP); 261efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 262efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 263efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_DEF_SP) { 2648dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko def_mask->SetBit(kX86RegSP); 265efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 266efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 267efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_DEFA) { 2688dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(def_mask, rs_rAX.GetReg()); 269efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 270efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 271efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_DEFD) { 2728dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(def_mask, rs_rDX.GetReg()); 273efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 274efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_USEA) { 2758dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rAX.GetReg()); 276efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 277efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 278efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_USEC) { 2798dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rCX.GetReg()); 280efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 281efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 282efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_USED) { 2838dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rDX.GetReg()); 284efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 28570b797d998f2a28e39f7d6ffc8a07c9cbc47da14Vladimir Marko 28670b797d998f2a28e39f7d6ffc8a07c9cbc47da14Vladimir Marko if (flags & REG_USEB) { 2878dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rBX.GetReg()); 28870b797d998f2a28e39f7d6ffc8a07c9cbc47da14Vladimir Marko } 2894028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 2904028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Fixup hard to describe instruction: Uses rAX, rCX, rDI; sets rDI. 2914028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (lir->opcode == kX86RepneScasw) { 2928dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rAX.GetReg()); 2938dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rCX.GetReg()); 2948dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rDI.GetReg()); 2958dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(def_mask, rs_rDI.GetReg()); 2964028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 297e90501da0222717d75c126ebf89569db3976927eSerguei Katkov 298e90501da0222717d75c126ebf89569db3976927eSerguei Katkov if (flags & USE_FP_STACK) { 2998dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko use_mask->SetBit(kX86FPStack); 3008dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko def_mask->SetBit(kX86FPStack); 301e90501da0222717d75c126ebf89569db3976927eSerguei Katkov } 302efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 303efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 304efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* For dumping instructions */ 305efc6369224b036a1fb77849f7ae65b3492c832c0buzbeestatic const char* x86RegName[] = { 306efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", 307efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15" 308efc6369224b036a1fb77849f7ae65b3492c832c0buzbee}; 309efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 310efc6369224b036a1fb77849f7ae65b3492c832c0buzbeestatic const char* x86CondName[] = { 311efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "O", 312efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NO", 313efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "B/NAE/C", 314efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NB/AE/NC", 315efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "Z/EQ", 316efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NZ/NE", 317efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "BE/NA", 318efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NBE/A", 319efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "S", 320efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NS", 321efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "P/PE", 322efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NP/PO", 323efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "L/NGE", 324efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NL/GE", 325efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "LE/NG", 326efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NLE/G" 327efc6369224b036a1fb77849f7ae65b3492c832c0buzbee}; 328efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 329efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* 330efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * Interpret a format string and build a string no longer than size 331efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * See format key in Assemble.cc. 332efc6369224b036a1fb77849f7ae65b3492c832c0buzbee */ 3331fd3346740dfb7f47be9922312b68a4227fada96buzbeestd::string X86Mir2Lir::BuildInsnString(const char *fmt, LIR *lir, unsigned char* base_addr) { 334efc6369224b036a1fb77849f7ae65b3492c832c0buzbee std::string buf; 335efc6369224b036a1fb77849f7ae65b3492c832c0buzbee size_t i = 0; 336efc6369224b036a1fb77849f7ae65b3492c832c0buzbee size_t fmt_len = strlen(fmt); 337efc6369224b036a1fb77849f7ae65b3492c832c0buzbee while (i < fmt_len) { 338efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (fmt[i] != '!') { 339efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += fmt[i]; 340efc6369224b036a1fb77849f7ae65b3492c832c0buzbee i++; 341efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } else { 342efc6369224b036a1fb77849f7ae65b3492c832c0buzbee i++; 343efc6369224b036a1fb77849f7ae65b3492c832c0buzbee DCHECK_LT(i, fmt_len); 344efc6369224b036a1fb77849f7ae65b3492c832c0buzbee char operand_number_ch = fmt[i]; 345efc6369224b036a1fb77849f7ae65b3492c832c0buzbee i++; 346efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (operand_number_ch == '!') { 347efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += "!"; 348efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } else { 349efc6369224b036a1fb77849f7ae65b3492c832c0buzbee int operand_number = operand_number_ch - '0'; 350efc6369224b036a1fb77849f7ae65b3492c832c0buzbee DCHECK_LT(operand_number, 6); // Expect upto 6 LIR operands. 351efc6369224b036a1fb77849f7ae65b3492c832c0buzbee DCHECK_LT(i, fmt_len); 352efc6369224b036a1fb77849f7ae65b3492c832c0buzbee int operand = lir->operands[operand_number]; 353efc6369224b036a1fb77849f7ae65b3492c832c0buzbee switch (fmt[i]) { 354efc6369224b036a1fb77849f7ae65b3492c832c0buzbee case 'c': 355efc6369224b036a1fb77849f7ae65b3492c832c0buzbee DCHECK_LT(static_cast<size_t>(operand), sizeof(x86CondName)); 356efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += x86CondName[operand]; 357efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 358efc6369224b036a1fb77849f7ae65b3492c832c0buzbee case 'd': 359efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += StringPrintf("%d", operand); 360efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 3615192cbb12856b12620dc346758605baaa1469cedYixin Shou case 'q': { 3625192cbb12856b12620dc346758605baaa1469cedYixin Shou int64_t value = static_cast<int64_t>(static_cast<int64_t>(operand) << 32 | 3635192cbb12856b12620dc346758605baaa1469cedYixin Shou static_cast<uint32_t>(lir->operands[operand_number+1])); 3645192cbb12856b12620dc346758605baaa1469cedYixin Shou buf +=StringPrintf("%" PRId64, value); 3655192cbb12856b12620dc346758605baaa1469cedYixin Shou } 366efc6369224b036a1fb77849f7ae65b3492c832c0buzbee case 'p': { 3670d82948094d9a198e01aa95f64012bdedd5b6fc9buzbee EmbeddedData *tab_rec = reinterpret_cast<EmbeddedData*>(UnwrapPointer(operand)); 368fa57c47f1b72916371a9c2d5c1389219bce655b4buzbee buf += StringPrintf("0x%08x", tab_rec->offset); 369efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 370efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 371efc6369224b036a1fb77849f7ae65b3492c832c0buzbee case 'r': 372091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee if (RegStorage::IsFloat(operand)) { 373091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee int fp_reg = RegStorage::RegNum(operand); 374efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += StringPrintf("xmm%d", fp_reg); 375efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } else { 376091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee int reg_num = RegStorage::RegNum(operand); 377091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee DCHECK_LT(static_cast<size_t>(reg_num), sizeof(x86RegName)); 378091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee buf += x86RegName[reg_num]; 379efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 380efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 381efc6369224b036a1fb77849f7ae65b3492c832c0buzbee case 't': 382107c31e598b649a8bb8d959d6a0377937e63e624Ian Rogers buf += StringPrintf("0x%08" PRIxPTR " (L%p)", 383107c31e598b649a8bb8d959d6a0377937e63e624Ian Rogers reinterpret_cast<uintptr_t>(base_addr) + lir->offset + operand, 384107c31e598b649a8bb8d959d6a0377937e63e624Ian Rogers lir->target); 385efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 386efc6369224b036a1fb77849f7ae65b3492c832c0buzbee default: 387efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += StringPrintf("DecodeError '%c'", fmt[i]); 388efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 389efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 390efc6369224b036a1fb77849f7ae65b3492c832c0buzbee i++; 391efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 392efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 393efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 394efc6369224b036a1fb77849f7ae65b3492c832c0buzbee return buf; 395efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 396efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 3978dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Markovoid X86Mir2Lir::DumpResourceMask(LIR *x86LIR, const ResourceMask& mask, const char *prefix) { 398efc6369224b036a1fb77849f7ae65b3492c832c0buzbee char buf[256]; 399efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf[0] = 0; 400efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 4018dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.Equals(kEncodeAll)) { 402efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcpy(buf, "all"); 403efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } else { 404efc6369224b036a1fb77849f7ae65b3492c832c0buzbee char num[8]; 405efc6369224b036a1fb77849f7ae65b3492c832c0buzbee int i; 406efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 407efc6369224b036a1fb77849f7ae65b3492c832c0buzbee for (i = 0; i < kX86RegEnd; i++) { 4088dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.HasBit(i)) { 409988e6ea9ac66edf1e205851df9bb53de3f3763f3Ian Rogers snprintf(num, arraysize(num), "%d ", i); 410efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcat(buf, num); 411efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 412efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 413efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 4148dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.HasBit(ResourceMask::kCCode)) { 415efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcat(buf, "cc "); 416efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 417efc6369224b036a1fb77849f7ae65b3492c832c0buzbee /* Memory bits */ 4188dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (x86LIR && (mask.HasBit(ResourceMask::kDalvikReg))) { 419988e6ea9ac66edf1e205851df9bb53de3f3763f3Ian Rogers snprintf(buf + strlen(buf), arraysize(buf) - strlen(buf), "dr%d%s", 420988e6ea9ac66edf1e205851df9bb53de3f3763f3Ian Rogers DECODE_ALIAS_INFO_REG(x86LIR->flags.alias_info), 421988e6ea9ac66edf1e205851df9bb53de3f3763f3Ian Rogers (DECODE_ALIAS_INFO_WIDE(x86LIR->flags.alias_info)) ? "(+1)" : ""); 422efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 4238dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.HasBit(ResourceMask::kLiteral)) { 424efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcat(buf, "lit "); 425efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 426efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 4278dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.HasBit(ResourceMask::kHeapRef)) { 428efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcat(buf, "heap "); 429efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 4308dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.HasBit(ResourceMask::kMustNotAlias)) { 431efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcat(buf, "noalias "); 432efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 433efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 434efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (buf[0]) { 435efc6369224b036a1fb77849f7ae65b3492c832c0buzbee LOG(INFO) << prefix << ": " << buf; 436efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 437efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 43802031b185b4653e6c72e21f7a51238b903f6d638buzbee 4391fd3346740dfb7f47be9922312b68a4227fada96buzbeevoid X86Mir2Lir::AdjustSpillMask() { 440efc6369224b036a1fb77849f7ae65b3492c832c0buzbee // Adjustment for LR spilling, x86 has no LR so nothing to do here 441091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee core_spill_mask_ |= (1 << rs_rRET.GetRegNum()); 4421fd3346740dfb7f47be9922312b68a4227fada96buzbee num_core_spills_++; 443efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 444efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 445e87f9b5185379c8cf8392d65a63e7bf7e51b97e7Mark MendellRegStorage X86Mir2Lir::AllocateByteRegister() { 4467e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu RegStorage reg = AllocTypedTemp(false, kCoreReg); 447dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (!cu_->target64) { 4487e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu DCHECK_LT(reg.GetRegNum(), rs_rX86_SP.GetRegNum()); 4497e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu } 4507e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu return reg; 4517e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu} 4527e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu 45360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan BanerjiRegStorage X86Mir2Lir::Get128BitRegister(RegStorage reg) { 45460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return GetRegInfo(reg)->FindMatchingView(RegisterInfo::k128SoloStorageMask)->GetReg(); 45560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 45660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 4577e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fubool X86Mir2Lir::IsByteRegister(RegStorage reg) { 458dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina return cu_->target64 || reg.GetRegNum() < rs_rX86_SP.GetRegNum(); 459e87f9b5185379c8cf8392d65a63e7bf7e51b97e7Mark Mendell} 460e87f9b5185379c8cf8392d65a63e7bf7e51b97e7Mark Mendell 461efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* Clobber all regs that might be used by an external C call */ 46231c2aac7137b69d5622eea09597500731fbee2efVladimir Markovoid X86Mir2Lir::ClobberCallerSave() { 463dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 464c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rAX); 465c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rCX); 466c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rDX); 467c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rSI); 468c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rDI); 469c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov 47035ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_r8); 47135ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_r9); 47235ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_r10); 47335ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_r11); 47435ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu 47535ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_fr8); 47635ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_fr9); 47735ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_fr10); 47835ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_fr11); 479c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } else { 480c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rAX); 481c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rCX); 482c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rDX); 483c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rBX); 48435ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu } 485c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov 486c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr0); 487c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr1); 488c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr2); 489c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr3); 490c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr4); 491c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr5); 492c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr6); 493c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr7); 494efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 495efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 4961fd3346740dfb7f47be9922312b68a4227fada96buzbeeRegLocation X86Mir2Lir::GetReturnWideAlt() { 49752a77fc135f0e0df57ee24641c3f5ae415ff7bd6buzbee RegLocation res = LocCReturnWide(); 498091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee DCHECK(res.reg.GetLowReg() == rs_rAX.GetReg()); 499091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee DCHECK(res.reg.GetHighReg() == rs_rDX.GetReg()); 500091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee Clobber(rs_rAX); 501091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee Clobber(rs_rDX); 502091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee MarkInUse(rs_rAX); 503091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee MarkInUse(rs_rDX); 504091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee MarkWide(res.reg); 505efc6369224b036a1fb77849f7ae65b3492c832c0buzbee return res; 506efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 507efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 5082ce745c06271d5223d57dbf08117b20d5b60694aBrian CarlstromRegLocation X86Mir2Lir::GetReturnAlt() { 50952a77fc135f0e0df57ee24641c3f5ae415ff7bd6buzbee RegLocation res = LocCReturn(); 510091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee res.reg.SetReg(rs_rDX.GetReg()); 511091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee Clobber(rs_rDX); 512091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee MarkInUse(rs_rDX); 513efc6369224b036a1fb77849f7ae65b3492c832c0buzbee return res; 514efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 515efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 516efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* To be used when explicitly managing register use */ 5172ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstromvoid X86Mir2Lir::LockCallTemps() { 518091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee LockTemp(rs_rX86_ARG0); 519091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee LockTemp(rs_rX86_ARG1); 520091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee LockTemp(rs_rX86_ARG2); 521091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee LockTemp(rs_rX86_ARG3); 522dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 52358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_ARG4); 52458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_ARG5); 52558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG0); 52658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG1); 52758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG2); 52858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG3); 52958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG4); 53058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG5); 53158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG6); 53258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG7); 53358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 534efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 535efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 536efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* To be used when explicitly managing register use */ 5372ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstromvoid X86Mir2Lir::FreeCallTemps() { 538091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee FreeTemp(rs_rX86_ARG0); 539091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee FreeTemp(rs_rX86_ARG1); 540091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee FreeTemp(rs_rX86_ARG2); 541091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee FreeTemp(rs_rX86_ARG3); 542dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 54358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_ARG4); 54458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_ARG5); 54558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG0); 54658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG1); 54758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG2); 54858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG3); 54958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG4); 55058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG5); 55158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG6); 55258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG7); 55358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 554efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 555efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 55699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusorubool X86Mir2Lir::ProvidesFullMemoryBarrier(X86OpCode opcode) { 55799ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru switch (opcode) { 55899ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru case kX86LockCmpxchgMR: 55999ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru case kX86LockCmpxchgAR: 5600f9b9c508814a62c6e21c6a06cfe4de39b5036c0Ian Rogers case kX86LockCmpxchg64M: 5610f9b9c508814a62c6e21c6a06cfe4de39b5036c0Ian Rogers case kX86LockCmpxchg64A: 56299ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru case kX86XchgMR: 56399ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru case kX86Mfence: 56499ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // Atomic memory instructions provide full barrier. 56599ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru return true; 56699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru default: 56799ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru break; 56899ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } 56999ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru 57099ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // Conservative if cannot prove it provides full barrier. 57199ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru return false; 57299ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru} 57399ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru 574b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampebool X86Mir2Lir::GenMemBarrier(MemBarrierKind barrier_kind) { 575efc6369224b036a1fb77849f7ae65b3492c832c0buzbee#if ANDROID_SMP != 0 57699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // Start off with using the last LIR as the barrier. If it is not enough, then we will update it. 57799ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru LIR* mem_barrier = last_lir_insn_; 57899ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru 579b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe bool ret = false; 58099ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru /* 58148f5c47907654350ce30a8dfdda0e977f5d3d39fHans Boehm * According to the JSR-133 Cookbook, for x86 only StoreLoad/AnyAny barriers need memory fence. 58248f5c47907654350ce30a8dfdda0e977f5d3d39fHans Boehm * All other barriers (LoadAny, AnyStore, StoreStore) are nops due to the x86 memory model. 58348f5c47907654350ce30a8dfdda0e977f5d3d39fHans Boehm * For those cases, all we need to ensure is that there is a scheduling barrier in place. 58499ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru */ 58548f5c47907654350ce30a8dfdda0e977f5d3d39fHans Boehm if (barrier_kind == kAnyAny) { 58699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // If no LIR exists already that can be used a barrier, then generate an mfence. 58799ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru if (mem_barrier == nullptr) { 58899ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru mem_barrier = NewLIR0(kX86Mfence); 589b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe ret = true; 59099ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } 59199ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru 59299ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // If last instruction does not provide full barrier, then insert an mfence. 59399ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru if (ProvidesFullMemoryBarrier(static_cast<X86OpCode>(mem_barrier->opcode)) == false) { 59499ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru mem_barrier = NewLIR0(kX86Mfence); 595b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe ret = true; 59699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } 59799ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } 59899ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru 59999ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // Now ensure that a scheduling barrier is in place. 60099ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru if (mem_barrier == nullptr) { 60199ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru GenBarrier(); 60299ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } else { 60399ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // Mark as a scheduling barrier. 60499ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru DCHECK(!mem_barrier->flags.use_def_invalid); 6058dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko mem_barrier->u.m.def_mask = &kEncodeAll; 60699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } 607b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe return ret; 608b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe#else 609b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe return false; 610efc6369224b036a1fb77849f7ae65b3492c832c0buzbee#endif 611efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 61200e1ec6581b5b7b46ca4c314c2854e9caa647dd2Bill Buzbee 6131fd3346740dfb7f47be9922312b68a4227fada96buzbeevoid X86Mir2Lir::CompilerInitializeRegAlloc() { 614dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 61576af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko reg_pool_ = new (arena_) RegisterPool(this, arena_, core_regs_64, core_regs_64q, sp_regs_64, 61676af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko dp_regs_64, reserved_regs_64, reserved_regs_64q, 61776af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko core_temps_64, core_temps_64q, sp_temps_64, dp_temps_64); 6189ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko } else { 619b01bf15d18f9b08d77e7a3c6e2897af0e02bf8cabuzbee reg_pool_ = new (arena_) RegisterPool(this, arena_, core_regs_32, empty_pool, sp_regs_32, 620b01bf15d18f9b08d77e7a3c6e2897af0e02bf8cabuzbee dp_regs_32, reserved_regs_32, empty_pool, 621b01bf15d18f9b08d77e7a3c6e2897af0e02bf8cabuzbee core_temps_32, empty_pool, sp_temps_32, dp_temps_32); 6229ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko } 623091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee 624091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee // Target-specific adjustments. 625091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee 626fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Add in XMM registers. 627c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov const ArrayRef<const RegStorage> *xp_regs = cu_->target64 ? &xp_regs_64 : &xp_regs_32; 628c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov for (RegStorage reg : *xp_regs) { 629fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell RegisterInfo* info = new (arena_) RegisterInfo(reg, GetRegMaskCommon(reg)); 630fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell reginfo_map_.Put(reg.GetReg(), info); 631c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 632c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov const ArrayRef<const RegStorage> *xp_temps = cu_->target64 ? &xp_temps_64 : &xp_temps_32; 633c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov for (RegStorage reg : *xp_temps) { 634c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov RegisterInfo* xp_reg_info = GetRegInfo(reg); 635c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov xp_reg_info->SetIsTemp(true); 636fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 637fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 638091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee // Alias single precision xmm to double xmms. 639091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee // TODO: as needed, add larger vector sizes - alias all to the largest. 640091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee GrowableArray<RegisterInfo*>::Iterator it(®_pool_->sp_regs_); 641091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee for (RegisterInfo* info = it.Next(); info != nullptr; info = it.Next()) { 642091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee int sp_reg_num = info->GetReg().GetRegNum(); 643fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell RegStorage xp_reg = RegStorage::Solo128(sp_reg_num); 644fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell RegisterInfo* xp_reg_info = GetRegInfo(xp_reg); 645fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // 128-bit xmm vector register's master storage should refer to itself. 646fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell DCHECK_EQ(xp_reg_info, xp_reg_info->Master()); 647fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 648fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Redirect 32-bit vector's master storage to 128-bit vector. 649fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell info->SetMaster(xp_reg_info); 650fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 65176af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko RegStorage dp_reg = RegStorage::FloatSolo64(sp_reg_num); 652091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee RegisterInfo* dp_reg_info = GetRegInfo(dp_reg); 653fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Redirect 64-bit vector's master storage to 128-bit vector. 654fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell dp_reg_info->SetMaster(xp_reg_info); 65576af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko // Singles should show a single 32-bit mask bit, at first referring to the low half. 65676af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko DCHECK_EQ(info->StorageMask(), 0x1U); 65776af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko } 65876af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko 659dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 66076af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko // Alias 32bit W registers to corresponding 64bit X registers. 66176af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko GrowableArray<RegisterInfo*>::Iterator w_it(®_pool_->core_regs_); 66276af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko for (RegisterInfo* info = w_it.Next(); info != nullptr; info = w_it.Next()) { 66376af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko int x_reg_num = info->GetReg().GetRegNum(); 66476af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko RegStorage x_reg = RegStorage::Solo64(x_reg_num); 66576af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko RegisterInfo* x_reg_info = GetRegInfo(x_reg); 66676af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko // 64bit X register's master storage should refer to itself. 66776af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko DCHECK_EQ(x_reg_info, x_reg_info->Master()); 66876af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko // Redirect 32bit W master storage to 64bit X. 66976af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko info->SetMaster(x_reg_info); 67076af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko // 32bit W should show a single 32-bit mask bit, at first referring to the low half. 67176af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko DCHECK_EQ(info->StorageMask(), 0x1U); 67276af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko } 673efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 674091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee 675091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee // Don't start allocating temps at r0/s0/d0 or you may clobber return regs in early-exit methods. 676091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee // TODO: adjust for x86/hard float calling convention. 677091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee reg_pool_->next_core_reg_ = 2; 678091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee reg_pool_->next_sp_reg_ = 2; 679091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee reg_pool_->next_dp_reg_ = 1; 680efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 681efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 68260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjiint X86Mir2Lir::VectorRegisterSize() { 68360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return 128; 68460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 68560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 68660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjiint X86Mir2Lir::NumReservableVectorRegisters(bool fp_used) { 68760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return fp_used ? 5 : 7; 68860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 68960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 6901fd3346740dfb7f47be9922312b68a4227fada96buzbeevoid X86Mir2Lir::SpillCoreRegs() { 6911fd3346740dfb7f47be9922312b68a4227fada96buzbee if (num_core_spills_ == 0) { 692efc6369224b036a1fb77849f7ae65b3492c832c0buzbee return; 693efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 694efc6369224b036a1fb77849f7ae65b3492c832c0buzbee // Spill mask not including fake return address register 695091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee uint32_t mask = core_spill_mask_ & ~(1 << rs_rRET.GetRegNum()); 6969ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko int offset = frame_size_ - (GetInstructionSetPointerSize(cu_->instruction_set) * num_core_spills_); 697c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov OpSize size = cu_->target64 ? k64 : k32; 698efc6369224b036a1fb77849f7ae65b3492c832c0buzbee for (int reg = 0; mask; mask >>= 1, reg++) { 699efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (mask & 0x1) { 700c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov StoreBaseDisp(rs_rX86_SP, offset, cu_->target64 ? RegStorage::Solo64(reg) : RegStorage::Solo32(reg), 701c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov size, kNotVolatile); 7029ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko offset += GetInstructionSetPointerSize(cu_->instruction_set); 703efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 704efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 705efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 706efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 7071fd3346740dfb7f47be9922312b68a4227fada96buzbeevoid X86Mir2Lir::UnSpillCoreRegs() { 7081fd3346740dfb7f47be9922312b68a4227fada96buzbee if (num_core_spills_ == 0) { 709efc6369224b036a1fb77849f7ae65b3492c832c0buzbee return; 710efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 711efc6369224b036a1fb77849f7ae65b3492c832c0buzbee // Spill mask not including fake return address register 712091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee uint32_t mask = core_spill_mask_ & ~(1 << rs_rRET.GetRegNum()); 7139ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko int offset = frame_size_ - (GetInstructionSetPointerSize(cu_->instruction_set) * num_core_spills_); 714c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov OpSize size = cu_->target64 ? k64 : k32; 715efc6369224b036a1fb77849f7ae65b3492c832c0buzbee for (int reg = 0; mask; mask >>= 1, reg++) { 716efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (mask & 0x1) { 717c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov LoadBaseDisp(rs_rX86_SP, offset, cu_->target64 ? RegStorage::Solo64(reg) : RegStorage::Solo32(reg), 718c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov size, kNotVolatile); 7199ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko offset += GetInstructionSetPointerSize(cu_->instruction_set); 720efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 721efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 722efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 723efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 724c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovvoid X86Mir2Lir::SpillFPRegs() { 725c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov if (num_fp_spills_ == 0) { 726c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov return; 727c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 728c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov uint32_t mask = fp_spill_mask_; 729c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov int offset = frame_size_ - (GetInstructionSetPointerSize(cu_->instruction_set) * (num_fp_spills_ + num_core_spills_)); 730c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov for (int reg = 0; mask; mask >>= 1, reg++) { 731c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov if (mask & 0x1) { 732c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov StoreBaseDisp(rs_rX86_SP, offset, RegStorage::FloatSolo64(reg), 733c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov k64, kNotVolatile); 734c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov offset += sizeof(double); 735c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 736c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 737c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov} 738c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovvoid X86Mir2Lir::UnSpillFPRegs() { 739c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov if (num_fp_spills_ == 0) { 740c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov return; 741c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 742c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov uint32_t mask = fp_spill_mask_; 743c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov int offset = frame_size_ - (GetInstructionSetPointerSize(cu_->instruction_set) * (num_fp_spills_ + num_core_spills_)); 744c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov for (int reg = 0; mask; mask >>= 1, reg++) { 745c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov if (mask & 0x1) { 746c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov LoadBaseDisp(rs_rX86_SP, offset, RegStorage::FloatSolo64(reg), 747c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov k64, kNotVolatile); 748c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov offset += sizeof(double); 749c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 750c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 751c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov} 752c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov 753c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov 7542ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstrombool X86Mir2Lir::IsUnconditionalBranch(LIR* lir) { 755cbd6d44c0a94f3d26671b5325aa21bbf1335ffe8buzbee return (lir->opcode == kX86Jmp8 || lir->opcode == kX86Jmp32); 756efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 757efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 758674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir MarkoRegisterClass X86Mir2Lir::RegClassForFieldLoadStore(OpSize size, bool is_volatile) { 759e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu // X86_64 can handle any size. 760dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 761e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu if (size == kReference) { 762e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu return kRefReg; 763e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu } 764e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu return kCoreReg; 765e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu } 766e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu 767674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko if (UNLIKELY(is_volatile)) { 768674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko // On x86, atomic 64-bit load/store requires an fp register. 769674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko // Smaller aligned load/store is atomic for both core and fp registers. 770674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko if (size == k64 || size == kDouble) { 771674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko return kFPReg; 772674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko } 773674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko } 774674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko return RegClassBySize(size); 775674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko} 776674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko 777dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena SayapinaX86Mir2Lir::X86Mir2Lir(CompilationUnit* cu, MIRGraph* mir_graph, ArenaAllocator* arena) 77855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell : Mir2Lir(cu, mir_graph, arena), 779dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers base_of_code_(nullptr), store_method_addr_(false), store_method_addr_used_(false), 78055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell method_address_insns_(arena, 100, kGrowableArrayMisc), 78155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell class_type_address_insns_(arena, 100, kGrowableArrayMisc), 782ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell call_method_insns_(arena, 100, kGrowableArrayMisc), 783dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina stack_decrement_(nullptr), stack_increment_(nullptr), 784d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell const_vectors_(nullptr) { 785d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell store_method_addr_used_ = false; 786dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers if (kIsDebugBuild) { 787dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers for (int i = 0; i < kX86Last; i++) { 788dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers if (X86Mir2Lir::EncodingMap[i].opcode != i) { 789dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers LOG(FATAL) << "Encoding order for " << X86Mir2Lir::EncodingMap[i].name 790d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell << " is wrong: expecting " << i << ", seeing " 791d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell << static_cast<int>(X86Mir2Lir::EncodingMap[i].opcode); 792dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers } 793efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 794efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 795dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 7969ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_SP = rs_rX86_SP_64; 7979ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko 7989ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG0 = rs_rDI; 7999ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG1 = rs_rSI; 8009ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG2 = rs_rDX; 8019ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG3 = rs_rCX; 80258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_ARG4 = rs_r8; 80358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_ARG5 = rs_r9; 80458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG0 = rs_fr0; 80558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG1 = rs_fr1; 80658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG2 = rs_fr2; 80758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG3 = rs_fr3; 80858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG4 = rs_fr4; 80958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG5 = rs_fr5; 81058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG6 = rs_fr6; 81158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG7 = rs_fr7; 8129ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG0 = rDI; 8139ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG1 = rSI; 8149ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG2 = rDX; 8159ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG3 = rCX; 81658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_ARG4 = r8; 81758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_ARG5 = r9; 81858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG0 = fr0; 81958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG1 = fr1; 82058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG2 = fr2; 82158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG3 = fr3; 82258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG4 = fr4; 82358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG5 = fr5; 82458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG6 = fr6; 82558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG7 = fr7; 82655884bc1e2e1b324809b462455ccaf5811ffafd8Mark Mendell rs_rX86_INVOKE_TGT = rs_rDI; 8279ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko } else { 8289ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_SP = rs_rX86_SP_32; 8299ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko 8309ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG0 = rs_rAX; 8319ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG1 = rs_rCX; 8329ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG2 = rs_rDX; 8339ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG3 = rs_rBX; 83458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_ARG4 = RegStorage::InvalidReg(); 83558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_ARG5 = RegStorage::InvalidReg(); 83658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG0 = rs_rAX; 83758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG1 = rs_rCX; 83858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG2 = rs_rDX; 83958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG3 = rs_rBX; 84058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG4 = RegStorage::InvalidReg(); 84158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG5 = RegStorage::InvalidReg(); 84258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG6 = RegStorage::InvalidReg(); 84358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG7 = RegStorage::InvalidReg(); 8449ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG0 = rAX; 8459ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG1 = rCX; 8469ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG2 = rDX; 8479ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG3 = rBX; 84858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG0 = rAX; 84958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG1 = rCX; 85058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG2 = rDX; 85158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG3 = rBX; 85255884bc1e2e1b324809b462455ccaf5811ffafd8Mark Mendell rs_rX86_INVOKE_TGT = rs_rAX; 85358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // TODO(64): Initialize with invalid reg 85458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko// rX86_ARG4 = RegStorage::InvalidReg(); 85558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko// rX86_ARG5 = RegStorage::InvalidReg(); 8569ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko } 8579ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_RET0 = rs_rAX; 8589ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_RET1 = rs_rDX; 8599ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_COUNT = rs_rCX; 8609ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_RET0 = rAX; 8619ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_RET1 = rDX; 8629ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_INVOKE_TGT = rAX; 8639ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_COUNT = rCX; 86460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 86560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Initialize the number of reserved vector registers 86660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji num_reserved_vector_regs_ = -1; 8671fd3346740dfb7f47be9922312b68a4227fada96buzbee} 8681fd3346740dfb7f47be9922312b68a4227fada96buzbee 869862a76027076c341c26aa6cd4a30a7cdd6dc2143buzbeeMir2Lir* X86CodeGenerator(CompilationUnit* const cu, MIRGraph* const mir_graph, 870862a76027076c341c26aa6cd4a30a7cdd6dc2143buzbee ArenaAllocator* const arena) { 871dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina return new X86Mir2Lir(cu, mir_graph, arena); 872efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 873efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 874984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe// Not used in x86(-64) 875984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas GampeRegStorage X86Mir2Lir::LoadHelper(QuickEntrypointEnum trampoline) { 8762f244e9faccfcca68af3c5484c397a01a1c3a342Andreas Gampe LOG(FATAL) << "Unexpected use of LoadHelper in x86"; 8772f244e9faccfcca68af3c5484c397a01a1c3a342Andreas Gampe return RegStorage::InvalidReg(); 8782f244e9faccfcca68af3c5484c397a01a1c3a342Andreas Gampe} 8792f244e9faccfcca68af3c5484c397a01a1c3a342Andreas Gampe 880b373e091eac39b1a79c11f2dcbd610af01e9e8a9Dave AllisonLIR* X86Mir2Lir::CheckSuspendUsingLoad() { 88169dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison // First load the pointer in fs:[suspend-trigger] into eax 88269dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison // Then use a test instruction to indirect via that address. 88369dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison NewLIR2(kX86Mov32RT, rs_rAX.GetReg(), cu_->target64 ? 88469dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison Thread::ThreadSuspendTriggerOffset<8>().Int32Value() : 88569dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison Thread::ThreadSuspendTriggerOffset<4>().Int32Value()); 88669dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison return NewLIR3(kX86Test32RM, rs_rAX.GetReg(), rs_rAX.GetReg(), 0); 887b373e091eac39b1a79c11f2dcbd610af01e9e8a9Dave Allison} 888b373e091eac39b1a79c11f2dcbd610af01e9e8a9Dave Allison 8892ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstromuint64_t X86Mir2Lir::GetTargetInstFlags(int opcode) { 890409fe94ad529d9334587be80b9f6a3d166805508buzbee DCHECK(!IsPseudoLirOp(opcode)); 8911fd3346740dfb7f47be9922312b68a4227fada96buzbee return X86Mir2Lir::EncodingMap[opcode].flags; 8921bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee} 8931bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee 8942ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstromconst char* X86Mir2Lir::GetTargetInstName(int opcode) { 895409fe94ad529d9334587be80b9f6a3d166805508buzbee DCHECK(!IsPseudoLirOp(opcode)); 8961fd3346740dfb7f47be9922312b68a4227fada96buzbee return X86Mir2Lir::EncodingMap[opcode].name; 8971bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee} 8981bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee 8992ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstromconst char* X86Mir2Lir::GetTargetInstFmt(int opcode) { 900409fe94ad529d9334587be80b9f6a3d166805508buzbee DCHECK(!IsPseudoLirOp(opcode)); 9011fd3346740dfb7f47be9922312b68a4227fada96buzbee return X86Mir2Lir::EncodingMap[opcode].fmt; 9021bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee} 9031bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee 904d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbeevoid X86Mir2Lir::GenConstWide(RegLocation rl_dest, int64_t value) { 905d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee // Can we do this directly to memory? 906d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee rl_dest = UpdateLocWide(rl_dest); 907d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee if ((rl_dest.location == kLocDalvikFrame) || 908d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee (rl_dest.location == kLocCompilerTemp)) { 909d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee int32_t val_lo = Low32Bits(value); 910d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee int32_t val_hi = High32Bits(value); 911a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu int r_base = rs_rX86_SP.GetReg(); 912d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee int displacement = SRegOffset(rl_dest.s_reg_low); 913d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee 9148dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 9152700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee LIR * store = NewLIR3(kX86Mov32MI, r_base, displacement + LOWORD_OFFSET, val_lo); 916d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee AnnotateDalvikRegAccess(store, (displacement + LOWORD_OFFSET) >> 2, 917d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee false /* is_load */, true /* is64bit */); 9182700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee store = NewLIR3(kX86Mov32MI, r_base, displacement + HIWORD_OFFSET, val_hi); 919d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee AnnotateDalvikRegAccess(store, (displacement + HIWORD_OFFSET) >> 2, 920d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee false /* is_load */, true /* is64bit */); 921d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee return; 922d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee } 923d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee 924d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee // Just use the standard code to do the generation. 925d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee Mir2Lir::GenConstWide(rl_dest, value); 926d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee} 927e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell 928e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell// TODO: Merge with existing RegLocation dumper in vreg_analysis.cc 929e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendellvoid X86Mir2Lir::DumpRegLocation(RegLocation loc) { 930e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell LOG(INFO) << "location: " << loc.location << ',' 931e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.wide ? " w" : " ") 932e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.defined ? " D" : " ") 933e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.is_const ? " c" : " ") 934e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.fp ? " F" : " ") 935e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.core ? " C" : " ") 936e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.ref ? " r" : " ") 937e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.high_word ? " h" : " ") 938e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.home ? " H" : " ") 9392700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee << ", low: " << static_cast<int>(loc.reg.GetLowReg()) 94000e1ec6581b5b7b46ca4c314c2854e9caa647dd2Bill Buzbee << ", high: " << static_cast<int>(loc.reg.GetHighReg()) 941e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << ", s_reg: " << loc.s_reg_low 942e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << ", orig: " << loc.orig_sreg; 943e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell} 944e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell 94567c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendellvoid X86Mir2Lir::Materialize() { 94667c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell // A good place to put the analysis before starting. 94767c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell AnalyzeMIR(); 94867c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell 94967c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell // Now continue with regular code generation. 95067c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell Mir2Lir::Materialize(); 95167c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell} 95267c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell 95349161cef10a308aedada18e9aa742498d6e6c8c7Jeff Haovoid X86Mir2Lir::LoadMethodAddress(const MethodReference& target_method, InvokeType type, 95455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell SpecialTargetRegister symbolic_reg) { 95555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell /* 95655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * For x86, just generate a 32 bit move immediate instruction, that will be filled 95755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * in at 'link time'. For now, put a unique value based on target to ensure that 95855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * code deduplication works. 95955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell */ 96049161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao int target_method_idx = target_method.dex_method_index; 96149161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile* target_dex_file = target_method.dex_file; 96249161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile::MethodId& target_method_id = target_dex_file->GetMethodId(target_method_idx); 96349161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao uintptr_t target_method_id_ptr = reinterpret_cast<uintptr_t>(&target_method_id); 96455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 96549161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao // Generate the move instruction with the unique pointer and save index, dex_file, and type. 966ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe LIR *move = RawLIR(current_dalvik_offset_, kX86Mov32RI, 967ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe TargetReg(symbolic_reg, kNotWide).GetReg(), 96849161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao static_cast<int>(target_method_id_ptr), target_method_idx, 96949161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao WrapPointer(const_cast<DexFile*>(target_dex_file)), type); 97055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell AppendLIR(move); 97155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell method_address_insns_.Insert(move); 97255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell} 97355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 97455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendellvoid X86Mir2Lir::LoadClassType(uint32_t type_idx, SpecialTargetRegister symbolic_reg) { 97555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell /* 97655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * For x86, just generate a 32 bit move immediate instruction, that will be filled 97755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * in at 'link time'. For now, put a unique value based on target to ensure that 97855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * code deduplication works. 97955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell */ 98055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell const DexFile::TypeId& id = cu_->dex_file->GetTypeId(type_idx); 98155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell uintptr_t ptr = reinterpret_cast<uintptr_t>(&id); 98255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 98355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // Generate the move instruction with the unique pointer and save index and type. 984ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe LIR *move = RawLIR(current_dalvik_offset_, kX86Mov32RI, 985ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe TargetReg(symbolic_reg, kNotWide).GetReg(), 98655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell static_cast<int>(ptr), type_idx); 98755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell AppendLIR(move); 98855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell class_type_address_insns_.Insert(move); 98955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell} 99055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 99149161cef10a308aedada18e9aa742498d6e6c8c7Jeff HaoLIR *X86Mir2Lir::CallWithLinkerFixup(const MethodReference& target_method, InvokeType type) { 99255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell /* 99355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * For x86, just generate a 32 bit call relative instruction, that will be filled 99455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * in at 'link time'. For now, put a unique value based on target to ensure that 99555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * code deduplication works. 99655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell */ 99749161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao int target_method_idx = target_method.dex_method_index; 99849161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile* target_dex_file = target_method.dex_file; 99949161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile::MethodId& target_method_id = target_dex_file->GetMethodId(target_method_idx); 100049161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao uintptr_t target_method_id_ptr = reinterpret_cast<uintptr_t>(&target_method_id); 100149161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao 100249161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao // Generate the call instruction with the unique pointer and save index, dex_file, and type. 100349161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao LIR *call = RawLIR(current_dalvik_offset_, kX86CallI, static_cast<int>(target_method_id_ptr), 100449161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao target_method_idx, WrapPointer(const_cast<DexFile*>(target_dex_file)), type); 100555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell AppendLIR(call); 100655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell call_method_insns_.Insert(call); 100755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell return call; 100855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell} 100955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 1010d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell/* 1011d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell * @brief Enter a 32 bit quantity into a buffer 1012d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell * @param buf buffer. 1013d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell * @param data Data value. 1014d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell */ 1015d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 1016d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendellstatic void PushWord(std::vector<uint8_t>&buf, int32_t data) { 1017d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell buf.push_back(data & 0xff); 1018d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell buf.push_back((data >> 8) & 0xff); 1019d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell buf.push_back((data >> 16) & 0xff); 1020d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell buf.push_back((data >> 24) & 0xff); 1021d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell} 1022d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 102355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendellvoid X86Mir2Lir::InstallLiteralPools() { 102455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // These are handled differently for x86. 102555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK(code_literal_list_ == nullptr); 102655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK(method_literal_list_ == nullptr); 102755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK(class_literal_list_ == nullptr); 102855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 1029d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // Align to 16 byte boundary. We have implicit knowledge that the start of the method is 1030d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // on a 4 byte boundary. How can I check this if it changes (other than aligned loads 1031d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // will fail at runtime)? 1032d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (const_vectors_ != nullptr) { 1033d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell int align_size = (16-4) - (code_buffer_.size() & 0xF); 1034d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (align_size < 0) { 1035d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell align_size += 16; 1036d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1037d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 1038d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell while (align_size > 0) { 1039d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell code_buffer_.push_back(0); 1040d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell align_size--; 1041d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1042d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell for (LIR *p = const_vectors_; p != nullptr; p = p->next) { 1043d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell PushWord(code_buffer_, p->operands[0]); 1044d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell PushWord(code_buffer_, p->operands[1]); 1045d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell PushWord(code_buffer_, p->operands[2]); 1046d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell PushWord(code_buffer_, p->operands[3]); 1047d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1048d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1049d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 105055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // Handle the fixups for methods. 105155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell for (uint32_t i = 0; i < method_address_insns_.Size(); i++) { 105255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell LIR* p = method_address_insns_.Get(i); 105355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK_EQ(p->opcode, kX86Mov32RI); 105449161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao uint32_t target_method_idx = p->operands[2]; 105549161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile* target_dex_file = 105649161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao reinterpret_cast<const DexFile*>(UnwrapPointer(p->operands[3])); 105755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 105855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // The offset to patch is the last 4 bytes of the instruction. 105955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell int patch_offset = p->offset + p->flags.size - 4; 106055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell cu_->compiler_driver->AddMethodPatch(cu_->dex_file, cu_->class_def_idx, 106155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell cu_->method_idx, cu_->invoke_type, 106249161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao target_method_idx, target_dex_file, 106349161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao static_cast<InvokeType>(p->operands[4]), 106455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell patch_offset); 106555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell } 106655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 106755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // Handle the fixups for class types. 106855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell for (uint32_t i = 0; i < class_type_address_insns_.Size(); i++) { 106955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell LIR* p = class_type_address_insns_.Get(i); 107055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK_EQ(p->opcode, kX86Mov32RI); 107149161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao uint32_t target_method_idx = p->operands[2]; 107255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 107355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // The offset to patch is the last 4 bytes of the instruction. 107455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell int patch_offset = p->offset + p->flags.size - 4; 107555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell cu_->compiler_driver->AddClassPatch(cu_->dex_file, cu_->class_def_idx, 107649161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao cu_->method_idx, target_method_idx, patch_offset); 107755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell } 107855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 107955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // And now the PC-relative calls to methods. 108055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell for (uint32_t i = 0; i < call_method_insns_.Size(); i++) { 108155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell LIR* p = call_method_insns_.Get(i); 108255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK_EQ(p->opcode, kX86CallI); 108349161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao uint32_t target_method_idx = p->operands[1]; 108449161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile* target_dex_file = 108549161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao reinterpret_cast<const DexFile*>(UnwrapPointer(p->operands[2])); 108655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 108755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // The offset to patch is the last 4 bytes of the instruction. 108855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell int patch_offset = p->offset + p->flags.size - 4; 108955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell cu_->compiler_driver->AddRelativeCodePatch(cu_->dex_file, cu_->class_def_idx, 109049161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao cu_->method_idx, cu_->invoke_type, 109149161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao target_method_idx, target_dex_file, 109249161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao static_cast<InvokeType>(p->operands[3]), 109355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell patch_offset, -4 /* offset */); 109455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell } 109555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 109655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // And do the normal processing. 109755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell Mir2Lir::InstallLiteralPools(); 109855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell} 109955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 110070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolovbool X86Mir2Lir::GenInlinedArrayCopyCharArray(CallInfo* info) { 110170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (cu_->target64) { 110270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // TODO: Implement ArrayCOpy intrinsic for x86_64 110370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov return false; 110470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 110570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 110670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov RegLocation rl_src = info->args[0]; 110770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov RegLocation rl_srcPos = info->args[1]; 110870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov RegLocation rl_dst = info->args[2]; 110970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov RegLocation rl_dstPos = info->args[3]; 111070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov RegLocation rl_length = info->args[4]; 111170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (rl_srcPos.is_const && (mir_graph_->ConstantValue(rl_srcPos) < 0)) { 111270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov return false; 111370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 111470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (rl_dstPos.is_const && (mir_graph_->ConstantValue(rl_dstPos) < 0)) { 111570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov return false; 111670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 111770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov ClobberCallerSave(); 111870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LockCallTemps(); // Using fixed registers 111970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_src , rs_rAX); 112070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_dst , rs_rCX); 112170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* src_dst_same = OpCmpBranch(kCondEq, rs_rAX , rs_rCX, nullptr); 112270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* src_null_branch = OpCmpImmBranch(kCondEq, rs_rAX , 0, nullptr); 112370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* dst_null_branch = OpCmpImmBranch(kCondEq, rs_rCX , 0, nullptr); 112470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_length , rs_rDX); 112570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* len_negative = OpCmpImmBranch(kCondLt, rs_rDX , 0, nullptr); 112670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* len_too_big = OpCmpImmBranch(kCondGt, rs_rDX , 128, nullptr); 112770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_src , rs_rAX); 112870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadWordDisp(rs_rAX , mirror::Array::LengthOffset().Int32Value(), rs_rAX); 112970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* src_bad_len = nullptr; 113070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* srcPos_negative = nullptr; 113170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (!rl_srcPos.is_const) { 113270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_srcPos , rs_rBX); 113370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov srcPos_negative = OpCmpImmBranch(kCondLt, rs_rBX , 0, nullptr); 113470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegReg(kOpAdd, rs_rBX, rs_rDX); 113570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rBX, nullptr); 113670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } else { 113770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov int pos_val = mir_graph_->ConstantValue(rl_srcPos.orig_sreg); 113870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (pos_val == 0) { 113970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rDX, nullptr); 114070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } else { 114170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegRegImm(kOpAdd, rs_rBX, rs_rDX, pos_val); 114270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rBX, nullptr); 114370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 114470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 114570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* dstPos_negative = nullptr; 114670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* dst_bad_len = nullptr; 114770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_dst, rs_rAX); 114870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadWordDisp(rs_rAX, mirror::Array::LengthOffset().Int32Value(), rs_rAX); 114970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (!rl_dstPos.is_const) { 115070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_dstPos , rs_rBX); 115170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dstPos_negative = OpCmpImmBranch(kCondLt, rs_rBX , 0, nullptr); 115270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegRegReg(kOpAdd, rs_rBX, rs_rBX, rs_rDX); 115370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dst_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rBX, nullptr); 115470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } else { 115570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov int pos_val = mir_graph_->ConstantValue(rl_dstPos.orig_sreg); 115670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (pos_val == 0) { 115770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dst_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rDX, nullptr); 115870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } else { 115970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegRegImm(kOpAdd, rs_rBX, rs_rDX, pos_val); 116070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dst_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rBX, nullptr); 116170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 116270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 116370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // everything is checked now 116470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_src , rs_rAX); 116570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_dst , rs_rBX); 116670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_srcPos , rs_rCX); 116770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov NewLIR5(kX86Lea32RA, rs_rAX.GetReg(), rs_rAX.GetReg(), 116870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov rs_rCX.GetReg() , 1, mirror::Array::DataOffset(2).Int32Value()); 116970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // RAX now holds the address of the first src element to be copied 117070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 117170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_dstPos , rs_rCX); 117270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov NewLIR5(kX86Lea32RA, rs_rBX.GetReg(), rs_rBX.GetReg(), 117370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov rs_rCX.GetReg() , 1, mirror::Array::DataOffset(2).Int32Value() ); 117470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // RBX now holds the address of the first dst element to be copied 117570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 117670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // check if the number of elements to be copied is odd or even. If odd 117770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // then copy the first element (so that the remaining number of elements 117870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // is even). 117970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_length , rs_rCX); 118070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegImm(kOpAnd, rs_rCX, 1); 118170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* jmp_to_begin_loop = OpCmpImmBranch(kCondEq, rs_rCX, 0, nullptr); 118270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegImm(kOpSub, rs_rDX, 1); 118370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadBaseIndexedDisp(rs_rAX, rs_rDX, 1, 0, rs_rCX, kSignedHalf); 118470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov StoreBaseIndexedDisp(rs_rBX, rs_rDX, 1, 0, rs_rCX, kSignedHalf); 118570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 118670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // since the remaining number of elements is even, we will copy by 118770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // two elements at a time. 118870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR *beginLoop = NewLIR0(kPseudoTargetLabel); 118970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* jmp_to_ret = OpCmpImmBranch(kCondEq, rs_rDX , 0, nullptr); 119070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegImm(kOpSub, rs_rDX, 2); 119170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadBaseIndexedDisp(rs_rAX, rs_rDX, 1, 0, rs_rCX, kSingle); 119270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov StoreBaseIndexedDisp(rs_rBX, rs_rDX, 1, 0, rs_rCX, kSingle); 119370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpUnconditionalBranch(beginLoop); 119470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR *check_failed = NewLIR0(kPseudoTargetLabel); 119570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* launchpad_branch = OpUnconditionalBranch(nullptr); 119670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR *return_point = NewLIR0(kPseudoTargetLabel); 119770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov jmp_to_ret->target = return_point; 119870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov jmp_to_begin_loop->target = beginLoop; 119970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_dst_same->target = check_failed; 120070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov len_negative->target = check_failed; 120170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov len_too_big->target = check_failed; 120270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_null_branch->target = check_failed; 120370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (srcPos_negative != nullptr) 120470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov srcPos_negative ->target = check_failed; 120570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (src_bad_len != nullptr) 120670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_bad_len->target = check_failed; 120770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dst_null_branch->target = check_failed; 120870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (dstPos_negative != nullptr) 120970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dstPos_negative->target = check_failed; 121070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (dst_bad_len != nullptr) 121170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dst_bad_len->target = check_failed; 121270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov AddIntrinsicSlowPath(info, launchpad_branch, return_point); 121370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov return true; 121470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov} 121570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 121670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 12174028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell/* 12184028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell * Fast string.index_of(I) & (II). Inline check for simple case of char <= 0xffff, 12194028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell * otherwise bails to standard library code. 12204028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell */ 12214028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendellbool X86Mir2Lir::GenInlinedIndexOf(CallInfo* info, bool zero_based) { 12224028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell RegLocation rl_obj = info->args[0]; 12234028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell RegLocation rl_char = info->args[1]; 1224a44d4f508fa1642294e79d3ebecd790afe75ea60buzbee RegLocation rl_start; // Note: only present in III flavor or IndexOf. 1225c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // RBX is callee-save register in 64-bit mode. 1226c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk RegStorage rs_tmp = cu_->target64 ? rs_r11 : rs_rBX; 1227c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk int start_value = -1; 12284028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 12294028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell uint32_t char_value = 12304028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell rl_char.is_const ? mir_graph_->ConstantValue(rl_char.orig_sreg) : 0; 12314028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 12324028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (char_value > 0xFFFF) { 12334028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // We have to punt to the real String.indexOf. 12344028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell return false; 12354028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 12364028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 12374028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Okay, we are commited to inlining this. 1238c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // EAX: 16 bit character being searched. 1239c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // ECX: count: number of words to be searched. 1240c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // EDI: String being searched. 1241c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // EDX: temporary during execution. 1242c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // EBX or R11: temporary during execution (depending on mode). 1243c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // REP SCASW: search instruction. 1244c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1245c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FlushReg(rs_rAX); 1246c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Clobber(rs_rAX); 1247c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LockTemp(rs_rAX); 1248c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FlushReg(rs_rCX); 1249c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Clobber(rs_rCX); 1250c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LockTemp(rs_rCX); 1251c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FlushReg(rs_rDX); 1252c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Clobber(rs_rDX); 1253c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LockTemp(rs_rDX); 1254c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FlushReg(rs_tmp); 1255c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Clobber(rs_tmp); 1256c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LockTemp(rs_tmp); 1257c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (cu_->target64) { 1258c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FlushReg(rs_rDI); 1259c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Clobber(rs_rDI); 1260c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LockTemp(rs_rDI); 1261c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk } 1262c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1263a0cd2d701f29e0bc6275f1b13c0edfd4ec391879buzbee RegLocation rl_return = GetReturn(kCoreReg); 12644028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell RegLocation rl_dest = InlineTarget(info); 12654028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 12664028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Is the string non-NULL? 12672700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee LoadValueDirectFixed(rl_obj, rs_rDX); 12682700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee GenNullCheck(rs_rDX, info->opt_flags); 12693bc8615332b7848dec8c2297a40f7e4d176c0efbVladimir Marko info->opt_flags |= MIR_IGNORE_NULL_CHECK; // Record that we've null checked. 12704028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 1271c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LIR *slowpath_branch = nullptr, *length_compare = nullptr; 1272c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1273c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // We need the value in EAX. 12744028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (rl_char.is_const) { 12752700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee LoadConstantNoClobber(rs_rAX, char_value); 12764028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } else { 1277c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Does the character fit in 16 bits? Compare it at runtime. 12782700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee LoadValueDirectFixed(rl_char, rs_rAX); 12793a74d15ccc9a902874473ac9632e568b19b91b1cMingyao Yang slowpath_branch = OpCmpImmBranch(kCondGt, rs_rAX, 0xFFFF, nullptr); 12804028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 12814028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 12824028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // From here down, we know that we are looking for a char that fits in 16 bits. 1283e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell // Location of reference to data array within the String object. 1284e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell int value_offset = mirror::String::ValueOffset().Int32Value(); 1285e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell // Location of count within the String object. 1286e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell int count_offset = mirror::String::CountOffset().Int32Value(); 1287e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell // Starting offset within data array. 1288e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell int offset_offset = mirror::String::OffsetOffset().Int32Value(); 1289e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell // Start of char data with array_. 1290e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell int data_offset = mirror::Array::DataOffset(sizeof(uint16_t)).Int32Value(); 12914028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 129269dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison // Compute the number of words to search in to rCX. 129369dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison Load32Disp(rs_rDX, count_offset, rs_rCX); 129469dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison 1295c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (!cu_->target64) { 1296c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Possible signal here due to null pointer dereference. 1297c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Note that the signal handler will expect the top word of 1298c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // the stack to be the ArtMethod*. If the PUSH edi instruction 1299c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // below is ahead of the load above then this will not be true 1300c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // and the signal handler will not work. 1301c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk MarkPossibleNullPointerException(0); 1302c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1303c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // EDI is callee-save register in 32-bit mode. 1304c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk NewLIR1(kX86Push32R, rs_rDI.GetReg()); 1305c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk } 13064028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13074028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (zero_based) { 1308c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Start index is not present. 13094028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // We have to handle an empty string. Use special instruction JECXZ. 13104028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell length_compare = NewLIR0(kX86Jecxz8); 1311c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1312c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Copy the number of words to search in a temporary register. 1313c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // We will use the register at the end to calculate result. 1314c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpMov, rs_tmp, rs_rCX); 13154028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } else { 1316c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Start index is present. 1317a44d4f508fa1642294e79d3ebecd790afe75ea60buzbee rl_start = info->args[2]; 1318c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 13194028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // We have to offset by the start index. 13204028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (rl_start.is_const) { 13214028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell start_value = mir_graph_->ConstantValue(rl_start.orig_sreg); 13224028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell start_value = std::max(start_value, 0); 13234028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13244028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Is the start > count? 13252700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee length_compare = OpCmpImmBranch(kCondLe, rs_rCX, start_value, nullptr); 1326c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegImm(kOpMov, rs_rDI, start_value); 1327c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1328c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Copy the number of words to search in a temporary register. 1329c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // We will use the register at the end to calculate result. 1330c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpMov, rs_tmp, rs_rCX); 13314028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13324028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (start_value != 0) { 1333c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Decrease the number of words to search by the start index. 13342700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee OpRegImm(kOpSub, rs_rCX, start_value); 13354028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 13364028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } else { 1337c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Handle "start index < 0" case. 1338c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (!cu_->target64 && rl_start.location != kLocPhysReg) { 1339a1758d83e298c9ee31848bcae07c2a35f6efd618Alexei Zavjalov // Load the start index from stack, remembering that we pushed EDI. 1340c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk int displacement = SRegOffset(rl_start.s_reg_low) + sizeof(uint32_t); 13418dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko { 13428dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 1343c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Load32Disp(rs_rX86_SP, displacement, rs_rDI); 13448dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko } 1345c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk } else { 1346c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LoadValueDirectFixed(rl_start, rs_rDI); 13474028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 1348c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpXor, rs_tmp, rs_tmp); 1349c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpCmp, rs_rDI, rs_tmp); 1350c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpCondRegReg(kOpCmov, kCondLt, rs_rDI, rs_tmp); 1351c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1352c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // The length of the string should be greater than the start index. 1353c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk length_compare = OpCmpBranch(kCondLe, rs_rCX, rs_rDI, nullptr); 1354c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1355c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Copy the number of words to search in a temporary register. 1356c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // We will use the register at the end to calculate result. 1357c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpMov, rs_tmp, rs_rCX); 1358c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1359c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Decrease the number of words to search by the start index. 1360c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpSub, rs_rCX, rs_rDI); 13614028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 13624028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 13634028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 1364c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Load the address of the string into EDI. 1365c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // In case of start index we have to add the address to existing value in EDI. 1366e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell // The string starts at VALUE(String) + 2 * OFFSET(String) + DATA_OFFSET. 1367c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (zero_based || (!zero_based && rl_start.is_const && start_value == 0)) { 1368c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Load32Disp(rs_rDX, offset_offset, rs_rDI); 13694028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } else { 1370c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegMem(kOpAdd, rs_rDI, rs_rDX, offset_offset); 13714028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 1372c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegImm(kOpLsl, rs_rDI, 1); 1373c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegMem(kOpAdd, rs_rDI, rs_rDX, value_offset); 1374c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegImm(kOpAdd, rs_rDI, data_offset); 13754028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13764028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // EDI now contains the start of the string to be searched. 13774028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // We are all prepared to do the search for the character. 13784028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell NewLIR0(kX86RepneScasw); 13794028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13804028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Did we find a match? 13814028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell LIR* failed_branch = OpCondBranch(kCondNe, nullptr); 13824028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13834028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // yes, we matched. Compute the index of the result. 1384c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpSub, rs_tmp, rs_rCX); 1385c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk NewLIR3(kX86Lea32RM, rl_return.reg.GetReg(), rs_tmp.GetReg(), -1); 1386c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 13874028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell LIR *all_done = NewLIR1(kX86Jmp8, 0); 13884028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13894028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Failed to match; return -1. 13904028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell LIR *not_found = NewLIR0(kPseudoTargetLabel); 13914028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell length_compare->target = not_found; 13924028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell failed_branch->target = not_found; 13932700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee LoadConstantNoClobber(rl_return.reg, -1); 13944028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13954028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // And join up at the end. 13964028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell all_done->target = NewLIR0(kPseudoTargetLabel); 1397c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1398c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (!cu_->target64) 1399c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk NewLIR1(kX86Pop32R, rs_rDI.GetReg()); 14004028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 14014028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Out of line code returns here. 14023a74d15ccc9a902874473ac9632e568b19b91b1cMingyao Yang if (slowpath_branch != nullptr) { 14034028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell LIR *return_point = NewLIR0(kPseudoTargetLabel); 14043a74d15ccc9a902874473ac9632e568b19b91b1cMingyao Yang AddIntrinsicSlowPath(info, slowpath_branch, return_point); 14054028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 14064028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 14074028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell StoreValue(rl_dest, rl_return); 1408c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1409c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FreeTemp(rs_rAX); 1410c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FreeTemp(rs_rCX); 1411c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FreeTemp(rs_rDX); 1412c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FreeTemp(rs_tmp); 1413c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (cu_->target64) { 1414c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FreeTemp(rs_rDI); 1415c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk } 1416c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 14174028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell return true; 14184028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell} 14194028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 1420ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell/* 1421ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell * @brief Enter an 'advance LOC' into the FDE buffer 1422ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell * @param buf FDE buffer. 1423ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell * @param increment Amount by which to increase the current location. 1424ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell */ 1425ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendellstatic void AdvanceLoc(std::vector<uint8_t>&buf, uint32_t increment) { 1426ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell if (increment < 64) { 1427ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Encoding in opcode. 1428ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(0x1 << 6 | increment); 1429ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } else if (increment < 256) { 1430ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Single byte delta. 1431ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(0x02); 1432ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(increment); 1433ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } else if (increment < 256 * 256) { 1434ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Two byte delta. 1435ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(0x03); 1436ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(increment & 0xff); 1437ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back((increment >> 8) & 0xff); 1438ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } else { 1439ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Four byte delta. 1440ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(0x04); 1441ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(buf, increment); 1442ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1443ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell} 1444ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1445ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 144635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shenstd::vector<uint8_t>* X86CFIInitialization(bool is_x86_64) { 144735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen return X86Mir2Lir::ReturnCommonCallFrameInformation(is_x86_64); 1448ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell} 1449ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 145035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shenstatic void EncodeUnsignedLeb128(std::vector<uint8_t>& buf, uint32_t value) { 145135e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen uint8_t buffer[12]; 145235e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen uint8_t *ptr = EncodeUnsignedLeb128(buffer, value); 145335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen for (uint8_t *p = buffer; p < ptr; p++) { 145435e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen buf.push_back(*p); 145535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } 145635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen} 145735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen 145835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shenstatic void EncodeSignedLeb128(std::vector<uint8_t>& buf, int32_t value) { 145935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen uint8_t buffer[12]; 146035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen uint8_t *ptr = EncodeSignedLeb128(buffer, value); 146135e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen for (uint8_t *p = buffer; p < ptr; p++) { 146235e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen buf.push_back(*p); 146335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } 146435e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen} 146535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen 146635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shenstd::vector<uint8_t>* X86Mir2Lir::ReturnCommonCallFrameInformation(bool is_x86_64) { 1467ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell std::vector<uint8_t>*cfi_info = new std::vector<uint8_t>; 1468ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 146935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Length (will be filled in later in this routine). 147035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen PushWord(*cfi_info, 0); 1471ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 147235e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // CIE id: always 0. 147335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen PushWord(*cfi_info, 0); 1474ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 147535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Version: always 1. 147635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x01); 1477ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 147835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Augmentation: 'zR\0' 147935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x7a); 148035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x52); 1481ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0); 1482ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1483ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Code alignment: 1. 148435e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen EncodeUnsignedLeb128(*cfi_info, 1); 1485ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 148635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Data alignment. 148735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen if (is_x86_64) { 148835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen EncodeSignedLeb128(*cfi_info, -8); 148935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } else { 149035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen EncodeSignedLeb128(*cfi_info, -4); 149135e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } 1492ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 149335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Return address register. 149435e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen if (is_x86_64) { 149535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // R16(RIP) 149635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x10); 149735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } else { 149835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // R8(EIP) 149935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x08); 150035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } 1501ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 150235e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Augmentation length: 1. 150335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(1); 1504ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 150535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Augmentation data: 0x03 ((DW_EH_PE_absptr << 4) | DW_EH_PE_udata4). 150635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x03); 1507ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 150835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Initial instructions. 150935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen if (is_x86_64) { 151035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // DW_CFA_def_cfa R7(RSP) 8. 151135e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x0c); 151235e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x07); 151335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x08); 1514ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 151535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // DW_CFA_offset R16(RIP) 1 (* -8). 151635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x90); 151735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x01); 151835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } else { 151935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // DW_CFA_def_cfa R4(ESP) 4. 152035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x0c); 152135e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x04); 152235e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x04); 152335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen 152435e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // DW_CFA_offset R8(EIP) 1 (* -4). 152535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x88); 152635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x01); 152735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } 152835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen 152935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Padding to a multiple of 4 153035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen while ((cfi_info->size() & 3) != 0) { 153135e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // DW_CFA_nop is encoded as 0. 153235e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0); 153335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } 153435e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen 153535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Set the length of the CIE inside the generated bytes. 153635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen uint32_t length = cfi_info->size() - 4; 153735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen (*cfi_info)[0] = length; 153835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen (*cfi_info)[1] = length >> 8; 153935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen (*cfi_info)[2] = length >> 16; 154035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen (*cfi_info)[3] = length >> 24; 1541ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell return cfi_info; 1542ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell} 1543ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 154435e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shenstatic bool ARTRegIDToDWARFRegID(bool is_x86_64, int art_reg_id, int* dwarf_reg_id) { 154535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen if (is_x86_64) { 154635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen switch (art_reg_id) { 154735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen case 3 : *dwarf_reg_id = 3; return true; // %rbx 154835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // This is the only discrepancy between ART & DWARF register numbering. 154935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen case 5 : *dwarf_reg_id = 6; return true; // %rbp 155035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen case 12: *dwarf_reg_id = 12; return true; // %r12 155135e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen case 13: *dwarf_reg_id = 13; return true; // %r13 155235e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen case 14: *dwarf_reg_id = 14; return true; // %r14 155335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen case 15: *dwarf_reg_id = 15; return true; // %r15 155435e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen default: return false; // Should not get here 155535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } 155635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } else { 155735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen switch (art_reg_id) { 155835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen case 5: *dwarf_reg_id = 5; return true; // %ebp 155935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen case 6: *dwarf_reg_id = 6; return true; // %esi 156035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen case 7: *dwarf_reg_id = 7; return true; // %edi 156135e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen default: return false; // Should not get here 156235e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } 1563ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1564ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell} 1565ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1566ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendellstd::vector<uint8_t>* X86Mir2Lir::ReturnCallFrameInformation() { 1567ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell std::vector<uint8_t>*cfi_info = new std::vector<uint8_t>; 1568ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1569ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Generate the FDE for the method. 1570ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell DCHECK_NE(data_offset_, 0U); 1571ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1572ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Length (will be filled in later in this routine). 1573ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(*cfi_info, 0); 1574ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 157535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // 'CIE_pointer' (filled in by linker). 1576ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(*cfi_info, 0); 1577ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1578ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // 'initial_location' (filled in by linker). 1579ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(*cfi_info, 0); 1580ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1581ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // 'address_range' (number of bytes in the method). 1582ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(*cfi_info, data_offset_); 1583ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 158435e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Augmentation length: 0 158535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0); 158635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen 1587ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // The instructions in the FDE. 1588ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell if (stack_decrement_ != nullptr) { 1589ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Advance LOC to just past the stack decrement. 1590ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell uint32_t pc = NEXT_LIR(stack_decrement_)->offset; 1591ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell AdvanceLoc(*cfi_info, pc); 1592ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1593ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Now update the offset to the call frame: DW_CFA_def_cfa_offset frame_size. 1594ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0e); 1595ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell EncodeUnsignedLeb128(*cfi_info, frame_size_); 1596ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 159735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Handle register spills 159835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen const uint32_t kSpillInstLen = (cu_->target64) ? 5 : 4; 159935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen const int kDataAlignmentFactor = (cu_->target64) ? -8 : -4; 160035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen uint32_t mask = core_spill_mask_ & ~(1 << rs_rRET.GetRegNum()); 160135e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen int offset = -(GetInstructionSetPointerSize(cu_->instruction_set) * num_core_spills_); 160235e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen for (int reg = 0; mask; mask >>= 1, reg++) { 160335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen if (mask & 0x1) { 160435e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen pc += kSpillInstLen; 160535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen 160635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // Advance LOC to pass this instruction 160735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen AdvanceLoc(*cfi_info, kSpillInstLen); 160835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen 160935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen int dwarf_reg_id; 161035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen if (ARTRegIDToDWARFRegID(cu_->target64, reg, &dwarf_reg_id)) { 161135e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // DW_CFA_offset_extended_sf reg_no offset 161235e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen cfi_info->push_back(0x11); 161335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen EncodeUnsignedLeb128(*cfi_info, dwarf_reg_id); 161435e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen EncodeSignedLeb128(*cfi_info, offset / kDataAlignmentFactor); 161535e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } 161635e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen 161735e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen offset += GetInstructionSetPointerSize(cu_->instruction_set); 161835e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } 161935e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen } 162035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen 1621ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // We continue with that stack until the epilogue. 1622ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell if (stack_increment_ != nullptr) { 1623ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell uint32_t new_pc = NEXT_LIR(stack_increment_)->offset; 1624ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell AdvanceLoc(*cfi_info, new_pc - pc); 1625ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1626ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // We probably have code snippets after the epilogue, so save the 1627ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // current state: DW_CFA_remember_state. 1628ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0a); 1629ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 163035e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // We have now popped the stack: DW_CFA_def_cfa_offset 4/8. 163135e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen // There is only the return PC on the stack now. 1632ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0e); 163335e1e6ad4b50f1adbe9f93fe467766f042491896Tong Shen EncodeUnsignedLeb128(*cfi_info, GetInstructionSetPointerSize(cu_->instruction_set)); 1634ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1635ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Everything after that is the same as before the epilogue. 1636ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Stack bump was followed by RET instruction. 1637ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell LIR *post_ret_insn = NEXT_LIR(NEXT_LIR(stack_increment_)); 1638ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell if (post_ret_insn != nullptr) { 1639ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell pc = new_pc; 1640ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell new_pc = post_ret_insn->offset; 1641ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell AdvanceLoc(*cfi_info, new_pc - pc); 1642ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Restore the state: DW_CFA_restore_state. 1643ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0b); 1644ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1645ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1646ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1647ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1648ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Padding to a multiple of 4 1649ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell while ((cfi_info->size() & 3) != 0) { 1650ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // DW_CFA_nop is encoded as 0. 1651ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0); 1652ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1653ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1654ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Set the length of the FDE inside the generated bytes. 1655ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell uint32_t length = cfi_info->size() - 4; 1656ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell (*cfi_info)[0] = length; 1657ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell (*cfi_info)[1] = length >> 8; 1658ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell (*cfi_info)[2] = length >> 16; 1659ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell (*cfi_info)[3] = length >> 24; 1660ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell return cfi_info; 1661ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell} 1662ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1663d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendellvoid X86Mir2Lir::GenMachineSpecificExtendedMethodMIR(BasicBlock* bb, MIR* mir) { 1664d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell switch (static_cast<ExtendedMIROpcode>(mir->dalvikInsn.opcode)) { 166560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kMirOpReserveVectorRegisters: 166660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji ReserveVectorRegisters(mir); 166760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 166860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kMirOpReturnVectorRegisters: 166960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji ReturnVectorRegisters(); 167060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 1671d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell case kMirOpConstVector: 1672d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell GenConst128(bb, mir); 1673d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell break; 1674fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpMoveVector: 1675fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenMoveVector(bb, mir); 1676fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1677fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedMultiply: 1678fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenMultiplyVector(bb, mir); 1679fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1680fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedAddition: 1681fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenAddVector(bb, mir); 1682fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1683fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedSubtract: 1684fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenSubtractVector(bb, mir); 1685fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1686fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedShiftLeft: 1687fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenShiftLeftVector(bb, mir); 1688fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1689fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedSignedShiftRight: 1690fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenSignedShiftRightVector(bb, mir); 1691fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1692fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedUnsignedShiftRight: 1693fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenUnsignedShiftRightVector(bb, mir); 1694fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1695fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedAnd: 1696fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenAndVector(bb, mir); 1697fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1698fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedOr: 1699fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenOrVector(bb, mir); 1700fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1701fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedXor: 1702fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenXorVector(bb, mir); 1703fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1704fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedAddReduce: 1705fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenAddReduceVector(bb, mir); 1706fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1707fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedReduce: 1708fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenReduceVector(bb, mir); 1709fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1710fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedSet: 1711fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenSetVector(bb, mir); 1712fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1713d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell default: 1714d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell break; 1715d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1716d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell} 1717d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 171860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::ReserveVectorRegisters(MIR* mir) { 171960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // We should not try to reserve twice without returning the registers 172060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_NE(num_reserved_vector_regs_, -1); 172160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 172260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int num_vector_reg = mir->dalvikInsn.vA; 172360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji for (int i = 0; i < num_vector_reg; i++) { 172460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage xp_reg = RegStorage::Solo128(i); 172560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegisterInfo *xp_reg_info = GetRegInfo(xp_reg); 172660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji Clobber(xp_reg); 172760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 172860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji for (RegisterInfo *info = xp_reg_info->GetAliasChain(); 172960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji info != nullptr; 173060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji info = info->GetAliasChain()) { 173160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (info->GetReg().IsSingle()) { 173260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_pool_->sp_regs_.Delete(info); 173360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 173460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_pool_->dp_regs_.Delete(info); 173560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 173660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 173760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 173860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 173960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji num_reserved_vector_regs_ = num_vector_reg; 174060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 174160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 174260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::ReturnVectorRegisters() { 174360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Return all the reserved registers 174460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji for (int i = 0; i < num_reserved_vector_regs_; i++) { 174560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage xp_reg = RegStorage::Solo128(i); 174660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegisterInfo *xp_reg_info = GetRegInfo(xp_reg); 174760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 174860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji for (RegisterInfo *info = xp_reg_info->GetAliasChain(); 174960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji info != nullptr; 175060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji info = info->GetAliasChain()) { 175160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (info->GetReg().IsSingle()) { 175260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_pool_->sp_regs_.Insert(info); 175360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 175460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_pool_->dp_regs_.Insert(info); 175560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 175660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 175760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 175860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 175960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // We don't have anymore reserved vector registers 176060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji num_reserved_vector_regs_ = -1; 176160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 176260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 1763d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendellvoid X86Mir2Lir::GenConst128(BasicBlock* bb, MIR* mir) { 176460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji store_method_addr_used_ = true; 176560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int type_size = mir->dalvikInsn.vB; 1766d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // We support 128 bit vectors. 1767d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell DCHECK_EQ(type_size & 0xFFFF, 128); 176860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest = RegStorage::Solo128(mir->dalvikInsn.vA); 1769d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell uint32_t *args = mir->dalvikInsn.arg; 1770fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int reg = rs_dest.GetReg(); 1771d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // Check for all 0 case. 1772d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (args[0] == 0 && args[1] == 0 && args[2] == 0 && args[3] == 0) { 1773d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell NewLIR2(kX86XorpsRR, reg, reg); 1774d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell return; 1775d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 177660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 177760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Append the mov const vector to reg opcode. 177860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AppendOpcodeWithConst(kX86MovupsRM, reg, mir); 177960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 178060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 178160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::AppendOpcodeWithConst(X86OpCode opcode, int reg, MIR* mir) { 1782d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // Okay, load it from the constant vector area. 1783d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell LIR *data_target = ScanVectorLiteral(mir); 1784d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (data_target == nullptr) { 1785d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell data_target = AddVectorLiteral(mir); 1786d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1787d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 1788d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // Address the start of the method. 1789d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell RegLocation rl_method = mir_graph_->GetRegLocation(base_of_code_->s_reg_low); 1790e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu if (rl_method.wide) { 1791e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu rl_method = LoadValueWide(rl_method, kCoreReg); 1792e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu } else { 1793e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu rl_method = LoadValue(rl_method, kCoreReg); 1794e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu } 1795d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 1796d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // Load the proper value from the literal area. 1797d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // We don't know the proper offset for the value, so pick one that will force 1798d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // 4 byte offset. We will fix this up in the assembler later to have the right 1799d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // value. 18008dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kLiteral); 180160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji LIR *load = NewLIR2(opcode, reg, rl_method.reg.GetReg()); 1802d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell load->flags.fixup = kFixupLoad; 1803d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell load->target = data_target; 1804d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell} 1805d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 1806fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenMoveVector(BasicBlock *bb, MIR *mir) { 1807fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // We only support 128 bit registers. 180860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 180960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest = RegStorage::Solo128(mir->dalvikInsn.vA); 181060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src = RegStorage::Solo128(mir->dalvikInsn.vB); 1811fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(kX86Mova128RR, rs_dest.GetReg(), rs_src.GetReg()); 1812fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1813fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 181460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::GenMultiplyVectorSignedByte(BasicBlock *bb, MIR *mir) { 181560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const int BYTE_SIZE = 8; 181660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 181760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 181860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src1_high_tmp = Get128BitRegister(AllocTempWide()); 181960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 182060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji /* 182160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * Emulate the behavior of a kSignedByte by separating out the 16 values in the two XMM 182260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * and multiplying 8 at a time before recombining back into one XMM register. 182360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * 182460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * let xmm1, xmm2 be real srcs (keep low bits of 16bit lanes) 182560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm3 is tmp (operate on high bits of 16bit lanes) 182660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * 182760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm3 = xmm1 182860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 = xmm1 .* xmm2 182960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 = xmm1 & 0x00ff00ff00ff00ff00ff00ff00ff00ff // xmm1 now has low bits 183060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm3 = xmm3 .>> 8 183160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 = xmm2 & 0xff00ff00ff00ff00ff00ff00ff00ff00 183260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 = xmm2 .* xmm3 // xmm2 now has high bits 183360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 = xmm1 | xmm2 // combine results 183460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji */ 183560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 183660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Copy xmm1. 183760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Mova128RR, rs_src1_high_tmp.GetReg(), rs_dest_src1.GetReg()); 183860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 183960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Multiply low bits. 184060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PmullwRR, rs_dest_src1.GetReg(), rs_src2.GetReg()); 184160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 184260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // xmm1 now has low bits. 184360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AndMaskVectorRegister(rs_dest_src1, 0x00FF00FF, 0x00FF00FF, 0x00FF00FF, 0x00FF00FF); 184460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 184560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Prepare high bits for multiplication. 184660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PsrlwRI, rs_src1_high_tmp.GetReg(), BYTE_SIZE); 184760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AndMaskVectorRegister(rs_src2, 0xFF00FF00, 0xFF00FF00, 0xFF00FF00, 0xFF00FF00); 184860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 184960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Multiply high bits and xmm2 now has high bits. 185060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PmullwRR, rs_src2.GetReg(), rs_src1_high_tmp.GetReg()); 185160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 185260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Combine back into dest XMM register. 185360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PorRR, rs_dest_src1.GetReg(), rs_src2.GetReg()); 185460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 185560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 1856fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenMultiplyVector(BasicBlock *bb, MIR *mir) { 185760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 185860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 185960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 186060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 1861fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 1862fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 1863fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 1864fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PmulldRR; 1865fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1866fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 1867fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PmullwRR; 1868fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1869fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSingle: 1870fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86MulpsRR; 1871fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1872fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kDouble: 1873fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86MulpdRR; 1874fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 187560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 187660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // HW doesn't support 16x16 byte multiplication so emulate it. 187760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji GenMultiplyVectorSignedByte(bb, mir); 187860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 1879fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 1880fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector multiply " << opsize; 1881fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1882fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 1883fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), rs_src2.GetReg()); 1884fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1885fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 1886fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenAddVector(BasicBlock *bb, MIR *mir) { 188760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 188860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 188960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 189060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 1891fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 1892fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 1893fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 1894fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PadddRR; 1895fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1896fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 1897fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 1898fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PaddwRR; 1899fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1900fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedByte: 1901fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedByte: 1902fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PaddbRR; 1903fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1904fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSingle: 1905fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86AddpsRR; 1906fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1907fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kDouble: 1908fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86AddpdRR; 1909fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1910fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 1911fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector addition " << opsize; 1912fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1913fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 1914fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), rs_src2.GetReg()); 1915fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1916fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 1917fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenSubtractVector(BasicBlock *bb, MIR *mir) { 191860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 191960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 192060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 192160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 1922fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 1923fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 1924fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 1925fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsubdRR; 1926fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1927fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 1928fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 1929fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsubwRR; 1930fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1931fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedByte: 1932fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedByte: 1933fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsubbRR; 1934fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1935fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSingle: 1936fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86SubpsRR; 1937fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1938fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kDouble: 1939fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86SubpdRR; 1940fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1941fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 1942fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector subtraction " << opsize; 1943fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1944fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 1945fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), rs_src2.GetReg()); 1946fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1947fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 194860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::GenShiftByteVector(BasicBlock *bb, MIR *mir) { 194960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 195060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_tmp = Get128BitRegister(AllocTempWide()); 195160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 195260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int opcode = 0; 195360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int imm = mir->dalvikInsn.vB; 195460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 195560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji switch (static_cast<ExtendedMIROpcode>(mir->dalvikInsn.opcode)) { 195660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kMirOpPackedShiftLeft: 195760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji opcode = kX86PsllwRI; 195860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 195960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kMirOpPackedSignedShiftRight: 196060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji opcode = kX86PsrawRI; 196160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 196260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kMirOpPackedUnsignedShiftRight: 196360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji opcode = kX86PsrlwRI; 196460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 196560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji default: 196660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji LOG(FATAL) << "Unsupported shift operation on byte vector " << opcode; 196760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 196860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 196960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 197060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji /* 197160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 will have low bits 197260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 will have high bits 197360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * 197460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 = xmm1 197560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 = xmm1 .<< N 197660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 = xmm2 && 0xFF00FF00FF00FF00FF00FF00FF00FF00 197760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 = xmm2 .<< N 197860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 = xmm1 | xmm2 197960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji */ 198060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 198160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Copy xmm1. 198260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Mova128RR, rs_tmp.GetReg(), rs_dest_src1.GetReg()); 198360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 198460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Shift lower values. 198560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(opcode, rs_dest_src1.GetReg(), imm); 198660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 198760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Mask bottom bits. 198860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AndMaskVectorRegister(rs_tmp, 0xFF00FF00, 0xFF00FF00, 0xFF00FF00, 0xFF00FF00); 198960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 199060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Shift higher values. 199160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(opcode, rs_tmp.GetReg(), imm); 199260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 199360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Combine back into dest XMM register. 199460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PorRR, rs_dest_src1.GetReg(), rs_tmp.GetReg()); 199560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 199660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 1997fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenShiftLeftVector(BasicBlock *bb, MIR *mir) { 199860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 199960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 200060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 200160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int imm = mir->dalvikInsn.vB; 2002fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 2003fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 2004fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 2005fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PslldRI; 2006fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2007fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k64: 2008fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsllqRI; 2009fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2010fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 2011fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 2012fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsllwRI; 2013fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 201460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 201560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kUnsignedByte: 201660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji GenShiftByteVector(bb, mir); 201760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 2018fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 2019fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector shift left " << opsize; 2020fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2021fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 2022fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), imm); 2023fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2024fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2025fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenSignedShiftRightVector(BasicBlock *bb, MIR *mir) { 202660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 202760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 202860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 202960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int imm = mir->dalvikInsn.vB; 2030fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 2031fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 2032fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 2033fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsradRI; 2034fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2035fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 2036fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 2037fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsrawRI; 2038fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 203960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 204060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kUnsignedByte: 204160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji GenShiftByteVector(bb, mir); 204260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 2043fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 2044fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector signed shift right " << opsize; 2045fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2046fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 2047fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), imm); 2048fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2049fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2050fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenUnsignedShiftRightVector(BasicBlock *bb, MIR *mir) { 205160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 205260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 205360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 205460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int imm = mir->dalvikInsn.vB; 2055fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 2056fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 2057fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 2058fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsrldRI; 2059fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2060fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k64: 2061fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsrlqRI; 2062fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2063fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 2064fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 2065fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsrlwRI; 2066fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 206760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 206860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kUnsignedByte: 206960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji GenShiftByteVector(bb, mir); 207060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 2071fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 2072fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector unsigned shift right " << opsize; 2073fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2074fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 2075fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), imm); 2076fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2077fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2078fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenAndVector(BasicBlock *bb, MIR *mir) { 2079fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // We only support 128 bit registers. 208060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 208160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 208260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 2083fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(kX86PandRR, rs_dest_src1.GetReg(), rs_src2.GetReg()); 2084fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2085fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2086fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenOrVector(BasicBlock *bb, MIR *mir) { 2087fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // We only support 128 bit registers. 208860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 208960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 209060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 2091fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(kX86PorRR, rs_dest_src1.GetReg(), rs_src2.GetReg()); 2092fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2093fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2094fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenXorVector(BasicBlock *bb, MIR *mir) { 2095fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // We only support 128 bit registers. 209660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 209760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 209860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 2099fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(kX86PxorRR, rs_dest_src1.GetReg(), rs_src2.GetReg()); 2100fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2101fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 210260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::AndMaskVectorRegister(RegStorage rs_src1, uint32_t m1, uint32_t m2, uint32_t m3, uint32_t m4) { 210360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji MaskVectorRegister(kX86PandRM, rs_src1, m1, m2, m3, m4); 210460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 210560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 210660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::MaskVectorRegister(X86OpCode opcode, RegStorage rs_src1, uint32_t m0, uint32_t m1, uint32_t m2, uint32_t m3) { 210760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Create temporary MIR as container for 128-bit binary mask. 210860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji MIR const_mir; 210960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji MIR* const_mirp = &const_mir; 211060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const_mirp->dalvikInsn.opcode = static_cast<Instruction::Code>(kMirOpConstVector); 211160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const_mirp->dalvikInsn.arg[0] = m0; 211260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const_mirp->dalvikInsn.arg[1] = m1; 211360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const_mirp->dalvikInsn.arg[2] = m2; 211460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const_mirp->dalvikInsn.arg[3] = m3; 211560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 211660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Mask vector with const from literal pool. 211760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AppendOpcodeWithConst(opcode, rs_src1.GetReg(), const_mirp); 211860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 211960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 2120fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenAddReduceVector(BasicBlock *bb, MIR *mir) { 212160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 212260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src1 = RegStorage::Solo128(mir->dalvikInsn.vB); 212360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegLocation rl_dest = mir_graph_->GetDest(mir); 212460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_tmp; 212560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 212660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int vec_bytes = (mir->dalvikInsn.vC & 0xFFFF) / 8; 212760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int vec_unit_size = 0; 2128fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 212960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int extr_opcode = 0; 213060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegLocation rl_result; 213160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 2132fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 2133fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 213460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji extr_opcode = kX86PextrdRRI; 2135fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PhadddRR; 213660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji vec_unit_size = 4; 213760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 213860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 213960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kUnsignedByte: 214060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji extr_opcode = kX86PextrbRRI; 214160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji opcode = kX86PhaddwRR; 214260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji vec_unit_size = 2; 2143fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2144fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 2145fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 214660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji extr_opcode = kX86PextrwRRI; 2147fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PhaddwRR; 214860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji vec_unit_size = 2; 2149fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 215060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSingle: 215160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_result = EvalLoc(rl_dest, kFPReg, true); 215260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji vec_unit_size = 4; 215360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji for (int i = 0; i < 3; i++) { 215460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86AddssRR, rl_result.reg.GetReg(), rs_src1.GetReg()); 215560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR3(kX86ShufpsRRI, rs_src1.GetReg(), rs_src1.GetReg(), 0x39); 215660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 215760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86AddssRR, rl_result.reg.GetReg(), rs_src1.GetReg()); 215860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji StoreValue(rl_dest, rl_result); 215960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 216060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // For single-precision floats, we are done here 216160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 2162fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 2163fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector add reduce " << opsize; 2164fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2165fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 216660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 216760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int elems = vec_bytes / vec_unit_size; 216860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 216960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Emulate horizontal add instruction by reducing 2 vectors with 8 values before adding them again 217060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // TODO is overflow handled correctly? 217160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (opsize == kSignedByte || opsize == kUnsignedByte) { 217260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rs_tmp = Get128BitRegister(AllocTempWide()); 217360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 217460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // tmp = xmm1 .>> 8. 217560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Mova128RR, rs_tmp.GetReg(), rs_src1.GetReg()); 217660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PsrlwRI, rs_tmp.GetReg(), 8); 217760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 217860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Zero extend low bits in xmm1. 217960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AndMaskVectorRegister(rs_src1, 0x00FF00FF, 0x00FF00FF, 0x00FF00FF, 0x00FF00FF); 218060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 218160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 218260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji while (elems > 1) { 218360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (opsize == kSignedByte || opsize == kUnsignedByte) { 218460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(opcode, rs_tmp.GetReg(), rs_tmp.GetReg()); 218560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 218660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(opcode, rs_src1.GetReg(), rs_src1.GetReg()); 218760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji elems >>= 1; 218860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 218960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 219060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Combine the results if we separated them. 219160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (opsize == kSignedByte || opsize == kUnsignedByte) { 219260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PaddbRR, rs_src1.GetReg(), rs_tmp.GetReg()); 219360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 219460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 219560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // We need to extract to a GPR. 219660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage temp = AllocTemp(); 219760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR3(extr_opcode, temp.GetReg(), rs_src1.GetReg(), 0); 219860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 219960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Can we do this directly into memory? 220060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_result = UpdateLocTyped(rl_dest, kCoreReg); 220160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (rl_result.location == kLocPhysReg) { 220260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Ensure res is in a core reg 220360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_result = EvalLoc(rl_dest, kCoreReg, true); 220460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpRegReg(kOpAdd, rl_result.reg, temp); 220560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji StoreFinalValue(rl_dest, rl_result); 220660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 220760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpMemReg(kOpAdd, rl_result, temp.GetReg()); 220860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 220960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 221060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji FreeTemp(temp); 2211fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2212fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2213fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenReduceVector(BasicBlock *bb, MIR *mir) { 221460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 221560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegLocation rl_dest = mir_graph_->GetDest(mir); 221660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src1 = RegStorage::Solo128(mir->dalvikInsn.vB); 221760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int extract_index = mir->dalvikInsn.arg[0]; 221860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int extr_opcode = 0; 221960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegLocation rl_result; 222060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji bool is_wide = false; 222160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 2222fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 2223fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 222460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_result = UpdateLocTyped(rl_dest, kCoreReg); 222560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji extr_opcode = (rl_result.location == kLocPhysReg) ? kX86PextrdMRI : kX86PextrdRRI; 2226fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2227fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 2228fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 222960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_result= UpdateLocTyped(rl_dest, kCoreReg); 223060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji extr_opcode = (rl_result.location == kLocPhysReg) ? kX86PextrwMRI : kX86PextrwRRI; 2231fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2232fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 223360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji LOG(FATAL) << "Unsupported vector add reduce " << opsize; 223460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 2235fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2236fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 2237fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 223860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (rl_result.location == kLocPhysReg) { 223960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR3(extr_opcode, rl_result.reg.GetReg(), rs_src1.GetReg(), extract_index); 224060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (is_wide == true) { 224160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji StoreFinalValue(rl_dest, rl_result); 224260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 224360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji StoreFinalValueWide(rl_dest, rl_result); 224460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 224560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 224660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int displacement = SRegOffset(rl_result.s_reg_low); 224760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji LIR *l = NewLIR3(extr_opcode, rs_rX86_SP.GetReg(), displacement, rs_src1.GetReg()); 224860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AnnotateDalvikRegAccess(l, displacement >> 2, true /* is_load */, is_wide /* is_64bit */); 224960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AnnotateDalvikRegAccess(l, displacement >> 2, false /* is_load */, is_wide /* is_64bit */); 225060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 2251fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2252fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2253fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenSetVector(BasicBlock *bb, MIR *mir) { 225460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 225560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 225660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest = RegStorage::Solo128(mir->dalvikInsn.vA); 225760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int op_low = 0, op_high = 0, imm = 0, op_mov = kX86MovdxrRR; 225860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegisterClass reg_type = kCoreReg; 225960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 2260fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 2261fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 2262fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell op_low = kX86PshufdRRI; 2263fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 226460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSingle: 226560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji op_low = kX86PshufdRRI; 226660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji op_mov = kX86Mova128RR; 226760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_type = kFPReg; 226860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 226960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case k64: 227060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji op_low = kX86PshufdRRI; 227160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji imm = 0x44; 227260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 227360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kDouble: 227460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji op_low = kX86PshufdRRI; 227560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji op_mov = kX86Mova128RR; 227660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_type = kFPReg; 227760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji imm = 0x44; 227860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 227960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 228060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kUnsignedByte: 228160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Shuffle 8 bit value into 16 bit word. 228260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // We set val = val + (val << 8) below and use 16 bit shuffle. 2283fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 2284fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 2285fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Handles low quadword. 2286fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell op_low = kX86PshuflwRRI; 2287fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Handles upper quadword. 2288fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell op_high = kX86PshufdRRI; 2289fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2290fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 2291fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector set " << opsize; 2292fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2293fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 2294fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2295fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell RegLocation rl_src = mir_graph_->GetSrc(mir, 0); 229660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 229760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Load the value from the VR into the reg. 229860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (rl_src.wide == 0) { 229960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_src = LoadValue(rl_src, reg_type); 230060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 230160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_src = LoadValueWide(rl_src, reg_type); 230260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 230360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 230460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // If opsize is 8 bits wide then double value and use 16 bit shuffle instead. 230560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (opsize == kSignedByte || opsize == kUnsignedByte) { 230660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage temp = AllocTemp(); 230760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // val = val + (val << 8). 230860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Mov32RR, temp.GetReg(), rl_src.reg.GetReg()); 230960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Sal32RI, temp.GetReg(), 8); 231060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Or32RR, rl_src.reg.GetReg(), temp.GetReg()); 231160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji FreeTemp(temp); 231260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 2313fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2314fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Load the value into the XMM register. 231560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(op_mov, rs_dest.GetReg(), rl_src.reg.GetReg()); 2316fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2317fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Now shuffle the value across the destination. 231860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR3(op_low, rs_dest.GetReg(), rs_dest.GetReg(), imm); 2319fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2320fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // And then repeat as needed. 2321fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell if (op_high != 0) { 232260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR3(op_high, rs_dest.GetReg(), rs_dest.GetReg(), imm); 2323fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 2324fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2325fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2326d65c51a556e6649db4e18bd083c8fec37607a442Mark MendellLIR *X86Mir2Lir::ScanVectorLiteral(MIR *mir) { 2327d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell int *args = reinterpret_cast<int*>(mir->dalvikInsn.arg); 2328d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell for (LIR *p = const_vectors_; p != nullptr; p = p->next) { 2329d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (args[0] == p->operands[0] && args[1] == p->operands[1] && 2330d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell args[2] == p->operands[2] && args[3] == p->operands[3]) { 2331d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell return p; 2332d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 2333d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 2334d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell return nullptr; 2335d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell} 2336d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 2337d65c51a556e6649db4e18bd083c8fec37607a442Mark MendellLIR *X86Mir2Lir::AddVectorLiteral(MIR *mir) { 2338d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell LIR* new_value = static_cast<LIR*>(arena_->Alloc(sizeof(LIR), kArenaAllocData)); 2339d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell int *args = reinterpret_cast<int*>(mir->dalvikInsn.arg); 2340d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell new_value->operands[0] = args[0]; 2341d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell new_value->operands[1] = args[1]; 2342d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell new_value->operands[2] = args[2]; 2343d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell new_value->operands[3] = args[3]; 2344d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell new_value->next = const_vectors_; 2345d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (const_vectors_ == nullptr) { 2346d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell estimated_native_code_size_ += 12; // Amount needed to align to 16 byte boundary. 2347d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 2348d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell estimated_native_code_size_ += 16; // Space for one vector. 2349d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell const_vectors_ = new_value; 2350d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell return new_value; 2351d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell} 2352d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 235358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko// ------------ ABI support: mapping of args to physical registers ------------- 2354ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas GampeRegStorage X86Mir2Lir::InToRegStorageX86_64Mapper::GetNextReg(bool is_double_or_float, bool is_wide, 2355ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe bool is_ref) { 2356a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu const SpecialTargetRegister coreArgMappingToPhysicalReg[] = {kArg1, kArg2, kArg3, kArg4, kArg5}; 2357ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe const int coreArgMappingToPhysicalRegSize = sizeof(coreArgMappingToPhysicalReg) / 2358ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe sizeof(SpecialTargetRegister); 2359a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu const SpecialTargetRegister fpArgMappingToPhysicalReg[] = {kFArg0, kFArg1, kFArg2, kFArg3, 2360ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe kFArg4, kFArg5, kFArg6, kFArg7}; 2361ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe const int fpArgMappingToPhysicalRegSize = sizeof(fpArgMappingToPhysicalReg) / 2362ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe sizeof(SpecialTargetRegister); 236358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 236458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (is_double_or_float) { 236558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (cur_fp_reg_ < fpArgMappingToPhysicalRegSize) { 2366ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe return ml_->TargetReg(fpArgMappingToPhysicalReg[cur_fp_reg_++], is_wide ? kWide : kNotWide); 236758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 236858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 236958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (cur_core_reg_ < coreArgMappingToPhysicalRegSize) { 2370ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe return ml_->TargetReg(coreArgMappingToPhysicalReg[cur_core_reg_++], 2371ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe is_ref ? kRef : (is_wide ? kWide : kNotWide)); 237258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 237358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 2374a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu return RegStorage::InvalidReg(); 237558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 237658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 237758994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage X86Mir2Lir::InToRegStorageMapping::Get(int in_position) { 237858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko DCHECK(IsInitialized()); 237958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko auto res = mapping_.find(in_position); 238058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return res != mapping_.end() ? res->second : RegStorage::InvalidReg(); 238158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 238258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 2383ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampevoid X86Mir2Lir::InToRegStorageMapping::Initialize(RegLocation* arg_locs, int count, 2384ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe InToRegStorageMapper* mapper) { 238558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko DCHECK(mapper != nullptr); 238658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko max_mapped_in_ = -1; 238758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko is_there_stack_mapped_ = false; 238858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko for (int in_position = 0; in_position < count; in_position++) { 2389407a9d2847161b843966a443b71760b1280bd396Serguei Katkov RegStorage reg = mapper->GetNextReg(arg_locs[in_position].fp, 2390407a9d2847161b843966a443b71760b1280bd396Serguei Katkov arg_locs[in_position].wide, arg_locs[in_position].ref); 239158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (reg.Valid()) { 239258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko mapping_[in_position] = reg; 239358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko max_mapped_in_ = std::max(max_mapped_in_, in_position); 2394407a9d2847161b843966a443b71760b1280bd396Serguei Katkov if (arg_locs[in_position].wide) { 239558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // We covered 2 args, so skip the next one 239658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko in_position++; 239758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 239858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 239958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko is_there_stack_mapped_ = true; 240058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 240158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 240258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko initialized_ = true; 240358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 240458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 240558994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage X86Mir2Lir::GetArgMappingToPhysicalReg(int arg_num) { 2406dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (!cu_->target64) { 240758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return GetCoreArgMappingToPhysicalReg(arg_num); 240858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 240958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 241058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (!in_to_reg_storage_mapping_.IsInitialized()) { 241158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int start_vreg = cu_->num_dalvik_registers - cu_->num_ins; 241258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegLocation* arg_locs = &mir_graph_->reg_location_[start_vreg]; 241358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 2414a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu InToRegStorageX86_64Mapper mapper(this); 241558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko in_to_reg_storage_mapping_.Initialize(arg_locs, cu_->num_ins, &mapper); 241658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 241758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return in_to_reg_storage_mapping_.Get(arg_num); 241858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 241958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 242058994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage X86Mir2Lir::GetCoreArgMappingToPhysicalReg(int core_arg_num) { 242158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // For the 32-bit internal ABI, the first 3 arguments are passed in registers. 242258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Not used for 64-bit, TODO: Move X86_32 to the same framework 242358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko switch (core_arg_num) { 242458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case 0: 242558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return rs_rX86_ARG1; 242658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case 1: 242758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return rs_rX86_ARG2; 242858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case 2: 242958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return rs_rX86_ARG3; 243058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko default: 243158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return RegStorage::InvalidReg(); 243258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 243358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 243458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 243558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko// ---------End of ABI support: mapping of args to physical registers ------------- 243658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 243758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko/* 243858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * If there are any ins passed in registers that have not been promoted 243958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * to a callee-save register, flush them to the frame. Perform initial 244058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * assignment of promoted arguments. 244158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * 244258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * ArgLocs is an array of location records describing the incoming arguments 244358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * with one location record per word of argument. 244458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 244558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenkovoid X86Mir2Lir::FlushIns(RegLocation* ArgLocs, RegLocation rl_method) { 2446dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (!cu_->target64) return Mir2Lir::FlushIns(ArgLocs, rl_method); 244758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko /* 244858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Dummy up a RegLocation for the incoming Method* 244958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * It will attempt to keep kArg0 live (or copy it to home location 245058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * if promoted). 245158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 245258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 245358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegLocation rl_src = rl_method; 245458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rl_src.location = kLocPhysReg; 2455ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe rl_src.reg = TargetReg(kArg0, kRef); 245658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rl_src.home = false; 245758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko MarkLive(rl_src); 245858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko StoreValue(rl_method, rl_src); 245958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // If Method* has been promoted, explicitly flush 246058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (rl_method.location == kLocPhysReg) { 2461ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe StoreRefDisp(rs_rX86_SP, 0, As32BitReg(TargetReg(kArg0, kRef)), kNotVolatile); 246258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 246358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 246458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (cu_->num_ins == 0) { 246558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return; 246658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 246758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 246858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int start_vreg = cu_->num_dalvik_registers - cu_->num_ins; 246958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko /* 247058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Copy incoming arguments to their proper home locations. 247158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * NOTE: an older version of dx had an issue in which 247258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * it would reuse static method argument registers. 247358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * This could result in the same Dalvik virtual register 247458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * being promoted to both core and fp regs. To account for this, 247558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * we only copy to the corresponding promoted physical register 247658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * if it matches the type of the SSA name for the incoming 247758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * argument. It is also possible that long and double arguments 247858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * end up half-promoted. In those cases, we must flush the promoted 247958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * half to memory as well. 248058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 24818dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 248258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko for (int i = 0; i < cu_->num_ins; i++) { 248358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // get reg corresponding to input 24844d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko RegStorage reg = GetArgMappingToPhysicalReg(i); 248558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 24864d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko RegLocation* t_loc = &ArgLocs[i]; 248758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (reg.Valid()) { 24884d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // If arriving in register. 248958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 24904d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // We have already updated the arg location with promoted info 24914d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // so we can be based on it. 24924d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko if (t_loc->location == kLocPhysReg) { 24934d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // Just copy it. 24944d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko OpRegCopy(t_loc->reg, reg); 24954d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko } else { 24964d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // Needs flush. 24974d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko if (t_loc->ref) { 2498a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreRefDisp(rs_rX86_SP, SRegOffset(start_vreg + i), reg, kNotVolatile); 249958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 2500a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, SRegOffset(start_vreg + i), reg, t_loc->wide ? k64 : k32, 25014d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko kNotVolatile); 250258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 250358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 250458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 25054d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // If arriving in frame & promoted. 25064d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko if (t_loc->location == kLocPhysReg) { 25074d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko if (t_loc->ref) { 2508a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu LoadRefDisp(rs_rX86_SP, SRegOffset(start_vreg + i), t_loc->reg, kNotVolatile); 25094d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko } else { 2510a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu LoadBaseDisp(rs_rX86_SP, SRegOffset(start_vreg + i), t_loc->reg, 25114d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko t_loc->wide ? k64 : k32, kNotVolatile); 25124d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko } 251358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 251458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 25154d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko if (t_loc->wide) { 25164d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // Increment i to skip the next one. 25174d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko i++; 25184d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko } 251958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 252058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 252158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 252258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko/* 252358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Load up to 5 arguments, the first three of which will be in 252458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * kArg1 .. kArg3. On entry kArg0 contains the current method pointer, 252558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * and as part of the load sequence, it must be replaced with 252658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * the target method pointer. Note, this may also be called 252758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * for "range" variants if the number of arguments is 5 or fewer. 252858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 252958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenkoint X86Mir2Lir::GenDalvikArgsNoRange(CallInfo* info, 253058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int call_state, LIR** pcrLabel, NextCallInsn next_call_insn, 253158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko const MethodReference& target_method, 253258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko uint32_t vtable_idx, uintptr_t direct_code, 253358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko uintptr_t direct_method, InvokeType type, bool skip_this) { 2534dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (!cu_->target64) { 253558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return Mir2Lir::GenDalvikArgsNoRange(info, 253658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko call_state, pcrLabel, next_call_insn, 253758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko target_method, 253858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko vtable_idx, direct_code, 253958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko direct_method, type, skip_this); 254058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 254158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return GenDalvikArgsRange(info, 254258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko call_state, pcrLabel, next_call_insn, 254358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko target_method, 254458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko vtable_idx, direct_code, 254558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko direct_method, type, skip_this); 254658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 254758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 254858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko/* 254958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * May have 0+ arguments (also used for jumbo). Note that 255058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * source virtual registers may be in physical registers, so may 255158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * need to be flushed to home location before copying. This 255258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * applies to arg3 and above (see below). 255358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * 255458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Two general strategies: 255558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * If < 20 arguments 255658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Pass args 3-18 using vldm/vstm block copy 255758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Pass arg0, arg1 & arg2 in kArg1-kArg3 255858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * If 20+ arguments 255958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Pass args arg19+ using memcpy block copy 256058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Pass arg0, arg1 & arg2 in kArg1-kArg3 256158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * 256258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 256358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenkoint X86Mir2Lir::GenDalvikArgsRange(CallInfo* info, int call_state, 256458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LIR** pcrLabel, NextCallInsn next_call_insn, 256558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko const MethodReference& target_method, 256658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko uint32_t vtable_idx, uintptr_t direct_code, uintptr_t direct_method, 256758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko InvokeType type, bool skip_this) { 2568dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (!cu_->target64) { 256958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return Mir2Lir::GenDalvikArgsRange(info, call_state, 257058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko pcrLabel, next_call_insn, 257158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko target_method, 257258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko vtable_idx, direct_code, direct_method, 257358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko type, skip_this); 257458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 257558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 257658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko /* If no arguments, just return */ 257758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (info->num_arg_words == 0) 257858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return call_state; 257958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 258058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko const int start_index = skip_this ? 1 : 0; 258158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 2582a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu InToRegStorageX86_64Mapper mapper(this); 258358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko InToRegStorageMapping in_to_reg_storage_mapping; 258458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko in_to_reg_storage_mapping.Initialize(info->args, info->num_arg_words, &mapper); 258558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko const int last_mapped_in = in_to_reg_storage_mapping.GetMaxMappedIn(); 258658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko const int size_of_the_last_mapped = last_mapped_in == -1 ? 1 : 25878e3acdd132aef1391676a5db2696804900aacd8eSerguei Katkov info->args[last_mapped_in].wide ? 2 : 1; 258858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int regs_left_to_pass_via_stack = info->num_arg_words - (last_mapped_in + size_of_the_last_mapped); 258958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 259058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Fisrt of all, check whether it make sense to use bulk copying 259158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Optimization is aplicable only for range case 259258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // TODO: make a constant instead of 2 259358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (info->is_range && regs_left_to_pass_via_stack >= 2) { 259458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Scan the rest of the args - if in phys_reg flush to memory 259558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko for (int next_arg = last_mapped_in + size_of_the_last_mapped; next_arg < info->num_arg_words;) { 259658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegLocation loc = info->args[next_arg]; 259758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (loc.wide) { 259858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko loc = UpdateLocWide(loc); 259958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (loc.location == kLocPhysReg) { 26008dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 2601a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, SRegOffset(loc.s_reg_low), loc.reg, k64, kNotVolatile); 260258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 260358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko next_arg += 2; 260458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 260558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko loc = UpdateLoc(loc); 260658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (loc.location == kLocPhysReg) { 26078dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 2608a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, SRegOffset(loc.s_reg_low), loc.reg, k32, kNotVolatile); 260958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 261058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko next_arg++; 261158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 261258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 261358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 261458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Logic below assumes that Method pointer is at offset zero from SP. 261558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko DCHECK_EQ(VRegOffset(static_cast<int>(kVRegMethodPtrBaseReg)), 0); 261658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 261758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // The rest can be copied together 261858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int start_offset = SRegOffset(info->args[last_mapped_in + size_of_the_last_mapped].s_reg_low); 2619ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe int outs_offset = StackVisitor::GetOutVROffset(last_mapped_in + size_of_the_last_mapped, 2620ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe cu_->instruction_set); 262158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 262258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int current_src_offset = start_offset; 262358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int current_dest_offset = outs_offset; 262458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 26258dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko // Only davik regs are accessed in this loop; no next_call_insn() calls. 26268dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 262758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko while (regs_left_to_pass_via_stack > 0) { 262858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // This is based on the knowledge that the stack itself is 16-byte aligned. 262958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bool src_is_16b_aligned = (current_src_offset & 0xF) == 0; 263058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bool dest_is_16b_aligned = (current_dest_offset & 0xF) == 0; 263158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko size_t bytes_to_move; 263258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 263358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko /* 263458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * The amount to move defaults to 32-bit. If there are 4 registers left to move, then do a 263558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * a 128-bit move because we won't get the chance to try to aligned. If there are more than 263658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * 4 registers left to move, consider doing a 128-bit only if either src or dest are aligned. 263758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * We do this because we could potentially do a smaller move to align. 263858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 263958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (regs_left_to_pass_via_stack == 4 || 264058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko (regs_left_to_pass_via_stack > 4 && (src_is_16b_aligned || dest_is_16b_aligned))) { 264158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Moving 128-bits via xmm register. 264258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bytes_to_move = sizeof(uint32_t) * 4; 264358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 264458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Allocate a free xmm temp. Since we are working through the calling sequence, 264558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // we expect to have an xmm temporary available. AllocTempDouble will abort if 264658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // there are no free registers. 264758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegStorage temp = AllocTempDouble(); 264858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 264958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LIR* ld1 = nullptr; 265058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LIR* ld2 = nullptr; 265158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LIR* st1 = nullptr; 265258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LIR* st2 = nullptr; 265358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 265458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko /* 265558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * The logic is similar for both loads and stores. If we have 16-byte alignment, 265658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * do an aligned move. If we have 8-byte alignment, then do the move in two 265758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * parts. This approach prevents possible cache line splits. Finally, fall back 265858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * to doing an unaligned move. In most cases we likely won't split the cache 265958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * line but we cannot prove it and thus take a conservative approach. 266058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 266158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bool src_is_8b_aligned = (current_src_offset & 0x7) == 0; 266258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bool dest_is_8b_aligned = (current_dest_offset & 0x7) == 0; 266358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 26648dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 266558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (src_is_16b_aligned) { 2666a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu ld1 = OpMovRegMem(temp, rs_rX86_SP, current_src_offset, kMovA128FP); 266758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else if (src_is_8b_aligned) { 2668a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu ld1 = OpMovRegMem(temp, rs_rX86_SP, current_src_offset, kMovLo128FP); 2669a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu ld2 = OpMovRegMem(temp, rs_rX86_SP, current_src_offset + (bytes_to_move >> 1), 267058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko kMovHi128FP); 267158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 2672a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu ld1 = OpMovRegMem(temp, rs_rX86_SP, current_src_offset, kMovU128FP); 267358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 267458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 267558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (dest_is_16b_aligned) { 2676a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu st1 = OpMovMemReg(rs_rX86_SP, current_dest_offset, temp, kMovA128FP); 267758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else if (dest_is_8b_aligned) { 2678a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu st1 = OpMovMemReg(rs_rX86_SP, current_dest_offset, temp, kMovLo128FP); 2679a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu st2 = OpMovMemReg(rs_rX86_SP, current_dest_offset + (bytes_to_move >> 1), 268058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko temp, kMovHi128FP); 268158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 2682a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu st1 = OpMovMemReg(rs_rX86_SP, current_dest_offset, temp, kMovU128FP); 268358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 268458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 268558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // TODO If we could keep track of aliasing information for memory accesses that are wider 268658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // than 64-bit, we wouldn't need to set up a barrier. 268758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (ld1 != nullptr) { 268858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (ld2 != nullptr) { 268958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // For 64-bit load we can actually set up the aliasing information. 269058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko AnnotateDalvikRegAccess(ld1, current_src_offset >> 2, true, true); 269158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko AnnotateDalvikRegAccess(ld2, (current_src_offset + (bytes_to_move >> 1)) >> 2, true, true); 269258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 269358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Set barrier for 128-bit load. 26948dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ld1->u.m.def_mask = &kEncodeAll; 269558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 269658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 269758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (st1 != nullptr) { 269858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (st2 != nullptr) { 269958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // For 64-bit store we can actually set up the aliasing information. 270058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko AnnotateDalvikRegAccess(st1, current_dest_offset >> 2, false, true); 270158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko AnnotateDalvikRegAccess(st2, (current_dest_offset + (bytes_to_move >> 1)) >> 2, false, true); 270258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 270358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Set barrier for 128-bit store. 27048dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko st1->u.m.def_mask = &kEncodeAll; 270558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 270658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 270758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 270858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Free the temporary used for the data movement. 270958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(temp); 271058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 271158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Moving 32-bits via general purpose register. 271258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bytes_to_move = sizeof(uint32_t); 271358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 271458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Instead of allocating a new temp, simply reuse one of the registers being used 271558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // for argument passing. 2716ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe RegStorage temp = TargetReg(kArg3, kNotWide); 271758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 271858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Now load the argument VR and store to the outs. 2719a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu Load32Disp(rs_rX86_SP, current_src_offset, temp); 2720a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu Store32Disp(rs_rX86_SP, current_dest_offset, temp); 272158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 272258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 272358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko current_src_offset += bytes_to_move; 272458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko current_dest_offset += bytes_to_move; 272558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko regs_left_to_pass_via_stack -= (bytes_to_move >> 2); 272658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 272758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko DCHECK_EQ(regs_left_to_pass_via_stack, 0); 272858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 272958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 273058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Now handle rest not registers if they are 273158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (in_to_reg_storage_mapping.IsThereStackMapped()) { 2732ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe RegStorage regSingle = TargetReg(kArg2, kNotWide); 2733ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe RegStorage regWide = TargetReg(kArg3, kWide); 2734b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu for (int i = start_index; 2735b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu i < last_mapped_in + size_of_the_last_mapped + regs_left_to_pass_via_stack; i++) { 273658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegLocation rl_arg = info->args[i]; 273758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rl_arg = UpdateRawLoc(rl_arg); 273858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegStorage reg = in_to_reg_storage_mapping.Get(i); 273958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (!reg.Valid()) { 274058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int out_offset = StackVisitor::GetOutVROffset(i, cu_->instruction_set); 274158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 27428dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko { 27438dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 27448dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (rl_arg.wide) { 27458dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (rl_arg.location == kLocPhysReg) { 2746a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, out_offset, rl_arg.reg, k64, kNotVolatile); 27478dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko } else { 27488dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko LoadValueDirectWideFixed(rl_arg, regWide); 2749a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, out_offset, regWide, k64, kNotVolatile); 27508dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko } 275158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 27528dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (rl_arg.location == kLocPhysReg) { 2753a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, out_offset, rl_arg.reg, k32, kNotVolatile); 27548dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko } else { 27558dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko LoadValueDirectFixed(rl_arg, regSingle); 2756a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, out_offset, regSingle, k32, kNotVolatile); 27578dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko } 275858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 275958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 276058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko call_state = next_call_insn(cu_, info, call_state, target_method, 276158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko vtable_idx, direct_code, direct_method, type); 276258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 2763b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu if (rl_arg.wide) { 2764b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu i++; 2765b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu } 276658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 276758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 276858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 276958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Finish with mapped registers 277058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko for (int i = start_index; i <= last_mapped_in; i++) { 277158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegLocation rl_arg = info->args[i]; 277258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rl_arg = UpdateRawLoc(rl_arg); 277358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegStorage reg = in_to_reg_storage_mapping.Get(i); 277458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (reg.Valid()) { 277558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (rl_arg.wide) { 277658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LoadValueDirectWideFixed(rl_arg, reg); 277758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 277858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LoadValueDirectFixed(rl_arg, reg); 277958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 278058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko call_state = next_call_insn(cu_, info, call_state, target_method, vtable_idx, 278158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko direct_code, direct_method, type); 278258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 2783b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu if (rl_arg.wide) { 2784b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu i++; 2785b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu } 278658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 278758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 278858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko call_state = next_call_insn(cu_, info, call_state, target_method, vtable_idx, 278958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko direct_code, direct_method, type); 279058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (pcrLabel) { 279169dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison if (!cu_->compiler_driver->GetCompilerOptions().GetImplicitNullChecks()) { 2792ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe *pcrLabel = GenExplicitNullCheck(TargetReg(kArg1, kRef), info->opt_flags); 279358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 279458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko *pcrLabel = nullptr; 279558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // In lieu of generating a check for kArg1 being null, we need to 279658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // perform a load when doing implicit checks. 279758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegStorage tmp = AllocTemp(); 2798ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe Load32Disp(TargetReg(kArg1, kRef), 0, tmp); 279958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko MarkPossibleNullPointerException(info->opt_flags); 280058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(tmp); 280158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 280258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 280358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return call_state; 280458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 280558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 2806984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampebool X86Mir2Lir::GenInlinedCharAt(CallInfo* info) { 2807984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // Location of reference to data array 2808984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe int value_offset = mirror::String::ValueOffset().Int32Value(); 2809984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // Location of count 2810984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe int count_offset = mirror::String::CountOffset().Int32Value(); 2811984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // Starting offset within data array 2812984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe int offset_offset = mirror::String::OffsetOffset().Int32Value(); 2813984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // Start of char data with array_ 2814984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe int data_offset = mirror::Array::DataOffset(sizeof(uint16_t)).Int32Value(); 2815984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe 2816984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegLocation rl_obj = info->args[0]; 2817984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegLocation rl_idx = info->args[1]; 2818984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe rl_obj = LoadValue(rl_obj, kRefReg); 2819984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // X86 wants to avoid putting a constant index into a register. 2820984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (!rl_idx.is_const) { 2821984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe rl_idx = LoadValue(rl_idx, kCoreReg); 2822984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2823984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegStorage reg_max; 2824984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe GenNullCheck(rl_obj.reg, info->opt_flags); 2825984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe bool range_check = (!(info->opt_flags & MIR_IGNORE_RANGE_CHECK)); 2826984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe LIR* range_check_branch = nullptr; 2827984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegStorage reg_off; 2828984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegStorage reg_ptr; 2829984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (range_check) { 2830984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // On x86, we can compare to memory directly 2831984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // Set up a launch pad to allow retry in case of bounds violation */ 2832984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (rl_idx.is_const) { 2833984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe LIR* comparison; 2834984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe range_check_branch = OpCmpMemImmBranch( 2835984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe kCondUlt, RegStorage::InvalidReg(), rl_obj.reg, count_offset, 2836984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe mir_graph_->ConstantValue(rl_idx.orig_sreg), nullptr, &comparison); 2837984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe MarkPossibleNullPointerExceptionAfter(0, comparison); 2838984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } else { 2839984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe OpRegMem(kOpCmp, rl_idx.reg, rl_obj.reg, count_offset); 2840984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe MarkPossibleNullPointerException(0); 2841984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe range_check_branch = OpCondBranch(kCondUge, nullptr); 2842984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2843984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2844984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe reg_off = AllocTemp(); 2845984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe reg_ptr = AllocTempRef(); 2846984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe Load32Disp(rl_obj.reg, offset_offset, reg_off); 2847984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe LoadRefDisp(rl_obj.reg, value_offset, reg_ptr, kNotVolatile); 2848984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (rl_idx.is_const) { 2849984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe OpRegImm(kOpAdd, reg_off, mir_graph_->ConstantValue(rl_idx.orig_sreg)); 2850984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } else { 2851984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe OpRegReg(kOpAdd, reg_off, rl_idx.reg); 2852984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2853984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe FreeTemp(rl_obj.reg); 2854984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (rl_idx.location == kLocPhysReg) { 2855984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe FreeTemp(rl_idx.reg); 2856984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2857984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegLocation rl_dest = InlineTarget(info); 2858984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegLocation rl_result = EvalLoc(rl_dest, kCoreReg, true); 2859984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe LoadBaseIndexedDisp(reg_ptr, reg_off, 1, data_offset, rl_result.reg, kUnsignedHalf); 2860984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe FreeTemp(reg_off); 2861984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe FreeTemp(reg_ptr); 2862984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe StoreValue(rl_dest, rl_result); 2863984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (range_check) { 2864984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe DCHECK(range_check_branch != nullptr); 2865984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe info->opt_flags |= MIR_IGNORE_NULL_CHECK; // Record that we've already null checked. 2866984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe AddIntrinsicSlowPath(info, range_check_branch); 2867984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2868984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe return true; 2869984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe} 2870984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe 28717934ac288acfb2552bb0b06ec1f61e5820d924a4Brian Carlstrom} // namespace art 2872