target_x86.cc revision 984305917bf57b3f8d92965e4715a0370cc5bcfb
1efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* 2efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * Copyright (C) 2012 The Android Open Source Project 3efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * 4efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * Licensed under the Apache License, Version 2.0 (the "License"); 5efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * you may not use this file except in compliance with the License. 6efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * You may obtain a copy of the License at 7efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * 8efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * http://www.apache.org/licenses/LICENSE-2.0 9efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * 10efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * Unless required by applicable law or agreed to in writing, software 11efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * distributed under the License is distributed on an "AS IS" BASIS, 12efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * See the License for the specific language governing permissions and 14efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * limitations under the License. 15efc6369224b036a1fb77849f7ae65b3492c832c0buzbee */ 16efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 17f3e2cc4a38389aa75eb8ee3973a535254bf1c8d2Nicolas Geoffray#include <string> 18f3e2cc4a38389aa75eb8ee3973a535254bf1c8d2Nicolas Geoffray#include <inttypes.h> 19f3e2cc4a38389aa75eb8ee3973a535254bf1c8d2Nicolas Geoffray 2002031b185b4653e6c72e21f7a51238b903f6d638buzbee#include "codegen_x86.h" 217940e44f4517de5e2634a7e07d58d0fb26160513Brian Carlstrom#include "dex/compiler_internals.h" 227940e44f4517de5e2634a7e07d58d0fb26160513Brian Carlstrom#include "dex/quick/mir_to_lir-inl.h" 23b5860fb459f1ed71f39d8a87b45bee6727d79fe8buzbee#include "dex/reg_storage_eq.h" 24e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell#include "mirror/array.h" 25e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell#include "mirror/string.h" 26641ce0371c2f0dc95d26be02d8366124c8b66653Brian Carlstrom#include "x86_lir.h" 27efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 28efc6369224b036a1fb77849f7ae65b3492c832c0buzbeenamespace art { 29efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 30089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_regs_arr_32[] = { 319ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rAX, rs_rCX, rs_rDX, rs_rBX, rs_rX86_SP_32, rs_rBP, rs_rSI, rs_rDI, 329ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 33089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_regs_arr_64[] = { 3476af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko rs_rAX, rs_rCX, rs_rDX, rs_rBX, rs_rX86_SP_32, rs_rBP, rs_rSI, rs_rDI, 35091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_r8, rs_r9, rs_r10, rs_r11, rs_r12, rs_r13, rs_r14, rs_r15 36efc6369224b036a1fb77849f7ae65b3492c832c0buzbee}; 37089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_regs_arr_64q[] = { 380999a6f7c83d10aa59b75f079f0d2fdbac982cf7Dmitry Petrochenko rs_r0q, rs_r1q, rs_r2q, rs_r3q, rs_rX86_SP_64, rs_r5q, rs_r6q, rs_r7q, 39a20468c004264592f309a548fc71ba62a69b8742Dmitry Petrochenko rs_r8q, rs_r9q, rs_r10q, rs_r11q, rs_r12q, rs_r13q, rs_r14q, rs_r15q 400999a6f7c83d10aa59b75f079f0d2fdbac982cf7Dmitry Petrochenko}; 41089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage sp_regs_arr_32[] = { 429ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_fr0, rs_fr1, rs_fr2, rs_fr3, rs_fr4, rs_fr5, rs_fr6, rs_fr7, 439ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 44089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage sp_regs_arr_64[] = { 45091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_fr0, rs_fr1, rs_fr2, rs_fr3, rs_fr4, rs_fr5, rs_fr6, rs_fr7, 46091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_fr8, rs_fr9, rs_fr10, rs_fr11, rs_fr12, rs_fr13, rs_fr14, rs_fr15 47efc6369224b036a1fb77849f7ae65b3492c832c0buzbee}; 48089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage dp_regs_arr_32[] = { 499ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_dr0, rs_dr1, rs_dr2, rs_dr3, rs_dr4, rs_dr5, rs_dr6, rs_dr7, 509ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 51089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage dp_regs_arr_64[] = { 52091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_dr0, rs_dr1, rs_dr2, rs_dr3, rs_dr4, rs_dr5, rs_dr6, rs_dr7, 53091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_dr8, rs_dr9, rs_dr10, rs_dr11, rs_dr12, rs_dr13, rs_dr14, rs_dr15 54efc6369224b036a1fb77849f7ae65b3492c832c0buzbee}; 55c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovstatic constexpr RegStorage xp_regs_arr_32[] = { 56c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_xr0, rs_xr1, rs_xr2, rs_xr3, rs_xr4, rs_xr5, rs_xr6, rs_xr7, 57c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov}; 58c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovstatic constexpr RegStorage xp_regs_arr_64[] = { 59c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_xr0, rs_xr1, rs_xr2, rs_xr3, rs_xr4, rs_xr5, rs_xr6, rs_xr7, 60c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_xr8, rs_xr9, rs_xr10, rs_xr11, rs_xr12, rs_xr13, rs_xr14, rs_xr15 61c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov}; 62089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage reserved_regs_arr_32[] = {rs_rX86_SP_32}; 6376af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenkostatic constexpr RegStorage reserved_regs_arr_64[] = {rs_rX86_SP_32}; 64089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage reserved_regs_arr_64q[] = {rs_rX86_SP_64}; 65089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_temps_arr_32[] = {rs_rAX, rs_rCX, rs_rDX, rs_rBX}; 66089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_temps_arr_64[] = { 679ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rAX, rs_rCX, rs_rDX, rs_rSI, rs_rDI, 689ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_r8, rs_r9, rs_r10, rs_r11 699ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 70c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov 71c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// How to add register to be available for promotion: 72c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 1) Remove register from array defining temp 73c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 2) Update ClobberCallerSave 74c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 3) Update JNI compiler ABI: 75c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 3.1) add reg in JniCallingConvention method 76c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 3.2) update CoreSpillMask/FpSpillMask 77c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 4) Update entrypoints 78c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 4.1) Update constants in asm_support_x86_64.h for new frame size 79c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 4.2) Remove entry in SmashCallerSaves 80c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 4.3) Update jni_entrypoints to spill/unspill new callee save reg 81c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 4.4) Update quick_entrypoints to spill/unspill new callee save reg 82c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 5) Update runtime ABI 83c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 5.1) Update quick_method_frame_info with new required spills 84c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// 5.2) Update QuickArgumentVisitor with new offsets to gprs and xmms 85c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// Note that you cannot use register corresponding to incoming args 86c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// according to ABI and QCG needs one additional XMM temp for 87c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov// bulk copy in preparation to call. 88089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage core_temps_arr_64q[] = { 890999a6f7c83d10aa59b75f079f0d2fdbac982cf7Dmitry Petrochenko rs_r0q, rs_r1q, rs_r2q, rs_r6q, rs_r7q, 900999a6f7c83d10aa59b75f079f0d2fdbac982cf7Dmitry Petrochenko rs_r8q, rs_r9q, rs_r10q, rs_r11q 910999a6f7c83d10aa59b75f079f0d2fdbac982cf7Dmitry Petrochenko}; 92089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage sp_temps_arr_32[] = { 939ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_fr0, rs_fr1, rs_fr2, rs_fr3, rs_fr4, rs_fr5, rs_fr6, rs_fr7, 949ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 95089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage sp_temps_arr_64[] = { 96091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_fr0, rs_fr1, rs_fr2, rs_fr3, rs_fr4, rs_fr5, rs_fr6, rs_fr7, 97c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_fr8, rs_fr9, rs_fr10, rs_fr11 98091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee}; 99089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage dp_temps_arr_32[] = { 1009ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_dr0, rs_dr1, rs_dr2, rs_dr3, rs_dr4, rs_dr5, rs_dr6, rs_dr7, 1019ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko}; 102089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage dp_temps_arr_64[] = { 103091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee rs_dr0, rs_dr1, rs_dr2, rs_dr3, rs_dr4, rs_dr5, rs_dr6, rs_dr7, 104c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_dr8, rs_dr9, rs_dr10, rs_dr11 105091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee}; 106091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee 107089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage xp_temps_arr_32[] = { 108fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell rs_xr0, rs_xr1, rs_xr2, rs_xr3, rs_xr4, rs_xr5, rs_xr6, rs_xr7, 109fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell}; 110089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr RegStorage xp_temps_arr_64[] = { 111fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell rs_xr0, rs_xr1, rs_xr2, rs_xr3, rs_xr4, rs_xr5, rs_xr6, rs_xr7, 112c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov rs_xr8, rs_xr9, rs_xr10, rs_xr11 113fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell}; 114fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 115089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> empty_pool; 116089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_regs_32(core_regs_arr_32); 117089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_regs_64(core_regs_arr_64); 118089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_regs_64q(core_regs_arr_64q); 119089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> sp_regs_32(sp_regs_arr_32); 120089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> sp_regs_64(sp_regs_arr_64); 121089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> dp_regs_32(dp_regs_arr_32); 122089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> dp_regs_64(dp_regs_arr_64); 123c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovstatic constexpr ArrayRef<const RegStorage> xp_regs_32(xp_regs_arr_32); 124c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovstatic constexpr ArrayRef<const RegStorage> xp_regs_64(xp_regs_arr_64); 125089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> reserved_regs_32(reserved_regs_arr_32); 126089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> reserved_regs_64(reserved_regs_arr_64); 127089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> reserved_regs_64q(reserved_regs_arr_64q); 128089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_temps_32(core_temps_arr_32); 129089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_temps_64(core_temps_arr_64); 130089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> core_temps_64q(core_temps_arr_64q); 131089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> sp_temps_32(sp_temps_arr_32); 132089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> sp_temps_64(sp_temps_arr_64); 133089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> dp_temps_32(dp_temps_arr_32); 134089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> dp_temps_64(dp_temps_arr_64); 135089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Marko 136089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> xp_temps_32(xp_temps_arr_32); 137089142cf1d0c028b5a7c703baf0b97f4a4ada3f7Vladimir Markostatic constexpr ArrayRef<const RegStorage> xp_temps_64(xp_temps_arr_64); 138fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 1399ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_SP; 1409ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko 1419ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_ARG0; 1429ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_ARG1; 1439ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_ARG2; 1449ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_ARG3; 14558994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_ARG4; 14658994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_ARG5; 1479ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_FARG0; 1489ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_FARG1; 1499ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_FARG2; 1509ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_FARG3; 15158994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_FARG4; 15258994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_FARG5; 15358994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_FARG6; 15458994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoX86NativeRegisterPool rX86_FARG7; 1559ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_RET0; 1569ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_RET1; 1579ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_INVOKE_TGT; 1589ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoX86NativeRegisterPool rX86_COUNT; 1599ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko 1609ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_ARG0; 1619ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_ARG1; 1629ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_ARG2; 1639ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_ARG3; 16458994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_ARG4; 16558994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_ARG5; 1669ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_FARG0; 1679ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_FARG1; 1689ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_FARG2; 1699ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_FARG3; 17058994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_FARG4; 17158994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_FARG5; 17258994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_FARG6; 17358994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage rs_rX86_FARG7; 1749ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_RET0; 1759ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_RET1; 1769ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_INVOKE_TGT; 1779ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry PetrochenkoRegStorage rs_rX86_COUNT; 178efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 1792ce745c06271d5223d57dbf08117b20d5b60694aBrian CarlstromRegLocation X86Mir2Lir::LocCReturn() { 18000e1ec6581b5b7b46ca4c314c2854e9caa647dd2Bill Buzbee return x86_loc_c_return; 181efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 182efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 183a0cd2d701f29e0bc6275f1b13c0edfd4ec391879buzbeeRegLocation X86Mir2Lir::LocCReturnRef() { 184a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu return cu_->target64 ? x86_64_loc_c_return_ref : x86_loc_c_return_ref; 185a0cd2d701f29e0bc6275f1b13c0edfd4ec391879buzbee} 186a0cd2d701f29e0bc6275f1b13c0edfd4ec391879buzbee 1872ce745c06271d5223d57dbf08117b20d5b60694aBrian CarlstromRegLocation X86Mir2Lir::LocCReturnWide() { 188dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina return cu_->target64 ? x86_64_loc_c_return_wide : x86_loc_c_return_wide; 189efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 190efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 1912ce745c06271d5223d57dbf08117b20d5b60694aBrian CarlstromRegLocation X86Mir2Lir::LocCReturnFloat() { 19200e1ec6581b5b7b46ca4c314c2854e9caa647dd2Bill Buzbee return x86_loc_c_return_float; 193efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 194efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 1952ce745c06271d5223d57dbf08117b20d5b60694aBrian CarlstromRegLocation X86Mir2Lir::LocCReturnDouble() { 19600e1ec6581b5b7b46ca4c314c2854e9caa647dd2Bill Buzbee return x86_loc_c_return_double; 197efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 198efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 199a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu// Return a target-dependent special register for 32-bit. 200a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying FuRegStorage X86Mir2Lir::TargetReg32(SpecialTargetRegister reg) { 201091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee RegStorage res_reg = RegStorage::InvalidReg(); 202efc6369224b036a1fb77849f7ae65b3492c832c0buzbee switch (reg) { 203091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kSelf: res_reg = RegStorage::InvalidReg(); break; 204091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kSuspend: res_reg = RegStorage::InvalidReg(); break; 205091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kLr: res_reg = RegStorage::InvalidReg(); break; 206091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kPc: res_reg = RegStorage::InvalidReg(); break; 207ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe case kSp: res_reg = rs_rX86_SP_32; break; // This must be the concrete one, as _SP is target- 208ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe // specific size. 209091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kArg0: res_reg = rs_rX86_ARG0; break; 210091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kArg1: res_reg = rs_rX86_ARG1; break; 211091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kArg2: res_reg = rs_rX86_ARG2; break; 212091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kArg3: res_reg = rs_rX86_ARG3; break; 21358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kArg4: res_reg = rs_rX86_ARG4; break; 21458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kArg5: res_reg = rs_rX86_ARG5; break; 215091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kFArg0: res_reg = rs_rX86_FARG0; break; 216091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kFArg1: res_reg = rs_rX86_FARG1; break; 217091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kFArg2: res_reg = rs_rX86_FARG2; break; 218091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kFArg3: res_reg = rs_rX86_FARG3; break; 21958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kFArg4: res_reg = rs_rX86_FARG4; break; 22058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kFArg5: res_reg = rs_rX86_FARG5; break; 22158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kFArg6: res_reg = rs_rX86_FARG6; break; 22258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case kFArg7: res_reg = rs_rX86_FARG7; break; 223091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kRet0: res_reg = rs_rX86_RET0; break; 224091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kRet1: res_reg = rs_rX86_RET1; break; 225091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kInvokeTgt: res_reg = rs_rX86_INVOKE_TGT; break; 226091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kHiddenArg: res_reg = rs_rAX; break; 227dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina case kHiddenFpArg: DCHECK(!cu_->target64); res_reg = rs_fr0; break; 228091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee case kCount: res_reg = rs_rX86_COUNT; break; 22958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko default: res_reg = RegStorage::InvalidReg(); 230091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee } 231091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee return res_reg; 232efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 233efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 234a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying FuRegStorage X86Mir2Lir::TargetReg(SpecialTargetRegister reg) { 235a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu LOG(FATAL) << "Do not use this function!!!"; 236a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu return RegStorage::InvalidReg(); 237a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu} 238a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu 239efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* 240efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * Decode the register id. 241efc6369224b036a1fb77849f7ae65b3492c832c0buzbee */ 2428dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir MarkoResourceMask X86Mir2Lir::GetRegMaskCommon(const RegStorage& reg) const { 2438dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko /* Double registers in x86 are just a single FP register. This is always just a single bit. */ 2448dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko return ResourceMask::Bit( 2458dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko /* FP register starts at bit position 16 */ 2468dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ((reg.IsFloat() || reg.StorageSize() > 8) ? kX86FPReg0 : 0) + reg.GetRegNum()); 2478dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko} 2488dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko 2498dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir MarkoResourceMask X86Mir2Lir::GetPCUseDefEncoding() const { 2508dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko return kEncodeNone; 251efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 252efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 2538dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Markovoid X86Mir2Lir::SetupTargetResourceMasks(LIR* lir, uint64_t flags, 2548dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ResourceMask* use_mask, ResourceMask* def_mask) { 2556a58cb16d803c9a7b3a75ccac8be19dd9d4e520dDmitry Petrochenko DCHECK(cu_->instruction_set == kX86 || cu_->instruction_set == kX86_64); 256b48819db07f9a0992a72173380c24249d7fc648abuzbee DCHECK(!lir->flags.use_def_invalid); 257efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 258efc6369224b036a1fb77849f7ae65b3492c832c0buzbee // X86-specific resource map setup here. 259efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_USE_SP) { 2608dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko use_mask->SetBit(kX86RegSP); 261efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 262efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 263efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_DEF_SP) { 2648dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko def_mask->SetBit(kX86RegSP); 265efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 266efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 267efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_DEFA) { 2688dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(def_mask, rs_rAX.GetReg()); 269efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 270efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 271efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_DEFD) { 2728dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(def_mask, rs_rDX.GetReg()); 273efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 274efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_USEA) { 2758dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rAX.GetReg()); 276efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 277efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 278efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_USEC) { 2798dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rCX.GetReg()); 280efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 281efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 282efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (flags & REG_USED) { 2838dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rDX.GetReg()); 284efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 28570b797d998f2a28e39f7d6ffc8a07c9cbc47da14Vladimir Marko 28670b797d998f2a28e39f7d6ffc8a07c9cbc47da14Vladimir Marko if (flags & REG_USEB) { 2878dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rBX.GetReg()); 28870b797d998f2a28e39f7d6ffc8a07c9cbc47da14Vladimir Marko } 2894028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 2904028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Fixup hard to describe instruction: Uses rAX, rCX, rDI; sets rDI. 2914028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (lir->opcode == kX86RepneScasw) { 2928dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rAX.GetReg()); 2938dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rCX.GetReg()); 2948dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(use_mask, rs_rDI.GetReg()); 2958dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko SetupRegMask(def_mask, rs_rDI.GetReg()); 2964028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 297e90501da0222717d75c126ebf89569db3976927eSerguei Katkov 298e90501da0222717d75c126ebf89569db3976927eSerguei Katkov if (flags & USE_FP_STACK) { 2998dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko use_mask->SetBit(kX86FPStack); 3008dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko def_mask->SetBit(kX86FPStack); 301e90501da0222717d75c126ebf89569db3976927eSerguei Katkov } 302efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 303efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 304efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* For dumping instructions */ 305efc6369224b036a1fb77849f7ae65b3492c832c0buzbeestatic const char* x86RegName[] = { 306efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", 307efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15" 308efc6369224b036a1fb77849f7ae65b3492c832c0buzbee}; 309efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 310efc6369224b036a1fb77849f7ae65b3492c832c0buzbeestatic const char* x86CondName[] = { 311efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "O", 312efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NO", 313efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "B/NAE/C", 314efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NB/AE/NC", 315efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "Z/EQ", 316efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NZ/NE", 317efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "BE/NA", 318efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NBE/A", 319efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "S", 320efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NS", 321efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "P/PE", 322efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NP/PO", 323efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "L/NGE", 324efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NL/GE", 325efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "LE/NG", 326efc6369224b036a1fb77849f7ae65b3492c832c0buzbee "NLE/G" 327efc6369224b036a1fb77849f7ae65b3492c832c0buzbee}; 328efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 329efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* 330efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * Interpret a format string and build a string no longer than size 331efc6369224b036a1fb77849f7ae65b3492c832c0buzbee * See format key in Assemble.cc. 332efc6369224b036a1fb77849f7ae65b3492c832c0buzbee */ 3331fd3346740dfb7f47be9922312b68a4227fada96buzbeestd::string X86Mir2Lir::BuildInsnString(const char *fmt, LIR *lir, unsigned char* base_addr) { 334efc6369224b036a1fb77849f7ae65b3492c832c0buzbee std::string buf; 335efc6369224b036a1fb77849f7ae65b3492c832c0buzbee size_t i = 0; 336efc6369224b036a1fb77849f7ae65b3492c832c0buzbee size_t fmt_len = strlen(fmt); 337efc6369224b036a1fb77849f7ae65b3492c832c0buzbee while (i < fmt_len) { 338efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (fmt[i] != '!') { 339efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += fmt[i]; 340efc6369224b036a1fb77849f7ae65b3492c832c0buzbee i++; 341efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } else { 342efc6369224b036a1fb77849f7ae65b3492c832c0buzbee i++; 343efc6369224b036a1fb77849f7ae65b3492c832c0buzbee DCHECK_LT(i, fmt_len); 344efc6369224b036a1fb77849f7ae65b3492c832c0buzbee char operand_number_ch = fmt[i]; 345efc6369224b036a1fb77849f7ae65b3492c832c0buzbee i++; 346efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (operand_number_ch == '!') { 347efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += "!"; 348efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } else { 349efc6369224b036a1fb77849f7ae65b3492c832c0buzbee int operand_number = operand_number_ch - '0'; 350efc6369224b036a1fb77849f7ae65b3492c832c0buzbee DCHECK_LT(operand_number, 6); // Expect upto 6 LIR operands. 351efc6369224b036a1fb77849f7ae65b3492c832c0buzbee DCHECK_LT(i, fmt_len); 352efc6369224b036a1fb77849f7ae65b3492c832c0buzbee int operand = lir->operands[operand_number]; 353efc6369224b036a1fb77849f7ae65b3492c832c0buzbee switch (fmt[i]) { 354efc6369224b036a1fb77849f7ae65b3492c832c0buzbee case 'c': 355efc6369224b036a1fb77849f7ae65b3492c832c0buzbee DCHECK_LT(static_cast<size_t>(operand), sizeof(x86CondName)); 356efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += x86CondName[operand]; 357efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 358efc6369224b036a1fb77849f7ae65b3492c832c0buzbee case 'd': 359efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += StringPrintf("%d", operand); 360efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 3615192cbb12856b12620dc346758605baaa1469cedYixin Shou case 'q': { 3625192cbb12856b12620dc346758605baaa1469cedYixin Shou int64_t value = static_cast<int64_t>(static_cast<int64_t>(operand) << 32 | 3635192cbb12856b12620dc346758605baaa1469cedYixin Shou static_cast<uint32_t>(lir->operands[operand_number+1])); 3645192cbb12856b12620dc346758605baaa1469cedYixin Shou buf +=StringPrintf("%" PRId64, value); 3655192cbb12856b12620dc346758605baaa1469cedYixin Shou } 366efc6369224b036a1fb77849f7ae65b3492c832c0buzbee case 'p': { 3670d82948094d9a198e01aa95f64012bdedd5b6fc9buzbee EmbeddedData *tab_rec = reinterpret_cast<EmbeddedData*>(UnwrapPointer(operand)); 368fa57c47f1b72916371a9c2d5c1389219bce655b4buzbee buf += StringPrintf("0x%08x", tab_rec->offset); 369efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 370efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 371efc6369224b036a1fb77849f7ae65b3492c832c0buzbee case 'r': 372091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee if (RegStorage::IsFloat(operand)) { 373091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee int fp_reg = RegStorage::RegNum(operand); 374efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += StringPrintf("xmm%d", fp_reg); 375efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } else { 376091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee int reg_num = RegStorage::RegNum(operand); 377091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee DCHECK_LT(static_cast<size_t>(reg_num), sizeof(x86RegName)); 378091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee buf += x86RegName[reg_num]; 379efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 380efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 381efc6369224b036a1fb77849f7ae65b3492c832c0buzbee case 't': 382107c31e598b649a8bb8d959d6a0377937e63e624Ian Rogers buf += StringPrintf("0x%08" PRIxPTR " (L%p)", 383107c31e598b649a8bb8d959d6a0377937e63e624Ian Rogers reinterpret_cast<uintptr_t>(base_addr) + lir->offset + operand, 384107c31e598b649a8bb8d959d6a0377937e63e624Ian Rogers lir->target); 385efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 386efc6369224b036a1fb77849f7ae65b3492c832c0buzbee default: 387efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf += StringPrintf("DecodeError '%c'", fmt[i]); 388efc6369224b036a1fb77849f7ae65b3492c832c0buzbee break; 389efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 390efc6369224b036a1fb77849f7ae65b3492c832c0buzbee i++; 391efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 392efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 393efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 394efc6369224b036a1fb77849f7ae65b3492c832c0buzbee return buf; 395efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 396efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 3978dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Markovoid X86Mir2Lir::DumpResourceMask(LIR *x86LIR, const ResourceMask& mask, const char *prefix) { 398efc6369224b036a1fb77849f7ae65b3492c832c0buzbee char buf[256]; 399efc6369224b036a1fb77849f7ae65b3492c832c0buzbee buf[0] = 0; 400efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 4018dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.Equals(kEncodeAll)) { 402efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcpy(buf, "all"); 403efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } else { 404efc6369224b036a1fb77849f7ae65b3492c832c0buzbee char num[8]; 405efc6369224b036a1fb77849f7ae65b3492c832c0buzbee int i; 406efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 407efc6369224b036a1fb77849f7ae65b3492c832c0buzbee for (i = 0; i < kX86RegEnd; i++) { 4088dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.HasBit(i)) { 409988e6ea9ac66edf1e205851df9bb53de3f3763f3Ian Rogers snprintf(num, arraysize(num), "%d ", i); 410efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcat(buf, num); 411efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 412efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 413efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 4148dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.HasBit(ResourceMask::kCCode)) { 415efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcat(buf, "cc "); 416efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 417efc6369224b036a1fb77849f7ae65b3492c832c0buzbee /* Memory bits */ 4188dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (x86LIR && (mask.HasBit(ResourceMask::kDalvikReg))) { 419988e6ea9ac66edf1e205851df9bb53de3f3763f3Ian Rogers snprintf(buf + strlen(buf), arraysize(buf) - strlen(buf), "dr%d%s", 420988e6ea9ac66edf1e205851df9bb53de3f3763f3Ian Rogers DECODE_ALIAS_INFO_REG(x86LIR->flags.alias_info), 421988e6ea9ac66edf1e205851df9bb53de3f3763f3Ian Rogers (DECODE_ALIAS_INFO_WIDE(x86LIR->flags.alias_info)) ? "(+1)" : ""); 422efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 4238dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.HasBit(ResourceMask::kLiteral)) { 424efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcat(buf, "lit "); 425efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 426efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 4278dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.HasBit(ResourceMask::kHeapRef)) { 428efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcat(buf, "heap "); 429efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 4308dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (mask.HasBit(ResourceMask::kMustNotAlias)) { 431efc6369224b036a1fb77849f7ae65b3492c832c0buzbee strcat(buf, "noalias "); 432efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 433efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 434efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (buf[0]) { 435efc6369224b036a1fb77849f7ae65b3492c832c0buzbee LOG(INFO) << prefix << ": " << buf; 436efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 437efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 43802031b185b4653e6c72e21f7a51238b903f6d638buzbee 4391fd3346740dfb7f47be9922312b68a4227fada96buzbeevoid X86Mir2Lir::AdjustSpillMask() { 440efc6369224b036a1fb77849f7ae65b3492c832c0buzbee // Adjustment for LR spilling, x86 has no LR so nothing to do here 441091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee core_spill_mask_ |= (1 << rs_rRET.GetRegNum()); 4421fd3346740dfb7f47be9922312b68a4227fada96buzbee num_core_spills_++; 443efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 444efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 445e87f9b5185379c8cf8392d65a63e7bf7e51b97e7Mark MendellRegStorage X86Mir2Lir::AllocateByteRegister() { 4467e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu RegStorage reg = AllocTypedTemp(false, kCoreReg); 447dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (!cu_->target64) { 4487e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu DCHECK_LT(reg.GetRegNum(), rs_rX86_SP.GetRegNum()); 4497e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu } 4507e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu return reg; 4517e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu} 4527e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fu 45360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan BanerjiRegStorage X86Mir2Lir::Get128BitRegister(RegStorage reg) { 45460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return GetRegInfo(reg)->FindMatchingView(RegisterInfo::k128SoloStorageMask)->GetReg(); 45560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 45660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 4577e399fd3a99ba9c9dbfafdf14f75dd318fa7d454Chao-ying Fubool X86Mir2Lir::IsByteRegister(RegStorage reg) { 458dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina return cu_->target64 || reg.GetRegNum() < rs_rX86_SP.GetRegNum(); 459e87f9b5185379c8cf8392d65a63e7bf7e51b97e7Mark Mendell} 460e87f9b5185379c8cf8392d65a63e7bf7e51b97e7Mark Mendell 461efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* Clobber all regs that might be used by an external C call */ 46231c2aac7137b69d5622eea09597500731fbee2efVladimir Markovoid X86Mir2Lir::ClobberCallerSave() { 463dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 464c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rAX); 465c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rCX); 466c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rDX); 467c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rSI); 468c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rDI); 469c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov 47035ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_r8); 47135ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_r9); 47235ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_r10); 47335ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_r11); 47435ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu 47535ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_fr8); 47635ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_fr9); 47735ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_fr10); 47835ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu Clobber(rs_fr11); 479c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } else { 480c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rAX); 481c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rCX); 482c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rDX); 483c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_rBX); 48435ec2b5faf9a2dbc3c0cddb7ebc09952b8a27d2aChao-ying Fu } 485c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov 486c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr0); 487c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr1); 488c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr2); 489c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr3); 490c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr4); 491c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr5); 492c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr6); 493c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov Clobber(rs_fr7); 494efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 495efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 4961fd3346740dfb7f47be9922312b68a4227fada96buzbeeRegLocation X86Mir2Lir::GetReturnWideAlt() { 49752a77fc135f0e0df57ee24641c3f5ae415ff7bd6buzbee RegLocation res = LocCReturnWide(); 498091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee DCHECK(res.reg.GetLowReg() == rs_rAX.GetReg()); 499091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee DCHECK(res.reg.GetHighReg() == rs_rDX.GetReg()); 500091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee Clobber(rs_rAX); 501091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee Clobber(rs_rDX); 502091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee MarkInUse(rs_rAX); 503091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee MarkInUse(rs_rDX); 504091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee MarkWide(res.reg); 505efc6369224b036a1fb77849f7ae65b3492c832c0buzbee return res; 506efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 507efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 5082ce745c06271d5223d57dbf08117b20d5b60694aBrian CarlstromRegLocation X86Mir2Lir::GetReturnAlt() { 50952a77fc135f0e0df57ee24641c3f5ae415ff7bd6buzbee RegLocation res = LocCReturn(); 510091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee res.reg.SetReg(rs_rDX.GetReg()); 511091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee Clobber(rs_rDX); 512091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee MarkInUse(rs_rDX); 513efc6369224b036a1fb77849f7ae65b3492c832c0buzbee return res; 514efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 515efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 516efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* To be used when explicitly managing register use */ 5172ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstromvoid X86Mir2Lir::LockCallTemps() { 518091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee LockTemp(rs_rX86_ARG0); 519091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee LockTemp(rs_rX86_ARG1); 520091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee LockTemp(rs_rX86_ARG2); 521091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee LockTemp(rs_rX86_ARG3); 522dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 52358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_ARG4); 52458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_ARG5); 52558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG0); 52658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG1); 52758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG2); 52858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG3); 52958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG4); 53058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG5); 53158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG6); 53258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LockTemp(rs_rX86_FARG7); 53358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 534efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 535efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 536efc6369224b036a1fb77849f7ae65b3492c832c0buzbee/* To be used when explicitly managing register use */ 5372ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstromvoid X86Mir2Lir::FreeCallTemps() { 538091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee FreeTemp(rs_rX86_ARG0); 539091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee FreeTemp(rs_rX86_ARG1); 540091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee FreeTemp(rs_rX86_ARG2); 541091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee FreeTemp(rs_rX86_ARG3); 542dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 54358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_ARG4); 54458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_ARG5); 54558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG0); 54658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG1); 54758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG2); 54858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG3); 54958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG4); 55058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG5); 55158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG6); 55258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(rs_rX86_FARG7); 55358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 554efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 555efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 55699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusorubool X86Mir2Lir::ProvidesFullMemoryBarrier(X86OpCode opcode) { 55799ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru switch (opcode) { 55899ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru case kX86LockCmpxchgMR: 55999ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru case kX86LockCmpxchgAR: 5600f9b9c508814a62c6e21c6a06cfe4de39b5036c0Ian Rogers case kX86LockCmpxchg64M: 5610f9b9c508814a62c6e21c6a06cfe4de39b5036c0Ian Rogers case kX86LockCmpxchg64A: 56299ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru case kX86XchgMR: 56399ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru case kX86Mfence: 56499ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // Atomic memory instructions provide full barrier. 56599ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru return true; 56699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru default: 56799ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru break; 56899ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } 56999ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru 57099ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // Conservative if cannot prove it provides full barrier. 57199ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru return false; 57299ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru} 57399ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru 574b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampebool X86Mir2Lir::GenMemBarrier(MemBarrierKind barrier_kind) { 575efc6369224b036a1fb77849f7ae65b3492c832c0buzbee#if ANDROID_SMP != 0 57699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // Start off with using the last LIR as the barrier. If it is not enough, then we will update it. 57799ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru LIR* mem_barrier = last_lir_insn_; 57899ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru 579b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe bool ret = false; 58099ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru /* 58148f5c47907654350ce30a8dfdda0e977f5d3d39fHans Boehm * According to the JSR-133 Cookbook, for x86 only StoreLoad/AnyAny barriers need memory fence. 58248f5c47907654350ce30a8dfdda0e977f5d3d39fHans Boehm * All other barriers (LoadAny, AnyStore, StoreStore) are nops due to the x86 memory model. 58348f5c47907654350ce30a8dfdda0e977f5d3d39fHans Boehm * For those cases, all we need to ensure is that there is a scheduling barrier in place. 58499ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru */ 58548f5c47907654350ce30a8dfdda0e977f5d3d39fHans Boehm if (barrier_kind == kAnyAny) { 58699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // If no LIR exists already that can be used a barrier, then generate an mfence. 58799ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru if (mem_barrier == nullptr) { 58899ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru mem_barrier = NewLIR0(kX86Mfence); 589b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe ret = true; 59099ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } 59199ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru 59299ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // If last instruction does not provide full barrier, then insert an mfence. 59399ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru if (ProvidesFullMemoryBarrier(static_cast<X86OpCode>(mem_barrier->opcode)) == false) { 59499ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru mem_barrier = NewLIR0(kX86Mfence); 595b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe ret = true; 59699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } 59799ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } 59899ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru 59999ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // Now ensure that a scheduling barrier is in place. 60099ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru if (mem_barrier == nullptr) { 60199ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru GenBarrier(); 60299ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } else { 60399ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru // Mark as a scheduling barrier. 60499ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru DCHECK(!mem_barrier->flags.use_def_invalid); 6058dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko mem_barrier->u.m.def_mask = &kEncodeAll; 60699ad7230ccaace93bf323dea9790f35fe991a4a2Razvan A Lupusoru } 607b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe return ret; 608b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe#else 609b14329f90f725af0f67c45dfcb94933a426d63ceAndreas Gampe return false; 610efc6369224b036a1fb77849f7ae65b3492c832c0buzbee#endif 611efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 61200e1ec6581b5b7b46ca4c314c2854e9caa647dd2Bill Buzbee 6131fd3346740dfb7f47be9922312b68a4227fada96buzbeevoid X86Mir2Lir::CompilerInitializeRegAlloc() { 614dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 61576af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko reg_pool_ = new (arena_) RegisterPool(this, arena_, core_regs_64, core_regs_64q, sp_regs_64, 61676af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko dp_regs_64, reserved_regs_64, reserved_regs_64q, 61776af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko core_temps_64, core_temps_64q, sp_temps_64, dp_temps_64); 6189ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko } else { 619b01bf15d18f9b08d77e7a3c6e2897af0e02bf8cabuzbee reg_pool_ = new (arena_) RegisterPool(this, arena_, core_regs_32, empty_pool, sp_regs_32, 620b01bf15d18f9b08d77e7a3c6e2897af0e02bf8cabuzbee dp_regs_32, reserved_regs_32, empty_pool, 621b01bf15d18f9b08d77e7a3c6e2897af0e02bf8cabuzbee core_temps_32, empty_pool, sp_temps_32, dp_temps_32); 6229ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko } 623091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee 624091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee // Target-specific adjustments. 625091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee 626fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Add in XMM registers. 627c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov const ArrayRef<const RegStorage> *xp_regs = cu_->target64 ? &xp_regs_64 : &xp_regs_32; 628c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov for (RegStorage reg : *xp_regs) { 629fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell RegisterInfo* info = new (arena_) RegisterInfo(reg, GetRegMaskCommon(reg)); 630fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell reginfo_map_.Put(reg.GetReg(), info); 631c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 632c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov const ArrayRef<const RegStorage> *xp_temps = cu_->target64 ? &xp_temps_64 : &xp_temps_32; 633c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov for (RegStorage reg : *xp_temps) { 634c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov RegisterInfo* xp_reg_info = GetRegInfo(reg); 635c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov xp_reg_info->SetIsTemp(true); 636fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 637fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 638091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee // Alias single precision xmm to double xmms. 639091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee // TODO: as needed, add larger vector sizes - alias all to the largest. 640091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee GrowableArray<RegisterInfo*>::Iterator it(®_pool_->sp_regs_); 641091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee for (RegisterInfo* info = it.Next(); info != nullptr; info = it.Next()) { 642091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee int sp_reg_num = info->GetReg().GetRegNum(); 643fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell RegStorage xp_reg = RegStorage::Solo128(sp_reg_num); 644fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell RegisterInfo* xp_reg_info = GetRegInfo(xp_reg); 645fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // 128-bit xmm vector register's master storage should refer to itself. 646fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell DCHECK_EQ(xp_reg_info, xp_reg_info->Master()); 647fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 648fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Redirect 32-bit vector's master storage to 128-bit vector. 649fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell info->SetMaster(xp_reg_info); 650fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 65176af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko RegStorage dp_reg = RegStorage::FloatSolo64(sp_reg_num); 652091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee RegisterInfo* dp_reg_info = GetRegInfo(dp_reg); 653fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Redirect 64-bit vector's master storage to 128-bit vector. 654fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell dp_reg_info->SetMaster(xp_reg_info); 65576af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko // Singles should show a single 32-bit mask bit, at first referring to the low half. 65676af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko DCHECK_EQ(info->StorageMask(), 0x1U); 65776af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko } 65876af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko 659dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 66076af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko // Alias 32bit W registers to corresponding 64bit X registers. 66176af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko GrowableArray<RegisterInfo*>::Iterator w_it(®_pool_->core_regs_); 66276af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko for (RegisterInfo* info = w_it.Next(); info != nullptr; info = w_it.Next()) { 66376af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko int x_reg_num = info->GetReg().GetRegNum(); 66476af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko RegStorage x_reg = RegStorage::Solo64(x_reg_num); 66576af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko RegisterInfo* x_reg_info = GetRegInfo(x_reg); 66676af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko // 64bit X register's master storage should refer to itself. 66776af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko DCHECK_EQ(x_reg_info, x_reg_info->Master()); 66876af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko // Redirect 32bit W master storage to 64bit X. 66976af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko info->SetMaster(x_reg_info); 67076af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko // 32bit W should show a single 32-bit mask bit, at first referring to the low half. 67176af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko DCHECK_EQ(info->StorageMask(), 0x1U); 67276af0d307194045ece429dbaf62e93d3e08c6c20Dmitry Petrochenko } 673efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 674091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee 675091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee // Don't start allocating temps at r0/s0/d0 or you may clobber return regs in early-exit methods. 676091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee // TODO: adjust for x86/hard float calling convention. 677091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee reg_pool_->next_core_reg_ = 2; 678091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee reg_pool_->next_sp_reg_ = 2; 679091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee reg_pool_->next_dp_reg_ = 1; 680efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 681efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 68260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjiint X86Mir2Lir::VectorRegisterSize() { 68360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return 128; 68460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 68560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 68660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjiint X86Mir2Lir::NumReservableVectorRegisters(bool fp_used) { 68760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return fp_used ? 5 : 7; 68860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 68960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 6901fd3346740dfb7f47be9922312b68a4227fada96buzbeevoid X86Mir2Lir::SpillCoreRegs() { 6911fd3346740dfb7f47be9922312b68a4227fada96buzbee if (num_core_spills_ == 0) { 692efc6369224b036a1fb77849f7ae65b3492c832c0buzbee return; 693efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 694efc6369224b036a1fb77849f7ae65b3492c832c0buzbee // Spill mask not including fake return address register 695091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee uint32_t mask = core_spill_mask_ & ~(1 << rs_rRET.GetRegNum()); 6969ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko int offset = frame_size_ - (GetInstructionSetPointerSize(cu_->instruction_set) * num_core_spills_); 697c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov OpSize size = cu_->target64 ? k64 : k32; 698efc6369224b036a1fb77849f7ae65b3492c832c0buzbee for (int reg = 0; mask; mask >>= 1, reg++) { 699efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (mask & 0x1) { 700c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov StoreBaseDisp(rs_rX86_SP, offset, cu_->target64 ? RegStorage::Solo64(reg) : RegStorage::Solo32(reg), 701c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov size, kNotVolatile); 7029ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko offset += GetInstructionSetPointerSize(cu_->instruction_set); 703efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 704efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 705efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 706efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 7071fd3346740dfb7f47be9922312b68a4227fada96buzbeevoid X86Mir2Lir::UnSpillCoreRegs() { 7081fd3346740dfb7f47be9922312b68a4227fada96buzbee if (num_core_spills_ == 0) { 709efc6369224b036a1fb77849f7ae65b3492c832c0buzbee return; 710efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 711efc6369224b036a1fb77849f7ae65b3492c832c0buzbee // Spill mask not including fake return address register 712091cc408e9dc87e60fb64c61e186bea568fc3d3abuzbee uint32_t mask = core_spill_mask_ & ~(1 << rs_rRET.GetRegNum()); 7139ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko int offset = frame_size_ - (GetInstructionSetPointerSize(cu_->instruction_set) * num_core_spills_); 714c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov OpSize size = cu_->target64 ? k64 : k32; 715efc6369224b036a1fb77849f7ae65b3492c832c0buzbee for (int reg = 0; mask; mask >>= 1, reg++) { 716efc6369224b036a1fb77849f7ae65b3492c832c0buzbee if (mask & 0x1) { 717c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov LoadBaseDisp(rs_rX86_SP, offset, cu_->target64 ? RegStorage::Solo64(reg) : RegStorage::Solo32(reg), 718c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov size, kNotVolatile); 7199ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko offset += GetInstructionSetPointerSize(cu_->instruction_set); 720efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 721efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 722efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 723efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 724c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovvoid X86Mir2Lir::SpillFPRegs() { 725c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov if (num_fp_spills_ == 0) { 726c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov return; 727c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 728c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov uint32_t mask = fp_spill_mask_; 729c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov int offset = frame_size_ - (GetInstructionSetPointerSize(cu_->instruction_set) * (num_fp_spills_ + num_core_spills_)); 730c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov for (int reg = 0; mask; mask >>= 1, reg++) { 731c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov if (mask & 0x1) { 732c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov StoreBaseDisp(rs_rX86_SP, offset, RegStorage::FloatSolo64(reg), 733c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov k64, kNotVolatile); 734c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov offset += sizeof(double); 735c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 736c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 737c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov} 738c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkovvoid X86Mir2Lir::UnSpillFPRegs() { 739c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov if (num_fp_spills_ == 0) { 740c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov return; 741c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 742c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov uint32_t mask = fp_spill_mask_; 743c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov int offset = frame_size_ - (GetInstructionSetPointerSize(cu_->instruction_set) * (num_fp_spills_ + num_core_spills_)); 744c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov for (int reg = 0; mask; mask >>= 1, reg++) { 745c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov if (mask & 0x1) { 746c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov LoadBaseDisp(rs_rX86_SP, offset, RegStorage::FloatSolo64(reg), 747c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov k64, kNotVolatile); 748c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov offset += sizeof(double); 749c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 750c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov } 751c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov} 752c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov 753c380191f3048db2a3796d65db8e5d5a5e7b08c65Serguei Katkov 7542ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstrombool X86Mir2Lir::IsUnconditionalBranch(LIR* lir) { 755cbd6d44c0a94f3d26671b5325aa21bbf1335ffe8buzbee return (lir->opcode == kX86Jmp8 || lir->opcode == kX86Jmp32); 756efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 757efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 758674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir MarkoRegisterClass X86Mir2Lir::RegClassForFieldLoadStore(OpSize size, bool is_volatile) { 759e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu // X86_64 can handle any size. 760dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 761e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu if (size == kReference) { 762e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu return kRefReg; 763e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu } 764e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu return kCoreReg; 765e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu } 766e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu 767674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko if (UNLIKELY(is_volatile)) { 768674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko // On x86, atomic 64-bit load/store requires an fp register. 769674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko // Smaller aligned load/store is atomic for both core and fp registers. 770674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko if (size == k64 || size == kDouble) { 771674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko return kFPReg; 772674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko } 773674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko } 774674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko return RegClassBySize(size); 775674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko} 776674744e635ddbdfb311fbd25b5a27356560d30c3Vladimir Marko 777dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena SayapinaX86Mir2Lir::X86Mir2Lir(CompilationUnit* cu, MIRGraph* mir_graph, ArenaAllocator* arena) 77855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell : Mir2Lir(cu, mir_graph, arena), 779dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers base_of_code_(nullptr), store_method_addr_(false), store_method_addr_used_(false), 78055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell method_address_insns_(arena, 100, kGrowableArrayMisc), 78155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell class_type_address_insns_(arena, 100, kGrowableArrayMisc), 782ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell call_method_insns_(arena, 100, kGrowableArrayMisc), 783dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina stack_decrement_(nullptr), stack_increment_(nullptr), 784d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell const_vectors_(nullptr) { 785d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell store_method_addr_used_ = false; 786dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers if (kIsDebugBuild) { 787dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers for (int i = 0; i < kX86Last; i++) { 788dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers if (X86Mir2Lir::EncodingMap[i].opcode != i) { 789dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers LOG(FATAL) << "Encoding order for " << X86Mir2Lir::EncodingMap[i].name 790d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell << " is wrong: expecting " << i << ", seeing " 791d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell << static_cast<int>(X86Mir2Lir::EncodingMap[i].opcode); 792dd7624d2b9e599d57762d12031b10b89defc9807Ian Rogers } 793efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 794efc6369224b036a1fb77849f7ae65b3492c832c0buzbee } 795dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (cu_->target64) { 7969ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_SP = rs_rX86_SP_64; 7979ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko 7989ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG0 = rs_rDI; 7999ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG1 = rs_rSI; 8009ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG2 = rs_rDX; 8019ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG3 = rs_rCX; 80258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_ARG4 = rs_r8; 80358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_ARG5 = rs_r9; 80458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG0 = rs_fr0; 80558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG1 = rs_fr1; 80658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG2 = rs_fr2; 80758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG3 = rs_fr3; 80858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG4 = rs_fr4; 80958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG5 = rs_fr5; 81058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG6 = rs_fr6; 81158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG7 = rs_fr7; 8129ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG0 = rDI; 8139ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG1 = rSI; 8149ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG2 = rDX; 8159ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG3 = rCX; 81658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_ARG4 = r8; 81758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_ARG5 = r9; 81858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG0 = fr0; 81958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG1 = fr1; 82058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG2 = fr2; 82158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG3 = fr3; 82258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG4 = fr4; 82358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG5 = fr5; 82458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG6 = fr6; 82558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG7 = fr7; 82655884bc1e2e1b324809b462455ccaf5811ffafd8Mark Mendell rs_rX86_INVOKE_TGT = rs_rDI; 8279ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko } else { 8289ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_SP = rs_rX86_SP_32; 8299ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko 8309ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG0 = rs_rAX; 8319ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG1 = rs_rCX; 8329ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG2 = rs_rDX; 8339ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_ARG3 = rs_rBX; 83458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_ARG4 = RegStorage::InvalidReg(); 83558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_ARG5 = RegStorage::InvalidReg(); 83658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG0 = rs_rAX; 83758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG1 = rs_rCX; 83858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG2 = rs_rDX; 83958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG3 = rs_rBX; 84058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG4 = RegStorage::InvalidReg(); 84158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG5 = RegStorage::InvalidReg(); 84258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG6 = RegStorage::InvalidReg(); 84358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rs_rX86_FARG7 = RegStorage::InvalidReg(); 8449ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG0 = rAX; 8459ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG1 = rCX; 8469ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG2 = rDX; 8479ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_ARG3 = rBX; 84858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG0 = rAX; 84958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG1 = rCX; 85058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG2 = rDX; 85158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rX86_FARG3 = rBX; 85255884bc1e2e1b324809b462455ccaf5811ffafd8Mark Mendell rs_rX86_INVOKE_TGT = rs_rAX; 85358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // TODO(64): Initialize with invalid reg 85458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko// rX86_ARG4 = RegStorage::InvalidReg(); 85558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko// rX86_ARG5 = RegStorage::InvalidReg(); 8569ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko } 8579ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_RET0 = rs_rAX; 8589ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_RET1 = rs_rDX; 8599ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rs_rX86_COUNT = rs_rCX; 8609ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_RET0 = rAX; 8619ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_RET1 = rDX; 8629ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_INVOKE_TGT = rAX; 8639ee801f5308aa3c62ae3bedae2658612762ffb91Dmitry Petrochenko rX86_COUNT = rCX; 86460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 86560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Initialize the number of reserved vector registers 86660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji num_reserved_vector_regs_ = -1; 8671fd3346740dfb7f47be9922312b68a4227fada96buzbee} 8681fd3346740dfb7f47be9922312b68a4227fada96buzbee 869862a76027076c341c26aa6cd4a30a7cdd6dc2143buzbeeMir2Lir* X86CodeGenerator(CompilationUnit* const cu, MIRGraph* const mir_graph, 870862a76027076c341c26aa6cd4a30a7cdd6dc2143buzbee ArenaAllocator* const arena) { 871dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina return new X86Mir2Lir(cu, mir_graph, arena); 872efc6369224b036a1fb77849f7ae65b3492c832c0buzbee} 873efc6369224b036a1fb77849f7ae65b3492c832c0buzbee 874984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe// Not used in x86(-64) 875984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas GampeRegStorage X86Mir2Lir::LoadHelper(QuickEntrypointEnum trampoline) { 8762f244e9faccfcca68af3c5484c397a01a1c3a342Andreas Gampe LOG(FATAL) << "Unexpected use of LoadHelper in x86"; 8772f244e9faccfcca68af3c5484c397a01a1c3a342Andreas Gampe return RegStorage::InvalidReg(); 8782f244e9faccfcca68af3c5484c397a01a1c3a342Andreas Gampe} 8792f244e9faccfcca68af3c5484c397a01a1c3a342Andreas Gampe 880b373e091eac39b1a79c11f2dcbd610af01e9e8a9Dave AllisonLIR* X86Mir2Lir::CheckSuspendUsingLoad() { 88169dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison // First load the pointer in fs:[suspend-trigger] into eax 88269dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison // Then use a test instruction to indirect via that address. 88369dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison NewLIR2(kX86Mov32RT, rs_rAX.GetReg(), cu_->target64 ? 88469dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison Thread::ThreadSuspendTriggerOffset<8>().Int32Value() : 88569dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison Thread::ThreadSuspendTriggerOffset<4>().Int32Value()); 88669dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison return NewLIR3(kX86Test32RM, rs_rAX.GetReg(), rs_rAX.GetReg(), 0); 887b373e091eac39b1a79c11f2dcbd610af01e9e8a9Dave Allison} 888b373e091eac39b1a79c11f2dcbd610af01e9e8a9Dave Allison 8892ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstromuint64_t X86Mir2Lir::GetTargetInstFlags(int opcode) { 890409fe94ad529d9334587be80b9f6a3d166805508buzbee DCHECK(!IsPseudoLirOp(opcode)); 8911fd3346740dfb7f47be9922312b68a4227fada96buzbee return X86Mir2Lir::EncodingMap[opcode].flags; 8921bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee} 8931bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee 8942ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstromconst char* X86Mir2Lir::GetTargetInstName(int opcode) { 895409fe94ad529d9334587be80b9f6a3d166805508buzbee DCHECK(!IsPseudoLirOp(opcode)); 8961fd3346740dfb7f47be9922312b68a4227fada96buzbee return X86Mir2Lir::EncodingMap[opcode].name; 8971bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee} 8981bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee 8992ce745c06271d5223d57dbf08117b20d5b60694aBrian Carlstromconst char* X86Mir2Lir::GetTargetInstFmt(int opcode) { 900409fe94ad529d9334587be80b9f6a3d166805508buzbee DCHECK(!IsPseudoLirOp(opcode)); 9011fd3346740dfb7f47be9922312b68a4227fada96buzbee return X86Mir2Lir::EncodingMap[opcode].fmt; 9021bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee} 9031bc37c60da71c923ea9a2e99d31ba1b3d76d79a8buzbee 904d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbeevoid X86Mir2Lir::GenConstWide(RegLocation rl_dest, int64_t value) { 905d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee // Can we do this directly to memory? 906d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee rl_dest = UpdateLocWide(rl_dest); 907d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee if ((rl_dest.location == kLocDalvikFrame) || 908d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee (rl_dest.location == kLocCompilerTemp)) { 909d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee int32_t val_lo = Low32Bits(value); 910d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee int32_t val_hi = High32Bits(value); 911a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu int r_base = rs_rX86_SP.GetReg(); 912d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee int displacement = SRegOffset(rl_dest.s_reg_low); 913d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee 9148dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 9152700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee LIR * store = NewLIR3(kX86Mov32MI, r_base, displacement + LOWORD_OFFSET, val_lo); 916d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee AnnotateDalvikRegAccess(store, (displacement + LOWORD_OFFSET) >> 2, 917d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee false /* is_load */, true /* is64bit */); 9182700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee store = NewLIR3(kX86Mov32MI, r_base, displacement + HIWORD_OFFSET, val_hi); 919d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee AnnotateDalvikRegAccess(store, (displacement + HIWORD_OFFSET) >> 2, 920d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee false /* is_load */, true /* is64bit */); 921d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee return; 922d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee } 923d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee 924d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee // Just use the standard code to do the generation. 925d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee Mir2Lir::GenConstWide(rl_dest, value); 926d61ba4ba6fcde666adb5d5c81b1c32f0534fb2c8Bill Buzbee} 927e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell 928e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell// TODO: Merge with existing RegLocation dumper in vreg_analysis.cc 929e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendellvoid X86Mir2Lir::DumpRegLocation(RegLocation loc) { 930e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell LOG(INFO) << "location: " << loc.location << ',' 931e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.wide ? " w" : " ") 932e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.defined ? " D" : " ") 933e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.is_const ? " c" : " ") 934e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.fp ? " F" : " ") 935e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.core ? " C" : " ") 936e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.ref ? " r" : " ") 937e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.high_word ? " h" : " ") 938e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << (loc.home ? " H" : " ") 9392700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee << ", low: " << static_cast<int>(loc.reg.GetLowReg()) 94000e1ec6581b5b7b46ca4c314c2854e9caa647dd2Bill Buzbee << ", high: " << static_cast<int>(loc.reg.GetHighReg()) 941e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << ", s_reg: " << loc.s_reg_low 942e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell << ", orig: " << loc.orig_sreg; 943e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell} 944e02d48fb24747f90fd893e1c3572bb3c500afcedMark Mendell 94567c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendellvoid X86Mir2Lir::Materialize() { 94667c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell // A good place to put the analysis before starting. 94767c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell AnalyzeMIR(); 94867c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell 94967c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell // Now continue with regular code generation. 95067c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell Mir2Lir::Materialize(); 95167c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell} 95267c39c4aefca23cb136157b889c09ee200b3dec6Mark Mendell 95349161cef10a308aedada18e9aa742498d6e6c8c7Jeff Haovoid X86Mir2Lir::LoadMethodAddress(const MethodReference& target_method, InvokeType type, 95455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell SpecialTargetRegister symbolic_reg) { 95555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell /* 95655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * For x86, just generate a 32 bit move immediate instruction, that will be filled 95755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * in at 'link time'. For now, put a unique value based on target to ensure that 95855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * code deduplication works. 95955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell */ 96049161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao int target_method_idx = target_method.dex_method_index; 96149161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile* target_dex_file = target_method.dex_file; 96249161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile::MethodId& target_method_id = target_dex_file->GetMethodId(target_method_idx); 96349161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao uintptr_t target_method_id_ptr = reinterpret_cast<uintptr_t>(&target_method_id); 96455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 96549161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao // Generate the move instruction with the unique pointer and save index, dex_file, and type. 966ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe LIR *move = RawLIR(current_dalvik_offset_, kX86Mov32RI, 967ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe TargetReg(symbolic_reg, kNotWide).GetReg(), 96849161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao static_cast<int>(target_method_id_ptr), target_method_idx, 96949161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao WrapPointer(const_cast<DexFile*>(target_dex_file)), type); 97055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell AppendLIR(move); 97155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell method_address_insns_.Insert(move); 97255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell} 97355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 97455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendellvoid X86Mir2Lir::LoadClassType(uint32_t type_idx, SpecialTargetRegister symbolic_reg) { 97555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell /* 97655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * For x86, just generate a 32 bit move immediate instruction, that will be filled 97755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * in at 'link time'. For now, put a unique value based on target to ensure that 97855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * code deduplication works. 97955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell */ 98055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell const DexFile::TypeId& id = cu_->dex_file->GetTypeId(type_idx); 98155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell uintptr_t ptr = reinterpret_cast<uintptr_t>(&id); 98255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 98355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // Generate the move instruction with the unique pointer and save index and type. 984ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe LIR *move = RawLIR(current_dalvik_offset_, kX86Mov32RI, 985ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe TargetReg(symbolic_reg, kNotWide).GetReg(), 98655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell static_cast<int>(ptr), type_idx); 98755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell AppendLIR(move); 98855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell class_type_address_insns_.Insert(move); 98955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell} 99055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 99149161cef10a308aedada18e9aa742498d6e6c8c7Jeff HaoLIR *X86Mir2Lir::CallWithLinkerFixup(const MethodReference& target_method, InvokeType type) { 99255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell /* 99355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * For x86, just generate a 32 bit call relative instruction, that will be filled 99455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * in at 'link time'. For now, put a unique value based on target to ensure that 99555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell * code deduplication works. 99655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell */ 99749161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao int target_method_idx = target_method.dex_method_index; 99849161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile* target_dex_file = target_method.dex_file; 99949161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile::MethodId& target_method_id = target_dex_file->GetMethodId(target_method_idx); 100049161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao uintptr_t target_method_id_ptr = reinterpret_cast<uintptr_t>(&target_method_id); 100149161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao 100249161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao // Generate the call instruction with the unique pointer and save index, dex_file, and type. 100349161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao LIR *call = RawLIR(current_dalvik_offset_, kX86CallI, static_cast<int>(target_method_id_ptr), 100449161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao target_method_idx, WrapPointer(const_cast<DexFile*>(target_dex_file)), type); 100555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell AppendLIR(call); 100655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell call_method_insns_.Insert(call); 100755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell return call; 100855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell} 100955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 1010d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell/* 1011d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell * @brief Enter a 32 bit quantity into a buffer 1012d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell * @param buf buffer. 1013d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell * @param data Data value. 1014d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell */ 1015d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 1016d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendellstatic void PushWord(std::vector<uint8_t>&buf, int32_t data) { 1017d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell buf.push_back(data & 0xff); 1018d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell buf.push_back((data >> 8) & 0xff); 1019d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell buf.push_back((data >> 16) & 0xff); 1020d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell buf.push_back((data >> 24) & 0xff); 1021d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell} 1022d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 102355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendellvoid X86Mir2Lir::InstallLiteralPools() { 102455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // These are handled differently for x86. 102555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK(code_literal_list_ == nullptr); 102655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK(method_literal_list_ == nullptr); 102755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK(class_literal_list_ == nullptr); 102855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 1029d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // Align to 16 byte boundary. We have implicit knowledge that the start of the method is 1030d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // on a 4 byte boundary. How can I check this if it changes (other than aligned loads 1031d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // will fail at runtime)? 1032d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (const_vectors_ != nullptr) { 1033d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell int align_size = (16-4) - (code_buffer_.size() & 0xF); 1034d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (align_size < 0) { 1035d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell align_size += 16; 1036d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1037d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 1038d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell while (align_size > 0) { 1039d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell code_buffer_.push_back(0); 1040d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell align_size--; 1041d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1042d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell for (LIR *p = const_vectors_; p != nullptr; p = p->next) { 1043d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell PushWord(code_buffer_, p->operands[0]); 1044d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell PushWord(code_buffer_, p->operands[1]); 1045d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell PushWord(code_buffer_, p->operands[2]); 1046d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell PushWord(code_buffer_, p->operands[3]); 1047d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1048d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1049d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 105055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // Handle the fixups for methods. 105155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell for (uint32_t i = 0; i < method_address_insns_.Size(); i++) { 105255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell LIR* p = method_address_insns_.Get(i); 105355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK_EQ(p->opcode, kX86Mov32RI); 105449161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao uint32_t target_method_idx = p->operands[2]; 105549161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile* target_dex_file = 105649161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao reinterpret_cast<const DexFile*>(UnwrapPointer(p->operands[3])); 105755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 105855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // The offset to patch is the last 4 bytes of the instruction. 105955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell int patch_offset = p->offset + p->flags.size - 4; 106055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell cu_->compiler_driver->AddMethodPatch(cu_->dex_file, cu_->class_def_idx, 106155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell cu_->method_idx, cu_->invoke_type, 106249161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao target_method_idx, target_dex_file, 106349161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao static_cast<InvokeType>(p->operands[4]), 106455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell patch_offset); 106555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell } 106655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 106755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // Handle the fixups for class types. 106855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell for (uint32_t i = 0; i < class_type_address_insns_.Size(); i++) { 106955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell LIR* p = class_type_address_insns_.Get(i); 107055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK_EQ(p->opcode, kX86Mov32RI); 107149161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao uint32_t target_method_idx = p->operands[2]; 107255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 107355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // The offset to patch is the last 4 bytes of the instruction. 107455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell int patch_offset = p->offset + p->flags.size - 4; 107555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell cu_->compiler_driver->AddClassPatch(cu_->dex_file, cu_->class_def_idx, 107649161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao cu_->method_idx, target_method_idx, patch_offset); 107755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell } 107855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 107955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // And now the PC-relative calls to methods. 108055d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell for (uint32_t i = 0; i < call_method_insns_.Size(); i++) { 108155d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell LIR* p = call_method_insns_.Get(i); 108255d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell DCHECK_EQ(p->opcode, kX86CallI); 108349161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao uint32_t target_method_idx = p->operands[1]; 108449161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao const DexFile* target_dex_file = 108549161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao reinterpret_cast<const DexFile*>(UnwrapPointer(p->operands[2])); 108655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 108755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // The offset to patch is the last 4 bytes of the instruction. 108855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell int patch_offset = p->offset + p->flags.size - 4; 108955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell cu_->compiler_driver->AddRelativeCodePatch(cu_->dex_file, cu_->class_def_idx, 109049161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao cu_->method_idx, cu_->invoke_type, 109149161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao target_method_idx, target_dex_file, 109249161cef10a308aedada18e9aa742498d6e6c8c7Jeff Hao static_cast<InvokeType>(p->operands[3]), 109355d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell patch_offset, -4 /* offset */); 109455d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell } 109555d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 109655d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell // And do the normal processing. 109755d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell Mir2Lir::InstallLiteralPools(); 109855d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell} 109955d0eac918321e0525f6e6491f36a80977e0d416Mark Mendell 110070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolovbool X86Mir2Lir::GenInlinedArrayCopyCharArray(CallInfo* info) { 110170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (cu_->target64) { 110270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // TODO: Implement ArrayCOpy intrinsic for x86_64 110370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov return false; 110470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 110570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 110670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov RegLocation rl_src = info->args[0]; 110770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov RegLocation rl_srcPos = info->args[1]; 110870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov RegLocation rl_dst = info->args[2]; 110970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov RegLocation rl_dstPos = info->args[3]; 111070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov RegLocation rl_length = info->args[4]; 111170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (rl_srcPos.is_const && (mir_graph_->ConstantValue(rl_srcPos) < 0)) { 111270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov return false; 111370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 111470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (rl_dstPos.is_const && (mir_graph_->ConstantValue(rl_dstPos) < 0)) { 111570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov return false; 111670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 111770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov ClobberCallerSave(); 111870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LockCallTemps(); // Using fixed registers 111970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_src , rs_rAX); 112070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_dst , rs_rCX); 112170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* src_dst_same = OpCmpBranch(kCondEq, rs_rAX , rs_rCX, nullptr); 112270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* src_null_branch = OpCmpImmBranch(kCondEq, rs_rAX , 0, nullptr); 112370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* dst_null_branch = OpCmpImmBranch(kCondEq, rs_rCX , 0, nullptr); 112470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_length , rs_rDX); 112570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* len_negative = OpCmpImmBranch(kCondLt, rs_rDX , 0, nullptr); 112670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* len_too_big = OpCmpImmBranch(kCondGt, rs_rDX , 128, nullptr); 112770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_src , rs_rAX); 112870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadWordDisp(rs_rAX , mirror::Array::LengthOffset().Int32Value(), rs_rAX); 112970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* src_bad_len = nullptr; 113070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* srcPos_negative = nullptr; 113170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (!rl_srcPos.is_const) { 113270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_srcPos , rs_rBX); 113370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov srcPos_negative = OpCmpImmBranch(kCondLt, rs_rBX , 0, nullptr); 113470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegReg(kOpAdd, rs_rBX, rs_rDX); 113570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rBX, nullptr); 113670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } else { 113770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov int pos_val = mir_graph_->ConstantValue(rl_srcPos.orig_sreg); 113870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (pos_val == 0) { 113970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rDX, nullptr); 114070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } else { 114170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegRegImm(kOpAdd, rs_rBX, rs_rDX, pos_val); 114270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rBX, nullptr); 114370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 114470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 114570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* dstPos_negative = nullptr; 114670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* dst_bad_len = nullptr; 114770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_dst, rs_rAX); 114870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadWordDisp(rs_rAX, mirror::Array::LengthOffset().Int32Value(), rs_rAX); 114970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (!rl_dstPos.is_const) { 115070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_dstPos , rs_rBX); 115170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dstPos_negative = OpCmpImmBranch(kCondLt, rs_rBX , 0, nullptr); 115270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegRegReg(kOpAdd, rs_rBX, rs_rBX, rs_rDX); 115370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dst_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rBX, nullptr); 115470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } else { 115570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov int pos_val = mir_graph_->ConstantValue(rl_dstPos.orig_sreg); 115670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (pos_val == 0) { 115770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dst_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rDX, nullptr); 115870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } else { 115970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegRegImm(kOpAdd, rs_rBX, rs_rDX, pos_val); 116070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dst_bad_len = OpCmpBranch(kCondLt, rs_rAX , rs_rBX, nullptr); 116170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 116270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov } 116370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // everything is checked now 116470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_src , rs_rAX); 116570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_dst , rs_rBX); 116670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_srcPos , rs_rCX); 116770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov NewLIR5(kX86Lea32RA, rs_rAX.GetReg(), rs_rAX.GetReg(), 116870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov rs_rCX.GetReg() , 1, mirror::Array::DataOffset(2).Int32Value()); 116970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // RAX now holds the address of the first src element to be copied 117070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 117170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_dstPos , rs_rCX); 117270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov NewLIR5(kX86Lea32RA, rs_rBX.GetReg(), rs_rBX.GetReg(), 117370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov rs_rCX.GetReg() , 1, mirror::Array::DataOffset(2).Int32Value() ); 117470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // RBX now holds the address of the first dst element to be copied 117570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 117670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // check if the number of elements to be copied is odd or even. If odd 117770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // then copy the first element (so that the remaining number of elements 117870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // is even). 117970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadValueDirectFixed(rl_length , rs_rCX); 118070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegImm(kOpAnd, rs_rCX, 1); 118170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* jmp_to_begin_loop = OpCmpImmBranch(kCondEq, rs_rCX, 0, nullptr); 118270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegImm(kOpSub, rs_rDX, 1); 118370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadBaseIndexedDisp(rs_rAX, rs_rDX, 1, 0, rs_rCX, kSignedHalf); 118470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov StoreBaseIndexedDisp(rs_rBX, rs_rDX, 1, 0, rs_rCX, kSignedHalf); 118570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 118670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // since the remaining number of elements is even, we will copy by 118770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov // two elements at a time. 118870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR *beginLoop = NewLIR0(kPseudoTargetLabel); 118970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* jmp_to_ret = OpCmpImmBranch(kCondEq, rs_rDX , 0, nullptr); 119070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpRegImm(kOpSub, rs_rDX, 2); 119170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LoadBaseIndexedDisp(rs_rAX, rs_rDX, 1, 0, rs_rCX, kSingle); 119270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov StoreBaseIndexedDisp(rs_rBX, rs_rDX, 1, 0, rs_rCX, kSingle); 119370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov OpUnconditionalBranch(beginLoop); 119470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR *check_failed = NewLIR0(kPseudoTargetLabel); 119570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR* launchpad_branch = OpUnconditionalBranch(nullptr); 119670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov LIR *return_point = NewLIR0(kPseudoTargetLabel); 119770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov jmp_to_ret->target = return_point; 119870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov jmp_to_begin_loop->target = beginLoop; 119970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_dst_same->target = check_failed; 120070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov len_negative->target = check_failed; 120170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov len_too_big->target = check_failed; 120270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_null_branch->target = check_failed; 120370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (srcPos_negative != nullptr) 120470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov srcPos_negative ->target = check_failed; 120570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (src_bad_len != nullptr) 120670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov src_bad_len->target = check_failed; 120770c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dst_null_branch->target = check_failed; 120870c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (dstPos_negative != nullptr) 120970c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dstPos_negative->target = check_failed; 121070c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov if (dst_bad_len != nullptr) 121170c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov dst_bad_len->target = check_failed; 121270c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov AddIntrinsicSlowPath(info, launchpad_branch, return_point); 121370c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov return true; 121470c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov} 121570c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 121670c4f06f9965cdb9319a2c85f65acda20086d765DaniilSokolov 12174028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell/* 12184028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell * Fast string.index_of(I) & (II). Inline check for simple case of char <= 0xffff, 12194028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell * otherwise bails to standard library code. 12204028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell */ 12214028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendellbool X86Mir2Lir::GenInlinedIndexOf(CallInfo* info, bool zero_based) { 12224028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell RegLocation rl_obj = info->args[0]; 12234028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell RegLocation rl_char = info->args[1]; 1224a44d4f508fa1642294e79d3ebecd790afe75ea60buzbee RegLocation rl_start; // Note: only present in III flavor or IndexOf. 1225c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // RBX is callee-save register in 64-bit mode. 1226c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk RegStorage rs_tmp = cu_->target64 ? rs_r11 : rs_rBX; 1227c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk int start_value = -1; 12284028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 12294028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell uint32_t char_value = 12304028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell rl_char.is_const ? mir_graph_->ConstantValue(rl_char.orig_sreg) : 0; 12314028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 12324028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (char_value > 0xFFFF) { 12334028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // We have to punt to the real String.indexOf. 12344028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell return false; 12354028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 12364028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 12374028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Okay, we are commited to inlining this. 1238c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // EAX: 16 bit character being searched. 1239c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // ECX: count: number of words to be searched. 1240c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // EDI: String being searched. 1241c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // EDX: temporary during execution. 1242c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // EBX or R11: temporary during execution (depending on mode). 1243c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // REP SCASW: search instruction. 1244c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1245c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FlushReg(rs_rAX); 1246c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Clobber(rs_rAX); 1247c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LockTemp(rs_rAX); 1248c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FlushReg(rs_rCX); 1249c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Clobber(rs_rCX); 1250c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LockTemp(rs_rCX); 1251c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FlushReg(rs_rDX); 1252c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Clobber(rs_rDX); 1253c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LockTemp(rs_rDX); 1254c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FlushReg(rs_tmp); 1255c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Clobber(rs_tmp); 1256c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LockTemp(rs_tmp); 1257c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (cu_->target64) { 1258c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FlushReg(rs_rDI); 1259c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Clobber(rs_rDI); 1260c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LockTemp(rs_rDI); 1261c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk } 1262c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1263a0cd2d701f29e0bc6275f1b13c0edfd4ec391879buzbee RegLocation rl_return = GetReturn(kCoreReg); 12644028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell RegLocation rl_dest = InlineTarget(info); 12654028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 12664028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Is the string non-NULL? 12672700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee LoadValueDirectFixed(rl_obj, rs_rDX); 12682700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee GenNullCheck(rs_rDX, info->opt_flags); 12693bc8615332b7848dec8c2297a40f7e4d176c0efbVladimir Marko info->opt_flags |= MIR_IGNORE_NULL_CHECK; // Record that we've null checked. 12704028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 1271c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LIR *slowpath_branch = nullptr, *length_compare = nullptr; 1272c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1273c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // We need the value in EAX. 12744028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (rl_char.is_const) { 12752700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee LoadConstantNoClobber(rs_rAX, char_value); 12764028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } else { 1277c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Does the character fit in 16 bits? Compare it at runtime. 12782700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee LoadValueDirectFixed(rl_char, rs_rAX); 12793a74d15ccc9a902874473ac9632e568b19b91b1cMingyao Yang slowpath_branch = OpCmpImmBranch(kCondGt, rs_rAX, 0xFFFF, nullptr); 12804028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 12814028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 12824028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // From here down, we know that we are looking for a char that fits in 16 bits. 1283e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell // Location of reference to data array within the String object. 1284e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell int value_offset = mirror::String::ValueOffset().Int32Value(); 1285e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell // Location of count within the String object. 1286e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell int count_offset = mirror::String::CountOffset().Int32Value(); 1287e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell // Starting offset within data array. 1288e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell int offset_offset = mirror::String::OffsetOffset().Int32Value(); 1289e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell // Start of char data with array_. 1290e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell int data_offset = mirror::Array::DataOffset(sizeof(uint16_t)).Int32Value(); 12914028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 129269dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison // Compute the number of words to search in to rCX. 129369dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison Load32Disp(rs_rDX, count_offset, rs_rCX); 129469dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison 1295c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (!cu_->target64) { 1296c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Possible signal here due to null pointer dereference. 1297c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Note that the signal handler will expect the top word of 1298c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // the stack to be the ArtMethod*. If the PUSH edi instruction 1299c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // below is ahead of the load above then this will not be true 1300c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // and the signal handler will not work. 1301c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk MarkPossibleNullPointerException(0); 1302c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1303c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // EDI is callee-save register in 32-bit mode. 1304c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk NewLIR1(kX86Push32R, rs_rDI.GetReg()); 1305c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk } 13064028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13074028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (zero_based) { 1308c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Start index is not present. 13094028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // We have to handle an empty string. Use special instruction JECXZ. 13104028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell length_compare = NewLIR0(kX86Jecxz8); 1311c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1312c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Copy the number of words to search in a temporary register. 1313c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // We will use the register at the end to calculate result. 1314c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpMov, rs_tmp, rs_rCX); 13154028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } else { 1316c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Start index is present. 1317a44d4f508fa1642294e79d3ebecd790afe75ea60buzbee rl_start = info->args[2]; 1318c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 13194028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // We have to offset by the start index. 13204028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (rl_start.is_const) { 13214028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell start_value = mir_graph_->ConstantValue(rl_start.orig_sreg); 13224028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell start_value = std::max(start_value, 0); 13234028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13244028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Is the start > count? 13252700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee length_compare = OpCmpImmBranch(kCondLe, rs_rCX, start_value, nullptr); 1326c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegImm(kOpMov, rs_rDI, start_value); 1327c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1328c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Copy the number of words to search in a temporary register. 1329c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // We will use the register at the end to calculate result. 1330c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpMov, rs_tmp, rs_rCX); 13314028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13324028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell if (start_value != 0) { 1333c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Decrease the number of words to search by the start index. 13342700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee OpRegImm(kOpSub, rs_rCX, start_value); 13354028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 13364028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } else { 1337c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Handle "start index < 0" case. 1338c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (!cu_->target64 && rl_start.location != kLocPhysReg) { 1339a1758d83e298c9ee31848bcae07c2a35f6efd618Alexei Zavjalov // Load the start index from stack, remembering that we pushed EDI. 1340c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk int displacement = SRegOffset(rl_start.s_reg_low) + sizeof(uint32_t); 13418dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko { 13428dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 1343c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Load32Disp(rs_rX86_SP, displacement, rs_rDI); 13448dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko } 1345c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk } else { 1346c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk LoadValueDirectFixed(rl_start, rs_rDI); 13474028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 1348c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpXor, rs_tmp, rs_tmp); 1349c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpCmp, rs_rDI, rs_tmp); 1350c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpCondRegReg(kOpCmov, kCondLt, rs_rDI, rs_tmp); 1351c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1352c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // The length of the string should be greater than the start index. 1353c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk length_compare = OpCmpBranch(kCondLe, rs_rCX, rs_rDI, nullptr); 1354c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1355c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Copy the number of words to search in a temporary register. 1356c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // We will use the register at the end to calculate result. 1357c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpMov, rs_tmp, rs_rCX); 1358c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1359c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Decrease the number of words to search by the start index. 1360c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpSub, rs_rCX, rs_rDI); 13614028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 13624028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 13634028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 1364c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // Load the address of the string into EDI. 1365c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk // In case of start index we have to add the address to existing value in EDI. 1366e19c91fdb88ff6fd4e88bc5984772dcfb1e86f80Mark Mendell // The string starts at VALUE(String) + 2 * OFFSET(String) + DATA_OFFSET. 1367c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (zero_based || (!zero_based && rl_start.is_const && start_value == 0)) { 1368c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk Load32Disp(rs_rDX, offset_offset, rs_rDI); 13694028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } else { 1370c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegMem(kOpAdd, rs_rDI, rs_rDX, offset_offset); 13714028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 1372c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegImm(kOpLsl, rs_rDI, 1); 1373c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegMem(kOpAdd, rs_rDI, rs_rDX, value_offset); 1374c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegImm(kOpAdd, rs_rDI, data_offset); 13754028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13764028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // EDI now contains the start of the string to be searched. 13774028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // We are all prepared to do the search for the character. 13784028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell NewLIR0(kX86RepneScasw); 13794028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13804028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Did we find a match? 13814028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell LIR* failed_branch = OpCondBranch(kCondNe, nullptr); 13824028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13834028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // yes, we matched. Compute the index of the result. 1384c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk OpRegReg(kOpSub, rs_tmp, rs_rCX); 1385c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk NewLIR3(kX86Lea32RM, rl_return.reg.GetReg(), rs_tmp.GetReg(), -1); 1386c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 13874028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell LIR *all_done = NewLIR1(kX86Jmp8, 0); 13884028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13894028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Failed to match; return -1. 13904028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell LIR *not_found = NewLIR0(kPseudoTargetLabel); 13914028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell length_compare->target = not_found; 13924028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell failed_branch->target = not_found; 13932700f7e1edbcd2518f4978e4cd0e05a4149f91b6buzbee LoadConstantNoClobber(rl_return.reg, -1); 13944028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 13954028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // And join up at the end. 13964028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell all_done->target = NewLIR0(kPseudoTargetLabel); 1397c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1398c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (!cu_->target64) 1399c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk NewLIR1(kX86Pop32R, rs_rDI.GetReg()); 14004028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 14014028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell // Out of line code returns here. 14023a74d15ccc9a902874473ac9632e568b19b91b1cMingyao Yang if (slowpath_branch != nullptr) { 14034028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell LIR *return_point = NewLIR0(kPseudoTargetLabel); 14043a74d15ccc9a902874473ac9632e568b19b91b1cMingyao Yang AddIntrinsicSlowPath(info, slowpath_branch, return_point); 14054028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell } 14064028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 14074028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell StoreValue(rl_dest, rl_return); 1408c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 1409c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FreeTemp(rs_rAX); 1410c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FreeTemp(rs_rCX); 1411c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FreeTemp(rs_rDX); 1412c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FreeTemp(rs_tmp); 1413c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk if (cu_->target64) { 1414c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk FreeTemp(rs_rDI); 1415c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk } 1416c3561ae381960cbd52a83b7591504f158ec06920nikolay serdjuk 14174028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell return true; 14184028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell} 14194028a6c83a339036864999fdfd2855b012a9f1a7Mark Mendell 1420ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell/* 1421ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell * @brief Enter an 'advance LOC' into the FDE buffer 1422ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell * @param buf FDE buffer. 1423ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell * @param increment Amount by which to increase the current location. 1424ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell */ 1425ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendellstatic void AdvanceLoc(std::vector<uint8_t>&buf, uint32_t increment) { 1426ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell if (increment < 64) { 1427ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Encoding in opcode. 1428ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(0x1 << 6 | increment); 1429ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } else if (increment < 256) { 1430ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Single byte delta. 1431ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(0x02); 1432ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(increment); 1433ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } else if (increment < 256 * 256) { 1434ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Two byte delta. 1435ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(0x03); 1436ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(increment & 0xff); 1437ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back((increment >> 8) & 0xff); 1438ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } else { 1439ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Four byte delta. 1440ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(0x04); 1441ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(buf, increment); 1442ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1443ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell} 1444ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1445ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1446ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendellstd::vector<uint8_t>* X86CFIInitialization() { 1447ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell return X86Mir2Lir::ReturnCommonCallFrameInformation(); 1448ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell} 1449ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1450ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendellstd::vector<uint8_t>* X86Mir2Lir::ReturnCommonCallFrameInformation() { 1451ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell std::vector<uint8_t>*cfi_info = new std::vector<uint8_t>; 1452ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1453ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Length of the CIE (except for this field). 1454ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(*cfi_info, 16); 1455ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1456ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // CIE id. 1457ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(*cfi_info, 0xFFFFFFFFU); 1458ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1459ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Version: 3. 1460ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x03); 1461ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1462ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Augmentation: empty string. 1463ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0); 1464ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1465ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Code alignment: 1. 1466ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x01); 1467ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1468ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Data alignment: -4. 1469ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x7C); 1470ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1471ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Return address register (R8). 1472ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x08); 1473ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1474ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Initial return PC is 4(ESP): DW_CFA_def_cfa R4 4. 1475ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0C); 1476ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x04); 1477ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x04); 1478ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1479ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Return address location: 0(SP): DW_CFA_offset R8 1 (* -4);. 1480ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x2 << 6 | 0x08); 1481ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x01); 1482ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1483ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // And 2 Noops to align to 4 byte boundary. 1484ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0); 1485ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0); 1486ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1487ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell DCHECK_EQ(cfi_info->size() & 3, 0U); 1488ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell return cfi_info; 1489ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell} 1490ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1491ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendellstatic void EncodeUnsignedLeb128(std::vector<uint8_t>& buf, uint32_t value) { 1492ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell uint8_t buffer[12]; 1493ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell uint8_t *ptr = EncodeUnsignedLeb128(buffer, value); 1494ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell for (uint8_t *p = buffer; p < ptr; p++) { 1495ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell buf.push_back(*p); 1496ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1497ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell} 1498ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1499ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendellstd::vector<uint8_t>* X86Mir2Lir::ReturnCallFrameInformation() { 1500ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell std::vector<uint8_t>*cfi_info = new std::vector<uint8_t>; 1501ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1502ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Generate the FDE for the method. 1503ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell DCHECK_NE(data_offset_, 0U); 1504ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1505ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Length (will be filled in later in this routine). 1506ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(*cfi_info, 0); 1507ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1508ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // CIE_pointer (can be filled in by linker); might be left at 0 if there is only 1509ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // one CIE for the whole debug_frame section. 1510ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(*cfi_info, 0); 1511ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1512ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // 'initial_location' (filled in by linker). 1513ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(*cfi_info, 0); 1514ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1515ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // 'address_range' (number of bytes in the method). 1516ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell PushWord(*cfi_info, data_offset_); 1517ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1518ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // The instructions in the FDE. 1519ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell if (stack_decrement_ != nullptr) { 1520ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Advance LOC to just past the stack decrement. 1521ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell uint32_t pc = NEXT_LIR(stack_decrement_)->offset; 1522ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell AdvanceLoc(*cfi_info, pc); 1523ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1524ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Now update the offset to the call frame: DW_CFA_def_cfa_offset frame_size. 1525ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0e); 1526ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell EncodeUnsignedLeb128(*cfi_info, frame_size_); 1527ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1528ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // We continue with that stack until the epilogue. 1529ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell if (stack_increment_ != nullptr) { 1530ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell uint32_t new_pc = NEXT_LIR(stack_increment_)->offset; 1531ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell AdvanceLoc(*cfi_info, new_pc - pc); 1532ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1533ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // We probably have code snippets after the epilogue, so save the 1534ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // current state: DW_CFA_remember_state. 1535ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0a); 1536ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1537ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // We have now popped the stack: DW_CFA_def_cfa_offset 4. There is only the return 1538ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // PC on the stack now. 1539ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0e); 1540ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell EncodeUnsignedLeb128(*cfi_info, 4); 1541ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1542ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Everything after that is the same as before the epilogue. 1543ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Stack bump was followed by RET instruction. 1544ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell LIR *post_ret_insn = NEXT_LIR(NEXT_LIR(stack_increment_)); 1545ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell if (post_ret_insn != nullptr) { 1546ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell pc = new_pc; 1547ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell new_pc = post_ret_insn->offset; 1548ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell AdvanceLoc(*cfi_info, new_pc - pc); 1549ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Restore the state: DW_CFA_restore_state. 1550ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0x0b); 1551ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1552ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1553ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1554ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1555ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Padding to a multiple of 4 1556ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell while ((cfi_info->size() & 3) != 0) { 1557ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // DW_CFA_nop is encoded as 0. 1558ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell cfi_info->push_back(0); 1559ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell } 1560ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1561ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell // Set the length of the FDE inside the generated bytes. 1562ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell uint32_t length = cfi_info->size() - 4; 1563ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell (*cfi_info)[0] = length; 1564ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell (*cfi_info)[1] = length >> 8; 1565ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell (*cfi_info)[2] = length >> 16; 1566ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell (*cfi_info)[3] = length >> 24; 1567ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell return cfi_info; 1568ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell} 1569ae9fd93c39a341e2dffe15c61cc7d9e841fa92c4Mark Mendell 1570d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendellvoid X86Mir2Lir::GenMachineSpecificExtendedMethodMIR(BasicBlock* bb, MIR* mir) { 1571d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell switch (static_cast<ExtendedMIROpcode>(mir->dalvikInsn.opcode)) { 157260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kMirOpReserveVectorRegisters: 157360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji ReserveVectorRegisters(mir); 157460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 157560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kMirOpReturnVectorRegisters: 157660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji ReturnVectorRegisters(); 157760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 1578d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell case kMirOpConstVector: 1579d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell GenConst128(bb, mir); 1580d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell break; 1581fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpMoveVector: 1582fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenMoveVector(bb, mir); 1583fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1584fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedMultiply: 1585fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenMultiplyVector(bb, mir); 1586fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1587fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedAddition: 1588fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenAddVector(bb, mir); 1589fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1590fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedSubtract: 1591fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenSubtractVector(bb, mir); 1592fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1593fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedShiftLeft: 1594fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenShiftLeftVector(bb, mir); 1595fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1596fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedSignedShiftRight: 1597fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenSignedShiftRightVector(bb, mir); 1598fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1599fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedUnsignedShiftRight: 1600fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenUnsignedShiftRightVector(bb, mir); 1601fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1602fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedAnd: 1603fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenAndVector(bb, mir); 1604fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1605fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedOr: 1606fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenOrVector(bb, mir); 1607fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1608fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedXor: 1609fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenXorVector(bb, mir); 1610fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1611fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedAddReduce: 1612fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenAddReduceVector(bb, mir); 1613fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1614fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedReduce: 1615fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenReduceVector(bb, mir); 1616fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1617fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kMirOpPackedSet: 1618fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell GenSetVector(bb, mir); 1619fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1620d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell default: 1621d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell break; 1622d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1623d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell} 1624d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 162560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::ReserveVectorRegisters(MIR* mir) { 162660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // We should not try to reserve twice without returning the registers 162760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_NE(num_reserved_vector_regs_, -1); 162860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 162960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int num_vector_reg = mir->dalvikInsn.vA; 163060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji for (int i = 0; i < num_vector_reg; i++) { 163160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage xp_reg = RegStorage::Solo128(i); 163260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegisterInfo *xp_reg_info = GetRegInfo(xp_reg); 163360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji Clobber(xp_reg); 163460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 163560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji for (RegisterInfo *info = xp_reg_info->GetAliasChain(); 163660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji info != nullptr; 163760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji info = info->GetAliasChain()) { 163860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (info->GetReg().IsSingle()) { 163960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_pool_->sp_regs_.Delete(info); 164060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 164160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_pool_->dp_regs_.Delete(info); 164260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 164360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 164460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 164560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 164660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji num_reserved_vector_regs_ = num_vector_reg; 164760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 164860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 164960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::ReturnVectorRegisters() { 165060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Return all the reserved registers 165160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji for (int i = 0; i < num_reserved_vector_regs_; i++) { 165260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage xp_reg = RegStorage::Solo128(i); 165360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegisterInfo *xp_reg_info = GetRegInfo(xp_reg); 165460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 165560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji for (RegisterInfo *info = xp_reg_info->GetAliasChain(); 165660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji info != nullptr; 165760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji info = info->GetAliasChain()) { 165860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (info->GetReg().IsSingle()) { 165960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_pool_->sp_regs_.Insert(info); 166060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 166160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_pool_->dp_regs_.Insert(info); 166260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 166360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 166460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 166560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 166660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // We don't have anymore reserved vector registers 166760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji num_reserved_vector_regs_ = -1; 166860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 166960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 1670d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendellvoid X86Mir2Lir::GenConst128(BasicBlock* bb, MIR* mir) { 167160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji store_method_addr_used_ = true; 167260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int type_size = mir->dalvikInsn.vB; 1673d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // We support 128 bit vectors. 1674d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell DCHECK_EQ(type_size & 0xFFFF, 128); 167560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest = RegStorage::Solo128(mir->dalvikInsn.vA); 1676d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell uint32_t *args = mir->dalvikInsn.arg; 1677fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int reg = rs_dest.GetReg(); 1678d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // Check for all 0 case. 1679d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (args[0] == 0 && args[1] == 0 && args[2] == 0 && args[3] == 0) { 1680d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell NewLIR2(kX86XorpsRR, reg, reg); 1681d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell return; 1682d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 168360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 168460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Append the mov const vector to reg opcode. 168560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AppendOpcodeWithConst(kX86MovupsRM, reg, mir); 168660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 168760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 168860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::AppendOpcodeWithConst(X86OpCode opcode, int reg, MIR* mir) { 1689d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // Okay, load it from the constant vector area. 1690d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell LIR *data_target = ScanVectorLiteral(mir); 1691d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (data_target == nullptr) { 1692d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell data_target = AddVectorLiteral(mir); 1693d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 1694d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 1695d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // Address the start of the method. 1696d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell RegLocation rl_method = mir_graph_->GetRegLocation(base_of_code_->s_reg_low); 1697e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu if (rl_method.wide) { 1698e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu rl_method = LoadValueWide(rl_method, kCoreReg); 1699e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu } else { 1700e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu rl_method = LoadValue(rl_method, kCoreReg); 1701e0ccdc0dd166136cd43e5f54201179a4496d33e8Chao-ying Fu } 1702d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 1703d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // Load the proper value from the literal area. 1704d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // We don't know the proper offset for the value, so pick one that will force 1705d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // 4 byte offset. We will fix this up in the assembler later to have the right 1706d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell // value. 17078dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kLiteral); 170860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji LIR *load = NewLIR2(opcode, reg, rl_method.reg.GetReg()); 1709d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell load->flags.fixup = kFixupLoad; 1710d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell load->target = data_target; 1711d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell} 1712d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 1713fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenMoveVector(BasicBlock *bb, MIR *mir) { 1714fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // We only support 128 bit registers. 171560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 171660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest = RegStorage::Solo128(mir->dalvikInsn.vA); 171760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src = RegStorage::Solo128(mir->dalvikInsn.vB); 1718fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(kX86Mova128RR, rs_dest.GetReg(), rs_src.GetReg()); 1719fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1720fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 172160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::GenMultiplyVectorSignedByte(BasicBlock *bb, MIR *mir) { 172260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const int BYTE_SIZE = 8; 172360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 172460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 172560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src1_high_tmp = Get128BitRegister(AllocTempWide()); 172660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 172760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji /* 172860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * Emulate the behavior of a kSignedByte by separating out the 16 values in the two XMM 172960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * and multiplying 8 at a time before recombining back into one XMM register. 173060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * 173160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * let xmm1, xmm2 be real srcs (keep low bits of 16bit lanes) 173260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm3 is tmp (operate on high bits of 16bit lanes) 173360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * 173460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm3 = xmm1 173560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 = xmm1 .* xmm2 173660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 = xmm1 & 0x00ff00ff00ff00ff00ff00ff00ff00ff // xmm1 now has low bits 173760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm3 = xmm3 .>> 8 173860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 = xmm2 & 0xff00ff00ff00ff00ff00ff00ff00ff00 173960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 = xmm2 .* xmm3 // xmm2 now has high bits 174060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 = xmm1 | xmm2 // combine results 174160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji */ 174260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 174360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Copy xmm1. 174460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Mova128RR, rs_src1_high_tmp.GetReg(), rs_dest_src1.GetReg()); 174560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 174660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Multiply low bits. 174760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PmullwRR, rs_dest_src1.GetReg(), rs_src2.GetReg()); 174860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 174960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // xmm1 now has low bits. 175060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AndMaskVectorRegister(rs_dest_src1, 0x00FF00FF, 0x00FF00FF, 0x00FF00FF, 0x00FF00FF); 175160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 175260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Prepare high bits for multiplication. 175360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PsrlwRI, rs_src1_high_tmp.GetReg(), BYTE_SIZE); 175460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AndMaskVectorRegister(rs_src2, 0xFF00FF00, 0xFF00FF00, 0xFF00FF00, 0xFF00FF00); 175560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 175660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Multiply high bits and xmm2 now has high bits. 175760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PmullwRR, rs_src2.GetReg(), rs_src1_high_tmp.GetReg()); 175860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 175960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Combine back into dest XMM register. 176060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PorRR, rs_dest_src1.GetReg(), rs_src2.GetReg()); 176160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 176260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 1763fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenMultiplyVector(BasicBlock *bb, MIR *mir) { 176460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 176560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 176660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 176760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 1768fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 1769fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 1770fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 1771fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PmulldRR; 1772fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1773fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 1774fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PmullwRR; 1775fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1776fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSingle: 1777fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86MulpsRR; 1778fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1779fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kDouble: 1780fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86MulpdRR; 1781fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 178260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 178360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // HW doesn't support 16x16 byte multiplication so emulate it. 178460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji GenMultiplyVectorSignedByte(bb, mir); 178560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 1786fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 1787fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector multiply " << opsize; 1788fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1789fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 1790fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), rs_src2.GetReg()); 1791fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1792fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 1793fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenAddVector(BasicBlock *bb, MIR *mir) { 179460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 179560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 179660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 179760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 1798fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 1799fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 1800fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 1801fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PadddRR; 1802fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1803fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 1804fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 1805fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PaddwRR; 1806fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1807fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedByte: 1808fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedByte: 1809fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PaddbRR; 1810fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1811fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSingle: 1812fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86AddpsRR; 1813fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1814fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kDouble: 1815fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86AddpdRR; 1816fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1817fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 1818fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector addition " << opsize; 1819fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1820fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 1821fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), rs_src2.GetReg()); 1822fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1823fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 1824fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenSubtractVector(BasicBlock *bb, MIR *mir) { 182560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 182660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 182760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 182860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 1829fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 1830fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 1831fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 1832fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsubdRR; 1833fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1834fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 1835fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 1836fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsubwRR; 1837fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1838fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedByte: 1839fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedByte: 1840fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsubbRR; 1841fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1842fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSingle: 1843fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86SubpsRR; 1844fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1845fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kDouble: 1846fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86SubpdRR; 1847fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1848fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 1849fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector subtraction " << opsize; 1850fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1851fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 1852fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), rs_src2.GetReg()); 1853fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1854fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 185560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::GenShiftByteVector(BasicBlock *bb, MIR *mir) { 185660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 185760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_tmp = Get128BitRegister(AllocTempWide()); 185860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 185960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int opcode = 0; 186060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int imm = mir->dalvikInsn.vB; 186160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 186260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji switch (static_cast<ExtendedMIROpcode>(mir->dalvikInsn.opcode)) { 186360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kMirOpPackedShiftLeft: 186460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji opcode = kX86PsllwRI; 186560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 186660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kMirOpPackedSignedShiftRight: 186760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji opcode = kX86PsrawRI; 186860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 186960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kMirOpPackedUnsignedShiftRight: 187060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji opcode = kX86PsrlwRI; 187160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 187260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji default: 187360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji LOG(FATAL) << "Unsupported shift operation on byte vector " << opcode; 187460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 187560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 187660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 187760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji /* 187860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 will have low bits 187960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 will have high bits 188060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * 188160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 = xmm1 188260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 = xmm1 .<< N 188360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 = xmm2 && 0xFF00FF00FF00FF00FF00FF00FF00FF00 188460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm2 = xmm2 .<< N 188560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji * xmm1 = xmm1 | xmm2 188660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji */ 188760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 188860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Copy xmm1. 188960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Mova128RR, rs_tmp.GetReg(), rs_dest_src1.GetReg()); 189060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 189160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Shift lower values. 189260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(opcode, rs_dest_src1.GetReg(), imm); 189360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 189460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Mask bottom bits. 189560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AndMaskVectorRegister(rs_tmp, 0xFF00FF00, 0xFF00FF00, 0xFF00FF00, 0xFF00FF00); 189660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 189760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Shift higher values. 189860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(opcode, rs_tmp.GetReg(), imm); 189960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 190060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Combine back into dest XMM register. 190160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PorRR, rs_dest_src1.GetReg(), rs_tmp.GetReg()); 190260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 190360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 1904fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenShiftLeftVector(BasicBlock *bb, MIR *mir) { 190560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 190660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 190760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 190860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int imm = mir->dalvikInsn.vB; 1909fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 1910fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 1911fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 1912fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PslldRI; 1913fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1914fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k64: 1915fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsllqRI; 1916fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1917fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 1918fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 1919fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsllwRI; 1920fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 192160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 192260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kUnsignedByte: 192360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji GenShiftByteVector(bb, mir); 192460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 1925fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 1926fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector shift left " << opsize; 1927fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1928fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 1929fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), imm); 1930fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1931fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 1932fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenSignedShiftRightVector(BasicBlock *bb, MIR *mir) { 193360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 193460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 193560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 193660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int imm = mir->dalvikInsn.vB; 1937fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 1938fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 1939fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 1940fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsradRI; 1941fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1942fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 1943fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 1944fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsrawRI; 1945fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 194660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 194760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kUnsignedByte: 194860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji GenShiftByteVector(bb, mir); 194960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 1950fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 1951fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector signed shift right " << opsize; 1952fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1953fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 1954fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), imm); 1955fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1956fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 1957fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenUnsignedShiftRightVector(BasicBlock *bb, MIR *mir) { 195860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 195960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 196060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 196160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int imm = mir->dalvikInsn.vB; 1962fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 1963fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 1964fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 1965fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsrldRI; 1966fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1967fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k64: 1968fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsrlqRI; 1969fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1970fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 1971fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 1972fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PsrlwRI; 1973fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 197460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 197560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kUnsignedByte: 197660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji GenShiftByteVector(bb, mir); 197760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 1978fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 1979fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector unsigned shift right " << opsize; 1980fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 1981fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 1982fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(opcode, rs_dest_src1.GetReg(), imm); 1983fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1984fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 1985fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenAndVector(BasicBlock *bb, MIR *mir) { 1986fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // We only support 128 bit registers. 198760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 198860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 198960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 1990fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(kX86PandRR, rs_dest_src1.GetReg(), rs_src2.GetReg()); 1991fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 1992fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 1993fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenOrVector(BasicBlock *bb, MIR *mir) { 1994fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // We only support 128 bit registers. 199560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 199660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 199760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 1998fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(kX86PorRR, rs_dest_src1.GetReg(), rs_src2.GetReg()); 1999fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2000fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2001fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenXorVector(BasicBlock *bb, MIR *mir) { 2002fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // We only support 128 bit registers. 200360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 200460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest_src1 = RegStorage::Solo128(mir->dalvikInsn.vA); 200560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src2 = RegStorage::Solo128(mir->dalvikInsn.vB); 2006fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell NewLIR2(kX86PxorRR, rs_dest_src1.GetReg(), rs_src2.GetReg()); 2007fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2008fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 200960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::AndMaskVectorRegister(RegStorage rs_src1, uint32_t m1, uint32_t m2, uint32_t m3, uint32_t m4) { 201060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji MaskVectorRegister(kX86PandRM, rs_src1, m1, m2, m3, m4); 201160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 201260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 201360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerjivoid X86Mir2Lir::MaskVectorRegister(X86OpCode opcode, RegStorage rs_src1, uint32_t m0, uint32_t m1, uint32_t m2, uint32_t m3) { 201460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Create temporary MIR as container for 128-bit binary mask. 201560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji MIR const_mir; 201660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji MIR* const_mirp = &const_mir; 201760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const_mirp->dalvikInsn.opcode = static_cast<Instruction::Code>(kMirOpConstVector); 201860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const_mirp->dalvikInsn.arg[0] = m0; 201960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const_mirp->dalvikInsn.arg[1] = m1; 202060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const_mirp->dalvikInsn.arg[2] = m2; 202160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji const_mirp->dalvikInsn.arg[3] = m3; 202260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 202360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Mask vector with const from literal pool. 202460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AppendOpcodeWithConst(opcode, rs_src1.GetReg(), const_mirp); 202560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji} 202660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 2027fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenAddReduceVector(BasicBlock *bb, MIR *mir) { 202860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 202960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src1 = RegStorage::Solo128(mir->dalvikInsn.vB); 203060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegLocation rl_dest = mir_graph_->GetDest(mir); 203160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_tmp; 203260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 203360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int vec_bytes = (mir->dalvikInsn.vC & 0xFFFF) / 8; 203460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int vec_unit_size = 0; 2035fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell int opcode = 0; 203660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int extr_opcode = 0; 203760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegLocation rl_result; 203860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 2039fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 2040fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 204160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji extr_opcode = kX86PextrdRRI; 2042fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PhadddRR; 204360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji vec_unit_size = 4; 204460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 204560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 204660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kUnsignedByte: 204760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji extr_opcode = kX86PextrbRRI; 204860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji opcode = kX86PhaddwRR; 204960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji vec_unit_size = 2; 2050fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2051fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 2052fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 205360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji extr_opcode = kX86PextrwRRI; 2054fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell opcode = kX86PhaddwRR; 205560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji vec_unit_size = 2; 2056fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 205760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSingle: 205860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_result = EvalLoc(rl_dest, kFPReg, true); 205960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji vec_unit_size = 4; 206060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji for (int i = 0; i < 3; i++) { 206160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86AddssRR, rl_result.reg.GetReg(), rs_src1.GetReg()); 206260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR3(kX86ShufpsRRI, rs_src1.GetReg(), rs_src1.GetReg(), 0x39); 206360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 206460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86AddssRR, rl_result.reg.GetReg(), rs_src1.GetReg()); 206560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji StoreValue(rl_dest, rl_result); 206660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 206760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // For single-precision floats, we are done here 206860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 2069fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 2070fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector add reduce " << opsize; 2071fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2072fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 207360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 207460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int elems = vec_bytes / vec_unit_size; 207560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 207660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Emulate horizontal add instruction by reducing 2 vectors with 8 values before adding them again 207760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // TODO is overflow handled correctly? 207860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (opsize == kSignedByte || opsize == kUnsignedByte) { 207960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rs_tmp = Get128BitRegister(AllocTempWide()); 208060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 208160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // tmp = xmm1 .>> 8. 208260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Mova128RR, rs_tmp.GetReg(), rs_src1.GetReg()); 208360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PsrlwRI, rs_tmp.GetReg(), 8); 208460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 208560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Zero extend low bits in xmm1. 208660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AndMaskVectorRegister(rs_src1, 0x00FF00FF, 0x00FF00FF, 0x00FF00FF, 0x00FF00FF); 208760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 208860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 208960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji while (elems > 1) { 209060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (opsize == kSignedByte || opsize == kUnsignedByte) { 209160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(opcode, rs_tmp.GetReg(), rs_tmp.GetReg()); 209260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 209360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(opcode, rs_src1.GetReg(), rs_src1.GetReg()); 209460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji elems >>= 1; 209560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 209660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 209760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Combine the results if we separated them. 209860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (opsize == kSignedByte || opsize == kUnsignedByte) { 209960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86PaddbRR, rs_src1.GetReg(), rs_tmp.GetReg()); 210060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 210160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 210260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // We need to extract to a GPR. 210360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage temp = AllocTemp(); 210460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR3(extr_opcode, temp.GetReg(), rs_src1.GetReg(), 0); 210560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 210660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Can we do this directly into memory? 210760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_result = UpdateLocTyped(rl_dest, kCoreReg); 210860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (rl_result.location == kLocPhysReg) { 210960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Ensure res is in a core reg 211060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_result = EvalLoc(rl_dest, kCoreReg, true); 211160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpRegReg(kOpAdd, rl_result.reg, temp); 211260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji StoreFinalValue(rl_dest, rl_result); 211360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 211460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpMemReg(kOpAdd, rl_result, temp.GetReg()); 211560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 211660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 211760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji FreeTemp(temp); 2118fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2119fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2120fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenReduceVector(BasicBlock *bb, MIR *mir) { 212160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 212260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegLocation rl_dest = mir_graph_->GetDest(mir); 212360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_src1 = RegStorage::Solo128(mir->dalvikInsn.vB); 212460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int extract_index = mir->dalvikInsn.arg[0]; 212560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int extr_opcode = 0; 212660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegLocation rl_result; 212760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji bool is_wide = false; 212860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 2129fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 2130fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 213160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_result = UpdateLocTyped(rl_dest, kCoreReg); 213260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji extr_opcode = (rl_result.location == kLocPhysReg) ? kX86PextrdMRI : kX86PextrdRRI; 2133fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2134fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 2135fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 213660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_result= UpdateLocTyped(rl_dest, kCoreReg); 213760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji extr_opcode = (rl_result.location == kLocPhysReg) ? kX86PextrwMRI : kX86PextrwRRI; 2138fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2139fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 214060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji LOG(FATAL) << "Unsupported vector add reduce " << opsize; 214160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji return; 2142fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2143fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 2144fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 214560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (rl_result.location == kLocPhysReg) { 214660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR3(extr_opcode, rl_result.reg.GetReg(), rs_src1.GetReg(), extract_index); 214760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (is_wide == true) { 214860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji StoreFinalValue(rl_dest, rl_result); 214960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 215060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji StoreFinalValueWide(rl_dest, rl_result); 215160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 215260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 215360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int displacement = SRegOffset(rl_result.s_reg_low); 215460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji LIR *l = NewLIR3(extr_opcode, rs_rX86_SP.GetReg(), displacement, rs_src1.GetReg()); 215560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AnnotateDalvikRegAccess(l, displacement >> 2, true /* is_load */, is_wide /* is_64bit */); 215660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji AnnotateDalvikRegAccess(l, displacement >> 2, false /* is_load */, is_wide /* is_64bit */); 215760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 2158fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2159fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2160fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendellvoid X86Mir2Lir::GenSetVector(BasicBlock *bb, MIR *mir) { 216160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji DCHECK_EQ(mir->dalvikInsn.vC & 0xFFFF, 128U); 216260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji OpSize opsize = static_cast<OpSize>(mir->dalvikInsn.vC >> 16); 216360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage rs_dest = RegStorage::Solo128(mir->dalvikInsn.vA); 216460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji int op_low = 0, op_high = 0, imm = 0, op_mov = kX86MovdxrRR; 216560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegisterClass reg_type = kCoreReg; 216660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 2167fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell switch (opsize) { 2168fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case k32: 2169fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell op_low = kX86PshufdRRI; 2170fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 217160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSingle: 217260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji op_low = kX86PshufdRRI; 217360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji op_mov = kX86Mova128RR; 217460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_type = kFPReg; 217560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 217660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case k64: 217760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji op_low = kX86PshufdRRI; 217860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji imm = 0x44; 217960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 218060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kDouble: 218160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji op_low = kX86PshufdRRI; 218260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji op_mov = kX86Mova128RR; 218360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji reg_type = kFPReg; 218460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji imm = 0x44; 218560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji break; 218660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kSignedByte: 218760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji case kUnsignedByte: 218860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Shuffle 8 bit value into 16 bit word. 218960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // We set val = val + (val << 8) below and use 16 bit shuffle. 2190fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kSignedHalf: 2191fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell case kUnsignedHalf: 2192fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Handles low quadword. 2193fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell op_low = kX86PshuflwRRI; 2194fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Handles upper quadword. 2195fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell op_high = kX86PshufdRRI; 2196fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2197fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell default: 2198fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell LOG(FATAL) << "Unsupported vector set " << opsize; 2199fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell break; 2200fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 2201fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2202fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell RegLocation rl_src = mir_graph_->GetSrc(mir, 0); 220360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 220460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // Load the value from the VR into the reg. 220560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (rl_src.wide == 0) { 220660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_src = LoadValue(rl_src, reg_type); 220760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } else { 220860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji rl_src = LoadValueWide(rl_src, reg_type); 220960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 221060bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji 221160bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // If opsize is 8 bits wide then double value and use 16 bit shuffle instead. 221260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji if (opsize == kSignedByte || opsize == kUnsignedByte) { 221360bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji RegStorage temp = AllocTemp(); 221460bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji // val = val + (val << 8). 221560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Mov32RR, temp.GetReg(), rl_src.reg.GetReg()); 221660bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Sal32RI, temp.GetReg(), 8); 221760bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(kX86Or32RR, rl_src.reg.GetReg(), temp.GetReg()); 221860bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji FreeTemp(temp); 221960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji } 2220fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2221fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Load the value into the XMM register. 222260bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR2(op_mov, rs_dest.GetReg(), rl_src.reg.GetReg()); 2223fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2224fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // Now shuffle the value across the destination. 222560bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR3(op_low, rs_dest.GetReg(), rs_dest.GetReg(), imm); 2226fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2227fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell // And then repeat as needed. 2228fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell if (op_high != 0) { 222960bfe7b3e8f00f0a8ef3f5d8716adfdf86b71f43Udayan Banerji NewLIR3(op_high, rs_dest.GetReg(), rs_dest.GetReg(), imm); 2230fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell } 2231fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell} 2232fe94578b63380f464c3abd5c156b7b31d068db6cMark Mendell 2233d65c51a556e6649db4e18bd083c8fec37607a442Mark MendellLIR *X86Mir2Lir::ScanVectorLiteral(MIR *mir) { 2234d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell int *args = reinterpret_cast<int*>(mir->dalvikInsn.arg); 2235d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell for (LIR *p = const_vectors_; p != nullptr; p = p->next) { 2236d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (args[0] == p->operands[0] && args[1] == p->operands[1] && 2237d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell args[2] == p->operands[2] && args[3] == p->operands[3]) { 2238d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell return p; 2239d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 2240d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 2241d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell return nullptr; 2242d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell} 2243d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 2244d65c51a556e6649db4e18bd083c8fec37607a442Mark MendellLIR *X86Mir2Lir::AddVectorLiteral(MIR *mir) { 2245d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell LIR* new_value = static_cast<LIR*>(arena_->Alloc(sizeof(LIR), kArenaAllocData)); 2246d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell int *args = reinterpret_cast<int*>(mir->dalvikInsn.arg); 2247d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell new_value->operands[0] = args[0]; 2248d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell new_value->operands[1] = args[1]; 2249d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell new_value->operands[2] = args[2]; 2250d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell new_value->operands[3] = args[3]; 2251d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell new_value->next = const_vectors_; 2252d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell if (const_vectors_ == nullptr) { 2253d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell estimated_native_code_size_ += 12; // Amount needed to align to 16 byte boundary. 2254d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell } 2255d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell estimated_native_code_size_ += 16; // Space for one vector. 2256d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell const_vectors_ = new_value; 2257d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell return new_value; 2258d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell} 2259d65c51a556e6649db4e18bd083c8fec37607a442Mark Mendell 226058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko// ------------ ABI support: mapping of args to physical registers ------------- 2261ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas GampeRegStorage X86Mir2Lir::InToRegStorageX86_64Mapper::GetNextReg(bool is_double_or_float, bool is_wide, 2262ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe bool is_ref) { 2263a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu const SpecialTargetRegister coreArgMappingToPhysicalReg[] = {kArg1, kArg2, kArg3, kArg4, kArg5}; 2264ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe const int coreArgMappingToPhysicalRegSize = sizeof(coreArgMappingToPhysicalReg) / 2265ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe sizeof(SpecialTargetRegister); 2266a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu const SpecialTargetRegister fpArgMappingToPhysicalReg[] = {kFArg0, kFArg1, kFArg2, kFArg3, 2267ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe kFArg4, kFArg5, kFArg6, kFArg7}; 2268ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe const int fpArgMappingToPhysicalRegSize = sizeof(fpArgMappingToPhysicalReg) / 2269ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe sizeof(SpecialTargetRegister); 227058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 227158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (is_double_or_float) { 227258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (cur_fp_reg_ < fpArgMappingToPhysicalRegSize) { 2273ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe return ml_->TargetReg(fpArgMappingToPhysicalReg[cur_fp_reg_++], is_wide ? kWide : kNotWide); 227458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 227558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 227658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (cur_core_reg_ < coreArgMappingToPhysicalRegSize) { 2277ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe return ml_->TargetReg(coreArgMappingToPhysicalReg[cur_core_reg_++], 2278ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe is_ref ? kRef : (is_wide ? kWide : kNotWide)); 227958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 228058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 2281a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu return RegStorage::InvalidReg(); 228258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 228358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 228458994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage X86Mir2Lir::InToRegStorageMapping::Get(int in_position) { 228558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko DCHECK(IsInitialized()); 228658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko auto res = mapping_.find(in_position); 228758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return res != mapping_.end() ? res->second : RegStorage::InvalidReg(); 228858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 228958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 2290ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampevoid X86Mir2Lir::InToRegStorageMapping::Initialize(RegLocation* arg_locs, int count, 2291ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe InToRegStorageMapper* mapper) { 229258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko DCHECK(mapper != nullptr); 229358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko max_mapped_in_ = -1; 229458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko is_there_stack_mapped_ = false; 229558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko for (int in_position = 0; in_position < count; in_position++) { 2296407a9d2847161b843966a443b71760b1280bd396Serguei Katkov RegStorage reg = mapper->GetNextReg(arg_locs[in_position].fp, 2297407a9d2847161b843966a443b71760b1280bd396Serguei Katkov arg_locs[in_position].wide, arg_locs[in_position].ref); 229858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (reg.Valid()) { 229958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko mapping_[in_position] = reg; 230058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko max_mapped_in_ = std::max(max_mapped_in_, in_position); 2301407a9d2847161b843966a443b71760b1280bd396Serguei Katkov if (arg_locs[in_position].wide) { 230258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // We covered 2 args, so skip the next one 230358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko in_position++; 230458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 230558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 230658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko is_there_stack_mapped_ = true; 230758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 230858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 230958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko initialized_ = true; 231058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 231158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 231258994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage X86Mir2Lir::GetArgMappingToPhysicalReg(int arg_num) { 2313dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (!cu_->target64) { 231458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return GetCoreArgMappingToPhysicalReg(arg_num); 231558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 231658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 231758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (!in_to_reg_storage_mapping_.IsInitialized()) { 231858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int start_vreg = cu_->num_dalvik_registers - cu_->num_ins; 231958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegLocation* arg_locs = &mir_graph_->reg_location_[start_vreg]; 232058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 2321a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu InToRegStorageX86_64Mapper mapper(this); 232258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko in_to_reg_storage_mapping_.Initialize(arg_locs, cu_->num_ins, &mapper); 232358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 232458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return in_to_reg_storage_mapping_.Get(arg_num); 232558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 232658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 232758994cdb00b323339bd83828eddc53976048006fDmitry PetrochenkoRegStorage X86Mir2Lir::GetCoreArgMappingToPhysicalReg(int core_arg_num) { 232858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // For the 32-bit internal ABI, the first 3 arguments are passed in registers. 232958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Not used for 64-bit, TODO: Move X86_32 to the same framework 233058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko switch (core_arg_num) { 233158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case 0: 233258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return rs_rX86_ARG1; 233358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case 1: 233458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return rs_rX86_ARG2; 233558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko case 2: 233658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return rs_rX86_ARG3; 233758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko default: 233858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return RegStorage::InvalidReg(); 233958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 234058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 234158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 234258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko// ---------End of ABI support: mapping of args to physical registers ------------- 234358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 234458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko/* 234558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * If there are any ins passed in registers that have not been promoted 234658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * to a callee-save register, flush them to the frame. Perform initial 234758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * assignment of promoted arguments. 234858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * 234958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * ArgLocs is an array of location records describing the incoming arguments 235058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * with one location record per word of argument. 235158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 235258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenkovoid X86Mir2Lir::FlushIns(RegLocation* ArgLocs, RegLocation rl_method) { 2353dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (!cu_->target64) return Mir2Lir::FlushIns(ArgLocs, rl_method); 235458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko /* 235558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Dummy up a RegLocation for the incoming Method* 235658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * It will attempt to keep kArg0 live (or copy it to home location 235758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * if promoted). 235858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 235958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 236058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegLocation rl_src = rl_method; 236158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rl_src.location = kLocPhysReg; 2362ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe rl_src.reg = TargetReg(kArg0, kRef); 236358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rl_src.home = false; 236458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko MarkLive(rl_src); 236558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko StoreValue(rl_method, rl_src); 236658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // If Method* has been promoted, explicitly flush 236758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (rl_method.location == kLocPhysReg) { 2368ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe StoreRefDisp(rs_rX86_SP, 0, As32BitReg(TargetReg(kArg0, kRef)), kNotVolatile); 236958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 237058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 237158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (cu_->num_ins == 0) { 237258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return; 237358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 237458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 237558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int start_vreg = cu_->num_dalvik_registers - cu_->num_ins; 237658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko /* 237758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Copy incoming arguments to their proper home locations. 237858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * NOTE: an older version of dx had an issue in which 237958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * it would reuse static method argument registers. 238058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * This could result in the same Dalvik virtual register 238158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * being promoted to both core and fp regs. To account for this, 238258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * we only copy to the corresponding promoted physical register 238358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * if it matches the type of the SSA name for the incoming 238458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * argument. It is also possible that long and double arguments 238558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * end up half-promoted. In those cases, we must flush the promoted 238658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * half to memory as well. 238758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 23888dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 238958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko for (int i = 0; i < cu_->num_ins; i++) { 239058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // get reg corresponding to input 23914d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko RegStorage reg = GetArgMappingToPhysicalReg(i); 239258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 23934d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko RegLocation* t_loc = &ArgLocs[i]; 239458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (reg.Valid()) { 23954d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // If arriving in register. 239658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 23974d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // We have already updated the arg location with promoted info 23984d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // so we can be based on it. 23994d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko if (t_loc->location == kLocPhysReg) { 24004d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // Just copy it. 24014d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko OpRegCopy(t_loc->reg, reg); 24024d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko } else { 24034d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // Needs flush. 24044d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko if (t_loc->ref) { 2405a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreRefDisp(rs_rX86_SP, SRegOffset(start_vreg + i), reg, kNotVolatile); 240658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 2407a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, SRegOffset(start_vreg + i), reg, t_loc->wide ? k64 : k32, 24084d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko kNotVolatile); 240958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 241058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 241158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 24124d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // If arriving in frame & promoted. 24134d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko if (t_loc->location == kLocPhysReg) { 24144d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko if (t_loc->ref) { 2415a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu LoadRefDisp(rs_rX86_SP, SRegOffset(start_vreg + i), t_loc->reg, kNotVolatile); 24164d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko } else { 2417a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu LoadBaseDisp(rs_rX86_SP, SRegOffset(start_vreg + i), t_loc->reg, 24184d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko t_loc->wide ? k64 : k32, kNotVolatile); 24194d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko } 242058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 242158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 24224d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko if (t_loc->wide) { 24234d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko // Increment i to skip the next one. 24244d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko i++; 24254d5d794382cd6d3a25392d17543d5987e432d314Dmitry Petrochenko } 242658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 242758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 242858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 242958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko/* 243058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Load up to 5 arguments, the first three of which will be in 243158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * kArg1 .. kArg3. On entry kArg0 contains the current method pointer, 243258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * and as part of the load sequence, it must be replaced with 243358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * the target method pointer. Note, this may also be called 243458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * for "range" variants if the number of arguments is 5 or fewer. 243558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 243658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenkoint X86Mir2Lir::GenDalvikArgsNoRange(CallInfo* info, 243758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int call_state, LIR** pcrLabel, NextCallInsn next_call_insn, 243858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko const MethodReference& target_method, 243958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko uint32_t vtable_idx, uintptr_t direct_code, 244058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko uintptr_t direct_method, InvokeType type, bool skip_this) { 2441dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (!cu_->target64) { 244258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return Mir2Lir::GenDalvikArgsNoRange(info, 244358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko call_state, pcrLabel, next_call_insn, 244458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko target_method, 244558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko vtable_idx, direct_code, 244658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko direct_method, type, skip_this); 244758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 244858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return GenDalvikArgsRange(info, 244958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko call_state, pcrLabel, next_call_insn, 245058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko target_method, 245158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko vtable_idx, direct_code, 245258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko direct_method, type, skip_this); 245358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 245458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 245558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko/* 245658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * May have 0+ arguments (also used for jumbo). Note that 245758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * source virtual registers may be in physical registers, so may 245858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * need to be flushed to home location before copying. This 245958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * applies to arg3 and above (see below). 246058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * 246158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Two general strategies: 246258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * If < 20 arguments 246358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Pass args 3-18 using vldm/vstm block copy 246458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Pass arg0, arg1 & arg2 in kArg1-kArg3 246558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * If 20+ arguments 246658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Pass args arg19+ using memcpy block copy 246758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * Pass arg0, arg1 & arg2 in kArg1-kArg3 246858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * 246958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 247058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenkoint X86Mir2Lir::GenDalvikArgsRange(CallInfo* info, int call_state, 247158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LIR** pcrLabel, NextCallInsn next_call_insn, 247258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko const MethodReference& target_method, 247358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko uint32_t vtable_idx, uintptr_t direct_code, uintptr_t direct_method, 247458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko InvokeType type, bool skip_this) { 2475dd64450b37776f68b9bfc47f8d9a88bc72c95727Elena Sayapina if (!cu_->target64) { 247658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return Mir2Lir::GenDalvikArgsRange(info, call_state, 247758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko pcrLabel, next_call_insn, 247858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko target_method, 247958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko vtable_idx, direct_code, direct_method, 248058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko type, skip_this); 248158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 248258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 248358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko /* If no arguments, just return */ 248458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (info->num_arg_words == 0) 248558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return call_state; 248658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 248758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko const int start_index = skip_this ? 1 : 0; 248858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 2489a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu InToRegStorageX86_64Mapper mapper(this); 249058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko InToRegStorageMapping in_to_reg_storage_mapping; 249158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko in_to_reg_storage_mapping.Initialize(info->args, info->num_arg_words, &mapper); 249258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko const int last_mapped_in = in_to_reg_storage_mapping.GetMaxMappedIn(); 249358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko const int size_of_the_last_mapped = last_mapped_in == -1 ? 1 : 24948e3acdd132aef1391676a5db2696804900aacd8eSerguei Katkov info->args[last_mapped_in].wide ? 2 : 1; 249558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int regs_left_to_pass_via_stack = info->num_arg_words - (last_mapped_in + size_of_the_last_mapped); 249658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 249758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Fisrt of all, check whether it make sense to use bulk copying 249858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Optimization is aplicable only for range case 249958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // TODO: make a constant instead of 2 250058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (info->is_range && regs_left_to_pass_via_stack >= 2) { 250158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Scan the rest of the args - if in phys_reg flush to memory 250258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko for (int next_arg = last_mapped_in + size_of_the_last_mapped; next_arg < info->num_arg_words;) { 250358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegLocation loc = info->args[next_arg]; 250458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (loc.wide) { 250558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko loc = UpdateLocWide(loc); 250658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (loc.location == kLocPhysReg) { 25078dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 2508a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, SRegOffset(loc.s_reg_low), loc.reg, k64, kNotVolatile); 250958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 251058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko next_arg += 2; 251158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 251258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko loc = UpdateLoc(loc); 251358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (loc.location == kLocPhysReg) { 25148dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 2515a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, SRegOffset(loc.s_reg_low), loc.reg, k32, kNotVolatile); 251658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 251758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko next_arg++; 251858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 251958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 252058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 252158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Logic below assumes that Method pointer is at offset zero from SP. 252258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko DCHECK_EQ(VRegOffset(static_cast<int>(kVRegMethodPtrBaseReg)), 0); 252358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 252458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // The rest can be copied together 252558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int start_offset = SRegOffset(info->args[last_mapped_in + size_of_the_last_mapped].s_reg_low); 2526ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe int outs_offset = StackVisitor::GetOutVROffset(last_mapped_in + size_of_the_last_mapped, 2527ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe cu_->instruction_set); 252858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 252958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int current_src_offset = start_offset; 253058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int current_dest_offset = outs_offset; 253158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 25328dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko // Only davik regs are accessed in this loop; no next_call_insn() calls. 25338dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 253458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko while (regs_left_to_pass_via_stack > 0) { 253558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // This is based on the knowledge that the stack itself is 16-byte aligned. 253658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bool src_is_16b_aligned = (current_src_offset & 0xF) == 0; 253758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bool dest_is_16b_aligned = (current_dest_offset & 0xF) == 0; 253858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko size_t bytes_to_move; 253958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 254058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko /* 254158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * The amount to move defaults to 32-bit. If there are 4 registers left to move, then do a 254258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * a 128-bit move because we won't get the chance to try to aligned. If there are more than 254358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * 4 registers left to move, consider doing a 128-bit only if either src or dest are aligned. 254458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * We do this because we could potentially do a smaller move to align. 254558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 254658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (regs_left_to_pass_via_stack == 4 || 254758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko (regs_left_to_pass_via_stack > 4 && (src_is_16b_aligned || dest_is_16b_aligned))) { 254858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Moving 128-bits via xmm register. 254958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bytes_to_move = sizeof(uint32_t) * 4; 255058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 255158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Allocate a free xmm temp. Since we are working through the calling sequence, 255258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // we expect to have an xmm temporary available. AllocTempDouble will abort if 255358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // there are no free registers. 255458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegStorage temp = AllocTempDouble(); 255558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 255658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LIR* ld1 = nullptr; 255758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LIR* ld2 = nullptr; 255858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LIR* st1 = nullptr; 255958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LIR* st2 = nullptr; 256058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 256158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko /* 256258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * The logic is similar for both loads and stores. If we have 16-byte alignment, 256358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * do an aligned move. If we have 8-byte alignment, then do the move in two 256458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * parts. This approach prevents possible cache line splits. Finally, fall back 256558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * to doing an unaligned move. In most cases we likely won't split the cache 256658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko * line but we cannot prove it and thus take a conservative approach. 256758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko */ 256858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bool src_is_8b_aligned = (current_src_offset & 0x7) == 0; 256958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bool dest_is_8b_aligned = (current_dest_offset & 0x7) == 0; 257058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 25718dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 257258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (src_is_16b_aligned) { 2573a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu ld1 = OpMovRegMem(temp, rs_rX86_SP, current_src_offset, kMovA128FP); 257458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else if (src_is_8b_aligned) { 2575a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu ld1 = OpMovRegMem(temp, rs_rX86_SP, current_src_offset, kMovLo128FP); 2576a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu ld2 = OpMovRegMem(temp, rs_rX86_SP, current_src_offset + (bytes_to_move >> 1), 257758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko kMovHi128FP); 257858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 2579a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu ld1 = OpMovRegMem(temp, rs_rX86_SP, current_src_offset, kMovU128FP); 258058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 258158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 258258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (dest_is_16b_aligned) { 2583a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu st1 = OpMovMemReg(rs_rX86_SP, current_dest_offset, temp, kMovA128FP); 258458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else if (dest_is_8b_aligned) { 2585a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu st1 = OpMovMemReg(rs_rX86_SP, current_dest_offset, temp, kMovLo128FP); 2586a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu st2 = OpMovMemReg(rs_rX86_SP, current_dest_offset + (bytes_to_move >> 1), 258758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko temp, kMovHi128FP); 258858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 2589a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu st1 = OpMovMemReg(rs_rX86_SP, current_dest_offset, temp, kMovU128FP); 259058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 259158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 259258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // TODO If we could keep track of aliasing information for memory accesses that are wider 259358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // than 64-bit, we wouldn't need to set up a barrier. 259458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (ld1 != nullptr) { 259558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (ld2 != nullptr) { 259658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // For 64-bit load we can actually set up the aliasing information. 259758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko AnnotateDalvikRegAccess(ld1, current_src_offset >> 2, true, true); 259858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko AnnotateDalvikRegAccess(ld2, (current_src_offset + (bytes_to_move >> 1)) >> 2, true, true); 259958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 260058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Set barrier for 128-bit load. 26018dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ld1->u.m.def_mask = &kEncodeAll; 260258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 260358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 260458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (st1 != nullptr) { 260558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (st2 != nullptr) { 260658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // For 64-bit store we can actually set up the aliasing information. 260758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko AnnotateDalvikRegAccess(st1, current_dest_offset >> 2, false, true); 260858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko AnnotateDalvikRegAccess(st2, (current_dest_offset + (bytes_to_move >> 1)) >> 2, false, true); 260958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 261058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Set barrier for 128-bit store. 26118dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko st1->u.m.def_mask = &kEncodeAll; 261258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 261358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 261458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 261558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Free the temporary used for the data movement. 261658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(temp); 261758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 261858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Moving 32-bits via general purpose register. 261958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko bytes_to_move = sizeof(uint32_t); 262058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 262158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Instead of allocating a new temp, simply reuse one of the registers being used 262258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // for argument passing. 2623ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe RegStorage temp = TargetReg(kArg3, kNotWide); 262458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 262558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Now load the argument VR and store to the outs. 2626a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu Load32Disp(rs_rX86_SP, current_src_offset, temp); 2627a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu Store32Disp(rs_rX86_SP, current_dest_offset, temp); 262858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 262958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 263058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko current_src_offset += bytes_to_move; 263158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko current_dest_offset += bytes_to_move; 263258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko regs_left_to_pass_via_stack -= (bytes_to_move >> 2); 263358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 263458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko DCHECK_EQ(regs_left_to_pass_via_stack, 0); 263558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 263658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 263758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Now handle rest not registers if they are 263858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (in_to_reg_storage_mapping.IsThereStackMapped()) { 2639ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe RegStorage regSingle = TargetReg(kArg2, kNotWide); 2640ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe RegStorage regWide = TargetReg(kArg3, kWide); 2641b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu for (int i = start_index; 2642b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu i < last_mapped_in + size_of_the_last_mapped + regs_left_to_pass_via_stack; i++) { 264358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegLocation rl_arg = info->args[i]; 264458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rl_arg = UpdateRawLoc(rl_arg); 264558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegStorage reg = in_to_reg_storage_mapping.Get(i); 264658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (!reg.Valid()) { 264758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko int out_offset = StackVisitor::GetOutVROffset(i, cu_->instruction_set); 264858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 26498dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko { 26508dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko ScopedMemRefType mem_ref_type(this, ResourceMask::kDalvikReg); 26518dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (rl_arg.wide) { 26528dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (rl_arg.location == kLocPhysReg) { 2653a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, out_offset, rl_arg.reg, k64, kNotVolatile); 26548dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko } else { 26558dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko LoadValueDirectWideFixed(rl_arg, regWide); 2656a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, out_offset, regWide, k64, kNotVolatile); 26578dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko } 265858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 26598dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko if (rl_arg.location == kLocPhysReg) { 2660a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, out_offset, rl_arg.reg, k32, kNotVolatile); 26618dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko } else { 26628dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko LoadValueDirectFixed(rl_arg, regSingle); 2663a77ee5103532abb197f492c14a9e6fb437054e2aChao-ying Fu StoreBaseDisp(rs_rX86_SP, out_offset, regSingle, k32, kNotVolatile); 26648dea81ca9c0201ceaa88086b927a5838a06a3e69Vladimir Marko } 266558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 266658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 266758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko call_state = next_call_insn(cu_, info, call_state, target_method, 266858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko vtable_idx, direct_code, direct_method, type); 266958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 2670b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu if (rl_arg.wide) { 2671b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu i++; 2672b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu } 267358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 267458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 267558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 267658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // Finish with mapped registers 267758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko for (int i = start_index; i <= last_mapped_in; i++) { 267858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegLocation rl_arg = info->args[i]; 267958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko rl_arg = UpdateRawLoc(rl_arg); 268058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegStorage reg = in_to_reg_storage_mapping.Get(i); 268158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (reg.Valid()) { 268258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (rl_arg.wide) { 268358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LoadValueDirectWideFixed(rl_arg, reg); 268458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 268558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko LoadValueDirectFixed(rl_arg, reg); 268658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 268758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko call_state = next_call_insn(cu_, info, call_state, target_method, vtable_idx, 268858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko direct_code, direct_method, type); 268958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 2690b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu if (rl_arg.wide) { 2691b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu i++; 2692b6564c19c5e14a3caa3f8da423b0da510fda7026Chao-ying Fu } 269358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 269458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 269558994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko call_state = next_call_insn(cu_, info, call_state, target_method, vtable_idx, 269658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko direct_code, direct_method, type); 269758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko if (pcrLabel) { 269869dfe51b684dd9d510dbcb63295fe180f998efdeDave Allison if (!cu_->compiler_driver->GetCompilerOptions().GetImplicitNullChecks()) { 2699ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe *pcrLabel = GenExplicitNullCheck(TargetReg(kArg1, kRef), info->opt_flags); 270058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } else { 270158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko *pcrLabel = nullptr; 270258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // In lieu of generating a check for kArg1 being null, we need to 270358994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko // perform a load when doing implicit checks. 270458994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko RegStorage tmp = AllocTemp(); 2705ccc60264229ac96d798528d2cb7dbbdd0deca993Andreas Gampe Load32Disp(TargetReg(kArg1, kRef), 0, tmp); 270658994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko MarkPossibleNullPointerException(info->opt_flags); 270758994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko FreeTemp(tmp); 270858994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 270958994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko } 271058994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko return call_state; 271158994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko} 271258994cdb00b323339bd83828eddc53976048006fDmitry Petrochenko 2713984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampebool X86Mir2Lir::GenInlinedCharAt(CallInfo* info) { 2714984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // Location of reference to data array 2715984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe int value_offset = mirror::String::ValueOffset().Int32Value(); 2716984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // Location of count 2717984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe int count_offset = mirror::String::CountOffset().Int32Value(); 2718984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // Starting offset within data array 2719984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe int offset_offset = mirror::String::OffsetOffset().Int32Value(); 2720984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // Start of char data with array_ 2721984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe int data_offset = mirror::Array::DataOffset(sizeof(uint16_t)).Int32Value(); 2722984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe 2723984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegLocation rl_obj = info->args[0]; 2724984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegLocation rl_idx = info->args[1]; 2725984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe rl_obj = LoadValue(rl_obj, kRefReg); 2726984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // X86 wants to avoid putting a constant index into a register. 2727984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (!rl_idx.is_const) { 2728984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe rl_idx = LoadValue(rl_idx, kCoreReg); 2729984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2730984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegStorage reg_max; 2731984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe GenNullCheck(rl_obj.reg, info->opt_flags); 2732984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe bool range_check = (!(info->opt_flags & MIR_IGNORE_RANGE_CHECK)); 2733984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe LIR* range_check_branch = nullptr; 2734984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegStorage reg_off; 2735984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegStorage reg_ptr; 2736984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (range_check) { 2737984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // On x86, we can compare to memory directly 2738984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe // Set up a launch pad to allow retry in case of bounds violation */ 2739984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (rl_idx.is_const) { 2740984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe LIR* comparison; 2741984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe range_check_branch = OpCmpMemImmBranch( 2742984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe kCondUlt, RegStorage::InvalidReg(), rl_obj.reg, count_offset, 2743984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe mir_graph_->ConstantValue(rl_idx.orig_sreg), nullptr, &comparison); 2744984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe MarkPossibleNullPointerExceptionAfter(0, comparison); 2745984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } else { 2746984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe OpRegMem(kOpCmp, rl_idx.reg, rl_obj.reg, count_offset); 2747984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe MarkPossibleNullPointerException(0); 2748984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe range_check_branch = OpCondBranch(kCondUge, nullptr); 2749984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2750984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2751984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe reg_off = AllocTemp(); 2752984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe reg_ptr = AllocTempRef(); 2753984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe Load32Disp(rl_obj.reg, offset_offset, reg_off); 2754984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe LoadRefDisp(rl_obj.reg, value_offset, reg_ptr, kNotVolatile); 2755984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (rl_idx.is_const) { 2756984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe OpRegImm(kOpAdd, reg_off, mir_graph_->ConstantValue(rl_idx.orig_sreg)); 2757984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } else { 2758984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe OpRegReg(kOpAdd, reg_off, rl_idx.reg); 2759984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2760984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe FreeTemp(rl_obj.reg); 2761984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (rl_idx.location == kLocPhysReg) { 2762984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe FreeTemp(rl_idx.reg); 2763984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2764984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegLocation rl_dest = InlineTarget(info); 2765984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe RegLocation rl_result = EvalLoc(rl_dest, kCoreReg, true); 2766984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe LoadBaseIndexedDisp(reg_ptr, reg_off, 1, data_offset, rl_result.reg, kUnsignedHalf); 2767984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe FreeTemp(reg_off); 2768984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe FreeTemp(reg_ptr); 2769984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe StoreValue(rl_dest, rl_result); 2770984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe if (range_check) { 2771984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe DCHECK(range_check_branch != nullptr); 2772984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe info->opt_flags |= MIR_IGNORE_NULL_CHECK; // Record that we've already null checked. 2773984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe AddIntrinsicSlowPath(info, range_check_branch); 2774984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe } 2775984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe return true; 2776984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe} 2777984305917bf57b3f8d92965e4715a0370cc5bcfbAndreas Gampe 27787934ac288acfb2552bb0b06ec1f61e5820d924a4Brian Carlstrom} // namespace art 2779