regexp-macro-assembler-x64.h revision eab96aab0834f21954b5d6aa6366bcfb348ed811
1// Copyright 2009 the V8 project authors. All rights reserved. 2// Redistribution and use in source and binary forms, with or without 3// modification, are permitted provided that the following conditions are 4// met: 5// 6// * Redistributions of source code must retain the above copyright 7// notice, this list of conditions and the following disclaimer. 8// * Redistributions in binary form must reproduce the above 9// copyright notice, this list of conditions and the following 10// disclaimer in the documentation and/or other materials provided 11// with the distribution. 12// * Neither the name of Google Inc. nor the names of its 13// contributors may be used to endorse or promote products derived 14// from this software without specific prior written permission. 15// 16// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 17// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 18// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 19// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 20// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 21// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 22// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 23// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 24// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 25// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 26// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 27 28#ifndef V8_X64_REGEXP_MACRO_ASSEMBLER_X64_H_ 29#define V8_X64_REGEXP_MACRO_ASSEMBLER_X64_H_ 30 31namespace v8 { 32namespace internal { 33 34#ifdef V8_NATIVE_REGEXP 35 36class RegExpMacroAssemblerX64: public NativeRegExpMacroAssembler { 37 public: 38 RegExpMacroAssemblerX64(Mode mode, int registers_to_save); 39 virtual ~RegExpMacroAssemblerX64(); 40 virtual int stack_limit_slack(); 41 virtual void AdvanceCurrentPosition(int by); 42 virtual void AdvanceRegister(int reg, int by); 43 virtual void Backtrack(); 44 virtual void Bind(Label* label); 45 virtual void CheckAtStart(Label* on_at_start); 46 virtual void CheckCharacter(uint32_t c, Label* on_equal); 47 virtual void CheckCharacterAfterAnd(uint32_t c, 48 uint32_t mask, 49 Label* on_equal); 50 virtual void CheckCharacterGT(uc16 limit, Label* on_greater); 51 virtual void CheckCharacterLT(uc16 limit, Label* on_less); 52 virtual void CheckCharacters(Vector<const uc16> str, 53 int cp_offset, 54 Label* on_failure, 55 bool check_end_of_string); 56 // A "greedy loop" is a loop that is both greedy and with a simple 57 // body. It has a particularly simple implementation. 58 virtual void CheckGreedyLoop(Label* on_tos_equals_current_position); 59 virtual void CheckNotAtStart(Label* on_not_at_start); 60 virtual void CheckNotBackReference(int start_reg, Label* on_no_match); 61 virtual void CheckNotBackReferenceIgnoreCase(int start_reg, 62 Label* on_no_match); 63 virtual void CheckNotRegistersEqual(int reg1, int reg2, Label* on_not_equal); 64 virtual void CheckNotCharacter(uint32_t c, Label* on_not_equal); 65 virtual void CheckNotCharacterAfterAnd(uint32_t c, 66 uint32_t mask, 67 Label* on_not_equal); 68 virtual void CheckNotCharacterAfterMinusAnd(uc16 c, 69 uc16 minus, 70 uc16 mask, 71 Label* on_not_equal); 72 // Checks whether the given offset from the current position is before 73 // the end of the string. 74 virtual void CheckPosition(int cp_offset, Label* on_outside_input); 75 virtual bool CheckSpecialCharacterClass(uc16 type, 76 Label* on_no_match); 77 virtual void Fail(); 78 virtual Handle<Object> GetCode(Handle<String> source); 79 virtual void GoTo(Label* label); 80 virtual void IfRegisterGE(int reg, int comparand, Label* if_ge); 81 virtual void IfRegisterLT(int reg, int comparand, Label* if_lt); 82 virtual void IfRegisterEqPos(int reg, Label* if_eq); 83 virtual IrregexpImplementation Implementation(); 84 virtual void LoadCurrentCharacter(int cp_offset, 85 Label* on_end_of_input, 86 bool check_bounds = true, 87 int characters = 1); 88 virtual void PopCurrentPosition(); 89 virtual void PopRegister(int register_index); 90 virtual void PushBacktrack(Label* label); 91 virtual void PushCurrentPosition(); 92 virtual void PushRegister(int register_index, 93 StackCheckFlag check_stack_limit); 94 virtual void ReadCurrentPositionFromRegister(int reg); 95 virtual void ReadStackPointerFromRegister(int reg); 96 virtual void SetRegister(int register_index, int to); 97 virtual void Succeed(); 98 virtual void WriteCurrentPositionToRegister(int reg, int cp_offset); 99 virtual void ClearRegisters(int reg_from, int reg_to); 100 virtual void WriteStackPointerToRegister(int reg); 101 102 static Result Match(Handle<Code> regexp, 103 Handle<String> subject, 104 int* offsets_vector, 105 int offsets_vector_length, 106 int previous_index); 107 108 static Result Execute(Code* code, 109 String* input, 110 int start_offset, 111 const byte* input_start, 112 const byte* input_end, 113 int* output, 114 bool at_start); 115 116 // Called from RegExp if the stack-guard is triggered. 117 // If the code object is relocated, the return address is fixed before 118 // returning. 119 static int CheckStackGuardState(Address* return_address, 120 Code* re_code, 121 Address re_frame); 122 123 private: 124 // Offsets from rbp of function parameters and stored registers. 125 static const int kFramePointer = 0; 126 // Above the frame pointer - function parameters and return address. 127 static const int kReturn_eip = kFramePointer + kPointerSize; 128 static const int kFrameAlign = kReturn_eip + kPointerSize; 129 130#ifdef _WIN64 131 // Parameters (first four passed as registers, but with room on stack). 132 // In Microsoft 64-bit Calling Convention, there is room on the callers 133 // stack (before the return address) to spill parameter registers. We 134 // use this space to store the register passed parameters. 135 static const int kInputString = kFrameAlign; 136 // StartIndex is passed as 32 bit int. 137 static const int kStartIndex = kInputString + kPointerSize; 138 static const int kInputStart = kStartIndex + kPointerSize; 139 static const int kInputEnd = kInputStart + kPointerSize; 140 static const int kRegisterOutput = kInputEnd + kPointerSize; 141 // AtStart is passed as 32 bit int (values 0 or 1). 142 static const int kAtStart = kRegisterOutput + kPointerSize; 143 static const int kStackHighEnd = kAtStart + kPointerSize; 144 // DirectCall is passed as 32 bit int (values 0 or 1). 145 static const int kDirectCall = kStackHighEnd + kPointerSize; 146#else 147 // In AMD64 ABI Calling Convention, the first six integer parameters 148 // are passed as registers, and caller must allocate space on the stack 149 // if it wants them stored. We push the parameters after the frame pointer. 150 static const int kInputString = kFramePointer - kPointerSize; 151 static const int kStartIndex = kInputString - kPointerSize; 152 static const int kInputStart = kStartIndex - kPointerSize; 153 static const int kInputEnd = kInputStart - kPointerSize; 154 static const int kRegisterOutput = kInputEnd - kPointerSize; 155 static const int kAtStart = kRegisterOutput - kPointerSize; 156 static const int kStackHighEnd = kFrameAlign; 157 static const int kDirectCall = kStackHighEnd + kPointerSize; 158#endif 159 160#ifdef _WIN64 161 // Microsoft calling convention has three callee-saved registers 162 // (that we are using). We push these after the frame pointer. 163 static const int kBackup_rsi = kFramePointer - kPointerSize; 164 static const int kBackup_rdi = kBackup_rsi - kPointerSize; 165 static const int kBackup_rbx = kBackup_rdi - kPointerSize; 166 static const int kLastCalleeSaveRegister = kBackup_rbx; 167#else 168 // AMD64 Calling Convention has only one callee-save register that 169 // we use. We push this after the frame pointer (and after the 170 // parameters). 171 static const int kBackup_rbx = kAtStart - kPointerSize; 172 static const int kLastCalleeSaveRegister = kBackup_rbx; 173#endif 174 175 // When adding local variables remember to push space for them in 176 // the frame in GetCode. 177 static const int kInputStartMinusOne = 178 kLastCalleeSaveRegister - kPointerSize; 179 180 // First register address. Following registers are below it on the stack. 181 static const int kRegisterZero = kInputStartMinusOne - kPointerSize; 182 183 // Initial size of code buffer. 184 static const size_t kRegExpCodeSize = 1024; 185 186 // Load a number of characters at the given offset from the 187 // current position, into the current-character register. 188 void LoadCurrentCharacterUnchecked(int cp_offset, int character_count); 189 190 // Check whether preemption has been requested. 191 void CheckPreemption(); 192 193 // Check whether we are exceeding the stack limit on the backtrack stack. 194 void CheckStackLimit(); 195 196 // Generate a call to CheckStackGuardState. 197 void CallCheckStackGuardState(); 198 199 // The rbp-relative location of a regexp register. 200 Operand register_location(int register_index); 201 202 // The register containing the current character after LoadCurrentCharacter. 203 inline Register current_character() { return rdx; } 204 205 // The register containing the backtrack stack top. Provides a meaningful 206 // name to the register. 207 inline Register backtrack_stackpointer() { return rcx; } 208 209 // The registers containing a self pointer to this code's Code object. 210 inline Register code_object_pointer() { return r8; } 211 212 // Byte size of chars in the string to match (decided by the Mode argument) 213 inline int char_size() { return static_cast<int>(mode_); } 214 215 // Equivalent to a conditional branch to the label, unless the label 216 // is NULL, in which case it is a conditional Backtrack. 217 void BranchOrBacktrack(Condition condition, Label* to); 218 219 void MarkPositionForCodeRelativeFixup() { 220 code_relative_fixup_positions_.Add(masm_->pc_offset()); 221 } 222 223 void FixupCodeRelativePositions(); 224 225 // Call and return internally in the generated code in a way that 226 // is GC-safe (i.e., doesn't leave absolute code addresses on the stack) 227 inline void SafeCall(Label* to); 228 inline void SafeCallTarget(Label* label); 229 inline void SafeReturn(); 230 231 // Pushes the value of a register on the backtrack stack. Decrements the 232 // stack pointer (rcx) by a word size and stores the register's value there. 233 inline void Push(Register source); 234 235 // Pushes a value on the backtrack stack. Decrements the stack pointer (rcx) 236 // by a word size and stores the value there. 237 inline void Push(Immediate value); 238 239 // Pushes the Code object relative offset of a label on the backtrack stack 240 // (i.e., a backtrack target). Decrements the stack pointer (rcx) 241 // by a word size and stores the value there. 242 inline void Push(Label* label); 243 244 // Pops a value from the backtrack stack. Reads the word at the stack pointer 245 // (rcx) and increments it by a word size. 246 inline void Pop(Register target); 247 248 // Drops the top value from the backtrack stack without reading it. 249 // Increments the stack pointer (rcx) by a word size. 250 inline void Drop(); 251 252 // Before calling a C-function from generated code, align arguments on stack. 253 // After aligning the frame, arguments must be stored in esp[0], esp[4], 254 // etc., not pushed. The argument count assumes all arguments are word sized. 255 // Some compilers/platforms require the stack to be aligned when calling 256 // C++ code. 257 // Needs a scratch register to do some arithmetic. This register will be 258 // trashed. 259 inline void FrameAlign(int num_arguments); 260 261 // Calls a C function and cleans up the space for arguments allocated 262 // by FrameAlign. The called function is not allowed to trigger a garbage 263 // collection, since that might move the code and invalidate the return 264 // address (unless this is somehow accounted for by the called function). 265 inline void CallCFunction(ExternalReference function, int num_arguments); 266 267 MacroAssembler* masm_; 268 269 ZoneList<int> code_relative_fixup_positions_; 270 271 // Which mode to generate code for (ASCII or UC16). 272 Mode mode_; 273 274 // One greater than maximal register index actually used. 275 int num_registers_; 276 277 // Number of registers to output at the end (the saved registers 278 // are always 0..num_saved_registers_-1) 279 int num_saved_registers_; 280 281 // Labels used internally. 282 Label entry_label_; 283 Label start_label_; 284 Label success_label_; 285 Label backtrack_label_; 286 Label exit_label_; 287 Label check_preempt_label_; 288 Label stack_overflow_label_; 289}; 290 291#endif // V8_NATIVE_REGEXP 292 293}} // namespace v8::internal 294 295#endif // V8_X64_REGEXP_MACRO_ASSEMBLER_X64_H_ 296