CompilerTemplateAsm-armv5te-vfp.S revision 72e93344b4d1ffc71e9c832ec23de0657e5b04a5
1/*
2 * This file was generated automatically by gen-template.py for 'armv5te-vfp'.
3 *
4 * --> DO NOT EDIT <--
5 */
6
7/* File: armv5te/header.S */
8/*
9 * Copyright (C) 2008 The Android Open Source Project
10 *
11 * Licensed under the Apache License, Version 2.0 (the "License");
12 * you may not use this file except in compliance with the License.
13 * You may obtain a copy of the License at
14 *
15 *      http://www.apache.org/licenses/LICENSE-2.0
16 *
17 * Unless required by applicable law or agreed to in writing, software
18 * distributed under the License is distributed on an "AS IS" BASIS,
19 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
20 * See the License for the specific language governing permissions and
21 * limitations under the License.
22 */
23
24#if defined(WITH_JIT)
25
26/*
27 * ARMv5 definitions and declarations.
28 */
29
30/*
31ARM EABI general notes:
32
33r0-r3 hold first 4 args to a method; they are not preserved across method calls
34r4-r8 are available for general use
35r9 is given special treatment in some situations, but not for us
36r10 (sl) seems to be generally available
37r11 (fp) is used by gcc (unless -fomit-frame-pointer is set)
38r12 (ip) is scratch -- not preserved across method calls
39r13 (sp) should be managed carefully in case a signal arrives
40r14 (lr) must be preserved
41r15 (pc) can be tinkered with directly
42
43r0 holds returns of <= 4 bytes
44r0-r1 hold returns of 8 bytes, low word in r0
45
46Callee must save/restore r4+ (except r12) if it modifies them.
47
48Stack is "full descending".  Only the arguments that don't fit in the first 4
49registers are placed on the stack.  "sp" points at the first stacked argument
50(i.e. the 5th arg).
51
52VFP: single-precision results in s0, double-precision results in d0.
53
54In the EABI, "sp" must be 64-bit aligned on entry to a function, and any
5564-bit quantities (long long, double) must be 64-bit aligned.
56*/
57
58/*
59JIT and ARM notes:
60
61The following registers have fixed assignments:
62
63  reg nick      purpose
64  r5  rFP       interpreted frame pointer, used for accessing locals and args
65  r6  rGLUE     MterpGlue pointer
66
67The following registers have fixed assignments in mterp but are scratch
68registers in compiled code
69
70  reg nick      purpose
71  r4  rPC       interpreted program counter, used for fetching instructions
72  r7  rINST     first 16-bit code unit of current instruction
73  r8  rIBASE    interpreted instruction base pointer, used for computed goto
74
75Macros are provided for common operations.  Each macro MUST emit only
76one instruction to make instruction-counting easier.  They MUST NOT alter
77unspecified registers or condition codes.
78*/
79
80/* single-purpose registers, given names for clarity */
81#define rPC     r4
82#define rFP     r5
83#define rGLUE   r6
84#define rINST   r7
85#define rIBASE  r8
86
87/*
88 * Given a frame pointer, find the stack save area.
89 *
90 * In C this is "((StackSaveArea*)(_fp) -1)".
91 */
92#define SAVEAREA_FROM_FP(_reg, _fpreg) \
93    sub     _reg, _fpreg, #sizeofStackSaveArea
94
95/*
96 * This is a #include, not a %include, because we want the C pre-processor
97 * to expand the macros into assembler assignment statements.
98 */
99#include "../../../mterp/common/asm-constants.h"
100
101
102/* File: armv5te/platform.S */
103/*
104 * ===========================================================================
105 *  CPU-version-specific defines
106 * ===========================================================================
107 */
108
109/*
110 * Macro for "MOV LR,PC / LDR PC,xxx", which is not allowed pre-ARMv5.
111 * Jump to subroutine.
112 *
113 * May modify IP and LR.
114 */
115.macro  LDR_PC_LR source
116    mov     lr, pc
117    ldr     pc, \source
118.endm
119
120
121    .global dvmCompilerTemplateStart
122    .type   dvmCompilerTemplateStart, %function
123    .text
124
125dvmCompilerTemplateStart:
126
127/* ------------------------------ */
128    .balign 4
129    .global dvmCompiler_TEMPLATE_CMP_LONG
130dvmCompiler_TEMPLATE_CMP_LONG:
131/* File: armv5te/TEMPLATE_CMP_LONG.S */
132    /*
133     * Compare two 64-bit values.  Puts 0, 1, or -1 into the destination
134     * register based on the results of the comparison.
135     *
136     * We load the full values with LDM, but in practice many values could
137     * be resolved by only looking at the high word.  This could be made
138     * faster or slower by splitting the LDM into a pair of LDRs.
139     *
140     * If we just wanted to set condition flags, we could do this:
141     *  subs    ip, r0, r2
142     *  sbcs    ip, r1, r3
143     *  subeqs  ip, r0, r2
144     * Leaving { <0, 0, >0 } in ip.  However, we have to set it to a specific
145     * integer value, which we can do with 2 conditional mov/mvn instructions
146     * (set 1, set -1; if they're equal we already have 0 in ip), giving
147     * us a constant 5-cycle path plus a branch at the end to the
148     * instruction epilogue code.  The multi-compare approach below needs
149     * 2 or 3 cycles + branch if the high word doesn't match, 6 + branch
150     * in the worst case (the 64-bit values are equal).
151     */
152    /* cmp-long vAA, vBB, vCC */
153    cmp     r1, r3                      @ compare (vBB+1, vCC+1)
154    blt     .LTEMPLATE_CMP_LONG_less            @ signed compare on high part
155    bgt     .LTEMPLATE_CMP_LONG_greater
156    subs    r0, r0, r2                  @ r0<- r0 - r2
157    bxeq     lr
158    bhi     .LTEMPLATE_CMP_LONG_greater         @ unsigned compare on low part
159.LTEMPLATE_CMP_LONG_less:
160    mvn     r0, #0                      @ r0<- -1
161    bx      lr
162.LTEMPLATE_CMP_LONG_greater:
163    mov     r0, #1                      @ r0<- 1
164    bx      lr
165
166
167/* ------------------------------ */
168    .balign 4
169    .global dvmCompiler_TEMPLATE_RETURN
170dvmCompiler_TEMPLATE_RETURN:
171/* File: armv5te/TEMPLATE_RETURN.S */
172    /*
173     * Unwind a frame from the Dalvik stack for compiled OP_RETURN_XXX.
174     * If the stored value in returnAddr
175     * is non-zero, the caller is compiled by the JIT thus return to the
176     * address in the code cache following the invoke instruction. Otherwise
177     * return to the special dvmJitToInterpNoChain entry point.
178     */
179    SAVEAREA_FROM_FP(r0, rFP)           @ r0<- saveArea (old)
180    ldr     r10, [r0, #offStackSaveArea_prevFrame] @ r10<- saveArea->prevFrame
181    ldr     r8, [rGLUE, #offGlue_pSelfSuspendCount] @ r8<- &suspendCount
182    ldr     rPC, [r0, #offStackSaveArea_savedPc] @ rPC<- saveArea->savedPc
183    ldr     r9,  [r0, #offStackSaveArea_returnAddr] @ r9<- chaining cell ret
184    ldr     r2, [r10, #(offStackSaveArea_method - sizeofStackSaveArea)]
185                                        @ r2<- method we're returning to
186    ldr     r3, [rGLUE, #offGlue_self]  @ r3<- glue->self
187    cmp     r2, #0                      @ break frame?
188    beq     1f                          @ bail to interpreter
189    ldr     r0, .LdvmJitToInterpNoChain @ defined in footer.S
190    mov     rFP, r10                    @ publish new FP
191    ldrne   r10, [r2, #offMethod_clazz] @ r10<- method->clazz
192    ldr     r8, [r8]                    @ r8<- suspendCount
193
194    str     r2, [rGLUE, #offGlue_method]@ glue->method = newSave->method
195    ldr     r1, [r10, #offClassObject_pDvmDex] @ r1<- method->clazz->pDvmDex
196    str     rFP, [r3, #offThread_curFrame] @ self->curFrame = fp
197    add     rPC, rPC, #6                @ publish new rPC (advance 6 bytes)
198    str     r1, [rGLUE, #offGlue_methodClassDex]
199    cmp     r8, #0                      @ check the suspendCount
200    movne   r9, #0                      @ clear the chaining cell address
201    cmp     r9, #0                      @ chaining cell exists?
202    blxne   r9                          @ jump to the chaining cell
203    mov     pc, r0                      @ callsite is interpreted
2041:
205    stmia   rGLUE, {rPC, rFP}           @ SAVE_PC_FP_TO_GLUE()
206    ldr     r2, .LdvmMterpStdBail       @ defined in footer.S
207    mov     r1, #0                      @ changeInterp = false
208    mov     r0, rGLUE                   @ Expecting rGLUE in r0
209    blx     r2                          @ exit the interpreter
210
211/* ------------------------------ */
212    .balign 4
213    .global dvmCompiler_TEMPLATE_INVOKE_METHOD_NO_OPT
214dvmCompiler_TEMPLATE_INVOKE_METHOD_NO_OPT:
215/* File: armv5te/TEMPLATE_INVOKE_METHOD_NO_OPT.S */
216    /*
217     * For polymorphic callsites - setup the Dalvik frame and load Dalvik PC
218     * into rPC then jump to dvmJitToInterpNoChain to dispatch the
219     * runtime-resolved callee.
220     */
221    @ r0 = methodToCall, r1 = returnCell, rPC = dalvikCallsite
222    ldrh    r7, [r0, #offMethod_registersSize]  @ r7<- methodToCall->regsSize
223    ldrh    r2, [r0, #offMethod_outsSize]  @ r2<- methodToCall->outsSize
224    ldr     r9, [rGLUE, #offGlue_interpStackEnd]    @ r9<- interpStackEnd
225    ldr     r8, [rGLUE, #offGlue_pSelfSuspendCount] @ r8<- &suspendCount
226    add     r3, r1, #1  @ Thumb addr is odd
227    SAVEAREA_FROM_FP(r1, rFP)           @ r1<- stack save area
228    sub     r1, r1, r7, lsl #2          @ r1<- newFp (old savearea - regsSize)
229    SAVEAREA_FROM_FP(r10, r1)           @ r10<- stack save area
230    sub     r10, r10, r2, lsl #2        @ r10<- bottom (newsave - outsSize)
231    ldr     r8, [r8]                    @ r3<- suspendCount (int)
232    cmp     r10, r9                     @ bottom < interpStackEnd?
233    bxlt    lr                          @ return to raise stack overflow excep.
234    @ r1 = newFP, r0 = methodToCall, r3 = returnCell, rPC = dalvikCallsite
235    ldr     r9, [r0, #offMethod_clazz]      @ r9<- method->clazz
236    ldr     r10, [r0, #offMethod_accessFlags] @ r10<- methodToCall->accessFlags
237    str     rPC, [rFP, #(offStackSaveArea_currentPc - sizeofStackSaveArea)]
238    str     rPC, [r1, #(offStackSaveArea_savedPc - sizeofStackSaveArea)]
239    ldr     rPC, [r0, #offMethod_insns]     @ rPC<- methodToCall->insns
240
241
242    @ set up newSaveArea
243    str     rFP, [r1, #(offStackSaveArea_prevFrame - sizeofStackSaveArea)]
244    str     r3, [r1, #(offStackSaveArea_returnAddr - sizeofStackSaveArea)]
245    str     r0, [r1, #(offStackSaveArea_method - sizeofStackSaveArea)]
246    cmp     r8, #0                      @ suspendCount != 0
247    bxne    lr                          @ bail to the interpreter
248    tst     r10, #ACC_NATIVE
249    bne     .LinvokeNative
250
251    ldr     r10, .LdvmJitToInterpNoChain
252    ldr     r3, [r9, #offClassObject_pDvmDex] @ r3<- method->clazz->pDvmDex
253    ldr     r2, [rGLUE, #offGlue_self]      @ r2<- glue->self
254
255    @ Update "glue" values for the new method
256    str     r0, [rGLUE, #offGlue_method]    @ glue->method = methodToCall
257    str     r3, [rGLUE, #offGlue_methodClassDex] @ glue->methodClassDex = ...
258    mov     rFP, r1                         @ fp = newFp
259    str     rFP, [r2, #offThread_curFrame]  @ self->curFrame = newFp
260
261    @ Start executing the callee
262    mov     pc, r10                         @ dvmJitToInterpNoChain
263
264/* ------------------------------ */
265    .balign 4
266    .global dvmCompiler_TEMPLATE_INVOKE_METHOD_CHAIN
267dvmCompiler_TEMPLATE_INVOKE_METHOD_CHAIN:
268/* File: armv5te/TEMPLATE_INVOKE_METHOD_CHAIN.S */
269    /*
270     * For monomorphic callsite, setup the Dalvik frame and return to the
271     * Thumb code through the link register to transfer control to the callee
272     * method through a dedicated chaining cell.
273     */
274    @ r0 = methodToCall, r1 = returnCell, rPC = dalvikCallsite
275    @ methodToCall is guaranteed to be non-native
276.LinvokeChain:
277    ldrh    r7, [r0, #offMethod_registersSize]  @ r7<- methodToCall->regsSize
278    ldrh    r2, [r0, #offMethod_outsSize]  @ r2<- methodToCall->outsSize
279    ldr     r9, [rGLUE, #offGlue_interpStackEnd]    @ r9<- interpStackEnd
280    ldr     r8, [rGLUE, #offGlue_pSelfSuspendCount] @ r8<- &suspendCount
281    add     r3, r1, #1  @ Thumb addr is odd
282    SAVEAREA_FROM_FP(r1, rFP)           @ r1<- stack save area
283    sub     r1, r1, r7, lsl #2          @ r1<- newFp (old savearea - regsSize)
284    SAVEAREA_FROM_FP(r10, r1)           @ r10<- stack save area
285    add     r12, lr, #2                 @ setup the punt-to-interp address
286    sub     r10, r10, r2, lsl #2        @ r10<- bottom (newsave - outsSize)
287    ldr     r8, [r8]                    @ r3<- suspendCount (int)
288    cmp     r10, r9                     @ bottom < interpStackEnd?
289    bxlt    r12                         @ return to raise stack overflow excep.
290    @ r1 = newFP, r0 = methodToCall, r3 = returnCell, rPC = dalvikCallsite
291    ldr     r9, [r0, #offMethod_clazz]      @ r9<- method->clazz
292    str     rPC, [rFP, #(offStackSaveArea_currentPc - sizeofStackSaveArea)]
293    str     rPC, [r1, #(offStackSaveArea_savedPc - sizeofStackSaveArea)]
294    ldr     rPC, [r0, #offMethod_insns]     @ rPC<- methodToCall->insns
295
296
297    @ set up newSaveArea
298    str     rFP, [r1, #(offStackSaveArea_prevFrame - sizeofStackSaveArea)]
299    str     r3, [r1, #(offStackSaveArea_returnAddr - sizeofStackSaveArea)]
300    str     r0, [r1, #(offStackSaveArea_method - sizeofStackSaveArea)]
301    cmp     r8, #0                      @ suspendCount != 0
302    bxne    r12                         @ bail to the interpreter
303
304    ldr     r3, [r9, #offClassObject_pDvmDex] @ r3<- method->clazz->pDvmDex
305    ldr     r2, [rGLUE, #offGlue_self]      @ r2<- glue->self
306
307    @ Update "glue" values for the new method
308    str     r0, [rGLUE, #offGlue_method]    @ glue->method = methodToCall
309    str     r3, [rGLUE, #offGlue_methodClassDex] @ glue->methodClassDex = ...
310    mov     rFP, r1                         @ fp = newFp
311    str     rFP, [r2, #offThread_curFrame]  @ self->curFrame = newFp
312
313    bx      lr                              @ return to the callee-chaining cell
314
315
316
317/* ------------------------------ */
318    .balign 4
319    .global dvmCompiler_TEMPLATE_INVOKE_METHOD_PREDICTED_CHAIN
320dvmCompiler_TEMPLATE_INVOKE_METHOD_PREDICTED_CHAIN:
321/* File: armv5te/TEMPLATE_INVOKE_METHOD_PREDICTED_CHAIN.S */
322    /*
323     * For polymorphic callsite, check whether the cached class pointer matches
324     * the current one. If so setup the Dalvik frame and return to the
325     * Thumb code through the link register to transfer control to the callee
326     * method through a dedicated chaining cell.
327     *
328     * The predicted chaining cell is declared in ArmLIR.h with the
329     * following layout:
330     *
331     *  typedef struct PredictedChainingCell {
332     *      u4 branch;
333     *      const ClassObject *clazz;
334     *      const Method *method;
335     *      u4 counter;
336     *  } PredictedChainingCell;
337     *
338     * Upon returning to the callsite:
339     *    - lr  : to branch to the chaining cell
340     *    - lr+2: to punt to the interpreter
341     *    - lr+4: to fully resolve the callee and may rechain.
342     *            r3 <- class
343     *            r9 <- counter
344     */
345    @ r0 = this, r1 = returnCell, r2 = predictedChainCell, rPC = dalvikCallsite
346    ldr     r3, [r0, #offObject_clazz]  @ r3 <- this->class
347    ldr     r8, [r2, #4]    @ r8 <- predictedChainCell->clazz
348    ldr     r0, [r2, #8]    @ r0 <- predictedChainCell->method
349    ldr     r9, [r2, #12]   @ r9 <- predictedChainCell->counter
350    cmp     r3, r8          @ predicted class == actual class?
351    beq     .LinvokeChain   @ predicted chain is valid
352    ldr     r7, [r3, #offClassObject_vtable] @ r7 <- this->class->vtable
353    sub     r1, r9, #1      @ count--
354    str     r1, [r2, #12]   @ write back to PredictedChainingCell->counter
355    add     lr, lr, #4      @ return to fully-resolve landing pad
356    /*
357     * r1 <- count
358     * r2 <- &predictedChainCell
359     * r3 <- this->class
360     * r4 <- dPC
361     * r7 <- this->class->vtable
362     */
363    bx      lr
364
365/* ------------------------------ */
366    .balign 4
367    .global dvmCompiler_TEMPLATE_INVOKE_METHOD_NATIVE
368dvmCompiler_TEMPLATE_INVOKE_METHOD_NATIVE:
369/* File: armv5te/TEMPLATE_INVOKE_METHOD_NATIVE.S */
370    @ r0 = methodToCall, r1 = returnCell, rPC = dalvikCallsite
371    ldrh    r7, [r0, #offMethod_registersSize]  @ r7<- methodToCall->regsSize
372    ldr     r9, [rGLUE, #offGlue_interpStackEnd]    @ r9<- interpStackEnd
373    ldr     r8, [rGLUE, #offGlue_pSelfSuspendCount] @ r8<- &suspendCount
374    add     r3, r1, #1  @ Thumb addr is odd
375    SAVEAREA_FROM_FP(r1, rFP)           @ r1<- stack save area
376    sub     r1, r1, r7, lsl #2          @ r1<- newFp (old savearea - regsSize)
377    SAVEAREA_FROM_FP(r10, r1)           @ r10<- stack save area
378    ldr     r8, [r8]                    @ r3<- suspendCount (int)
379    cmp     r10, r9                     @ bottom < interpStackEnd?
380    bxlt    lr                          @ return to raise stack overflow excep.
381    @ r1 = newFP, r0 = methodToCall, r3 = returnCell, rPC = dalvikCallsite
382    str     rPC, [rFP, #(offStackSaveArea_currentPc - sizeofStackSaveArea)]
383    str     rPC, [r1, #(offStackSaveArea_savedPc - sizeofStackSaveArea)]
384    ldr     rPC, [r0, #offMethod_insns]     @ rPC<- methodToCall->insns
385
386
387    @ set up newSaveArea
388    str     rFP, [r1, #(offStackSaveArea_prevFrame - sizeofStackSaveArea)]
389    str     r3, [r1, #(offStackSaveArea_returnAddr - sizeofStackSaveArea)]
390    ldr     r3, [rGLUE, #offGlue_self]      @ r3<- glue->self
391    str     r0, [r1, #(offStackSaveArea_method - sizeofStackSaveArea)]
392    cmp     r8, #0                      @ suspendCount != 0
393    ldr     r8, [r0, #offMethod_nativeFunc] @ r8<- method->nativeFunc
394    bxne    lr                          @ bail to the interpreter
395
396    @ go ahead and transfer control to the native code
397    ldr     r9, [r3, #offThread_jniLocal_topCookie] @ r9<- thread->localRef->...
398    str     r1, [r3, #offThread_curFrame]   @ self->curFrame = newFp
399    str     r9, [r1, #(offStackSaveArea_localRefCookie - sizeofStackSaveArea)]
400                                        @ newFp->localRefCookie=top
401    mov     r9, r3                      @ r9<- glue->self (preserve)
402    SAVEAREA_FROM_FP(r10, r1)           @ r10<- new stack save area
403
404    mov     r2, r0                      @ r2<- methodToCall
405    mov     r0, r1                      @ r0<- newFP
406    add     r1, rGLUE, #offGlue_retval  @ r1<- &retval
407
408    blx     r8                          @ off to the native code
409
410    @ native return; r9=self, r10=newSaveArea
411    @ equivalent to dvmPopJniLocals
412    ldr     r2, [r10, #offStackSaveArea_returnAddr] @ r2 = chaining cell ret
413    ldr     r0, [r10, #offStackSaveArea_localRefCookie] @ r0<- saved->top
414    ldr     r1, [r9, #offThread_exception] @ check for exception
415    str     rFP, [r9, #offThread_curFrame]  @ self->curFrame = fp
416    cmp     r1, #0                      @ null?
417    str     r0, [r9, #offThread_jniLocal_topCookie] @ new top <- old top
418    bne     .LhandleException             @ no, handle exception
419    bx      r2
420
421
422/* ------------------------------ */
423    .balign 4
424    .global dvmCompiler_TEMPLATE_MUL_LONG
425dvmCompiler_TEMPLATE_MUL_LONG:
426/* File: armv5te/TEMPLATE_MUL_LONG.S */
427    /*
428     * Signed 64-bit integer multiply.
429     *
430     * For JIT: op1 in r0/r1, op2 in r2/r3, return in r0/r1
431     *
432     * Consider WXxYZ (r1r0 x r3r2) with a long multiply:
433     *        WX
434     *      x YZ
435     *  --------
436     *     ZW ZX
437     *  YW YX
438     *
439     * The low word of the result holds ZX, the high word holds
440     * (ZW+YX) + (the high overflow from ZX).  YW doesn't matter because
441     * it doesn't fit in the low 64 bits.
442     *
443     * Unlike most ARM math operations, multiply instructions have
444     * restrictions on using the same register more than once (Rd and Rm
445     * cannot be the same).
446     */
447    /* mul-long vAA, vBB, vCC */
448    mul     ip, r2, r1                  @  ip<- ZxW
449    umull   r9, r10, r2, r0             @  r9/r10 <- ZxX
450    mla     r2, r0, r3, ip              @  r2<- YxX + (ZxW)
451    add     r10, r2, r10                @  r10<- r10 + low(ZxW + (YxX))
452    mov     r0,r9
453    mov     r1,r10
454    bx      lr
455
456/* ------------------------------ */
457    .balign 4
458    .global dvmCompiler_TEMPLATE_SHL_LONG
459dvmCompiler_TEMPLATE_SHL_LONG:
460/* File: armv5te/TEMPLATE_SHL_LONG.S */
461    /*
462     * Long integer shift.  This is different from the generic 32/64-bit
463     * binary operations because vAA/vBB are 64-bit but vCC (the shift
464     * distance) is 32-bit.  Also, Dalvik requires us to ignore all but the low
465     * 6 bits.
466     */
467    /* shl-long vAA, vBB, vCC */
468    and     r2, r2, #63                 @ r2<- r2 & 0x3f
469    mov     r1, r1, asl r2              @  r1<- r1 << r2
470    rsb     r3, r2, #32                 @  r3<- 32 - r2
471    orr     r1, r1, r0, lsr r3          @  r1<- r1 | (r0 << (32-r2))
472    subs    ip, r2, #32                 @  ip<- r2 - 32
473    movpl   r1, r0, asl ip              @  if r2 >= 32, r1<- r0 << (r2-32)
474    mov     r0, r0, asl r2              @  r0<- r0 << r2
475    bx      lr
476
477/* ------------------------------ */
478    .balign 4
479    .global dvmCompiler_TEMPLATE_SHR_LONG
480dvmCompiler_TEMPLATE_SHR_LONG:
481/* File: armv5te/TEMPLATE_SHR_LONG.S */
482    /*
483     * Long integer shift.  This is different from the generic 32/64-bit
484     * binary operations because vAA/vBB are 64-bit but vCC (the shift
485     * distance) is 32-bit.  Also, Dalvik requires us to ignore all but the low
486     * 6 bits.
487     */
488    /* shr-long vAA, vBB, vCC */
489    and     r2, r2, #63                 @ r0<- r0 & 0x3f
490    mov     r0, r0, lsr r2              @  r0<- r2 >> r2
491    rsb     r3, r2, #32                 @  r3<- 32 - r2
492    orr     r0, r0, r1, asl r3          @  r0<- r0 | (r1 << (32-r2))
493    subs    ip, r2, #32                 @  ip<- r2 - 32
494    movpl   r0, r1, asr ip              @  if r2 >= 32, r0<-r1 >> (r2-32)
495    mov     r1, r1, asr r2              @  r1<- r1 >> r2
496    bx      lr
497
498
499/* ------------------------------ */
500    .balign 4
501    .global dvmCompiler_TEMPLATE_USHR_LONG
502dvmCompiler_TEMPLATE_USHR_LONG:
503/* File: armv5te/TEMPLATE_USHR_LONG.S */
504    /*
505     * Long integer shift.  This is different from the generic 32/64-bit
506     * binary operations because vAA/vBB are 64-bit but vCC (the shift
507     * distance) is 32-bit.  Also, Dalvik requires us to ignore all but the low
508     * 6 bits.
509     */
510    /* ushr-long vAA, vBB, vCC */
511    and     r2, r2, #63                 @ r0<- r0 & 0x3f
512    mov     r0, r0, lsr r2              @  r0<- r2 >> r2
513    rsb     r3, r2, #32                 @  r3<- 32 - r2
514    orr     r0, r0, r1, asl r3          @  r0<- r0 | (r1 << (32-r2))
515    subs    ip, r2, #32                 @  ip<- r2 - 32
516    movpl   r0, r1, lsr ip              @  if r2 >= 32, r0<-r1 >>> (r2-32)
517    mov     r1, r1, lsr r2              @  r1<- r1 >>> r2
518    bx      lr
519
520
521/* ------------------------------ */
522    .balign 4
523    .global dvmCompiler_TEMPLATE_ADD_FLOAT_VFP
524dvmCompiler_TEMPLATE_ADD_FLOAT_VFP:
525/* File: armv5te-vfp/TEMPLATE_ADD_FLOAT_VFP.S */
526/* File: armv5te-vfp/fbinop.S */
527    /*
528     * Generic 32-bit floating point operation.  Provide an "instr" line that
529     * specifies an instruction that performs s2 = s0 op s1.
530     *
531     * On entry:
532     *     r0 = target dalvik register address
533     *     r1 = op1 address
534     *     r2 = op2 address
535     */
536     flds    s0,[r1]
537     flds    s1,[r2]
538     fadds   s2, s0, s1
539     fsts    s2,[r0]
540     bx      lr
541
542
543/* ------------------------------ */
544    .balign 4
545    .global dvmCompiler_TEMPLATE_SUB_FLOAT_VFP
546dvmCompiler_TEMPLATE_SUB_FLOAT_VFP:
547/* File: armv5te-vfp/TEMPLATE_SUB_FLOAT_VFP.S */
548/* File: armv5te-vfp/fbinop.S */
549    /*
550     * Generic 32-bit floating point operation.  Provide an "instr" line that
551     * specifies an instruction that performs s2 = s0 op s1.
552     *
553     * On entry:
554     *     r0 = target dalvik register address
555     *     r1 = op1 address
556     *     r2 = op2 address
557     */
558     flds    s0,[r1]
559     flds    s1,[r2]
560     fsubs   s2, s0, s1
561     fsts    s2,[r0]
562     bx      lr
563
564
565/* ------------------------------ */
566    .balign 4
567    .global dvmCompiler_TEMPLATE_MUL_FLOAT_VFP
568dvmCompiler_TEMPLATE_MUL_FLOAT_VFP:
569/* File: armv5te-vfp/TEMPLATE_MUL_FLOAT_VFP.S */
570/* File: armv5te-vfp/fbinop.S */
571    /*
572     * Generic 32-bit floating point operation.  Provide an "instr" line that
573     * specifies an instruction that performs s2 = s0 op s1.
574     *
575     * On entry:
576     *     r0 = target dalvik register address
577     *     r1 = op1 address
578     *     r2 = op2 address
579     */
580     flds    s0,[r1]
581     flds    s1,[r2]
582     fmuls   s2, s0, s1
583     fsts    s2,[r0]
584     bx      lr
585
586
587/* ------------------------------ */
588    .balign 4
589    .global dvmCompiler_TEMPLATE_DIV_FLOAT_VFP
590dvmCompiler_TEMPLATE_DIV_FLOAT_VFP:
591/* File: armv5te-vfp/TEMPLATE_DIV_FLOAT_VFP.S */
592/* File: armv5te-vfp/fbinop.S */
593    /*
594     * Generic 32-bit floating point operation.  Provide an "instr" line that
595     * specifies an instruction that performs s2 = s0 op s1.
596     *
597     * On entry:
598     *     r0 = target dalvik register address
599     *     r1 = op1 address
600     *     r2 = op2 address
601     */
602     flds    s0,[r1]
603     flds    s1,[r2]
604     fdivs   s2, s0, s1
605     fsts    s2,[r0]
606     bx      lr
607
608
609/* ------------------------------ */
610    .balign 4
611    .global dvmCompiler_TEMPLATE_ADD_DOUBLE_VFP
612dvmCompiler_TEMPLATE_ADD_DOUBLE_VFP:
613/* File: armv5te-vfp/TEMPLATE_ADD_DOUBLE_VFP.S */
614/* File: armv5te-vfp/fbinopWide.S */
615    /*
616     * Generic 64-bit floating point operation.  Provide an "instr" line that
617     * specifies an instruction that performs s2 = s0 op s1.
618     *
619     * On entry:
620     *     r0 = target dalvik register address
621     *     r1 = op1 address
622     *     r2 = op2 address
623     */
624     fldd    d0,[r1]
625     fldd    d1,[r2]
626     faddd   d2, d0, d1
627     fstd    d2,[r0]
628     bx      lr
629
630
631/* ------------------------------ */
632    .balign 4
633    .global dvmCompiler_TEMPLATE_SUB_DOUBLE_VFP
634dvmCompiler_TEMPLATE_SUB_DOUBLE_VFP:
635/* File: armv5te-vfp/TEMPLATE_SUB_DOUBLE_VFP.S */
636/* File: armv5te-vfp/fbinopWide.S */
637    /*
638     * Generic 64-bit floating point operation.  Provide an "instr" line that
639     * specifies an instruction that performs s2 = s0 op s1.
640     *
641     * On entry:
642     *     r0 = target dalvik register address
643     *     r1 = op1 address
644     *     r2 = op2 address
645     */
646     fldd    d0,[r1]
647     fldd    d1,[r2]
648     fsubd   d2, d0, d1
649     fstd    d2,[r0]
650     bx      lr
651
652
653/* ------------------------------ */
654    .balign 4
655    .global dvmCompiler_TEMPLATE_MUL_DOUBLE_VFP
656dvmCompiler_TEMPLATE_MUL_DOUBLE_VFP:
657/* File: armv5te-vfp/TEMPLATE_MUL_DOUBLE_VFP.S */
658/* File: armv5te-vfp/fbinopWide.S */
659    /*
660     * Generic 64-bit floating point operation.  Provide an "instr" line that
661     * specifies an instruction that performs s2 = s0 op s1.
662     *
663     * On entry:
664     *     r0 = target dalvik register address
665     *     r1 = op1 address
666     *     r2 = op2 address
667     */
668     fldd    d0,[r1]
669     fldd    d1,[r2]
670     fmuld   d2, d0, d1
671     fstd    d2,[r0]
672     bx      lr
673
674
675/* ------------------------------ */
676    .balign 4
677    .global dvmCompiler_TEMPLATE_DIV_DOUBLE_VFP
678dvmCompiler_TEMPLATE_DIV_DOUBLE_VFP:
679/* File: armv5te-vfp/TEMPLATE_DIV_DOUBLE_VFP.S */
680/* File: armv5te-vfp/fbinopWide.S */
681    /*
682     * Generic 64-bit floating point operation.  Provide an "instr" line that
683     * specifies an instruction that performs s2 = s0 op s1.
684     *
685     * On entry:
686     *     r0 = target dalvik register address
687     *     r1 = op1 address
688     *     r2 = op2 address
689     */
690     fldd    d0,[r1]
691     fldd    d1,[r2]
692     fdivd   d2, d0, d1
693     fstd    d2,[r0]
694     bx      lr
695
696
697/* ------------------------------ */
698    .balign 4
699    .global dvmCompiler_TEMPLATE_DOUBLE_TO_FLOAT_VFP
700dvmCompiler_TEMPLATE_DOUBLE_TO_FLOAT_VFP:
701/* File: armv5te-vfp/TEMPLATE_DOUBLE_TO_FLOAT_VFP.S */
702/* File: armv5te-vfp/funopNarrower.S */
703    /*
704     * Generic 64bit-to-32bit floating point unary operation.  Provide an
705     * "instr" line that specifies an instruction that performs "s0 = op d0".
706     *
707     * For: double-to-int, double-to-float
708     *
709     * On entry:
710     *     r0 = target dalvik register address
711     *     r1 = src dalvik register address
712     */
713    /* unop vA, vB */
714    fldd    d0, [r1]                    @ d0<- vB
715    fcvtsd  s0, d0                              @ s0<- op d0
716    fsts    s0, [r0]                    @ vA<- s0
717    bx      lr
718
719
720/* ------------------------------ */
721    .balign 4
722    .global dvmCompiler_TEMPLATE_DOUBLE_TO_INT_VFP
723dvmCompiler_TEMPLATE_DOUBLE_TO_INT_VFP:
724/* File: armv5te-vfp/TEMPLATE_DOUBLE_TO_INT_VFP.S */
725/* File: armv5te-vfp/funopNarrower.S */
726    /*
727     * Generic 64bit-to-32bit floating point unary operation.  Provide an
728     * "instr" line that specifies an instruction that performs "s0 = op d0".
729     *
730     * For: double-to-int, double-to-float
731     *
732     * On entry:
733     *     r0 = target dalvik register address
734     *     r1 = src dalvik register address
735     */
736    /* unop vA, vB */
737    fldd    d0, [r1]                    @ d0<- vB
738    ftosizd  s0, d0                              @ s0<- op d0
739    fsts    s0, [r0]                    @ vA<- s0
740    bx      lr
741
742
743/* ------------------------------ */
744    .balign 4
745    .global dvmCompiler_TEMPLATE_FLOAT_TO_DOUBLE_VFP
746dvmCompiler_TEMPLATE_FLOAT_TO_DOUBLE_VFP:
747/* File: armv5te-vfp/TEMPLATE_FLOAT_TO_DOUBLE_VFP.S */
748/* File: armv5te-vfp/funopWider.S */
749    /*
750     * Generic 32bit-to-64bit floating point unary operation.  Provide an
751     * "instr" line that specifies an instruction that performs "d0 = op s0".
752     *
753     * For: int-to-double, float-to-double
754     *
755     * On entry:
756     *     r0 = target dalvik register address
757     *     r1 = src dalvik register address
758     */
759    /* unop vA, vB */
760    flds    s0, [r1]                    @ s0<- vB
761    fcvtds  d0, s0                              @ d0<- op s0
762    fstd    d0, [r0]                    @ vA<- d0
763    bx      lr
764
765
766/* ------------------------------ */
767    .balign 4
768    .global dvmCompiler_TEMPLATE_FLOAT_TO_INT_VFP
769dvmCompiler_TEMPLATE_FLOAT_TO_INT_VFP:
770/* File: armv5te-vfp/TEMPLATE_FLOAT_TO_INT_VFP.S */
771/* File: armv5te-vfp/funop.S */
772    /*
773     * Generic 32bit-to-32bit floating point unary operation.  Provide an
774     * "instr" line that specifies an instruction that performs "s1 = op s0".
775     *
776     * For: float-to-int, int-to-float
777     *
778     * On entry:
779     *     r0 = target dalvik register address
780     *     r1 = src dalvik register address
781     */
782    /* unop vA, vB */
783    flds    s0, [r1]                    @ s0<- vB
784    ftosizs s1, s0                              @ s1<- op s0
785    fsts    s1, [r0]                    @ vA<- s1
786    bx      lr
787
788
789/* ------------------------------ */
790    .balign 4
791    .global dvmCompiler_TEMPLATE_INT_TO_DOUBLE_VFP
792dvmCompiler_TEMPLATE_INT_TO_DOUBLE_VFP:
793/* File: armv5te-vfp/TEMPLATE_INT_TO_DOUBLE_VFP.S */
794/* File: armv5te-vfp/funopWider.S */
795    /*
796     * Generic 32bit-to-64bit floating point unary operation.  Provide an
797     * "instr" line that specifies an instruction that performs "d0 = op s0".
798     *
799     * For: int-to-double, float-to-double
800     *
801     * On entry:
802     *     r0 = target dalvik register address
803     *     r1 = src dalvik register address
804     */
805    /* unop vA, vB */
806    flds    s0, [r1]                    @ s0<- vB
807    fsitod  d0, s0                              @ d0<- op s0
808    fstd    d0, [r0]                    @ vA<- d0
809    bx      lr
810
811
812/* ------------------------------ */
813    .balign 4
814    .global dvmCompiler_TEMPLATE_INT_TO_FLOAT_VFP
815dvmCompiler_TEMPLATE_INT_TO_FLOAT_VFP:
816/* File: armv5te-vfp/TEMPLATE_INT_TO_FLOAT_VFP.S */
817/* File: armv5te-vfp/funop.S */
818    /*
819     * Generic 32bit-to-32bit floating point unary operation.  Provide an
820     * "instr" line that specifies an instruction that performs "s1 = op s0".
821     *
822     * For: float-to-int, int-to-float
823     *
824     * On entry:
825     *     r0 = target dalvik register address
826     *     r1 = src dalvik register address
827     */
828    /* unop vA, vB */
829    flds    s0, [r1]                    @ s0<- vB
830    fsitos  s1, s0                              @ s1<- op s0
831    fsts    s1, [r0]                    @ vA<- s1
832    bx      lr
833
834
835/* ------------------------------ */
836    .balign 4
837    .global dvmCompiler_TEMPLATE_CMPG_DOUBLE_VFP
838dvmCompiler_TEMPLATE_CMPG_DOUBLE_VFP:
839/* File: armv5te-vfp/TEMPLATE_CMPG_DOUBLE_VFP.S */
840    /*
841     * Compare two floating-point values.  Puts 0, 1, or -1 into the
842     * destination register based on the results of the comparison.
843     *
844     * int compare(x, y) {
845     *     if (x == y) {
846     *         return 0;
847     *     } else if (x < y) {
848     *         return -1;
849     *     } else if (x > y) {
850     *         return 1;
851     *     } else {
852     *         return 1;
853     *     }
854     * }
855     *
856     * On entry:
857     *    r0 = &op1 [vBB]
858     *    r1 = &op2 [vCC]
859     */
860    /* op vAA, vBB, vCC */
861    fldd    d0, [r0]                    @ d0<- vBB
862    fldd    d1, [r1]                    @ d1<- vCC
863    fcmped  d0, d1                      @ compare (vBB, vCC)
864    mov     r0, #1                      @ r0<- 1 (default)
865    fmstat                              @ export status flags
866    mvnmi   r0, #0                      @ (less than) r0<- -1
867    moveq   r0, #0                      @ (equal) r0<- 0
868    bx      lr
869
870
871/* ------------------------------ */
872    .balign 4
873    .global dvmCompiler_TEMPLATE_CMPL_DOUBLE_VFP
874dvmCompiler_TEMPLATE_CMPL_DOUBLE_VFP:
875/* File: armv5te-vfp/TEMPLATE_CMPL_DOUBLE_VFP.S */
876    /*
877     * Compare two floating-point values.  Puts 0, 1, or -1 into the
878     * destination register based on the results of the comparison.
879     *
880     * int compare(x, y) {
881     *     if (x == y) {
882     *         return 0;
883     *     } else if (x > y) {
884     *         return 1;
885     *     } else if (x < y) {
886     *         return -1;
887     *     } else {
888     *         return -1;
889     *     }
890     * }
891     * On entry:
892     *    r0 = &op1 [vBB]
893     *    r1 = &op2 [vCC]
894     */
895    /* op vAA, vBB, vCC */
896    fldd    d0, [r0]                    @ d0<- vBB
897    fldd    d1, [r1]                    @ d1<- vCC
898    fcmped  d0, d1                      @ compare (vBB, vCC)
899    mvn     r0, #0                      @ r0<- -1 (default)
900    fmstat                              @ export status flags
901    movgt   r0, #1                      @ (greater than) r0<- 1
902    moveq   r0, #0                      @ (equal) r0<- 0
903    bx      lr
904
905/* ------------------------------ */
906    .balign 4
907    .global dvmCompiler_TEMPLATE_CMPG_FLOAT_VFP
908dvmCompiler_TEMPLATE_CMPG_FLOAT_VFP:
909/* File: armv5te-vfp/TEMPLATE_CMPG_FLOAT_VFP.S */
910    /*
911     * Compare two floating-point values.  Puts 0, 1, or -1 into the
912     * destination register based on the results of the comparison.
913     *
914     * int compare(x, y) {
915     *     if (x == y) {
916     *         return 0;
917     *     } else if (x < y) {
918     *         return -1;
919     *     } else if (x > y) {
920     *         return 1;
921     *     } else {
922     *         return 1;
923     *     }
924     * }
925     * On entry:
926     *    r0 = &op1 [vBB]
927     *    r1 = &op2 [vCC]
928     */
929    /* op vAA, vBB, vCC */
930    flds    s0, [r0]                    @ d0<- vBB
931    flds    s1, [r1]                    @ d1<- vCC
932    fcmpes  s0, s1                      @ compare (vBB, vCC)
933    mov     r0, #1                      @ r0<- 1 (default)
934    fmstat                              @ export status flags
935    mvnmi   r0, #0                      @ (less than) r0<- -1
936    moveq   r0, #0                      @ (equal) r0<- 0
937    bx      lr
938
939/* ------------------------------ */
940    .balign 4
941    .global dvmCompiler_TEMPLATE_CMPL_FLOAT_VFP
942dvmCompiler_TEMPLATE_CMPL_FLOAT_VFP:
943/* File: armv5te-vfp/TEMPLATE_CMPL_FLOAT_VFP.S */
944    /*
945     * Compare two floating-point values.  Puts 0, 1, or -1 into the
946     * destination register based on the results of the comparison.
947     *
948     * int compare(x, y) {
949     *     if (x == y) {
950     *         return 0;
951     *     } else if (x > y) {
952     *         return 1;
953     *     } else if (x < y) {
954     *         return -1;
955     *     } else {
956     *         return -1;
957     *     }
958     * }
959     * On entry:
960     *    r0 = &op1 [vBB]
961     *    r1 = &op2 [vCC]
962     */
963    /* op vAA, vBB, vCC */
964    flds    s0, [r0]                    @ d0<- vBB
965    flds    s1, [r1]                    @ d1<- vCC
966    fcmpes  s0, s1                      @ compare (vBB, vCC)
967    mvn     r0, #0                      @ r0<- -1 (default)
968    fmstat                              @ export status flags
969    movgt   r0, #1                      @ (greater than) r0<- 1
970    moveq   r0, #0                      @ (equal) r0<- 0
971    bx      lr
972
973/* ------------------------------ */
974    .balign 4
975    .global dvmCompiler_TEMPLATE_SQRT_DOUBLE_VFP
976dvmCompiler_TEMPLATE_SQRT_DOUBLE_VFP:
977/* File: armv5te-vfp/TEMPLATE_SQRT_DOUBLE_VFP.S */
978    /*
979     * 64-bit floating point vfp sqrt operation.
980     * If the result is a NaN, bail out to library code to do
981     * the right thing.
982     *
983     * On entry:
984     *     r2 src addr of op1
985     * On exit:
986     *     r0,r1 = res
987     */
988    fldd    d0, [r2]
989    fsqrtd  d1, d0
990    fcmpd   d1, d1
991    fmstat
992    fmrrd   r0, r1, d1
993    bxeq    lr   @ Result OK - return
994    ldr     r2, .Lsqrt
995    fmrrd   r0, r1, d0   @ reload orig operand
996    bx      r2   @ tail call to sqrt library routine
997
998.Lsqrt:
999    .word   sqrt
1000
1001    .size   dvmCompilerTemplateStart, .-dvmCompilerTemplateStart
1002/* File: armv5te/footer.S */
1003/*
1004 * ===========================================================================
1005 *  Common subroutines and data
1006 * ===========================================================================
1007 */
1008
1009    .text
1010    .align  2
1011.LinvokeNative:
1012    @ Prep for the native call
1013    @ r1 = newFP, r0 = methodToCall
1014    ldr     r3, [rGLUE, #offGlue_self]      @ r3<- glue->self
1015    ldr     r9, [r3, #offThread_jniLocal_topCookie] @ r9<- thread->localRef->...
1016    str     r1, [r3, #offThread_curFrame]   @ self->curFrame = newFp
1017    str     r9, [r1, #(offStackSaveArea_localRefCookie - sizeofStackSaveArea)]
1018                                        @ newFp->localRefCookie=top
1019    mov     r9, r3                      @ r9<- glue->self (preserve)
1020    SAVEAREA_FROM_FP(r10, r1)           @ r10<- new stack save area
1021
1022    mov     r2, r0                      @ r2<- methodToCall
1023    mov     r0, r1                      @ r0<- newFP
1024    add     r1, rGLUE, #offGlue_retval  @ r1<- &retval
1025
1026    LDR_PC_LR "[r2, #offMethod_nativeFunc]"
1027
1028    @ native return; r9=self, r10=newSaveArea
1029    @ equivalent to dvmPopJniLocals
1030    ldr     r2, [r10, #offStackSaveArea_returnAddr] @ r2 = chaining cell ret
1031    ldr     r0, [r10, #offStackSaveArea_localRefCookie] @ r0<- saved->top
1032    ldr     r1, [r9, #offThread_exception] @ check for exception
1033    str     rFP, [r9, #offThread_curFrame]  @ self->curFrame = fp
1034    cmp     r1, #0                      @ null?
1035    str     r0, [r9, #offThread_jniLocal_topCookie] @ new top <- old top
1036    bne     .LhandleException             @ no, handle exception
1037    bx      r2
1038
1039/* NOTE - this path can be exercised if the JIT threshold is set to 5 */
1040.LhandleException:
1041    ldr     r0, .LdvmMterpCommonExceptionThrown @ PIC way of getting &func
1042    ldr     rIBASE, .LdvmAsmInstructionStart    @ same as above
1043    ldr     rPC, [r10, #offStackSaveArea_savedPc] @ reload rPC
1044    mov     pc, r0                  @ branch to dvmMterpCommonExceptionThrown
1045
1046    .align  2
1047.LdvmAsmInstructionStart:
1048    .word   dvmAsmInstructionStart
1049.LdvmJitToInterpNoChain:
1050    .word   dvmJitToInterpNoChain
1051.LdvmMterpStdBail:
1052    .word   dvmMterpStdBail
1053.LdvmMterpCommonExceptionThrown:
1054    .word   dvmMterpCommonExceptionThrown
1055.L__aeabi_cdcmple:
1056    .word   __aeabi_cdcmple
1057.L__aeabi_cfcmple:
1058    .word   __aeabi_cfcmple
1059
1060    .global dmvCompilerTemplateEnd
1061dmvCompilerTemplateEnd:
1062
1063#endif /* WITH_JIT */
1064
1065