1233d2500723e5594f3e7c70896ffeeef32b9c950ywan;
2233d2500723e5594f3e7c70896ffeeef32b9c950ywan;  Copyright (c) 2011 The WebM project authors. All Rights Reserved.
3233d2500723e5594f3e7c70896ffeeef32b9c950ywan;
4233d2500723e5594f3e7c70896ffeeef32b9c950ywan;  Use of this source code is governed by a BSD-style license
5233d2500723e5594f3e7c70896ffeeef32b9c950ywan;  that can be found in the LICENSE file in the root of the source
6233d2500723e5594f3e7c70896ffeeef32b9c950ywan;  tree. An additional intellectual property rights grant can be found
7233d2500723e5594f3e7c70896ffeeef32b9c950ywan;  in the file PATENTS.  All contributing project authors may
8233d2500723e5594f3e7c70896ffeeef32b9c950ywan;  be found in the AUTHORS file in the root of the source tree.
9233d2500723e5594f3e7c70896ffeeef32b9c950ywan;
10233d2500723e5594f3e7c70896ffeeef32b9c950ywan
11233d2500723e5594f3e7c70896ffeeef32b9c950ywan
12233d2500723e5594f3e7c70896ffeeef32b9c950ywan    EXPORT  |vp8_sad16x16_armv6|
13233d2500723e5594f3e7c70896ffeeef32b9c950ywan
14233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ARM
15233d2500723e5594f3e7c70896ffeeef32b9c950ywan    REQUIRE8
16233d2500723e5594f3e7c70896ffeeef32b9c950ywan    PRESERVE8
17233d2500723e5594f3e7c70896ffeeef32b9c950ywan
18233d2500723e5594f3e7c70896ffeeef32b9c950ywan    AREA ||.text||, CODE, READONLY, ALIGN=2
19233d2500723e5594f3e7c70896ffeeef32b9c950ywan
20233d2500723e5594f3e7c70896ffeeef32b9c950ywan; r0    const unsigned char *src_ptr
21233d2500723e5594f3e7c70896ffeeef32b9c950ywan; r1    int  src_stride
22233d2500723e5594f3e7c70896ffeeef32b9c950ywan; r2    const unsigned char *ref_ptr
23233d2500723e5594f3e7c70896ffeeef32b9c950ywan; r3    int  ref_stride
24233d2500723e5594f3e7c70896ffeeef32b9c950ywan; stack max_sad (not used)
25233d2500723e5594f3e7c70896ffeeef32b9c950ywan|vp8_sad16x16_armv6| PROC
26233d2500723e5594f3e7c70896ffeeef32b9c950ywan    stmfd   sp!, {r4-r12, lr}
27233d2500723e5594f3e7c70896ffeeef32b9c950ywan
28233d2500723e5594f3e7c70896ffeeef32b9c950ywan    pld     [r0, r1, lsl #0]
29233d2500723e5594f3e7c70896ffeeef32b9c950ywan    pld     [r2, r3, lsl #0]
30233d2500723e5594f3e7c70896ffeeef32b9c950ywan    pld     [r0, r1, lsl #1]
31233d2500723e5594f3e7c70896ffeeef32b9c950ywan    pld     [r2, r3, lsl #1]
32233d2500723e5594f3e7c70896ffeeef32b9c950ywan
33233d2500723e5594f3e7c70896ffeeef32b9c950ywan    mov     r4, #0              ; sad = 0;
34233d2500723e5594f3e7c70896ffeeef32b9c950ywan    mov     r5, #8              ; loop count
35233d2500723e5594f3e7c70896ffeeef32b9c950ywan
36233d2500723e5594f3e7c70896ffeeef32b9c950ywanloop
37233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ; 1st row
38233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r6, [r0, #0x0]      ; load 4 src pixels (1A)
39233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r8, [r2, #0x0]      ; load 4 ref pixels (1A)
40233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r7, [r0, #0x4]      ; load 4 src pixels (1A)
41233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r9, [r2, #0x4]      ; load 4 ref pixels (1A)
42233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r10, [r0, #0x8]     ; load 4 src pixels (1B)
43233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r11, [r0, #0xC]     ; load 4 src pixels (1B)
44233d2500723e5594f3e7c70896ffeeef32b9c950ywan
45233d2500723e5594f3e7c70896ffeeef32b9c950ywan    usada8  r4, r8, r6, r4      ; calculate sad for 4 pixels
46233d2500723e5594f3e7c70896ffeeef32b9c950ywan    usad8   r8, r7, r9          ; calculate sad for 4 pixels
47233d2500723e5594f3e7c70896ffeeef32b9c950ywan
48233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r12, [r2, #0x8]     ; load 4 ref pixels (1B)
49233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     lr, [r2, #0xC]      ; load 4 ref pixels (1B)
50233d2500723e5594f3e7c70896ffeeef32b9c950ywan
51233d2500723e5594f3e7c70896ffeeef32b9c950ywan    add     r0, r0, r1          ; set src pointer to next row
52233d2500723e5594f3e7c70896ffeeef32b9c950ywan    add     r2, r2, r3          ; set dst pointer to next row
53233d2500723e5594f3e7c70896ffeeef32b9c950ywan
54233d2500723e5594f3e7c70896ffeeef32b9c950ywan    pld     [r0, r1, lsl #1]
55233d2500723e5594f3e7c70896ffeeef32b9c950ywan    pld     [r2, r3, lsl #1]
56233d2500723e5594f3e7c70896ffeeef32b9c950ywan
57233d2500723e5594f3e7c70896ffeeef32b9c950ywan    usada8  r4, r10, r12, r4    ; calculate sad for 4 pixels
58233d2500723e5594f3e7c70896ffeeef32b9c950ywan    usada8  r8, r11, lr, r8     ; calculate sad for 4 pixels
59233d2500723e5594f3e7c70896ffeeef32b9c950ywan
60233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r6, [r0, #0x0]      ; load 4 src pixels (2A)
61233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r7, [r0, #0x4]      ; load 4 src pixels (2A)
62233d2500723e5594f3e7c70896ffeeef32b9c950ywan    add     r4, r4, r8          ; add partial sad values
63233d2500723e5594f3e7c70896ffeeef32b9c950ywan
64233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ; 2nd row
65233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r8, [r2, #0x0]      ; load 4 ref pixels (2A)
66233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r9, [r2, #0x4]      ; load 4 ref pixels (2A)
67233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r10, [r0, #0x8]     ; load 4 src pixels (2B)
68233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r11, [r0, #0xC]     ; load 4 src pixels (2B)
69233d2500723e5594f3e7c70896ffeeef32b9c950ywan
70233d2500723e5594f3e7c70896ffeeef32b9c950ywan    usada8  r4, r6, r8, r4      ; calculate sad for 4 pixels
71233d2500723e5594f3e7c70896ffeeef32b9c950ywan    usad8   r8, r7, r9          ; calculate sad for 4 pixels
72233d2500723e5594f3e7c70896ffeeef32b9c950ywan
73233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     r12, [r2, #0x8]     ; load 4 ref pixels (2B)
74233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldr     lr, [r2, #0xC]      ; load 4 ref pixels (2B)
75233d2500723e5594f3e7c70896ffeeef32b9c950ywan
76233d2500723e5594f3e7c70896ffeeef32b9c950ywan    add     r0, r0, r1          ; set src pointer to next row
77233d2500723e5594f3e7c70896ffeeef32b9c950ywan    add     r2, r2, r3          ; set dst pointer to next row
78233d2500723e5594f3e7c70896ffeeef32b9c950ywan
79233d2500723e5594f3e7c70896ffeeef32b9c950ywan    usada8  r4, r10, r12, r4    ; calculate sad for 4 pixels
80233d2500723e5594f3e7c70896ffeeef32b9c950ywan    usada8  r8, r11, lr, r8     ; calculate sad for 4 pixels
81233d2500723e5594f3e7c70896ffeeef32b9c950ywan
82233d2500723e5594f3e7c70896ffeeef32b9c950ywan    pld     [r0, r1, lsl #1]
83233d2500723e5594f3e7c70896ffeeef32b9c950ywan    pld     [r2, r3, lsl #1]
84233d2500723e5594f3e7c70896ffeeef32b9c950ywan
85233d2500723e5594f3e7c70896ffeeef32b9c950ywan    subs    r5, r5, #1          ; decrement loop counter
86233d2500723e5594f3e7c70896ffeeef32b9c950ywan    add     r4, r4, r8          ; add partial sad values
87233d2500723e5594f3e7c70896ffeeef32b9c950ywan
88233d2500723e5594f3e7c70896ffeeef32b9c950ywan    bne     loop
89233d2500723e5594f3e7c70896ffeeef32b9c950ywan
90233d2500723e5594f3e7c70896ffeeef32b9c950ywan    mov     r0, r4              ; return sad
91233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ldmfd   sp!, {r4-r12, pc}
92233d2500723e5594f3e7c70896ffeeef32b9c950ywan
93233d2500723e5594f3e7c70896ffeeef32b9c950ywan    ENDP
94233d2500723e5594f3e7c70896ffeeef32b9c950ywan
95233d2500723e5594f3e7c70896ffeeef32b9c950ywan    END
96233d2500723e5594f3e7c70896ffeeef32b9c950ywan
97