armVCM4P10_TransformResidual4x4_s.S revision 78e52bfac041d71ce53b5b13c2abf78af742b09d
1/*
2 * Copyright (C) 2007-2008 ARM Limited
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 *      http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 *
16 */
17/*
18 *
19 */
20
21    .eabi_attribute 24, 1
22    .eabi_attribute 25, 1
23
24    .arm
25    .fpu neon
26    .text
27
28    .global armVCM4P10_TransformResidual4x4
29    .func   armVCM4P10_TransformResidual4x4
30armVCM4P10_TransformResidual4x4:
31    VPUSH    {d8}
32    VLD4.16  {d0,d1,d2,d3},[r1]
33    VMOV.I16 d4,#0
34    VADD.I16 d5,d0,d2
35    VSUB.I16 d6,d0,d2
36    VHADD.S16 d7,d1,d4
37    VHADD.S16 d8,d3,d4
38    VSUB.I16 d7,d7,d3
39    VADD.I16 d8,d1,d8
40    VADD.I16 d0,d5,d8
41    VADD.I16 d1,d6,d7
42    VSUB.I16 d2,d6,d7
43    VSUB.I16 d3,d5,d8
44    VTRN.16  d0,d1
45    VTRN.16  d2,d3
46    VTRN.32  q0,q1
47    VADD.I16 d5,d0,d2
48    VSUB.I16 d6,d0,d2
49    VHADD.S16 d7,d1,d4
50    VHADD.S16 d8,d3,d4
51    VSUB.I16 d7,d7,d3
52    VADD.I16 d8,d1,d8
53    VADD.I16 d0,d5,d8
54    VADD.I16 d1,d6,d7
55    VSUB.I16 d2,d6,d7
56    VSUB.I16 d3,d5,d8
57    VRSHR.S16 d0,d0,#6
58    VRSHR.S16 d1,d1,#6
59    VRSHR.S16 d2,d2,#6
60    VRSHR.S16 d3,d3,#6
61    VST1.16  {d0,d1,d2,d3},[r0]
62    VPOP     {d8}
63    BX       lr
64    .endfunc
65
66    .end
67
68