10d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@/*****************************************************************************
20d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*
30d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* Copyright (C) 2012 Ittiam Systems Pvt Ltd, Bangalore
40d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*
50d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* Licensed under the Apache License, Version 2.0 (the "License");
60d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* you may not use this file except in compliance with the License.
70d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* You may obtain a copy of the License at:
80d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*
90d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* http://www.apache.org/licenses/LICENSE-2.0
100d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*
110d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* Unless required by applicable law or agreed to in writing, software
120d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* distributed under the License is distributed on an "AS IS" BASIS,
130d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
140d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* See the License for the specific language governing permissions and
150d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* limitations under the License.
160d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*
170d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*****************************************************************************/
180d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@/**
190d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@/*******************************************************************************
200d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* @file
210d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  ihevcd_fmt_conv_420sp_to_rgba8888.s
220d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*
230d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* @brief
240d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  contains function definitions for format conversions
250d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*
260d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* @author
270d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  ittiam
280d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*
290d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* @par list of functions:
300d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*
310d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*
320d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@* @remarks
330d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  none
340d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*
350d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*******************************************************************************/
360d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    .equ DO1STROUNDING, 0
370d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
380d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @ ARM
390d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @
400d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @ PRESERVE8
410d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
420d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar.text
430d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar.p2align 2
440d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
450d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
460d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
470d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
480d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@/*****************************************************************************
490d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                                                                            *
500d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  Function Name    : ihevcd_fmt_conv_420sp_to_rgba8888()                    *
510d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                                                                            *
520d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  Description      : This function conversts the image from YUV422 color    *
530d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     space to RGB888 color space. The function can be       *
540d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     invoked at the MB level.                               *
550d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                                                                            *
560d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  Arguments        : R0           pubY                                      *
570d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     R1           pubUV                                     *
580d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     R2           pusRGB                                    *
590d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     R3           pusRGB                                    *
600d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     [R13 #40]    usHeight                                  *
610d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     [R13 #44]    usWidth                                   *
620d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     [R13 #48]    usStrideY                                 *
630d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     [R13 #52]    usStrideU                                 *
640d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     [R13 #56]    usStrideV                                 *
650d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     [R13 #60]    usStrideRGB                               *
660d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                                                                            *
670d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  Values Returned  : None                                                   *
680d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                                                                            *
690d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  Register Usage   : R0 - R14                                               *
700d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                                                                            *
710d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  Stack Usage      : 40 Bytes                                               *
720d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                                                                            *
730d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  Interruptibility : Interruptible                                          *
740d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                                                                            *
750d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  Known Limitations                                                         *
760d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*       Assumptions: Image Width:     Assumed to be multiple of 16 and       *
770d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     greater than or equal to 16                *
780d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                     Image Height:    Assumed to be even.                   *
790d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*                                                                            *
800d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*  Revision History :                                                        *
810d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*         DD MM YYYY   Author(s)       Changes (Describe the changes made)   *
820d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*         07 06 2010   Varshita        Draft                                 *
830d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*         07 06 2010   Naveen Kr T     Completed                             *
840d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*         05 08 2013   Naveen K P      Modified for HEVC                     *
850d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar@*****************************************************************************/
860d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    .global ihevcd_fmt_conv_420sp_to_rgba8888_a9q
870d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar.type ihevcd_fmt_conv_420sp_to_rgba8888_a9q, function
880d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakarihevcd_fmt_conv_420sp_to_rgba8888_a9q:
890d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
900d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @// push the registers on the stack
910d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    STMFD       SP!,{R4-R12,LR}
920d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
930d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
940d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//R0 - Y PTR
950d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//R1 - UV PTR
960d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//R2 - RGB PTR
970d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//R3 - RGB PTR
980d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//R4 - PIC WIDTH
990d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//R5 - PIC HT
1000d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//R6 - STRIDE Y
1010d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//R7 - STRIDE U
1020d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//R8 - STRIDE V
1030d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//R9 - STRIDE RGB
1040d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1050d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//ONE ROW PROCESSING AT A TIME
1060d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1070d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//THE FOUR CONSTANTS ARE:
1080d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//C1=0x3311,C2=0xF379,C3=0xE5F8,C4=0x4092
1090d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1100d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @PLD        [R0]
1110d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @PLD        [R1]
1120d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @PLD        [R2]
1130d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1140d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1150d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @/* can be loaded from a defined const type */
1160d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    MOVW        R10,#0x3311
1170d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.16     D0[0],R10                   @//C1
1180d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1190d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    MOVW        R10,#0xF379
1200d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.16     D0[1],R10                   @//C2
1210d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1220d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    MOVW        R10,#0xE5F8
1230d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.16     D0[2],R10                   @//C3
1240d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1250d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    MOVW        R10,#0x4092
1260d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.16     D0[3],R10                   @//C4
1270d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1280d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//LOAD CONSTANT 128 INTO A CORTEX REGISTER
1290d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    MOV         R10,#128
1300d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VDUP.8      D1,R10
1310d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1320d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//D0 HAS C1-C2-C3-C4
1330d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @// load other parameters from stack
1340d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    LDR         R5,[sp,#40]
1350d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @LDR  R4,[sp,#44]
1360d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    LDR         R6,[sp,#44]
1370d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    LDR         R7,[sp,#48]
1380d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @LDR  R8,[sp,#52]
1390d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    LDR         R9,[sp,#52]
1400d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1410d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @// calculate offsets, offset = stride - width
1420d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    SUB         R10,R6,R3                   @// luma offset
1430d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    SUB         R11,R7,R3
1440d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @, LSR #1   @// u offset
1450d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @SUB     R12,R8,R3, LSR #1  @// v offset
1460d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    SUB         R14,R9,R3                   @// rgb offset in pixels
1470d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1480d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @// calculate height loop count
1490d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    MOV         R5,R5, LSR #1               @// height_cnt = height / 16
1500d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1510d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @// create next row pointers for rgb and luma data
1520d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    ADD         R7,R0,R6                    @// luma_next_row = luma + luma_stride
1530d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    ADD         R8,R2,R9,LSL #2             @// rgb_next_row = rgb + rgb_stride
1540d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1550d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish MahendrakarLABEL_YUV420SP_TO_RGB8888_HEIGHT_LOOP:
1560d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1570d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//LOAD VALUES OF U&V AND COMPUTE THE R,G,B WEIGHT VALUES.
1580d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VLD1.8      {D2,D3},[R1]!               @//LOAD 8 VALUES OF UV
1590d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//VLD1.8 {D3},[R2]!            @//LOAD 8 VALUES OF V
1600d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1610d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @// calculate width loop count
1620d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    MOV         R6,R3, LSR #4               @// width_cnt = width / 16
1630d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1640d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//COMPUTE THE ACTUAL RGB VALUES,WE CAN DO TWO ROWS AT A TIME
1650d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//LOAD VALUES OF Y 8-BIT VALUES
1660d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VLD2.8      {D30,D31},[R0]!             @//D0 - Y0,Y2,Y4,Y6,Y8,Y10,Y12,Y14 row 1
1670d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar                                            @//D1 - Y1,Y3,Y5,Y7,Y9,Y11,Y13,Y15
1680d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VLD2.8      {D28,D29},[R7]!             @//D0 - Y0,Y2,Y4,Y6,Y8,Y10,Y12,Y14 row2
1690d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar                                            @//D1 - Y1,Y3,Y5,Y7,Y9,Y11,Y13,Y15
1700d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1710d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    SUBS        R6,R6,#1
1720d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    BEQ         LABEL_YUV420SP_TO_RGB8888_WIDTH_LOOP_SKIP
1730d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1740d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish MahendrakarLABEL_YUV420SP_TO_RGB8888_WIDTH_LOOP:
1750d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @VMOV.I8 Q1,#128
1760d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VUZP.8      D2,D3
1770d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1780d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1790d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//NEED TO SUBTRACT (U-128) AND (V-128)
1800d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//(D2-D1),(D3-D1)
1810d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VSUBL.U8    Q2,D2,D1                    @//(U-128)
1820d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VSUBL.U8    Q3,D3,D1                    @//(V-128)
1830d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1840d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//LOAD VALUES OF U&V for next row
1850d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VLD1.8      {D2,D3},[R1]!               @//LOAD 8 VALUES OF U
1860d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//VLD1.8 {D3},[R2]!            @//LOAD 8 VALUES OF V
1870d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1880d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @PLD        [R0]
1890d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    PLD         [R1]
1900d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1910d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//NEED TO MULTIPLY WITH Q2,Q3 WITH CO-EEFICIENTS
1920d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q4,D4,D0[3]                 @//(U-128)*C4 FOR B
1930d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q5,D5,D0[3]                 @//(U-128)*C4 FOR B
1940d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1950d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q10,D6,D0[0]                @//(V-128)*C1 FOR R
1960d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q11,D7,D0[0]                @//(V-128)*C1 FOR R
1970d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
1980d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q6,D4,D0[1]                 @//(U-128)*C2 FOR G
1990d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMLAL.S16   Q6,D6,D0[2]                 @//Q6 = (U-128)*C2 + (V-128)*C3
2000d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q7,D5,D0[1]                 @//(U-128)*C2 FOR G
2010d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMLAL.S16   Q7,D7,D0[2]                 @//Q7 = (U-128)*C2 + (V-128)*C3
2020d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2030d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//NARROW RIGHT SHIFT BY 13 FOR R&B
2040d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D8,Q4,#13                   @//D8 = (U-128)*C4>>13 4 16-BIT VALUES
2050d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D9,Q5,#13                   @//D9 = (U-128)*C4>>13 4 16-BIT VALUES
2060d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//Q4 - WEIGHT FOR B
2070d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2080d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//NARROW RIGHT SHIFT BY 13 FOR R&B
2090d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D10,Q10,#13                 @//D10 = (V-128)*C1>>13 4 16-BIT VALUES
2100d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D11,Q11,#13                 @//D11 = (V-128)*C1>>13 4 16-BIT VALUES
2110d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//Q5 - WEIGHT FOR R
2120d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2130d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//NARROW RIGHT SHIFT BY 13 FOR G
2140d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D12,Q6,#13                  @//D12 = [(U-128)*C2 + (V-128)*C3]>>13 4 16-BIT VALUES
2150d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D13,Q7,#13                  @//D13 = [(U-128)*C2 + (V-128)*C3]>>13 4 16-BIT VALUES
2160d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//Q6 - WEIGHT FOR G
2170d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2180d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q7,Q4,D30                   @//Q7 - HAS Y + B
2190d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q8,Q5,D30                   @//Q8 - HAS Y + R
2200d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q9,Q6,D30                   @//Q9 - HAS Y + G
2210d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2220d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q10,Q4,D31                  @//Q10 - HAS Y + B
2230d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q11,Q5,D31                  @//Q11 - HAS Y + R
2240d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q12,Q6,D31                  @//Q12 - HAS Y + G
2250d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2260d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D14,Q7
2270d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D15,Q9
2280d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D16,Q8
2290d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.I8     D17,#0
2300d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2310d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D14,D15
2320d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D16,D17
2330d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.16     Q7,Q8
2340d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2350d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2360d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D20,Q10
2370d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D21,Q12
2380d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D22,Q11
2390d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.I8     D23,#0
2400d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2410d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D20,D21
2420d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D22,D23
2430d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.16     Q10,Q11
2440d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2450d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.32     Q7,Q10
2460d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.32     Q8,Q11
2470d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2480d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D14,[R2]!
2490d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D15,[R2]!
2500d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D20,[R2]!
2510d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D21,[R2]!
2520d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D16,[R2]!
2530d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D17,[R2]!
2540d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D22,[R2]!
2550d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D23,[R2]!
2560d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2570d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//D14-D20 - TOALLY HAVE 16 VALUES
2580d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//WE NEED TO SHIFT R,G,B VALUES TO GET 5BIT,6BIT AND 5BIT COMBINATIONS
2590d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q7,Q4,D28                   @//Q7 - HAS Y + B
2600d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q8,Q5,D28                   @//Q2 - HAS Y + R
2610d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q9,Q6,D28                   @//Q3 - HAS Y + G
2620d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2630d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q10,Q4,D29                  @//Q10 - HAS Y + B
2640d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q11,Q5,D29                  @//Q11 - HAS Y + R
2650d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q12,Q6,D29                  @//Q12 - HAS Y + G
2660d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2670d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//COMPUTE THE ACTUAL RGB VALUES,WE CAN DO TWO ROWS AT A TIME
2680d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//LOAD VALUES OF Y 8-BIT VALUES
2690d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VLD2.8      {D30,D31},[R0]!             @//D0 - Y0,Y2,Y4,Y6,Y8,Y10,Y12,Y14 row 1
2700d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar                                            @//D1 - Y1,Y3,Y5,Y7,Y9,Y11,Y13,Y15
2710d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VLD2.8      {D28,D29},[R7]!             @//D0 - Y0,Y2,Y4,Y6,Y8,Y10,Y12,Y14 row2
2720d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar                                            @//D1 - Y1,Y3,Y5,Y7,Y9,Y11,Y13,Y15
2730d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2740d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    PLD         [R0]
2750d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    PLD         [R7]
2760d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2770d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D14,Q7
2780d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D15,Q9
2790d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D16,Q8
2800d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.I8     D17,#0
2810d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2820d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D14,D15
2830d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D16,D17
2840d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.16     Q7,Q8
2850d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2860d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2870d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D20,Q10
2880d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D21,Q12
2890d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D22,Q11
2900d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.I8     D23,#0
2910d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2920d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D20,D21
2930d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D22,D23
2940d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.16     Q10,Q11
2950d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2960d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.32     Q7,Q10
2970d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.32     Q8,Q11
2980d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
2990d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D14,[R8]!
3000d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D15,[R8]!
3010d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D20,[R8]!
3020d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D21,[R8]!
3030d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D16,[R8]!
3040d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D17,[R8]!
3050d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D22,[R8]!
3060d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D23,[R8]!
3070d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3080d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    SUBS        R6,R6,#1                    @// width_cnt -= 1
3090d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    BNE         LABEL_YUV420SP_TO_RGB8888_WIDTH_LOOP
3100d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3110d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish MahendrakarLABEL_YUV420SP_TO_RGB8888_WIDTH_LOOP_SKIP:
3120d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @VMOV.I8 Q1,#128
3130d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VUZP.8      D2,D3
3140d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3150d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3160d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//NEED TO SUBTRACT (U-128) AND (V-128)
3170d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//(D2-D1),(D3-D1)
3180d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VSUBL.U8    Q2,D2,D1                    @//(U-128)
3190d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VSUBL.U8    Q3,D3,D1                    @//(V-128)
3200d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3210d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3220d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//NEED TO MULTIPLY WITH Q2,Q3 WITH CO-EEFICIENTS
3230d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q4,D4,D0[3]                 @//(U-128)*C4 FOR B
3240d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q5,D5,D0[3]                 @//(U-128)*C4 FOR B
3250d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3260d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q10,D6,D0[0]                @//(V-128)*C1 FOR R
3270d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q11,D7,D0[0]                @//(V-128)*C1 FOR R
3280d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3290d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q6,D4,D0[1]                 @//(U-128)*C2 FOR G
3300d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMLAL.S16   Q6,D6,D0[2]                 @//Q6 = (U-128)*C2 + (V-128)*C3
3310d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMULL.S16   Q7,D5,D0[1]                 @//(U-128)*C2 FOR G
3320d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMLAL.S16   Q7,D7,D0[2]                 @//Q7 = (U-128)*C2 + (V-128)*C3
3330d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3340d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//NARROW RIGHT SHIFT BY 13 FOR R&B
3350d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D8,Q4,#13                   @//D8 = (U-128)*C4>>13 4 16-BIT VALUES
3360d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D9,Q5,#13                   @//D9 = (U-128)*C4>>13 4 16-BIT VALUES
3370d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//Q4 - WEIGHT FOR B
3380d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3390d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//NARROW RIGHT SHIFT BY 13 FOR R&B
3400d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D10,Q10,#13                 @//D10 = (V-128)*C1>>13 4 16-BIT VALUES
3410d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D11,Q11,#13                 @//D11 = (V-128)*C1>>13 4 16-BIT VALUES
3420d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//Q5 - WEIGHT FOR R
3430d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3440d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//NARROW RIGHT SHIFT BY 13 FOR G
3450d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D12,Q6,#13                  @//D12 = [(U-128)*C2 + (V-128)*C3]>>13 4 16-BIT VALUES
3460d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQSHRN.S32  D13,Q7,#13                  @//D13 = [(U-128)*C2 + (V-128)*C3]>>13 4 16-BIT VALUES
3470d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//Q6 - WEIGHT FOR G
3480d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3490d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q7,Q4,D30                   @//Q7 - HAS Y + B
3500d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q8,Q5,D30                   @//Q8 - HAS Y + R
3510d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q9,Q6,D30                   @//Q9 - HAS Y + G
3520d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3530d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q10,Q4,D31                  @//Q10 - HAS Y + B
3540d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q11,Q5,D31                  @//Q11 - HAS Y + R
3550d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q12,Q6,D31                  @//Q12 - HAS Y + G
3560d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3570d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D14,Q7
3580d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D15,Q9
3590d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D16,Q8
3600d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.I8     D17,#0
3610d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3620d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D14,D15
3630d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D16,D17
3640d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.16     Q7,Q8
3650d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3660d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3670d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D20,Q10
3680d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D21,Q12
3690d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D22,Q11
3700d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.I8     D23,#0
3710d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3720d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D20,D21
3730d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D22,D23
3740d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.16     Q10,Q11
3750d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3760d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.32     Q7,Q10
3770d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.32     Q8,Q11
3780d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3790d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D14,[R2]!
3800d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D15,[R2]!
3810d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D20,[R2]!
3820d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D21,[R2]!
3830d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D16,[R2]!
3840d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D17,[R2]!
3850d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D22,[R2]!
3860d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D23,[R2]!
3870d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3880d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//D14-D20 - TOALLY HAVE 16 VALUES
3890d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//WE NEED TO SHIFT R,G,B VALUES TO GET 5BIT,6BIT AND 5BIT COMBINATIONS
3900d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q7,Q4,D28                   @//Q7 - HAS Y + B
3910d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q8,Q5,D28                   @//Q2 - HAS Y + R
3920d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q9,Q6,D28                   @//Q3 - HAS Y + G
3930d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3940d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q10,Q4,D29                  @//Q10 - HAS Y + B
3950d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q11,Q5,D29                  @//Q11 - HAS Y + R
3960d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VADDW.U8    Q12,Q6,D29                  @//Q12 - HAS Y + G
3970d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3980d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
3990d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D14,Q7
4000d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D15,Q9
4010d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D16,Q8
4020d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.I8     D17,#0
4030d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4040d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D14,D15
4050d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D16,D17
4060d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.16     Q7,Q8
4070d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4080d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4090d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D20,Q10
4100d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D21,Q12
4110d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VQMOVUN.S16 D22,Q11
4120d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VMOV.I8     D23,#0
4130d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4140d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D20,D21
4150d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.8      D22,D23
4160d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.16     Q10,Q11
4170d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4180d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.32     Q7,Q10
4190d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VZIP.32     Q8,Q11
4200d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4210d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D14,[R8]!
4220d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D15,[R8]!
4230d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D20,[R8]!
4240d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D21,[R8]!
4250d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D16,[R8]!
4260d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D17,[R8]!
4270d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D22,[R8]!
4280d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    VST1.32     D23,[R8]!
4290d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4300d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @// Adjust the address pointers
4310d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    ADD         R0,R7,R10                   @// luma = luma_next + offset
4320d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    ADD         R2,R8,R14,LSL #2            @// rgb = rgb_next + offset
4330d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4340d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    ADD         R7,R0,R3                    @// luma_next = luma + width
4350d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    ADD         R8,R2,R3,LSL #2             @// rgb_next_row = rgb + width
4360d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4370d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    ADD         R1,R1,R11                   @// adjust u pointer
4380d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @ADD        R2,R2,R12           @// adjust v pointer
4390d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4400d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    ADD         R7,R7,R10                   @// luma_next = luma + width + offset (because of register crunch)
4410d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    ADD         R8,R8,R14,LSL #2            @// rgb_next_row = rgb + width + offset
4420d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4430d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    SUBS        R5,R5,#1                    @// height_cnt -= 1
4440d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4450d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    BNE         LABEL_YUV420SP_TO_RGB8888_HEIGHT_LOOP
4460d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4470d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    @//POP THE REGISTERS
4480d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    LDMFD       SP!,{R4-R12,PC}
4490d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4500d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4510d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4520d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
4530d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar    .section .note.GNU-stack,"",%progbits
4540d8951cef4b1a1dbf4ff5ba3e8796cf1d4503098Harish Mahendrakar
455