aboutsummaryrefslogtreecommitdiff
path: root/decoder/armv7/ixheaacd_no_lap1.s
blob: 28841911d50d8dd49cbdd80826544540d93693a7 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
@/******************************************************************************
@ *
@ * Copyright (C) 2018 The Android Open Source Project
@ *
@ * Licensed under the Apache License, Version 2.0 (the "License");
@ * you may not use this file except in compliance with the License.
@ * You may obtain a copy of the License at:
@ *
@ * http://www.apache.org/licenses/LICENSE-2.0
@ *
@ * Unless required by applicable law or agreed to in writing, software
@ * distributed under the License is distributed on an "AS IS" BASIS,
@ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@ * See the License for the specific language governing permissions and
@ * limitations under the License.
@ *
@ *****************************************************************************
@ * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
@*/


.text
.p2align 2
    .global ixheaacd_neg_shift_spec_armv7

ixheaacd_neg_shift_spec_armv7:
    STMFD           sp!, {R4-R12, R14}
    VPUSH           {D8 - D15}
    MOV             R5, #448
    SUB             R6, R5, #1
    MOV             R6, R6, LSL #2
    ADD             R6, R6, R0
    MOV             R8, #-16
    SUB             R6, R6, #12
    MOV             R7, R3, LSL #1
    VDUP.32         Q1, R2
    MOV             R4, #0x8000
    VDUP.32         Q2, R4

    VLD1.32         {D0, D1}, [R6], R8
    VQNEG.S32       Q0, Q0


    VLD1.32         {D6, D7}, [R6], R8
    VQSHL.S32       Q15, Q0, Q1
    VQADD.S32       Q14, Q15, Q2
    VSHR.S32        Q13, Q14, #16
    VREV64.32       Q13, Q13
    SUB             R5, R5, #8

    VUZP.16         D27, D26
    VQNEG.S32       Q3, Q3


LOOP_1:


    VST1.16         D27[0], [R1], R7
    VQSHL.S32       Q12, Q3, Q1
    VLD1.32         {D0, D1}, [R6], R8
    VST1.16         D27[1], [R1], R7
    VQADD.S32       Q11, Q12, Q2
    VST1.16         D27[2], [R1], R7
    VQNEG.S32       Q0, Q0
    VST1.16         D27[3], [R1], R7
    VSHR.S32        Q10, Q11, #16
    VREV64.32       Q10, Q10
    SUBS            R5, R5, #8


    VUZP.16         D21, D20
    VQSHL.S32       Q15, Q0, Q1
    VST1.16         D21[0], [R1], R7
    VLD1.32         {D6, D7}, [R6], R8
    VQADD.S32       Q14, Q15, Q2
    VST1.16         D21[1], [R1], R7
    VSHR.S32        Q13, Q14, #16
    VST1.16         D21[2], [R1], R7
    VREV64.32       Q13, Q13
    VST1.16         D21[3], [R1], R7


    VUZP.16         D27, D26
    VQNEG.S32       Q3, Q3



    BGT             LOOP_1

    VST1.16         D27[0], [R1], R7
    VQSHL.S32       Q12, Q3, Q1
    VST1.16         D27[1], [R1], R7
    VST1.16         D27[2], [R1], R7
    VQADD.S32       Q11, Q12, Q2
    VST1.16         D27[3], [R1], R7
    VSHR.S32        Q10, Q11, #16


    VREV64.32       Q10, Q10

    VUZP.16         D21, D20

    VST1.16         D21[0], [R1], R7
    VST1.16         D21[1], [R1], R7
    VST1.16         D21[2], [R1], R7
    VST1.16         D21[3], [R1], R7
    VPOP            {D8 - D15}
    LDMFD           sp!, {R4-R12, R15}
.end