diff options
Diffstat (limited to 'src/libmpg123/tabinit_mmx.S')
-rw-r--r-- | src/libmpg123/tabinit_mmx.S | 213 |
1 files changed, 213 insertions, 0 deletions
diff --git a/src/libmpg123/tabinit_mmx.S b/src/libmpg123/tabinit_mmx.S new file mode 100644 index 0000000..355d5d8 --- /dev/null +++ b/src/libmpg123/tabinit_mmx.S @@ -0,0 +1,213 @@ +/* + tabinit_mmx: make_decode_tables_mmx + + copyright ?-2006 by the mpg123 project - free software under the terms of the LGPL 2.1 + see COPYING and AUTHORS files in distribution or http://mpg123.org + initially written by the mysterious higway (apparently) +*/ + +#include "mangle.h" + +.data + ALIGN32 +.globl ASM_NAME(costab_mmxsse) +ASM_NAME(costab_mmxsse): + .long 1056974725 + .long 1057056395 + .long 1057223771 + .long 1057485416 + .long 1057855544 + .long 1058356026 + .long 1059019886 + .long 1059897405 + .long 1061067246 + .long 1062657950 + .long 1064892987 + .long 1066774581 + .long 1069414683 + .long 1073984175 + .long 1079645762 + .long 1092815430 + .long 1057005197 + .long 1057342072 + .long 1058087743 + .long 1059427869 + .long 1061799040 + .long 1065862217 + .long 1071413542 + .long 1084439708 + .long 1057128951 + .long 1058664893 + .long 1063675095 + .long 1076102863 + .long 1057655764 + .long 1067924853 + .long 1060439283 + ALIGN32 +intwinbase: + .value 0, -1, -1, -1, -1, -1, -1, -2 + .value -2, -2, -2, -3, -3, -4, -4, -5 + .value -5, -6, -7, -7, -8, -9, -10, -11 + .value -13, -14, -16, -17, -19, -21, -24, -26 + .value -29, -31, -35, -38, -41, -45, -49, -53 + .value -58, -63, -68, -73, -79, -85, -91, -97 + .value -104, -111, -117, -125, -132, -139, -147, -154 + .value -161, -169, -176, -183, -190, -196, -202, -208 + .value -213, -218, -222, -225, -227, -228, -228, -227 + .value -224, -221, -215, -208, -200, -189, -177, -163 + .value -146, -127, -106, -83, -57, -29, 2, 36 + .value 72, 111, 153, 197, 244, 294, 347, 401 + .value 459, 519, 581, 645, 711, 779, 848, 919 + .value 991, 1064, 1137, 1210, 1283, 1356, 1428, 1498 + .value 1567, 1634, 1698, 1759, 1817, 1870, 1919, 1962 + .value 2001, 2032, 2057, 2075, 2085, 2087, 2080, 2063 + .value 2037, 2000, 1952, 1893, 1822, 1739, 1644, 1535 + .value 1414, 1280, 1131, 970, 794, 605, 402, 185 + .value -45, -288, -545, -814, -1095, -1388, -1692, -2006 + .value -2330, -2663, -3004, -3351, -3705, -4063, -4425, -4788 + .value -5153, -5517, -5879, -6237, -6589, -6935, -7271, -7597 + .value -7910, -8209, -8491, -8755, -8998, -9219, -9416, -9585 + .value -9727, -9838, -9916, -9959, -9966, -9935, -9863, -9750 + .value -9592, -9389, -9139, -8840, -8492, -8092, -7640, -7134 + .value -6574, -5959, -5288, -4561, -3776, -2935, -2037, -1082 + .value -70, 998, 2122, 3300, 4533, 5818, 7154, 8540 + .value 9975, 11455, 12980, 14548, 16155, 17799, 19478, 21189 + .value 22929, 24694, 26482, 28289, 30112, 31947,-26209,-24360 + .value -22511,-20664,-18824,-16994,-15179,-13383,-11610, -9863 + .value -8147, -6466, -4822, -3222, -1667, -162, 1289, 2684 + .value 4019, 5290, 6494, 7629, 8692, 9679, 10590, 11420 + .value 12169, 12835, 13415, 13908, 14313, 14630, 14856, 14992 + .value 15038 + +intwindiv: + .long 0x47800000 # 65536.0 +.text + ALIGN32 +/* void make_decode_tables_mmx_asm(long scaleval, float* decwin_mmx, float *decwins); */ +.globl ASM_NAME(make_decode_tables_mmx_asm) +ASM_NAME(make_decode_tables_mmx_asm): + pushl %edi + pushl %esi + pushl %ebx +/* stack: 0=ebx, 4=esi, 8=edi, 12=back, 16=scaleval, 20=decwin_mmx, 24=decwins */ + + xorl %ecx,%ecx + xorl %ebx,%ebx + movl $32,%esi + movl $intwinbase,%edi + negl 16(%esp) /* scaleval */ + pushl $2 /* intwinbase step */ +/* stack: 20=scaleval 24=decwin_mmx, 28=decwins */ +.L00: + cmpl $528,%ecx + jnc .L02 + movswl (%edi),%eax + cmpl $intwinbase+444,%edi + jc .L01 + addl $60000,%eax +.L01: + pushl %eax +/* stack: 24=scaleval 28=decwin_mmx, 32=decwins */ + fildl (%esp) + fdivs intwindiv + fimull 24(%esp) /* scaleval */ +/* eax used to be popped the line before... I'll just use it here a bit */ + movl 28(%esp),%eax /* decwin_mmx */ + fsts (%eax,%ecx,4) + fstps 64(%eax,%ecx,4) + popl %eax +/* stack: 20=scaleval 24=decwin_mmx, 28=decwins */ +.L02: + leal -1(%esi),%edx + and %ebx,%edx + cmp $31,%edx + jnz .L03 + addl $-1023,%ecx + test %esi,%ebx + jz .L03 + negl 20(%esp) +.L03: + addl %esi,%ecx + addl (%esp),%edi + incl %ebx + cmpl $intwinbase,%edi + jz .L04 + cmp $256,%ebx + jnz .L00 + negl (%esp) + jmp .L00 +.L04: + popl %eax + + xorl %ecx,%ecx + xorl %ebx,%ebx + pushl $2 /* paired with popl above */ +.L05: + cmpl $528,%ecx + jnc .L11 + movswl (%edi),%eax + cmpl $intwinbase+444,%edi + jc .L06 + addl $60000,%eax +.L06: + cltd + imull 20(%esp) + shrdl $17,%edx,%eax + cmpl $32767,%eax + movl $1055,%edx + jle .L07 + movl $32767,%eax + jmp .L08 +.L07: + cmpl $-32767,%eax + jge .L08 + movl $-32767,%eax +.L08: +/* going to use ebx for decwins, watch the jumps */ + pushl %ebx +/* stack: 24=scaleval 28=decwin_mmx, 32=decwins */ + movl 32(%esp),%ebx + cmpl $512,%ecx + jnc .L09 + subl %ecx,%edx + movw %ax,(%ebx,%edx,2) /* decwins */ + movw %ax,-32(%ebx,%edx,2) +.L09: + testl $1,%ecx + jnz .L10 + negl %eax +.L10: + movw %ax,(%ebx,%ecx,2) + movw %ax,32(%ebx,%ecx,2) + popl %ebx /* that has to match the pushl before */ +.L11: + leal -1(%esi),%edx + and %ebx,%edx + cmp $31,%edx + jnz .L12 + addl $-1023,%ecx + test %esi,%ebx + jz .L12 + negl 20(%esp) +.L12: + addl %esi,%ecx + addl (%esp),%edi + incl %ebx + cmpl $intwinbase,%edi + jz .L13 + cmp $256,%ebx + jnz .L05 + negl (%esp) + jmp .L05 +.L13: + popl %eax + + popl %ebx + popl %esi + popl %edi + ret + +/* Mark non-executable stack. */ +#if defined(__linux__) && defined(__ELF__) +.section .note.GNU-stack,"",%progbits +#endif |