view decoders/libmpg123/tabinit_mmx.S @ 562:7e08477b0fc1

MP3 decoder upgrade work. Ripped out SMPEG and mpglib support, replaced it with "mpg123.c" and libmpg123. libmpg123 is a much better version of mpglib, so it should solve all the problems about MP3's not seeking, or most modern MP3's not playing at all, etc. Since you no longer have to make a tradeoff with SMPEG for features, and SMPEG is basically rotting, I removed it from the project. There is still work to be done with libmpg123...there are MMX, 3DNow, SSE, Altivec, etc decoders which we don't have enabled at the moment, and the build system could use some work to make this compile more cleanly, etc. Still: huge win.
author Ryan C. Gordon <icculus@icculus.org>
date Fri, 30 Jan 2009 02:44:47 -0500
parents
children
line wrap: on
line source

/*
	tabinit_mmx: make_decode_tables_mmx

	copyright ?-2006 by the mpg123 project - free software under the terms of the LGPL 2.1
	see COPYING and AUTHORS files in distribution or http://mpg123.org
	initially written by the mysterious higway (apparently)
*/

#include "mangle.h"

.data
	ALIGN32
.globl ASM_NAME(costab_mmxsse)
ASM_NAME(costab_mmxsse):
	.long 1056974725
	.long 1057056395
	.long 1057223771
	.long 1057485416
	.long 1057855544
	.long 1058356026
	.long 1059019886
	.long 1059897405
	.long 1061067246
	.long 1062657950
	.long 1064892987
	.long 1066774581
	.long 1069414683
	.long 1073984175
	.long 1079645762
	.long 1092815430
	.long 1057005197
	.long 1057342072
	.long 1058087743
	.long 1059427869
	.long 1061799040
	.long 1065862217
	.long 1071413542
	.long 1084439708
	.long 1057128951
	.long 1058664893
	.long 1063675095
	.long 1076102863
	.long 1057655764
	.long 1067924853
	.long 1060439283
	ALIGN32
intwinbase:
	.value      0,    -1,    -1,    -1,    -1,    -1,    -1,    -2
	.value     -2,    -2,    -2,    -3,    -3,    -4,    -4,    -5
	.value     -5,    -6,    -7,    -7,    -8,    -9,   -10,   -11
	.value    -13,   -14,   -16,   -17,   -19,   -21,   -24,   -26
	.value    -29,   -31,   -35,   -38,   -41,   -45,   -49,   -53
	.value    -58,   -63,   -68,   -73,   -79,   -85,   -91,   -97
	.value   -104,  -111,  -117,  -125,  -132,  -139,  -147,  -154
	.value   -161,  -169,  -176,  -183,  -190,  -196,  -202,  -208
	.value   -213,  -218,  -222,  -225,  -227,  -228,  -228,  -227
	.value   -224,  -221,  -215,  -208,  -200,  -189,  -177,  -163
	.value   -146,  -127,  -106,   -83,   -57,   -29,     2,    36
	.value     72,   111,   153,   197,   244,   294,   347,   401
	.value    459,   519,   581,   645,   711,   779,   848,   919
	.value    991,  1064,  1137,  1210,  1283,  1356,  1428,  1498
	.value   1567,  1634,  1698,  1759,  1817,  1870,  1919,  1962
	.value   2001,  2032,  2057,  2075,  2085,  2087,  2080,  2063
	.value   2037,  2000,  1952,  1893,  1822,  1739,  1644,  1535
	.value   1414,  1280,  1131,   970,   794,   605,   402,   185
	.value    -45,  -288,  -545,  -814, -1095, -1388, -1692, -2006
	.value  -2330, -2663, -3004, -3351, -3705, -4063, -4425, -4788
	.value  -5153, -5517, -5879, -6237, -6589, -6935, -7271, -7597
	.value  -7910, -8209, -8491, -8755, -8998, -9219, -9416, -9585
	.value  -9727, -9838, -9916, -9959, -9966, -9935, -9863, -9750
	.value  -9592, -9389, -9139, -8840, -8492, -8092, -7640, -7134
	.value  -6574, -5959, -5288, -4561, -3776, -2935, -2037, -1082
	.value    -70,   998,  2122,  3300,  4533,  5818,  7154,  8540
	.value   9975, 11455, 12980, 14548, 16155, 17799, 19478, 21189
	.value  22929, 24694, 26482, 28289, 30112, 31947,-26209,-24360
	.value -22511,-20664,-18824,-16994,-15179,-13383,-11610, -9863
	.value  -8147, -6466, -4822, -3222, -1667,  -162,  1289,  2684
	.value   4019,  5290,  6494,  7629,  8692,  9679, 10590, 11420
	.value  12169, 12835, 13415, 13908, 14313, 14630, 14856, 14992
	.value  15038

intwindiv:
	.long 0x47800000			# 65536.0
.text
	ALIGN32
/* void make_decode_tables_mmx_asm(long scaleval, float* decwin_mmx, float *decwins); */
.globl ASM_NAME(make_decode_tables_mmx_asm)
ASM_NAME(make_decode_tables_mmx_asm):
	pushl %edi
	pushl %esi
	pushl %ebx
/* stack: 0=ebx, 4=esi, 8=edi, 12=back, 16=scaleval, 20=decwin_mmx, 24=decwins */

	xorl %ecx,%ecx
	xorl %ebx,%ebx
	movl $32,%esi
	movl $intwinbase,%edi
	negl 16(%esp)	/* scaleval */
	pushl $2	/* intwinbase step */
/* stack: 20=scaleval 24=decwin_mmx, 28=decwins */
.L00:
	cmpl $528,%ecx
	jnc .L02
	movswl (%edi),%eax
	cmpl $intwinbase+444,%edi
	jc .L01
	addl $60000,%eax
.L01:
	pushl %eax
/* stack: 24=scaleval 28=decwin_mmx, 32=decwins */
	fildl (%esp)
	fdivs intwindiv
	fimull 24(%esp) /* scaleval */
/* eax used to be popped the line before... I'll just use it here a bit */
	movl 28(%esp),%eax /* decwin_mmx */
	fsts    (%eax,%ecx,4)
	fstps 64(%eax,%ecx,4)
	popl %eax
/* stack: 20=scaleval 24=decwin_mmx, 28=decwins */
.L02:
	leal -1(%esi),%edx
	and %ebx,%edx
	cmp $31,%edx
	jnz .L03
	addl $-1023,%ecx
	test %esi,%ebx
	jz  .L03
	negl 20(%esp)
.L03:
	addl %esi,%ecx
	addl (%esp),%edi
	incl %ebx
	cmpl $intwinbase,%edi
	jz .L04
	cmp $256,%ebx
	jnz .L00
	negl (%esp)
	jmp .L00
.L04:
	popl %eax

	xorl %ecx,%ecx
	xorl %ebx,%ebx
	pushl $2 /* paired with popl above */
.L05:
	cmpl $528,%ecx
	jnc .L11
	movswl (%edi),%eax
	cmpl $intwinbase+444,%edi
	jc .L06
	addl $60000,%eax
.L06:
	cltd
	imull 20(%esp)
	shrdl $17,%edx,%eax
	cmpl $32767,%eax
	movl $1055,%edx
	jle .L07
	movl $32767,%eax
	jmp .L08
.L07:
	cmpl $-32767,%eax
	jge .L08
	movl $-32767,%eax
.L08:
/* going to use ebx for decwins, watch the jumps */
	pushl %ebx 
/* stack: 24=scaleval 28=decwin_mmx, 32=decwins */
	movl 32(%esp),%ebx
	cmpl $512,%ecx
	jnc .L09
	subl %ecx,%edx
	movw %ax,(%ebx,%edx,2) /* decwins */
	movw %ax,-32(%ebx,%edx,2)
.L09:
	testl $1,%ecx
	jnz .L10
	negl %eax
.L10:
	movw %ax,(%ebx,%ecx,2)
	movw %ax,32(%ebx,%ecx,2)
	popl %ebx /* that has to match the pushl before */
.L11:
	leal -1(%esi),%edx
	and %ebx,%edx
	cmp $31,%edx
	jnz .L12
	addl $-1023,%ecx
	test %esi,%ebx
	jz  .L12
	negl 20(%esp)
.L12:
	addl %esi,%ecx
	addl (%esp),%edi
	incl %ebx
	cmpl $intwinbase,%edi
	jz .L13
	cmp $256,%ebx
	jnz .L05
	negl (%esp)
	jmp .L05
.L13:
	popl %eax
	
	popl %ebx
	popl %esi
	popl %edi
	ret

/* Mark non-executable stack. */
#if defined(__linux__) && defined(__ELF__)
.section .note.GNU-stack,"",%progbits
#endif