/shark/trunk/ports/mesa/src/x86/common_x86_macros.h |
---|
File deleted |
/shark/trunk/ports/mesa/src/x86/x86_xform3.s |
---|
File deleted |
/shark/trunk/ports/mesa/src/x86/x86_xform2.s |
---|
File deleted |
/shark/trunk/ports/mesa/src/x86/x86_xform4.s |
---|
File deleted |
/shark/trunk/ports/mesa/src/x86/common_x86_features.h |
---|
File deleted |
/shark/trunk/ports/mesa/src/x86/common_x86_asm.s |
---|
File deleted |
/shark/trunk/ports/mesa/src/x86/common_x86_asm.h |
---|
1,4 → 1,4 |
/* $Id: common_x86_asm.h,v 1.1 2003-03-13 12:11:48 giacomo Exp $ */ |
/* $Id: common_x86_asm.h,v 1.2 2003-04-24 13:36:03 giacomo Exp $ */ |
/* |
* Mesa 3-D graphics library |
41,7 → 41,7 |
/* Do not reference mtypes.h from this file. |
*/ |
#include "common_x86_features.h" |
#include "features_common_x86.h" |
#ifdef HAVE_CONFIG_H |
#include "conf.h" |
/shark/trunk/ports/mesa/src/x86/macros_common_x86.h |
---|
0,0 → 1,107 |
/* $Id: macros_common_x86.h,v 1.1 2003-04-24 13:36:03 giacomo Exp $ */ |
/* |
* Mesa 3-D graphics library |
* Version: 3.5 |
* |
* Copyright (C) 1999-2001 Brian Paul All Rights Reserved. |
* |
* Permission is hereby granted, free of charge, to any person obtaining a |
* copy of this software and associated documentation files (the "Software"), |
* to deal in the Software without restriction, including without limitation |
* the rights to use, copy, modify, merge, publish, distribute, sublicense, |
* and/or sell copies of the Software, and to permit persons to whom the |
* Software is furnished to do so, subject to the following conditions: |
* |
* The above copyright notice and this permission notice shall be included |
* in all copies or substantial portions of the Software. |
* |
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS |
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
* BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN |
* AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN |
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. |
* |
* Authors: |
* Gareth Hughes |
*/ |
#ifndef __COMMON_X86_MACROS_H__ |
#define __COMMON_X86_MACROS_H__ |
/* ============================================================= |
* Transformation function declarations: |
*/ |
#define XFORM_ARGS GLvector4f *to_vec, \ |
const GLfloat m[16], \ |
const GLvector4f *from_vec |
#define DECLARE_XFORM_GROUP( pfx, sz ) \ |
extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_general( XFORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_identity( XFORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_3d_no_rot( XFORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_perspective( XFORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_2d( XFORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_2d_no_rot( XFORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_3d( XFORM_ARGS ); |
#define ASSIGN_XFORM_GROUP( pfx, sz ) \ |
_mesa_transform_tab[sz][MATRIX_GENERAL] = \ |
_mesa_##pfx##_transform_points##sz##_general; \ |
_mesa_transform_tab[sz][MATRIX_IDENTITY] = \ |
_mesa_##pfx##_transform_points##sz##_identity; \ |
_mesa_transform_tab[sz][MATRIX_3D_NO_ROT] = \ |
_mesa_##pfx##_transform_points##sz##_3d_no_rot; \ |
_mesa_transform_tab[sz][MATRIX_PERSPECTIVE] = \ |
_mesa_##pfx##_transform_points##sz##_perspective; \ |
_mesa_transform_tab[sz][MATRIX_2D] = \ |
_mesa_##pfx##_transform_points##sz##_2d; \ |
_mesa_transform_tab[sz][MATRIX_2D_NO_ROT] = \ |
_mesa_##pfx##_transform_points##sz##_2d_no_rot; \ |
_mesa_transform_tab[sz][MATRIX_3D] = \ |
_mesa_##pfx##_transform_points##sz##_3d; |
/* ============================================================= |
* Normal transformation function declarations: |
*/ |
#define NORM_ARGS const GLmatrix *mat, \ |
GLfloat scale, \ |
const GLvector4f *in, \ |
const GLfloat *lengths, \ |
GLvector4f *dest |
#define DECLARE_NORM_GROUP( pfx ) \ |
extern void _ASMAPI _mesa_##pfx##_rescale_normals( NORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_normalize_normals( NORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_normals( NORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_normals_no_rot( NORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_rescale_normals( NORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_rescale_normals_no_rot( NORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_normalize_normals( NORM_ARGS ); \ |
extern void _ASMAPI _mesa_##pfx##_transform_normalize_normals_no_rot( NORM_ARGS ); |
#define ASSIGN_NORM_GROUP( pfx ) \ |
_mesa_normal_tab[NORM_RESCALE] = \ |
_mesa_##pfx##_rescale_normals; \ |
_mesa_normal_tab[NORM_NORMALIZE] = \ |
_mesa_##pfx##_normalize_normals; \ |
_mesa_normal_tab[NORM_TRANSFORM] = \ |
_mesa_##pfx##_transform_normals; \ |
_mesa_normal_tab[NORM_TRANSFORM_NO_ROT] = \ |
_mesa_##pfx##_transform_normals_no_rot; \ |
_mesa_normal_tab[NORM_TRANSFORM | NORM_RESCALE] = \ |
_mesa_##pfx##_transform_rescale_normals; \ |
_mesa_normal_tab[NORM_TRANSFORM_NO_ROT | NORM_RESCALE] = \ |
_mesa_##pfx##_transform_rescale_normals_no_rot; \ |
_mesa_normal_tab[NORM_TRANSFORM | NORM_NORMALIZE] = \ |
_mesa_##pfx##_transform_normalize_normals; \ |
_mesa_normal_tab[NORM_TRANSFORM_NO_ROT | NORM_NORMALIZE] = \ |
_mesa_##pfx##_transform_normalize_normals_no_rot; |
#endif |
/shark/trunk/ports/mesa/src/x86/asm_common_x86.s |
---|
0,0 → 1,239 |
/* $Id: asm_common_x86.s,v 1.1 2003-04-24 13:36:02 giacomo Exp $ */ |
/* |
* Mesa 3-D graphics library |
* Version: 4.0.3 |
* |
* Copyright (C) 1999-2002 Brian Paul All Rights Reserved. |
* |
* Permission is hereby granted, free of charge, to any person obtaining a |
* copy of this software and associated documentation files (the "Software"), |
* to deal in the Software without restriction, including without limitation |
* the rights to use, copy, modify, merge, publish, distribute, sublicense, |
* and/or sell copies of the Software, and to permit persons to whom the |
* Software is furnished to do so, subject to the following conditions: |
* |
* The above copyright notice and this permission notice shall be included |
* in all copies or substantial portions of the Software. |
* |
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS |
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
* BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN |
* AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN |
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. |
*/ |
/* |
* Check extended CPU capabilities. Now justs returns the raw CPUID |
* feature information, allowing the higher level code to interpret the |
* results. |
* |
* Written by Holger Waechtler <holger@akaflieg.extern.tu-berlin.de> |
* |
* Cleaned up and simplified by Gareth Hughes <gareth@valinux.com> |
*/ |
/* |
* NOTE: Avoid using spaces in between '(' ')' and arguments, especially |
* with macros like CONST, LLBL that expand to CONCAT(...). Putting spaces |
* in there will break the build on some platforms. |
*/ |
#include "matypes.h" |
#include "features_common_x86.h" |
/* Intel vendor string |
*/ |
#define GENU 0x756e6547 /* "Genu" */ |
#define INEI 0x49656e69 /* "ineI" */ |
#define NTEL 0x6c65746e /* "ntel" */ |
/* AMD vendor string |
*/ |
#define AUTH 0x68747541 /* "Auth" */ |
#define ENTI 0x69746e65 /* "enti" */ |
#define CAMD 0x444d4163 /* "cAMD" */ |
SEG_DATA |
/* We might want to print out some useful messages. |
*/ |
GLNAME( found_intel ): STRING( "Genuine Intel processor found\n\0" ) |
GLNAME( found_amd ): STRING( "Authentic AMD processor found\n\0" ) |
SEG_TEXT |
ALIGNTEXT4 |
GLOBL GLNAME( _mesa_identify_x86_cpu_features ) |
GLNAME( _mesa_identify_x86_cpu_features ): |
PUSH_L ( EBX ) |
PUSH_L ( ESI ) |
/* Test for the CPUID command. If the ID Flag bit in EFLAGS |
* (bit 21) is writable, the CPUID command is present. |
*/ |
PUSHF_L |
POP_L ( EAX ) |
MOV_L ( EAX, ECX ) |
XOR_L ( CONST(0x00200000), EAX ) |
PUSH_L ( EAX ) |
POPF_L |
PUSHF_L |
POP_L ( EAX ) |
/* Verify the ID Flag bit has been written. |
*/ |
CMP_L ( ECX, EAX ) |
JZ ( LLBL (cpuid_done) ) |
/* Get the CPU vendor info. |
*/ |
XOR_L ( EAX, EAX ) |
CPUID |
/* Test for Intel processors. We must look for the |
* "GenuineIntel" string in EBX, ECX and EDX. |
*/ |
CMP_L ( CONST(GENU), EBX ) |
JNE ( LLBL(cpuid_amd) ) |
CMP_L ( CONST(INEI), EDX ) |
JNE ( LLBL(cpuid_amd) ) |
CMP_L ( CONST(NTEL), ECX ) |
JNE ( LLBL(cpuid_amd) ) |
/* We have an Intel processor, so we can get the feature |
* information with an CPUID input value of 1. |
*/ |
MOV_L ( CONST(0x1), EAX ) |
CPUID |
MOV_L ( EDX, EAX ) |
/* Mask out highest bit, which is used by AMD for 3dnow |
* Newer Intel have this bit set, but do not support 3dnow |
*/ |
AND_L ( CONST(0X7FFFFFFF), EAX) |
JMP ( LLBL(cpuid_done) ) |
LLBL(cpuid_amd): |
/* Test for AMD processors. We must look for the |
* "AuthenticAMD" string in EBX, ECX and EDX. |
*/ |
CMP_L ( CONST(AUTH), EBX ) |
JNE ( LLBL(cpuid_other) ) |
CMP_L ( CONST(ENTI), EDX ) |
JNE ( LLBL(cpuid_other) ) |
CMP_L ( CONST(CAMD), ECX ) |
JNE ( LLBL(cpuid_other) ) |
/* We have an AMD processor, so we can get the feature |
* information after we verify that the extended functions are |
* supported. |
*/ |
/* The features we need are almost all in the extended set. The |
* exception is SSE enable, which is in the standard set (0x1). |
*/ |
MOV_L ( CONST(0x1), EAX ) |
CPUID |
TEST_L ( EAX, EAX ) |
JZ ( LLBL (cpuid_failed) ) |
MOV_L ( EDX, ESI ) |
MOV_L ( CONST(0x80000000), EAX ) |
CPUID |
TEST_L ( EAX, EAX ) |
JZ ( LLBL (cpuid_failed) ) |
MOV_L ( CONST(0x80000001), EAX ) |
CPUID |
MOV_L ( EDX, EAX ) |
AND_L ( CONST(0x02000000), ESI ) /* OR in the SSE bit */ |
OR_L ( ESI, EAX ) |
JMP ( LLBL (cpuid_done) ) |
LLBL(cpuid_other): |
/* Test for other processors here when required. |
*/ |
LLBL(cpuid_failed): |
/* If we can't determine the feature information, we must |
* return zero to indicate that no platform-specific |
* optimizations can be used. |
*/ |
MOV_L ( CONST(0), EAX ) |
LLBL (cpuid_done): |
POP_L ( ESI ) |
POP_L ( EBX ) |
RET |
#ifdef USE_SSE_ASM |
/* Execute an SSE instruction to see if the operating system correctly |
* supports SSE. A signal handler for SIGILL should have been set |
* before calling this function, otherwise this could kill the client |
* application. |
*/ |
ALIGNTEXT4 |
GLOBL GLNAME( _mesa_test_os_sse_support ) |
GLNAME( _mesa_test_os_sse_support ): |
XORPS ( XMM0, XMM0 ) |
RET |
/* Perform an SSE divide-by-zero to see if the operating system |
* correctly supports unmasked SIMD FPU exceptions. Signal handlers for |
* SIGILL and SIGFPE should have been set before calling this function, |
* otherwise this could kill the client application. |
*/ |
ALIGNTEXT4 |
GLOBL GLNAME( _mesa_test_os_sse_exception_support ) |
GLNAME( _mesa_test_os_sse_exception_support ): |
PUSH_L ( EBP ) |
MOV_L ( ESP, EBP ) |
SUB_L ( CONST( 8 ), ESP ) |
/* Save the original MXCSR register value. |
*/ |
STMXCSR ( REGOFF( -4, EBP ) ) |
/* Unmask the divide-by-zero exception and perform one. |
*/ |
STMXCSR ( REGOFF( -8, EBP ) ) |
AND_L ( CONST( 0xfffffdff ), REGOFF( -8, EBP ) ) |
LDMXCSR ( REGOFF( -8, EBP ) ) |
XORPS ( XMM0, XMM0 ) |
PUSH_L ( CONST( 0x3f800000 ) ) |
PUSH_L ( CONST( 0x3f800000 ) ) |
PUSH_L ( CONST( 0x3f800000 ) ) |
PUSH_L ( CONST( 0x3f800000 ) ) |
MOVUPS ( REGIND( ESP ), XMM1 ) |
ADD_L ( CONST( 32 ), ESP ) |
DIVPS ( XMM0, XMM1 ) |
/* Restore the original MXCSR register value. |
*/ |
LDMXCSR ( REGOFF( -4, EBP ) ) |
LEAVE |
RET |
#endif |
/shark/trunk/ports/mesa/src/x86/features_common_x86.h |
---|
0,0 → 1,80 |
/* $Id: features_common_x86.h,v 1.1 2003-04-24 13:36:03 giacomo Exp $ */ |
/* |
* Mesa 3-D graphics library |
* Version: 3.5 |
* |
* Copyright (C) 1999-2001 Brian Paul All Rights Reserved. |
* |
* Permission is hereby granted, free of charge, to any person obtaining a |
* copy of this software and associated documentation files (the "Software"), |
* to deal in the Software without restriction, including without limitation |
* the rights to use, copy, modify, merge, publish, distribute, sublicense, |
* and/or sell copies of the Software, and to permit persons to whom the |
* Software is furnished to do so, subject to the following conditions: |
* |
* The above copyright notice and this permission notice shall be included |
* in all copies or substantial portions of the Software. |
* |
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS |
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
* BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN |
* AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN |
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. |
*/ |
/* |
* x86 CPUID feature information. The raw data is returned by |
* _mesa_identify_x86_cpu_features() and interpreted with the cpu_has_* |
* helper macros. |
* |
* Gareth Hughes |
*/ |
#ifndef __COMMON_X86_FEATURES_H__ |
#define __COMMON_X86_FEATURES_H__ |
/* Capabilities of CPUs |
*/ |
#define X86_FEATURE_FPU 0x00000001 |
#define X86_FEATURE_VME 0x00000002 |
#define X86_FEATURE_DE 0x00000004 |
#define X86_FEATURE_PSE 0x00000008 |
#define X86_FEATURE_TSC 0x00000010 |
#define X86_FEATURE_MSR 0x00000020 |
#define X86_FEATURE_PAE 0x00000040 |
#define X86_FEATURE_MCE 0x00000080 |
#define X86_FEATURE_CX8 0x00000100 |
#define X86_FEATURE_APIC 0x00000200 |
#define X86_FEATURE_10 0x00000400 |
#define X86_FEATURE_SEP 0x00000800 |
#define X86_FEATURE_MTRR 0x00001000 |
#define X86_FEATURE_PGE 0x00002000 |
#define X86_FEATURE_MCA 0x00004000 |
#define X86_FEATURE_CMOV 0x00008000 |
#define X86_FEATURE_PAT 0x00010000 |
#define X86_FEATURE_PSE36 0x00020000 |
#define X86_FEATURE_18 0x00040000 |
#define X86_FEATURE_19 0x00080000 |
#define X86_FEATURE_20 0x00100000 |
#define X86_FEATURE_21 0x00200000 |
#define X86_FEATURE_MMXEXT 0x00400000 |
#define X86_FEATURE_MMX 0x00800000 |
#define X86_FEATURE_FXSR 0x01000000 |
#define X86_FEATURE_XMM 0x02000000 |
#define X86_FEATURE_XMM2 0x04000000 |
#define X86_FEATURE_27 0x08000000 |
#define X86_FEATURE_28 0x10000000 |
#define X86_FEATURE_29 0x20000000 |
#define X86_FEATURE_3DNOWEXT 0x40000000 |
#define X86_FEATURE_3DNOW 0x80000000 |
#define cpu_has_mmx (_mesa_x86_cpu_features & X86_FEATURE_MMX) |
#define cpu_has_mmxext (_mesa_x86_cpu_features & X86_FEATURE_MMXEXT) |
#define cpu_has_xmm (_mesa_x86_cpu_features & X86_FEATURE_XMM) |
#define cpu_has_xmm2 (_mesa_x86_cpu_features & X86_FEATURE_XMM2) |
#define cpu_has_3dnow (_mesa_x86_cpu_features & X86_FEATURE_3DNOW) |
#define cpu_has_3dnowext (_mesa_x86_cpu_features & X86_FEATURE_3DNOWEXT) |
#endif |
/shark/trunk/ports/mesa/src/x86/xform2_x86.s |
---|
0,0 → 1,563 |
/* $Id: xform2_x86.s,v 1.1 2003-04-24 13:36:03 giacomo Exp $ */ |
/* |
* Mesa 3-D graphics library |
* Version: 3.5 |
* |
* Copyright (C) 1999-2001 Brian Paul All Rights Reserved. |
* |
* Permission is hereby granted, free of charge, to any person obtaining a |
* copy of this software and associated documentation files (the "Software"), |
* to deal in the Software without restriction, including without limitation |
* the rights to use, copy, modify, merge, publish, distribute, sublicense, |
* and/or sell copies of the Software, and to permit persons to whom the |
* Software is furnished to do so, subject to the following conditions: |
* |
* The above copyright notice and this permission notice shall be included |
* in all copies or substantial portions of the Software. |
* |
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS |
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
* BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN |
* AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN |
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. |
*/ |
/* |
* NOTE: Avoid using spaces in between '(' ')' and arguments, especially |
* with macros like CONST, LLBL that expand to CONCAT(...). Putting spaces |
* in there will break the build on some platforms. |
*/ |
#include "matypes.h" |
#include "xform_args.h" |
SEG_TEXT |
#define FP_ONE 1065353216 |
#define FP_ZERO 0 |
#define SRC0 REGOFF(0, ESI) |
#define SRC1 REGOFF(4, ESI) |
#define SRC2 REGOFF(8, ESI) |
#define SRC3 REGOFF(12, ESI) |
#define DST0 REGOFF(0, EDI) |
#define DST1 REGOFF(4, EDI) |
#define DST2 REGOFF(8, EDI) |
#define DST3 REGOFF(12, EDI) |
#define MAT0 REGOFF(0, EDX) |
#define MAT1 REGOFF(4, EDX) |
#define MAT2 REGOFF(8, EDX) |
#define MAT3 REGOFF(12, EDX) |
#define MAT4 REGOFF(16, EDX) |
#define MAT5 REGOFF(20, EDX) |
#define MAT6 REGOFF(24, EDX) |
#define MAT7 REGOFF(28, EDX) |
#define MAT8 REGOFF(32, EDX) |
#define MAT9 REGOFF(36, EDX) |
#define MAT10 REGOFF(40, EDX) |
#define MAT11 REGOFF(44, EDX) |
#define MAT12 REGOFF(48, EDX) |
#define MAT13 REGOFF(52, EDX) |
#define MAT14 REGOFF(56, EDX) |
#define MAT15 REGOFF(60, EDX) |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points2_general ) |
GLNAME( _mesa_x86_transform_points2_general ): |
#define FRAME_OFFSET 8 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p2_gr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p2_gr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC0 ) /* F5 F4 */ |
FMUL_S( MAT1 ) |
FLD_S( SRC0 ) /* F6 F5 F4 */ |
FMUL_S( MAT2 ) |
FLD_S( SRC0 ) /* F7 F6 F5 F4 */ |
FMUL_S( MAT3 ) |
FLD_S( SRC1 ) /* F0 F7 F6 F5 F4 */ |
FMUL_S( MAT4 ) |
FLD_S( SRC1 ) /* F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT5 ) |
FLD_S( SRC1 ) /* F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT6 ) |
FLD_S( SRC1 ) /* F3 F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT7 ) |
FXCH( ST(3) ) /* F0 F2 F1 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(7) ) /* F2 F1 F3 F7 F6 F5 F4 */ |
FXCH( ST(1) ) /* F1 F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F7 F6 F5 F4 */ |
FXCH( ST(3) ) /* F4 F6 F5 F7 */ |
FADD_S( MAT12 ) |
FXCH( ST(2) ) /* F5 F6 F4 F7 */ |
FADD_S( MAT13 ) |
FXCH( ST(1) ) /* F6 F5 F4 F7 */ |
FADD_S( MAT14 ) |
FXCH( ST(3) ) /* F7 F5 F4 F6 */ |
FADD_S( MAT15 ) |
FXCH( ST(2) ) /* F4 F5 F7 F6 */ |
FSTP_S( DST0 ) /* F5 F7 F6 */ |
FSTP_S( DST1 ) /* F7 F6 */ |
FXCH( ST(1) ) /* F6 F7 */ |
FSTP_S( DST2 ) /* F7 */ |
FSTP_S( DST3 ) /* */ |
LLBL(x86_p2_gr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p2_gr_loop) ) |
LLBL(x86_p2_gr_done): |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points2_perspective ) |
GLNAME( _mesa_x86_transform_points2_perspective ): |
#define FRAME_OFFSET 12 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p2_pr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
MOV_L( MAT14, EBX ) |
ALIGNTEXT16 |
LLBL(x86_p2_pr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC1 ) /* F1 F4 */ |
FMUL_S( MAT5 ) |
FXCH( ST(1) ) /* F4 F1 */ |
FSTP_S( DST0 ) /* F1 */ |
FSTP_S( DST1 ) /* */ |
MOV_L( EBX, DST2 ) |
MOV_L( CONST(FP_ZERO), DST3 ) |
LLBL(x86_p2_pr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p2_pr_loop) ) |
LLBL(x86_p2_pr_done): |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points2_3d ) |
GLNAME( _mesa_x86_transform_points2_3d ): |
#define FRAME_OFFSET 8 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p2_3dr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_3), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(3), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p2_3dr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC0 ) /* F5 F4 */ |
FMUL_S( MAT1 ) |
FLD_S( SRC0 ) /* F6 F5 F4 */ |
FMUL_S( MAT2 ) |
FLD_S( SRC1 ) /* F0 F6 F5 F4 */ |
FMUL_S( MAT4 ) |
FLD_S( SRC1 ) /* F1 F0 F6 F5 F4 */ |
FMUL_S( MAT5 ) |
FLD_S( SRC1 ) /* F2 F1 F0 F6 F5 F4 */ |
FMUL_S( MAT6 ) |
FXCH( ST(2) ) /* F0 F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F2 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F6 F5 F4 */ |
FXCH( ST(2) ) /* F4 F5 F6 */ |
FADD_S( MAT12 ) |
FXCH( ST(1) ) /* F5 F4 F6 */ |
FADD_S( MAT13 ) |
FXCH( ST(2) ) /* F6 F4 F5 */ |
FADD_S( MAT14 ) |
FXCH( ST(1) ) /* F4 F6 F5 */ |
FSTP_S( DST0 ) /* F6 F5 */ |
FXCH( ST(1) ) /* F5 F6 */ |
FSTP_S( DST1 ) /* F6 */ |
FSTP_S( DST2 ) /* */ |
LLBL(x86_p2_3dr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p2_3dr_loop) ) |
LLBL(x86_p2_3dr_done): |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points2_3d_no_rot ) |
GLNAME( _mesa_x86_transform_points2_3d_no_rot ): |
#define FRAME_OFFSET 12 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p2_3dnrr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_3), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(3), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
MOV_L( MAT14, EBX ) |
ALIGNTEXT16 |
LLBL(x86_p2_3dnrr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC1 ) /* F1 F4 */ |
FMUL_S( MAT5 ) |
FXCH( ST(1) ) /* F4 F1 */ |
FADD_S( MAT12 ) |
FLD_S( MAT13 ) /* F5 F4 F1 */ |
FXCH( ST(2) ) /* F1 F4 F5 */ |
FADDP( ST0, ST(2) ) /* F4 F5 */ |
FSTP_S( DST0 ) /* F5 */ |
FSTP_S( DST1 ) /* */ |
MOV_L( EBX, DST2 ) |
LLBL(x86_p2_3dnrr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p2_3dnrr_loop) ) |
LLBL(x86_p2_3dnrr_done): |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points2_2d ) |
GLNAME( _mesa_x86_transform_points2_2d ): |
#define FRAME_OFFSET 8 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p2_2dr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_2), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(2), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p2_2dr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC0 ) /* F5 F4 */ |
FMUL_S( MAT1 ) |
FLD_S( SRC1 ) /* F0 F5 F4 */ |
FMUL_S( MAT4 ) |
FLD_S( SRC1 ) /* F1 F0 F5 F4 */ |
FMUL_S( MAT5 ) |
FXCH( ST(1) ) /* F0 F1 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F1 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F5 F4 */ |
FXCH( ST(1) ) /* F4 F5 */ |
FADD_S( MAT12 ) |
FXCH( ST(1) ) /* F5 F4 */ |
FADD_S( MAT13 ) |
FXCH( ST(1) ) /* F4 F5 */ |
FSTP_S( DST0 ) /* F5 */ |
FSTP_S( DST1 ) /* */ |
LLBL(x86_p2_2dr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p2_2dr_loop) ) |
LLBL(x86_p2_2dr_done): |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT4 |
GLOBL GLNAME( _mesa_x86_transform_points2_2d_no_rot ) |
GLNAME( _mesa_x86_transform_points2_2d_no_rot ): |
#define FRAME_OFFSET 8 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p2_2dnrr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_2), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(2), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p2_2dnrr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC1 ) /* F1 F4 */ |
FMUL_S( MAT5 ) |
FXCH( ST(1) ) /* F4 F1 */ |
FADD_S( MAT12 ) |
FLD_S( MAT13 ) /* F5 F4 F1 */ |
FXCH( ST(2) ) /* F1 F4 F5 */ |
FADDP( ST0, ST(2) ) /* F4 F5 */ |
FSTP_S( DST0 ) /* F5 */ |
FSTP_S( DST1 ) /* */ |
LLBL(x86_p2_2dnrr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p2_2dnrr_loop) ) |
LLBL(x86_p2_2dnrr_done): |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points2_identity ) |
GLNAME( _mesa_x86_transform_points2_identity ): |
#define FRAME_OFFSET 12 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p2_ir_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_2), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(2), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
CMP_L( ESI, EDI ) |
JE( LLBL(x86_p2_ir_done) ) |
ALIGNTEXT16 |
LLBL(x86_p2_ir_loop): |
MOV_L( SRC0, EBX ) |
MOV_L( SRC1, EDX ) |
MOV_L( EBX, DST0 ) |
MOV_L( EDX, DST1 ) |
LLBL(x86_p2_ir_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p2_ir_loop) ) |
LLBL(x86_p2_ir_done): |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
/shark/trunk/ports/mesa/src/x86/xform3_x86.s |
---|
0,0 → 1,633 |
/* $Id: xform3_x86.s,v 1.1 2003-04-24 13:36:03 giacomo Exp $ */ |
/* |
* Mesa 3-D graphics library |
* Version: 3.5 |
* |
* Copyright (C) 1999-2001 Brian Paul All Rights Reserved. |
* |
* Permission is hereby granted, free of charge, to any person obtaining a |
* copy of this software and associated documentation files (the "Software"), |
* to deal in the Software without restriction, including without limitation |
* the rights to use, copy, modify, merge, publish, distribute, sublicense, |
* and/or sell copies of the Software, and to permit persons to whom the |
* Software is furnished to do so, subject to the following conditions: |
* |
* The above copyright notice and this permission notice shall be included |
* in all copies or substantial portions of the Software. |
* |
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS |
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
* BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN |
* AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN |
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. |
*/ |
/* |
* NOTE: Avoid using spaces in between '(' ')' and arguments, especially |
* with macros like CONST, LLBL that expand to CONCAT(...). Putting spaces |
* in there will break the build on some platforms. |
*/ |
#include "matypes.h" |
#include "xform_args.h" |
SEG_TEXT |
#define FP_ONE 1065353216 |
#define FP_ZERO 0 |
#define SRC0 REGOFF(0, ESI) |
#define SRC1 REGOFF(4, ESI) |
#define SRC2 REGOFF(8, ESI) |
#define SRC3 REGOFF(12, ESI) |
#define DST0 REGOFF(0, EDI) |
#define DST1 REGOFF(4, EDI) |
#define DST2 REGOFF(8, EDI) |
#define DST3 REGOFF(12, EDI) |
#define MAT0 REGOFF(0, EDX) |
#define MAT1 REGOFF(4, EDX) |
#define MAT2 REGOFF(8, EDX) |
#define MAT3 REGOFF(12, EDX) |
#define MAT4 REGOFF(16, EDX) |
#define MAT5 REGOFF(20, EDX) |
#define MAT6 REGOFF(24, EDX) |
#define MAT7 REGOFF(28, EDX) |
#define MAT8 REGOFF(32, EDX) |
#define MAT9 REGOFF(36, EDX) |
#define MAT10 REGOFF(40, EDX) |
#define MAT11 REGOFF(44, EDX) |
#define MAT12 REGOFF(48, EDX) |
#define MAT13 REGOFF(52, EDX) |
#define MAT14 REGOFF(56, EDX) |
#define MAT15 REGOFF(60, EDX) |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points3_general ) |
GLNAME( _mesa_x86_transform_points3_general ): |
#define FRAME_OFFSET 8 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p3_gr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p3_gr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC0 ) /* F5 F4 */ |
FMUL_S( MAT1 ) |
FLD_S( SRC0 ) /* F6 F5 F4 */ |
FMUL_S( MAT2 ) |
FLD_S( SRC0 ) /* F7 F6 F5 F4 */ |
FMUL_S( MAT3 ) |
FLD_S( SRC1 ) /* F0 F7 F6 F5 F4 */ |
FMUL_S( MAT4 ) |
FLD_S( SRC1 ) /* F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT5 ) |
FLD_S( SRC1 ) /* F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT6 ) |
FLD_S( SRC1 ) /* F3 F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT7 ) |
FXCH( ST(3) ) /* F0 F2 F1 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(7) ) /* F2 F1 F3 F7 F6 F5 F4 */ |
FXCH( ST(1) ) /* F1 F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F7 F6 F5 F4 */ |
FLD_S( SRC2 ) /* F0 F7 F6 F5 F4 */ |
FMUL_S( MAT8 ) |
FLD_S( SRC2 ) /* F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT9 ) |
FLD_S( SRC2 ) /* F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT10 ) |
FLD_S( SRC2 ) /* F3 F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT11 ) |
FXCH( ST(3) ) /* F0 F2 F1 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(7) ) /* F2 F1 F3 F7 F6 F5 F4 */ |
FXCH( ST(1) ) /* F1 F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F7 F6 F5 F4 */ |
FXCH( ST(3) ) /* F4 F6 F5 F7 */ |
FADD_S( MAT12 ) |
FXCH( ST(2) ) /* F5 F6 F4 F7 */ |
FADD_S( MAT13 ) |
FXCH( ST(1) ) /* F6 F5 F4 F7 */ |
FADD_S( MAT14 ) |
FXCH( ST(3) ) /* F7 F5 F4 F6 */ |
FADD_S( MAT15 ) |
FXCH( ST(2) ) /* F4 F5 F7 F6 */ |
FSTP_S( DST0 ) /* F5 F7 F6 */ |
FSTP_S( DST1 ) /* F7 F6 */ |
FXCH( ST(1) ) /* F6 F7 */ |
FSTP_S( DST2 ) /* F7 */ |
FSTP_S( DST3 ) /* */ |
LLBL(x86_p3_gr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p3_gr_loop) ) |
LLBL(x86_p3_gr_done): |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points3_perspective ) |
GLNAME( _mesa_x86_transform_points3_perspective ): |
#define FRAME_OFFSET 12 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p3_pr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p3_pr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC1 ) /* F5 F4 */ |
FMUL_S( MAT5 ) |
FLD_S( SRC2 ) /* F0 F5 F4 */ |
FMUL_S( MAT8 ) |
FLD_S( SRC2 ) /* F1 F0 F5 F4 */ |
FMUL_S( MAT9 ) |
FLD_S( SRC2 ) /* F2 F1 F0 F5 F4 */ |
FMUL_S( MAT10 ) |
FXCH( ST(2) ) /* F0 F1 F2 F5 F4 */ |
FADDP( ST0, ST(4) ) /* F1 F2 F5 F4 */ |
FADDP( ST0, ST(2) ) /* F2 F5 F4 */ |
FLD_S( MAT14 ) /* F6 F2 F5 F4 */ |
FXCH( ST(1) ) /* F2 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F6 F5 F4 */ |
MOV_L( SRC2, EBX ) |
XOR_L( CONST(-2147483648), EBX )/* change sign */ |
FXCH( ST(2) ) /* F4 F5 F6 */ |
FSTP_S( DST0 ) /* F5 F6 */ |
FSTP_S( DST1 ) /* F6 */ |
FSTP_S( DST2 ) /* */ |
MOV_L( EBX, DST3 ) |
LLBL(x86_p3_pr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p3_pr_loop) ) |
LLBL(x86_p3_pr_done): |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points3_3d ) |
GLNAME( _mesa_x86_transform_points3_3d ): |
#define FRAME_OFFSET 8 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p3_3dr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_3), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(3), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p3_3dr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC0 ) /* F5 F4 */ |
FMUL_S( MAT1 ) |
FLD_S( SRC0 ) /* F6 F5 F4 */ |
FMUL_S( MAT2 ) |
FLD_S( SRC1 ) /* F0 F6 F5 F4 */ |
FMUL_S( MAT4 ) |
FLD_S( SRC1 ) /* F1 F0 F6 F5 F4 */ |
FMUL_S( MAT5 ) |
FLD_S( SRC1 ) /* F2 F1 F0 F6 F5 F4 */ |
FMUL_S( MAT6 ) |
FXCH( ST(2) ) /* F0 F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F2 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F6 F5 F4 */ |
FLD_S( SRC2 ) /* F0 F6 F5 F4 */ |
FMUL_S( MAT8 ) |
FLD_S( SRC2 ) /* F1 F0 F6 F5 F4 */ |
FMUL_S( MAT9 ) |
FLD_S( SRC2 ) /* F2 F1 F0 F6 F5 F4 */ |
FMUL_S( MAT10 ) |
FXCH( ST(2) ) /* F0 F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F2 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F6 F5 F4 */ |
FXCH( ST(2) ) /* F4 F5 F6 */ |
FADD_S( MAT12 ) |
FXCH( ST(1) ) /* F5 F4 F6 */ |
FADD_S( MAT13 ) |
FXCH( ST(2) ) /* F6 F4 F5 */ |
FADD_S( MAT14 ) |
FXCH( ST(1) ) /* F4 F6 F5 */ |
FSTP_S( DST0 ) /* F6 F5 */ |
FXCH( ST(1) ) /* F5 F6 */ |
FSTP_S( DST1 ) /* F6 */ |
FSTP_S( DST2 ) /* */ |
LLBL(x86_p3_3dr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p3_3dr_loop) ) |
LLBL(x86_p3_3dr_done): |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points3_3d_no_rot ) |
GLNAME( _mesa_x86_transform_points3_3d_no_rot ): |
#define FRAME_OFFSET 8 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p3_3dnrr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_3), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(3), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p3_3dnrr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC1 ) /* F1 F4 */ |
FMUL_S( MAT5 ) |
FLD_S( SRC2 ) /* F2 F1 F4 */ |
FMUL_S( MAT10 ) |
FXCH( ST(2) ) /* F4 F1 F2 */ |
FADD_S( MAT12 ) |
FLD_S( MAT13 ) /* F5 F4 F1 F2 */ |
FXCH( ST(2) ) /* F1 F4 F5 F2 */ |
FADDP( ST0, ST(2) ) /* F4 F5 F2 */ |
FLD_S( MAT14 ) /* F6 F4 F5 F2 */ |
FXCH( ST(3) ) /* F2 F4 F5 F6 */ |
FADDP( ST0, ST(3) ) /* F4 F5 F6 */ |
FSTP_S( DST0 ) /* F5 F6 */ |
FSTP_S( DST1 ) /* F6 */ |
FSTP_S( DST2 ) /* */ |
LLBL(x86_p3_3dnrr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p3_3dnrr_loop) ) |
LLBL(x86_p3_3dnrr_done): |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points3_2d ) |
GLNAME( _mesa_x86_transform_points3_2d ): |
#define FRAME_OFFSET 12 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p3_2dr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_3), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(3), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p3_2dr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC0 ) /* F5 F4 */ |
FMUL_S( MAT1 ) |
FLD_S( SRC1 ) /* F0 F5 F4 */ |
FMUL_S( MAT4 ) |
FLD_S( SRC1 ) /* F1 F0 F5 F4 */ |
FMUL_S( MAT5 ) |
FXCH( ST(1) ) /* F0 F1 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F1 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F5 F4 */ |
FXCH( ST(1) ) /* F4 F5 */ |
FADD_S( MAT12 ) |
FXCH( ST(1) ) /* F5 F4 */ |
FADD_S( MAT13 ) |
MOV_L( SRC2, EBX ) |
FXCH( ST(1) ) /* F4 F5 */ |
FSTP_S( DST0 ) /* F5 */ |
FSTP_S( DST1 ) /* */ |
MOV_L( EBX, DST2 ) |
LLBL(x86_p3_2dr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p3_2dr_loop) ) |
LLBL(x86_p3_2dr_done): |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points3_2d_no_rot ) |
GLNAME( _mesa_x86_transform_points3_2d_no_rot ): |
#define FRAME_OFFSET 12 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p3_2dnrr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_3), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(3), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p3_2dnrr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC1 ) /* F1 F4 */ |
FMUL_S( MAT5 ) |
FXCH( ST(1) ) /* F4 F1 */ |
FADD_S( MAT12 ) |
FLD_S( MAT13 ) /* F5 F4 F1 */ |
FXCH( ST(2) ) /* F1 F4 F5 */ |
FADDP( ST0, ST(2) ) /* F4 F5 */ |
MOV_L( SRC2, EBX ) |
FSTP_S( DST0 ) /* F5 */ |
FSTP_S( DST1 ) /* */ |
MOV_L( EBX, DST2 ) |
LLBL(x86_p3_2dnrr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p3_2dnrr_loop) ) |
LLBL(x86_p3_2dnrr_done): |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points3_identity ) |
GLNAME(_mesa_x86_transform_points3_identity ): |
#define FRAME_OFFSET 16 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
PUSH_L( EBP ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p3_ir_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_3), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(3), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
CMP_L( ESI, EDI ) |
JE( LLBL(x86_p3_ir_done) ) |
ALIGNTEXT16 |
LLBL(x86_p3_ir_loop): |
#if 1 |
MOV_L( SRC0, EBX ) |
MOV_L( SRC1, EBP ) |
MOV_L( SRC2, EDX ) |
MOV_L( EBX, DST0 ) |
MOV_L( EBP, DST1 ) |
MOV_L( EDX, DST2 ) |
#else |
FLD_S( SRC0 ) |
FLD_S( SRC1 ) |
FLD_S( SRC2 ) |
FSTP_S( DST2 ) |
FSTP_S( DST1 ) |
FSTP_S( DST0 ) |
#endif |
LLBL(x86_p3_ir_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p3_ir_loop) ) |
LLBL(x86_p3_ir_done): |
POP_L( EBP ) |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
/shark/trunk/ports/mesa/src/x86/xform4_x86.s |
---|
0,0 → 1,666 |
/* $Id: xform4_x86.s,v 1.1 2003-04-24 13:36:03 giacomo Exp $ */ |
/* |
* Mesa 3-D graphics library |
* Version: 3.5 |
* |
* Copyright (C) 1999-2001 Brian Paul All Rights Reserved. |
* |
* Permission is hereby granted, free of charge, to any person obtaining a |
* copy of this software and associated documentation files (the "Software"), |
* to deal in the Software without restriction, including without limitation |
* the rights to use, copy, modify, merge, publish, distribute, sublicense, |
* and/or sell copies of the Software, and to permit persons to whom the |
* Software is furnished to do so, subject to the following conditions: |
* |
* The above copyright notice and this permission notice shall be included |
* in all copies or substantial portions of the Software. |
* |
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS |
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
* BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN |
* AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN |
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. |
*/ |
/* |
* NOTE: Avoid using spaces in between '(' ')' and arguments, especially |
* with macros like CONST, LLBL that expand to CONCAT(...). Putting spaces |
* in there will break the build on some platforms. |
*/ |
#include "matypes.h" |
#include "xform_args.h" |
SEG_TEXT |
#define FP_ONE 1065353216 |
#define FP_ZERO 0 |
#define SRC0 REGOFF(0, ESI) |
#define SRC1 REGOFF(4, ESI) |
#define SRC2 REGOFF(8, ESI) |
#define SRC3 REGOFF(12, ESI) |
#define DST0 REGOFF(0, EDI) |
#define DST1 REGOFF(4, EDI) |
#define DST2 REGOFF(8, EDI) |
#define DST3 REGOFF(12, EDI) |
#define MAT0 REGOFF(0, EDX) |
#define MAT1 REGOFF(4, EDX) |
#define MAT2 REGOFF(8, EDX) |
#define MAT3 REGOFF(12, EDX) |
#define MAT4 REGOFF(16, EDX) |
#define MAT5 REGOFF(20, EDX) |
#define MAT6 REGOFF(24, EDX) |
#define MAT7 REGOFF(28, EDX) |
#define MAT8 REGOFF(32, EDX) |
#define MAT9 REGOFF(36, EDX) |
#define MAT10 REGOFF(40, EDX) |
#define MAT11 REGOFF(44, EDX) |
#define MAT12 REGOFF(48, EDX) |
#define MAT13 REGOFF(52, EDX) |
#define MAT14 REGOFF(56, EDX) |
#define MAT15 REGOFF(60, EDX) |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points4_general ) |
GLNAME( _mesa_x86_transform_points4_general ): |
#define FRAME_OFFSET 8 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p4_gr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p4_gr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC0 ) /* F5 F4 */ |
FMUL_S( MAT1 ) |
FLD_S( SRC0 ) /* F6 F5 F4 */ |
FMUL_S( MAT2 ) |
FLD_S( SRC0 ) /* F7 F6 F5 F4 */ |
FMUL_S( MAT3 ) |
FLD_S( SRC1 ) /* F0 F7 F6 F5 F4 */ |
FMUL_S( MAT4 ) |
FLD_S( SRC1 ) /* F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT5 ) |
FLD_S( SRC1 ) /* F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT6 ) |
FLD_S( SRC1 ) /* F3 F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT7 ) |
FXCH( ST(3) ) /* F0 F2 F1 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(7) ) /* F2 F1 F3 F7 F6 F5 F4 */ |
FXCH( ST(1) ) /* F1 F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F7 F6 F5 F4 */ |
FLD_S( SRC2 ) /* F0 F7 F6 F5 F4 */ |
FMUL_S( MAT8 ) |
FLD_S( SRC2 ) /* F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT9 ) |
FLD_S( SRC2 ) /* F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT10 ) |
FLD_S( SRC2 ) /* F3 F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT11 ) |
FXCH( ST(3) ) /* F0 F2 F1 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(7) ) /* F2 F1 F3 F7 F6 F5 F4 */ |
FXCH( ST(1) ) /* F1 F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F7 F6 F5 F4 */ |
FLD_S( SRC3 ) /* F0 F7 F6 F5 F4 */ |
FMUL_S( MAT12 ) |
FLD_S( SRC3 ) /* F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT13 ) |
FLD_S( SRC3 ) /* F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT14 ) |
FLD_S( SRC3 ) /* F3 F2 F1 F0 F7 F6 F5 F4 */ |
FMUL_S( MAT15 ) |
FXCH( ST(3) ) /* F0 F2 F1 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(7) ) /* F2 F1 F3 F7 F6 F5 F4 */ |
FXCH( ST(1) ) /* F1 F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F2 F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F3 F7 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F7 F6 F5 F4 */ |
FXCH( ST(3) ) /* F4 F6 F5 F7 */ |
FSTP_S( DST0 ) /* F6 F5 F7 */ |
FXCH( ST(1) ) /* F5 F6 F7 */ |
FSTP_S( DST1 ) /* F6 F7 */ |
FSTP_S( DST2 ) /* F7 */ |
FSTP_S( DST3 ) /* */ |
LLBL(x86_p4_gr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p4_gr_loop) ) |
LLBL(x86_p4_gr_done): |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points4_perspective ) |
GLNAME( _mesa_x86_transform_points4_perspective ): |
#define FRAME_OFFSET 12 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p4_pr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p4_pr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC1 ) /* F5 F4 */ |
FMUL_S( MAT5 ) |
FLD_S( SRC2 ) /* F0 F5 F4 */ |
FMUL_S( MAT8 ) |
FLD_S( SRC2 ) /* F1 F0 F5 F4 */ |
FMUL_S( MAT9 ) |
FLD_S( SRC2 ) /* F6 F1 F0 F5 F4 */ |
FMUL_S( MAT10 ) |
FXCH( ST(2) ) /* F0 F1 F6 F5 F4 */ |
FADDP( ST0, ST(4) ) /* F1 F6 F5 F4 */ |
FADDP( ST0, ST(2) ) /* F6 F5 F4 */ |
FLD_S( SRC3 ) /* F2 F6 F5 F4 */ |
FMUL_S( MAT14 ) |
FADDP( ST0, ST(1) ) /* F6 F5 F4 */ |
MOV_L( SRC2, EBX ) |
XOR_L( CONST(-2147483648), EBX )/* change sign */ |
FXCH( ST(2) ) /* F4 F5 F6 */ |
FSTP_S( DST0 ) /* F5 F6 */ |
FSTP_S( DST1 ) /* F6 */ |
FSTP_S( DST2 ) /* */ |
MOV_L( EBX, DST3 ) |
LLBL(x86_p4_pr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p4_pr_loop) ) |
LLBL(x86_p4_pr_done): |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points4_3d ) |
GLNAME( _mesa_x86_transform_points4_3d ): |
#define FRAME_OFFSET 12 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p4_3dr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p4_3dr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC0 ) /* F5 F4 */ |
FMUL_S( MAT1 ) |
FLD_S( SRC0 ) /* F6 F5 F4 */ |
FMUL_S( MAT2 ) |
FLD_S( SRC1 ) /* F0 F6 F5 F4 */ |
FMUL_S( MAT4 ) |
FLD_S( SRC1 ) /* F1 F0 F6 F5 F4 */ |
FMUL_S( MAT5 ) |
FLD_S( SRC1 ) /* F2 F1 F0 F6 F5 F4 */ |
FMUL_S( MAT6 ) |
FXCH( ST(2) ) /* F0 F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F2 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F6 F5 F4 */ |
FLD_S( SRC2 ) /* F0 F6 F5 F4 */ |
FMUL_S( MAT8 ) |
FLD_S( SRC2 ) /* F1 F0 F6 F5 F4 */ |
FMUL_S( MAT9 ) |
FLD_S( SRC2 ) /* F2 F1 F0 F6 F5 F4 */ |
FMUL_S( MAT10 ) |
FXCH( ST(2) ) /* F0 F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F2 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F6 F5 F4 */ |
FLD_S( SRC3 ) /* F0 F6 F5 F4 */ |
FMUL_S( MAT12 ) |
FLD_S( SRC3 ) /* F1 F0 F6 F5 F4 */ |
FMUL_S( MAT13 ) |
FLD_S( SRC3 ) /* F2 F1 F0 F6 F5 F4 */ |
FMUL_S( MAT14 ) |
FXCH( ST(2) ) /* F0 F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F2 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F6 F5 F4 */ |
MOV_L( SRC3, EBX ) |
FXCH( ST(2) ) /* F4 F5 F6 */ |
FSTP_S( DST0 ) /* F5 F6 */ |
FSTP_S( DST1 ) /* F6 */ |
FSTP_S( DST2 ) /* */ |
MOV_L( EBX, DST3 ) |
LLBL(x86_p4_3dr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p4_3dr_loop) ) |
LLBL(x86_p4_3dr_done): |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME(_mesa_x86_transform_points4_3d_no_rot) |
GLNAME(_mesa_x86_transform_points4_3d_no_rot): |
#define FRAME_OFFSET 12 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p4_3dnrr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p4_3dnrr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC1 ) /* F5 F4 */ |
FMUL_S( MAT5 ) |
FLD_S( SRC2 ) /* F6 F5 F4 */ |
FMUL_S( MAT10 ) |
FLD_S( SRC3 ) /* F0 F6 F5 F4 */ |
FMUL_S( MAT12 ) |
FLD_S( SRC3 ) /* F1 F0 F6 F5 F4 */ |
FMUL_S( MAT13 ) |
FLD_S( SRC3 ) /* F2 F1 F0 F6 F5 F4 */ |
FMUL_S( MAT14 ) |
FXCH( ST(2) ) /* F0 F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(5) ) /* F1 F2 F6 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F2 F6 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F6 F5 F4 */ |
MOV_L( SRC3, EBX ) |
FXCH( ST(2) ) /* F4 F5 F6 */ |
FSTP_S( DST0 ) /* F5 F6 */ |
FSTP_S( DST1 ) /* F6 */ |
FSTP_S( DST2 ) /* */ |
MOV_L( EBX, DST3 ) |
LLBL(x86_p4_3dnrr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p4_3dnrr_loop) ) |
LLBL(x86_p4_3dnrr_done): |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points4_2d ) |
GLNAME( _mesa_x86_transform_points4_2d ): |
#define FRAME_OFFSET 16 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
PUSH_L( EBP ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p4_2dr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p4_2dr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC0 ) /* F5 F4 */ |
FMUL_S( MAT1 ) |
FLD_S( SRC1 ) /* F0 F5 F4 */ |
FMUL_S( MAT4 ) |
FLD_S( SRC1 ) /* F1 F0 F5 F4 */ |
FMUL_S( MAT5 ) |
FXCH( ST(1) ) /* F0 F1 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F1 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F5 F4 */ |
FLD_S( SRC3 ) /* F0 F5 F4 */ |
FMUL_S( MAT12 ) |
FLD_S( SRC3 ) /* F1 F0 F5 F4 */ |
FMUL_S( MAT13 ) |
FXCH( ST(1) ) /* F0 F1 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F1 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F5 F4 */ |
MOV_L( SRC2, EBX ) |
MOV_L( SRC3, EBP ) |
FXCH( ST(1) ) /* F4 F5 */ |
FSTP_S( DST0 ) /* F5 */ |
FSTP_S( DST1 ) /* */ |
MOV_L( EBX, DST2 ) |
MOV_L( EBP, DST3 ) |
LLBL(x86_p4_2dr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p4_2dr_loop) ) |
LLBL(x86_p4_2dr_done): |
POP_L( EBP ) |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points4_2d_no_rot ) |
GLNAME( _mesa_x86_transform_points4_2d_no_rot ): |
#define FRAME_OFFSET 16 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
PUSH_L( EBP ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p4_2dnrr_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
ALIGNTEXT16 |
LLBL(x86_p4_2dnrr_loop): |
FLD_S( SRC0 ) /* F4 */ |
FMUL_S( MAT0 ) |
FLD_S( SRC1 ) /* F5 F4 */ |
FMUL_S( MAT5 ) |
FLD_S( SRC3 ) /* F0 F5 F4 */ |
FMUL_S( MAT12 ) |
FLD_S( SRC3 ) /* F1 F0 F5 F4 */ |
FMUL_S( MAT13 ) |
FXCH( ST(1) ) /* F0 F1 F5 F4 */ |
FADDP( ST0, ST(3) ) /* F1 F5 F4 */ |
FADDP( ST0, ST(1) ) /* F5 F4 */ |
MOV_L( SRC2, EBX ) |
MOV_L( SRC3, EBP ) |
FXCH( ST(1) ) /* F4 F5 */ |
FSTP_S( DST0 ) /* F5 */ |
FSTP_S( DST1 ) /* */ |
MOV_L( EBX, DST2 ) |
MOV_L( EBP, DST3 ) |
LLBL(x86_p4_2dnrr_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p4_2dnrr_loop) ) |
LLBL(x86_p4_2dnrr_done): |
POP_L( EBP ) |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
#undef FRAME_OFFSET |
ALIGNTEXT16 |
GLOBL GLNAME( _mesa_x86_transform_points4_identity ) |
GLNAME( _mesa_x86_transform_points4_identity ): |
#define FRAME_OFFSET 12 |
PUSH_L( ESI ) |
PUSH_L( EDI ) |
PUSH_L( EBX ) |
MOV_L( ARG_SOURCE, ESI ) |
MOV_L( ARG_DEST, EDI ) |
MOV_L( ARG_MATRIX, EDX ) |
MOV_L( REGOFF(V4F_COUNT, ESI), ECX ) |
TEST_L( ECX, ECX ) |
JZ( LLBL(x86_p4_ir_done) ) |
MOV_L( REGOFF(V4F_STRIDE, ESI), EAX ) |
OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) ) |
MOV_L( ECX, REGOFF(V4F_COUNT, EDI) ) |
MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) ) |
SHL_L( CONST(4), ECX ) |
MOV_L( REGOFF(V4F_START, ESI), ESI ) |
MOV_L( REGOFF(V4F_START, EDI), EDI ) |
ADD_L( EDI, ECX ) |
CMP_L( ESI, EDI ) |
JE( LLBL(x86_p4_ir_done) ) |
ALIGNTEXT16 |
LLBL(x86_p4_ir_loop): |
MOV_L( SRC0, EBX ) |
MOV_L( SRC1, EDX ) |
MOV_L( EBX, DST0 ) |
MOV_L( EDX, DST1 ) |
MOV_L( SRC2, EBX ) |
MOV_L( SRC3, EDX ) |
MOV_L( EBX, DST2 ) |
MOV_L( EDX, DST3 ) |
LLBL(x86_p4_ir_skip): |
ADD_L( CONST(16), EDI ) |
ADD_L( EAX, ESI ) |
CMP_L( ECX, EDI ) |
JNE( LLBL(x86_p4_ir_loop) ) |
LLBL(x86_p4_ir_done): |
POP_L( EBX ) |
POP_L( EDI ) |
POP_L( ESI ) |
RET |
/shark/trunk/ports/mesa/src/x86/x86.c |
---|
1,4 → 1,4 |
/* $Id: x86.c,v 1.1 2003-03-13 12:11:49 giacomo Exp $ */ |
/* $Id: x86.c,v 1.2 2003-04-24 13:36:03 giacomo Exp $ */ |
/* |
* Mesa 3-D graphics library |
34,7 → 34,7 |
#include "tnl/t_context.h" |
#include "x86.h" |
#include "common_x86_macros.h" |
#include "macros_common_x86.h" |
#ifdef DEBUG |
#include "math/m_debug.h" |