Subversion Repositories shark

Rev

Rev 70 | Details | Compare with Previous | Last modification | View Log | RSS feed

Rev Author Line No. Line
70 giacomo 1
/* $Id: x86_cliptest.s,v 1.1 2003-03-13 12:11:49 giacomo Exp $ */
2
 
3
/*
4
 * Mesa 3-D graphics library
5
 * Version:  3.5
6
 *
7
 * Copyright (C) 1999-2001  Brian Paul   All Rights Reserved.
8
 *
9
 * Permission is hereby granted, free of charge, to any person obtaining a
10
 * copy of this software and associated documentation files (the "Software"),
11
 * to deal in the Software without restriction, including without limitation
12
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
13
 * and/or sell copies of the Software, and to permit persons to whom the
14
 * Software is furnished to do so, subject to the following conditions:
15
 *
16
 * The above copyright notice and this permission notice shall be included
17
 * in all copies or substantial portions of the Software.
18
 *
19
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
20
 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
22
 * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
23
 * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
24
 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25
 */
26
 
27
/*
28
 * NOTE: Avoid using spaces in between '(' ')' and arguments, especially
29
 * with macros like CONST, LLBL that expand to CONCAT(...).  Putting spaces
30
 * in there will break the build on some platforms.
31
 */
32
 
33
#include "matypes.h"
34
#include "clip_args.h"
35
 
36
#define SRC0		REGOFF(0, ESI)
37
#define SRC1		REGOFF(4, ESI)
38
#define SRC2		REGOFF(8, ESI)
39
#define SRC3		REGOFF(12, ESI)
40
#define DST0		REGOFF(0, EDI)
41
#define DST1		REGOFF(4, EDI)
42
#define DST2		REGOFF(8, EDI)
43
#define DST3		REGOFF(12, EDI)
44
#define MAT0		REGOFF(0, EDX)
45
#define MAT1		REGOFF(4, EDX)
46
#define MAT2		REGOFF(8, EDX)
47
#define MAT3		REGOFF(12, EDX)
48
 
49
 
50
/*
51
 * Table for clip test.
52
 *
53
 * 	bit6 = SRC3 < 0
54
 * 	bit5 = SRC2 < 0
55
 * 	bit4 = abs(S(2)) > abs(S(3))
56
 * 	bit3 = SRC1 < 0
57
 * 	bit2 = abs(S(1)) > abs(S(3))
58
 * 	bit1 = SRC0 < 0
59
 * 	bit0 = abs(S(0)) > abs(S(3))
60
 */
61
 
62
	SEG_DATA
63
 
64
clip_table:
65
	D_BYTE 0x00, 0x01, 0x00, 0x02, 0x04, 0x05, 0x04, 0x06
66
	D_BYTE 0x00, 0x01, 0x00, 0x02, 0x08, 0x09, 0x08, 0x0a
67
	D_BYTE 0x20, 0x21, 0x20, 0x22, 0x24, 0x25, 0x24, 0x26
68
	D_BYTE 0x20, 0x21, 0x20, 0x22, 0x28, 0x29, 0x28, 0x2a
69
	D_BYTE 0x00, 0x01, 0x00, 0x02, 0x04, 0x05, 0x04, 0x06
70
	D_BYTE 0x00, 0x01, 0x00, 0x02, 0x08, 0x09, 0x08, 0x0a
71
	D_BYTE 0x10, 0x11, 0x10, 0x12, 0x14, 0x15, 0x14, 0x16
72
	D_BYTE 0x10, 0x11, 0x10, 0x12, 0x18, 0x19, 0x18, 0x1a
73
	D_BYTE 0x3f, 0x3d, 0x3f, 0x3e, 0x37, 0x35, 0x37, 0x36
74
	D_BYTE 0x3f, 0x3d, 0x3f, 0x3e, 0x3b, 0x39, 0x3b, 0x3a
75
	D_BYTE 0x2f, 0x2d, 0x2f, 0x2e, 0x27, 0x25, 0x27, 0x26
76
	D_BYTE 0x2f, 0x2d, 0x2f, 0x2e, 0x2b, 0x29, 0x2b, 0x2a
77
	D_BYTE 0x3f, 0x3d, 0x3f, 0x3e, 0x37, 0x35, 0x37, 0x36
78
	D_BYTE 0x3f, 0x3d, 0x3f, 0x3e, 0x3b, 0x39, 0x3b, 0x3a
79
	D_BYTE 0x1f, 0x1d, 0x1f, 0x1e, 0x17, 0x15, 0x17, 0x16
80
	D_BYTE 0x1f, 0x1d, 0x1f, 0x1e, 0x1b, 0x19, 0x1b, 0x1a
81
 
82
 
83
	SEG_TEXT
84
 
85
/*
86
 * _mesa_x86_cliptest_points4
87
 *
88
 *   AL:  ormask
89
 *   AH:  andmask
90
 *   EBX: temp0
91
 *   ECX: temp1
92
 *   EDX: clipmask[]
93
 *   ESI: clip[]
94
 *   EDI: proj[]
95
 *   EBP: temp2
96
 */
97
 
98
#if defined(__ELF__) && defined(__PIC__) && defined(GNU_ASSEMBLER) && !defined(ELFPIC)
99
#define ELFPIC
100
#endif
101
 
102
ALIGNTEXT16
103
GLOBL GLNAME( _mesa_x86_cliptest_points4 )
104
GLNAME( _mesa_x86_cliptest_points4 ):
105
 
106
#ifdef ELFPIC
107
#define FRAME_OFFSET 20
108
#else
109
#define FRAME_OFFSET 16
110
#endif
111
	PUSH_L( ESI )
112
	PUSH_L( EDI )
113
	PUSH_L( EBP )
114
	PUSH_L( EBX )
115
 
116
#ifdef ELFPIC
117
	/* store pointer to clip_table on stack */
118
	CALL( LLBL(ctp4_get_eip) )
119
	ADD_L( CONST(_GLOBAL_OFFSET_TABLE_), EBX )
120
	MOV_L( REGOFF(clip_table@GOT, EBX), EBX )
121
	PUSH_L( EBX )
122
	JMP( LLBL(ctp4_clip_table_ready) )
123
 
124
LLBL(ctp4_get_eip):
125
	/* store eip in ebx */
126
	MOV_L( REGIND(ESP), EBX )
127
	RET
128
 
129
LLBL(ctp4_clip_table_ready):
130
#endif
131
 
132
	MOV_L( ARG_SOURCE, ESI )
133
	MOV_L( ARG_DEST, EDI )
134
 
135
	MOV_L( ARG_CLIP, EDX )
136
	MOV_L( ARG_OR, EBX )
137
 
138
	MOV_L( ARG_AND, EBP )
139
	MOV_L( REGOFF(V4F_STRIDE, ESI), EAX )
140
 
141
	MOV_L( REGOFF(V4F_COUNT, ESI), ECX )
142
	MOV_L( REGOFF(V4F_START, ESI), ESI )
143
 
144
	OR_L( CONST(VEC_SIZE_4), REGOFF(V4F_FLAGS, EDI) )
145
	MOV_L( EAX, ARG_SOURCE )	/* put stride in ARG_SOURCE */
146
 
147
	MOV_L( CONST(4), REGOFF(V4F_SIZE, EDI) )
148
	MOV_L( ECX, REGOFF(V4F_COUNT, EDI) )
149
 
150
	MOV_L( REGOFF(V4F_START, EDI), EDI )
151
	ADD_L( EDX, ECX )
152
 
153
	MOV_L( ECX, ARG_CLIP )		/* put clipmask + count in ARG_CLIP */
154
	CMP_L( ECX, EDX )
155
 
156
	MOV_B( REGIND(EBX), AL )
157
	MOV_B( REGIND(EBP), AH )
158
 
159
	JZ( LLBL(ctp4_finish) )
160
 
161
ALIGNTEXT16
162
LLBL(ctp4_top):
163
 
164
	FLD1				/* F3 */
165
	FDIV_S( SRC3 )		/* GH: don't care about div-by-zero */
166
 
167
	MOV_L( SRC3, EBP )
168
	MOV_L( SRC2, EBX )
169
 
170
	XOR_L( ECX, ECX )
171
	ADD_L( EBP, EBP )	/* ebp = abs(S(3))*2 ; carry = sign of S(3) */
172
 
173
	ADC_L( ECX, ECX )
174
	ADD_L( EBX, EBX )	/* ebx = abs(S(2))*2 ; carry = sign of S(2) */
175
 
176
	ADC_L( ECX, ECX )
177
	CMP_L( EBX, EBP )	/* carry = abs(S(2))*2 > abs(S(3))*2 */
178
 
179
	ADC_L( ECX, ECX )
180
	MOV_L( SRC1, EBX )
181
 
182
	ADD_L( EBX, EBX )	/* ebx = abs(S(1))*2 ; carry = sign of S(1) */
183
 
184
	ADC_L( ECX, ECX )
185
	CMP_L( EBX, EBP )	/* carry = abs(S(1))*2 > abs(S(3))*2 */
186
 
187
	ADC_L( ECX, ECX )
188
	MOV_L( SRC0, EBX )
189
 
190
	ADD_L( EBX, EBX )	/* ebx = abs(S(0))*2 ; carry = sign of S(0) */
191
 
192
	ADC_L( ECX, ECX )
193
	CMP_L( EBX, EBP )	/* carry = abs(S(0))*2 > abs(S(3))*2 */
194
 
195
	ADC_L( ECX, ECX )
196
 
197
#ifdef ELFPIC
198
	MOV_L( REGIND(ESP), EBP )	/* clip_table */
199
 
200
	MOV_B( REGBI(EBP, ECX), CL )
201
#else
202
	MOV_B( REGOFF(clip_table,ECX), CL )
203
#endif
204
 
205
	OR_B( CL, AL )
206
	AND_B( CL, AH )
207
 
208
	TEST_B( CL, CL )
209
	MOV_B( CL, REGIND(EDX) )
210
 
211
	JZ( LLBL(ctp4_proj) )
212
 
213
LLBL(ctp4_noproj):
214
 
215
	FSTP( ST(0) )			/* */
216
 
217
	MOV_L( CONST(0), DST0 )
218
	MOV_L( CONST(0), DST1 )
219
	MOV_L( CONST(0), DST2 )
220
	MOV_L( CONST(0x3f800000), DST3 )
221
 
222
	JMP( LLBL(ctp4_next) )
223
 
224
LLBL(ctp4_proj):
225
 
226
	FLD_S( SRC0 )			/* F0 F3 */
227
	FMUL2( ST(1), ST0 )
228
 
229
	FLD_S( SRC1 )			/* F1 F0 F3 */
230
	FMUL2( ST(2), ST0 )
231
 
232
	FLD_S( SRC2 )			/* F2 F1 F0 F3 */
233
	FMUL2( ST(3), ST0 )
234
 
235
	FXCH( ST(2) )			/* F0 F1 F2 F3 */
236
	FSTP_S( DST0 )		/* F1 F2 F3 */
237
	FSTP_S( DST1 )		/* F2 F3 */
238
	FSTP_S( DST2 )		/* F3 */
239
	FSTP_S( DST3 )		/* */
240
 
241
LLBL(ctp4_next):
242
 
243
	INC_L( EDX )
244
	ADD_L( CONST(16), EDI )
245
 
246
	ADD_L( ARG_SOURCE, ESI )
247
	CMP_L( EDX, ARG_CLIP )
248
 
249
	JNZ( LLBL(ctp4_top) )
250
 
251
	MOV_L( ARG_OR, ECX )
252
	MOV_L( ARG_AND, EDX )
253
 
254
	MOV_B( AL, REGIND(ECX) )
255
	MOV_B( AH, REGIND(EDX) )
256
 
257
LLBL(ctp4_finish):
258
 
259
	MOV_L( ARG_DEST, EAX )
260
#ifdef ELFPIC
261
	POP_L( ESI )			/* discard ptr to clip_table */
262
#endif
263
	POP_L( EBX )
264
	POP_L( EBP )
265
	POP_L( EDI )
266
	POP_L( ESI )
267
 
268
	RET
269
 
270
 
271
 
272
 
273
 
274
 
275
 
276
ALIGNTEXT16
277
GLOBL GLNAME( _mesa_x86_cliptest_points4_np )
278
GLNAME( _mesa_x86_cliptest_points4_np ):
279
 
280
#ifdef ELFPIC
281
#define FRAME_OFFSET 20
282
#else
283
#define FRAME_OFFSET 16
284
#endif
285
	PUSH_L( ESI )
286
	PUSH_L( EDI )
287
	PUSH_L( EBP )
288
	PUSH_L( EBX )
289
 
290
#ifdef ELFPIC
291
	/* store pointer to clip_table on stack */
292
	CALL( LLBL(ctp4_np_get_eip) )
293
	ADD_L( CONST(_GLOBAL_OFFSET_TABLE_), EBX )
294
	MOV_L( REGOFF(clip_table@GOT, EBX), EBX )
295
	PUSH_L( EBX )
296
	JMP( LLBL(ctp4_np_clip_table_ready) )
297
 
298
LLBL(ctp4_np_get_eip):
299
	/* store eip in ebx */
300
	MOV_L( REGIND(ESP), EBX )
301
	RET
302
 
303
LLBL(ctp4_np_clip_table_ready):
304
#endif
305
 
306
	MOV_L( ARG_SOURCE, ESI )
307
	/* slot */
308
 
309
	MOV_L( ARG_CLIP, EDX )
310
	MOV_L( ARG_OR, EBX )
311
 
312
	MOV_L( ARG_AND, EBP )
313
	MOV_L( REGOFF(V4F_STRIDE, ESI), EAX )
314
 
315
	MOV_L( REGOFF(V4F_COUNT, ESI), ECX )
316
	MOV_L( REGOFF(V4F_START, ESI), ESI )
317
 
318
	MOV_L( EAX, ARG_DEST )   	/* put stride in ARG_DEST */
319
	ADD_L( EDX, ECX )
320
 
321
	MOV_L( ECX, EDI )		/* put clipmask + count in EDI */
322
	CMP_L( ECX, EDX )
323
 
324
	MOV_B( REGIND(EBX), AL )
325
	MOV_B( REGIND(EBP), AH )
326
 
327
	JZ( LLBL(ctp4_np_finish) )
328
 
329
ALIGNTEXT16
330
LLBL(ctp4_np_top):
331
 
332
	MOV_L( SRC3, EBP )
333
	MOV_L( SRC2, EBX )
334
 
335
	XOR_L( ECX, ECX )
336
	ADD_L( EBP, EBP )	/* ebp = abs(S(3))*2 ; carry = sign of S(3) */
337
 
338
	ADC_L( ECX, ECX )
339
	ADD_L( EBX, EBX )	/* ebx = abs(S(2))*2 ; carry = sign of S(2) */
340
 
341
	ADC_L( ECX, ECX )
342
	CMP_L( EBX, EBP )	/* carry = abs(S(2))*2 > abs(S(3))*2 */
343
 
344
	ADC_L( ECX, ECX )
345
	MOV_L( SRC1, EBX )
346
 
347
	ADD_L( EBX, EBX )	/* ebx = abs(S(1))*2 ; carry = sign of S(1) */
348
 
349
	ADC_L( ECX, ECX )
350
	CMP_L( EBX, EBP )	/* carry = abs(S(1))*2 > abs(S(3))*2 */
351
 
352
	ADC_L( ECX, ECX )
353
	MOV_L( SRC0, EBX )
354
 
355
	ADD_L( EBX, EBX )	/* ebx = abs(S(0))*2 ; carry = sign of S(0) */
356
 
357
	ADC_L( ECX, ECX )
358
	CMP_L( EBX, EBP )	/* carry = abs(S(0))*2 > abs(S(3))*2 */
359
 
360
	ADC_L( ECX, ECX )
361
 
362
#ifdef ELFPIC
363
	MOV_L( REGIND(ESP), EBP )	/* clip_table */
364
 
365
	MOV_B( REGBI(EBP, ECX), CL )
366
#else
367
	MOV_B( REGOFF(clip_table,ECX), CL )
368
#endif
369
 
370
	OR_B( CL, AL )
371
	AND_B( CL, AH )
372
 
373
	TEST_B( CL, CL )
374
	MOV_B( CL, REGIND(EDX) )
375
 
376
	INC_L( EDX )
377
	/* slot */
378
 
379
	ADD_L( ARG_DEST, ESI )
380
	CMP_L( EDX, EDI )
381
 
382
	JNZ( LLBL(ctp4_np_top) )
383
 
384
	MOV_L( ARG_OR, ECX )
385
	MOV_L( ARG_AND, EDX )
386
 
387
	MOV_B( AL, REGIND(ECX) )
388
	MOV_B( AH, REGIND(EDX) )
389
 
390
LLBL(ctp4_np_finish):
391
 
392
	MOV_L( ARG_SOURCE, EAX )
393
#ifdef ELFPIC
394
	POP_L( ESI )			/* discard ptr to clip_table */
395
#endif
396
	POP_L( EBX )
397
	POP_L( EBP )
398
	POP_L( EDI )
399
	POP_L( ESI )
400
 
401
	RET