2
* Mesa 3-D graphics library
4
* Copyright (C) 1999-2005 Brian Paul All Rights Reserved.
6
* Permission is hereby granted, free of charge, to any person obtaining a
7
* copy of this software and associated documentation files (the "Software"),
8
* to deal in the Software without restriction, including without limitation
9
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
10
* and/or sell copies of the Software, and to permit persons to whom the
11
* Software is furnished to do so, subject to the following conditions:
13
* The above copyright notice and this permission notice shall be included
14
* in all copies or substantial portions of the Software.
16
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
17
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
20
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22
* OTHER DEALINGS IN THE SOFTWARE.
28
#include "main/glheader.h"
29
#include "main/context.h"
30
#include "main/macros.h"
37
#include "m_debug_util.h"
40
/* The linker doesn't like empty files */
44
#ifdef DEBUG_MATH /* This code only used for debugging */
46
static clip_func *clip_tab[2] = {
50
static char *cnames[2] = {
54
#ifdef RUN_DEBUG_BENCHMARK
55
static char *cstrings[2] = {
56
"clip, perspective divide",
62
/* =============================================================
66
static GLvector4f *ref_cliptest_points4( GLvector4f *clip_vec,
71
GLboolean viewport_z_clip )
73
const GLuint stride = clip_vec->stride;
74
const GLuint count = clip_vec->count;
75
const GLfloat *from = (GLfloat *)clip_vec->start;
77
GLfloat (*vProj)[4] = (GLfloat (*)[4])proj_vec->start;
78
GLubyte tmpAndMask = *andMask;
79
GLubyte tmpOrMask = *orMask;
81
for ( i = 0 ; i < count ; i++, STRIDE_F(from, stride) ) {
82
const GLfloat cx = from[0];
83
const GLfloat cy = from[1];
84
const GLfloat cz = from[2];
85
const GLfloat cw = from[3];
87
if ( -cx + cw < 0 ) mask |= CLIP_RIGHT_BIT;
88
if ( cx + cw < 0 ) mask |= CLIP_LEFT_BIT;
89
if ( -cy + cw < 0 ) mask |= CLIP_TOP_BIT;
90
if ( cy + cw < 0 ) mask |= CLIP_BOTTOM_BIT;
91
if (viewport_z_clip) {
92
if ( -cz + cw < 0 ) mask |= CLIP_FAR_BIT;
93
if ( cz + cw < 0 ) mask |= CLIP_NEAR_BIT;
105
GLfloat oow = 1.0F / cw;
106
vProj[i][0] = cx * oow;
107
vProj[i][1] = cy * oow;
108
vProj[i][2] = cz * oow;
114
*andMask = (GLubyte) (c < count ? 0 : tmpAndMask);
116
proj_vec->flags |= VEC_SIZE_4;
118
proj_vec->count = clip_vec->count;
122
/* Keep these here for now, even though we don't use them...
124
static GLvector4f *ref_cliptest_points3( GLvector4f *clip_vec,
125
GLvector4f *proj_vec,
129
GLboolean viewport_z_clip )
131
const GLuint stride = clip_vec->stride;
132
const GLuint count = clip_vec->count;
133
const GLfloat *from = (GLfloat *)clip_vec->start;
135
GLubyte tmpOrMask = *orMask;
136
GLubyte tmpAndMask = *andMask;
138
for ( i = 0 ; i < count ; i++, STRIDE_F(from, stride) ) {
139
const GLfloat cx = from[0], cy = from[1], cz = from[2];
141
if ( cx > 1.0 ) mask |= CLIP_RIGHT_BIT;
142
else if ( cx < -1.0 ) mask |= CLIP_LEFT_BIT;
143
if ( cy > 1.0 ) mask |= CLIP_TOP_BIT;
144
else if ( cy < -1.0 ) mask |= CLIP_BOTTOM_BIT;
145
if (viewport_z_clip) {
146
if ( cz > 1.0 ) mask |= CLIP_FAR_BIT;
147
else if ( cz < -1.0 ) mask |= CLIP_NEAR_BIT;
155
*andMask = tmpAndMask;
159
static GLvector4f * ref_cliptest_points2( GLvector4f *clip_vec,
160
GLvector4f *proj_vec,
164
GLboolean viewport_z_clip )
166
const GLuint stride = clip_vec->stride;
167
const GLuint count = clip_vec->count;
168
const GLfloat *from = (GLfloat *)clip_vec->start;
170
GLubyte tmpOrMask = *orMask;
171
GLubyte tmpAndMask = *andMask;
174
(void) viewport_z_clip;
176
for ( i = 0 ; i < count ; i++, STRIDE_F(from, stride) ) {
177
const GLfloat cx = from[0], cy = from[1];
179
if ( cx > 1.0 ) mask |= CLIP_RIGHT_BIT;
180
else if ( cx < -1.0 ) mask |= CLIP_LEFT_BIT;
181
if ( cy > 1.0 ) mask |= CLIP_TOP_BIT;
182
else if ( cy < -1.0 ) mask |= CLIP_BOTTOM_BIT;
189
*andMask = tmpAndMask;
193
static clip_func ref_cliptest[5] = {
196
ref_cliptest_points2,
197
ref_cliptest_points3,
202
/* =============================================================
206
ALIGN16 static GLfloat s[TEST_COUNT][4];
207
ALIGN16 static GLfloat d[TEST_COUNT][4];
208
ALIGN16 static GLfloat r[TEST_COUNT][4];
212
* Check if X, Y or Z component of the coordinate is close to W, in terms
216
xyz_close_to_w(const GLfloat c[4])
219
return (fabs(c[0] - c[3]) < k ||
220
fabs(c[1] - c[3]) < k ||
221
fabs(c[2] - c[3]) < k ||
222
fabs(-c[0] - c[3]) < k ||
223
fabs(-c[1] - c[3]) < k ||
224
fabs(-c[2] - c[3]) < k);
229
static int test_cliptest_function( clip_func func, int np,
230
int psize, long *cycles )
232
GLvector4f source[1], dest[1], ref[1];
233
GLubyte dm[TEST_COUNT], dco, dca;
234
GLubyte rm[TEST_COUNT], rco, rca;
236
#ifdef RUN_DEBUG_BENCHMARK
237
int cycle_i; /* the counter for the benchmarks we run */
239
GLboolean viewport_z_clip = GL_TRUE;
244
_mesa_problem( NULL, "test_cliptest_function called with psize > 4\n" );
248
for ( i = 0 ; i < TEST_COUNT ; i++) {
249
ASSIGN_4V( d[i], 0.0, 0.0, 0.0, 1.0 );
250
ASSIGN_4V( s[i], 0.0, 0.0, 0.0, 1.0 );
251
for ( j = 0 ; j < psize ; j++ )
255
source->data = (GLfloat(*)[4])s;
256
source->start = (GLfloat *)s;
257
source->count = TEST_COUNT;
258
source->stride = sizeof(s[0]);
262
dest->data = (GLfloat(*)[4])d;
263
dest->start = (GLfloat *)d;
264
dest->count = TEST_COUNT;
265
dest->stride = sizeof(float[4]);
269
ref->data = (GLfloat(*)[4])r;
270
ref->start = (GLfloat *)r;
271
ref->count = TEST_COUNT;
272
ref->stride = sizeof(float[4]);
277
dca = rca = CLIP_FRUSTUM_BITS;
279
ref_cliptest[psize]( source, ref, rm, &rco, &rca, viewport_z_clip );
281
if ( mesa_profile ) {
282
BEGIN_RACE( *cycles );
283
func( source, dest, dm, &dco, &dca, viewport_z_clip );
287
func( source, dest, dm, &dco, &dca, viewport_z_clip );
291
printf( "\n-----------------------------\n" );
292
printf( "dco = 0x%02x rco = 0x%02x\n", dco, rco );
296
printf( "\n-----------------------------\n" );
297
printf( "dca = 0x%02x rca = 0x%02x\n", dca, rca );
300
for ( i = 0 ; i < TEST_COUNT ; i++ ) {
301
if ( dm[i] != rm[i] ) {
302
GLfloat *c = source->start;
303
STRIDE_F(c, source->stride * i);
304
if (psize == 4 && xyz_close_to_w(c)) {
305
/* The coordinate is very close to the clip plane. The clipmask
306
* may vary depending on code path, but that's OK.
310
printf( "\n-----------------------------\n" );
311
printf( "mask[%d] = 0x%02x ref mask[%d] = 0x%02x\n", i, dm[i], i,rm[i] );
312
printf(" coord = %f, %f, %f, %f\n",
313
c[0], c[1], c[2], c[3]);
318
/* Only verify output on projected points4 case. FIXME: Do we need
319
* to test other cases?
321
if ( np || psize < 4 )
324
for ( i = 0 ; i < TEST_COUNT ; i++ ) {
325
for ( j = 0 ; j < 4 ; j++ ) {
326
if ( significand_match( d[i][j], r[i][j] ) < REQUIRED_PRECISION ) {
327
printf( "\n-----------------------------\n" );
328
printf( "(i = %i, j = %i) dm = 0x%02x rm = 0x%02x\n",
329
i, j, dm[i], rm[i] );
330
printf( "%f \t %f \t [diff = %e - %i bit missed]\n",
331
d[i][0], r[i][0], r[i][0]-d[i][0],
332
MAX_PRECISION - significand_match( d[i][0], r[i][0] ) );
333
printf( "%f \t %f \t [diff = %e - %i bit missed]\n",
334
d[i][1], r[i][1], r[i][1]-d[i][1],
335
MAX_PRECISION - significand_match( d[i][1], r[i][1] ) );
336
printf( "%f \t %f \t [diff = %e - %i bit missed]\n",
337
d[i][2], r[i][2], r[i][2]-d[i][2],
338
MAX_PRECISION - significand_match( d[i][2], r[i][2] ) );
339
printf( "%f \t %f \t [diff = %e - %i bit missed]\n",
340
d[i][3], r[i][3], r[i][3]-d[i][3],
341
MAX_PRECISION - significand_match( d[i][3], r[i][3] ) );
350
void _math_test_all_cliptest_functions( char *description )
353
long benchmark_tab[2][4];
354
static int first_time = 1;
358
mesa_profile = getenv( "MESA_PROFILE" );
361
#ifdef RUN_DEBUG_BENCHMARK
362
if ( mesa_profile ) {
363
if ( !counter_overhead ) {
365
printf( "counter overhead: %ld cycles\n\n", counter_overhead );
367
printf( "cliptest results after hooking in %s functions:\n", description );
371
#ifdef RUN_DEBUG_BENCHMARK
372
if ( mesa_profile ) {
374
for ( psize = 2 ; psize <= 4 ; psize++ ) {
375
printf( " p%d\t", psize );
377
printf( "\n--------------------------------------------------------\n\t" );
381
for ( np = 0 ; np < 2 ; np++ ) {
382
for ( psize = 2 ; psize <= 4 ; psize++ ) {
383
clip_func func = clip_tab[np][psize];
384
long *cycles = &(benchmark_tab[np][psize-1]);
386
if ( test_cliptest_function( func, np, psize, cycles ) == 0 ) {
388
sprintf( buf, "%s[%d] failed test (%s)",
389
cnames[np], psize, description );
390
_mesa_problem( NULL, "%s", buf );
392
#ifdef RUN_DEBUG_BENCHMARK
394
printf( " %li\t", benchmark_tab[np][psize-1] );
397
#ifdef RUN_DEBUG_BENCHMARK
399
printf( " | [%s]\n\t", cstrings[np] );
402
#ifdef RUN_DEBUG_BENCHMARK
409
#endif /* DEBUG_MATH */