[3598] | 1 | /* $Id: mmath.c,v 1.2 2000-05-23 20:40:41 jeroen Exp $ */
|
---|
[2938] | 2 |
|
---|
| 3 | /*
|
---|
| 4 | * Mesa 3-D graphics library
|
---|
[3598] | 5 | * Version: 3.3
|
---|
[2938] | 6 | *
|
---|
| 7 | * Copyright (C) 1999 Brian Paul All Rights Reserved.
|
---|
| 8 | *
|
---|
| 9 | * Permission is hereby granted, free of charge, to any person obtaining a
|
---|
| 10 | * copy of this software and associated documentation files (the "Software"),
|
---|
| 11 | * to deal in the Software without restriction, including without limitation
|
---|
| 12 | * the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
---|
| 13 | * and/or sell copies of the Software, and to permit persons to whom the
|
---|
| 14 | * Software is furnished to do so, subject to the following conditions:
|
---|
| 15 | *
|
---|
| 16 | * The above copyright notice and this permission notice shall be included
|
---|
| 17 | * in all copies or substantial portions of the Software.
|
---|
| 18 | *
|
---|
| 19 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
---|
| 20 | * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
---|
| 21 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
---|
| 22 | * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
|
---|
| 23 | * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
|
---|
| 24 | * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
---|
| 25 | */
|
---|
| 26 |
|
---|
| 27 |
|
---|
| 28 | #ifdef PC_HEADER
|
---|
| 29 | #include "all.h"
|
---|
| 30 | #else
|
---|
[3598] | 31 | #include "glheader.h"
|
---|
[2938] | 32 | #include "mmath.h"
|
---|
| 33 | #endif
|
---|
| 34 |
|
---|
| 35 |
|
---|
| 36 | static int in_fast_math;
|
---|
| 37 |
|
---|
| 38 | /*
|
---|
| 39 | * A High Speed, Low Precision Square Root
|
---|
| 40 | * by Paul Lalonde and Robert Dawson
|
---|
| 41 | * from "Graphics Gems", Academic Press, 1990
|
---|
| 42 | */
|
---|
| 43 |
|
---|
| 44 | /*
|
---|
| 45 | * SPARC implementation of a fast square root by table
|
---|
| 46 | * lookup.
|
---|
| 47 | * SPARC floating point format is as follows:
|
---|
| 48 | *
|
---|
[3598] | 49 | * BIT 31 30 23 22 0
|
---|
| 50 | * sign exponent mantissa
|
---|
[2938] | 51 | */
|
---|
| 52 | static short sqrttab[0x100]; /* declare table of square roots */
|
---|
| 53 |
|
---|
| 54 | static void init_sqrt(void)
|
---|
| 55 | {
|
---|
| 56 | #ifdef FAST_MATH
|
---|
| 57 | unsigned short i;
|
---|
| 58 | float f;
|
---|
| 59 | unsigned int *fi = (unsigned int *)&f;
|
---|
| 60 | /* to access the bits of a float in */
|
---|
| 61 | /* C quickly we must misuse pointers */
|
---|
| 62 |
|
---|
| 63 | for(i=0; i<= 0x7f; i++) {
|
---|
| 64 | *fi = 0;
|
---|
| 65 |
|
---|
| 66 | /*
|
---|
| 67 | * Build a float with the bit pattern i as mantissa
|
---|
| 68 | * and an exponent of 0, stored as 127
|
---|
| 69 | */
|
---|
| 70 |
|
---|
| 71 | *fi = (i << 16) | (127 << 23);
|
---|
| 72 | f = sqrt(f);
|
---|
| 73 |
|
---|
| 74 | /*
|
---|
| 75 | * Take the square root then strip the first 7 bits of
|
---|
| 76 | * the mantissa into the table
|
---|
| 77 | */
|
---|
| 78 |
|
---|
| 79 | sqrttab[i] = (*fi & 0x7fffff) >> 16;
|
---|
| 80 |
|
---|
| 81 | /*
|
---|
| 82 | * Repeat the process, this time with an exponent of
|
---|
| 83 | * 1, stored as 128
|
---|
| 84 | */
|
---|
| 85 |
|
---|
| 86 | *fi = 0;
|
---|
| 87 | *fi = (i << 16) | (128 << 23);
|
---|
| 88 | f = sqrt(f);
|
---|
| 89 | sqrttab[i+0x80] = (*fi & 0x7fffff) >> 16;
|
---|
| 90 | }
|
---|
| 91 | #else
|
---|
[3598] | 92 | (void) sqrttab; /* silence compiler warnings */
|
---|
| 93 | #endif /*FAST_MATH*/
|
---|
[2938] | 94 | }
|
---|
| 95 |
|
---|
| 96 |
|
---|
| 97 | float gl_sqrt( float x )
|
---|
| 98 | {
|
---|
| 99 | #ifdef FAST_MATH
|
---|
| 100 | unsigned int *num = (unsigned int *)&x;
|
---|
| 101 | /* to access the bits of a float in C
|
---|
| 102 | * we must misuse pointers */
|
---|
| 103 |
|
---|
| 104 | short e; /* the exponent */
|
---|
| 105 | if (x == 0.0F) return 0.0F; /* check for square root of 0 */
|
---|
| 106 | e = (*num >> 23) - 127; /* get the exponent - on a SPARC the */
|
---|
| 107 | /* exponent is stored with 127 added */
|
---|
| 108 | *num &= 0x7fffff; /* leave only the mantissa */
|
---|
| 109 | if (e & 0x01) *num |= 0x800000;
|
---|
| 110 | /* the exponent is odd so we have to */
|
---|
| 111 | /* look it up in the second half of */
|
---|
| 112 | /* the lookup table, so we set the */
|
---|
| 113 | /* high bit */
|
---|
| 114 | e >>= 1; /* divide the exponent by two */
|
---|
| 115 | /* note that in C the shift */
|
---|
| 116 | /* operators are sign preserving */
|
---|
| 117 | /* for signed operands */
|
---|
| 118 | /* Do the table lookup, based on the quaternary mantissa,
|
---|
| 119 | * then reconstruct the result back into a float
|
---|
| 120 | */
|
---|
| 121 | *num = ((sqrttab[*num >> 16]) << 16) | ((e + 127) << 23);
|
---|
| 122 | return x;
|
---|
| 123 | #else
|
---|
| 124 | return sqrt(x);
|
---|
| 125 | #endif
|
---|
| 126 | }
|
---|
| 127 |
|
---|
| 128 | float gl_ubyte_to_float_color_tab[256];
|
---|
| 129 | float gl_ubyte_to_float_255_color_tab[256];
|
---|
| 130 |
|
---|
| 131 | static void
|
---|
| 132 | init_ubyte_color_tab(void)
|
---|
| 133 | {
|
---|
| 134 | int i;
|
---|
| 135 | for (i = 0 ; i < 256 ; i++) {
|
---|
| 136 | gl_ubyte_to_float_color_tab[i] = (float) i * (1.0/255.0);
|
---|
| 137 | gl_ubyte_to_float_255_color_tab[i] = (float) i;
|
---|
| 138 | }
|
---|
| 139 | }
|
---|
| 140 |
|
---|
| 141 | /*
|
---|
| 142 | * Initialize tables, etc for fast math functions.
|
---|
| 143 | */
|
---|
[3598] | 144 | void _mesa_init_math(void)
|
---|
[2938] | 145 | {
|
---|
| 146 | static GLboolean initialized = GL_FALSE;
|
---|
| 147 |
|
---|
| 148 | if (!initialized) {
|
---|
| 149 | init_sqrt();
|
---|
| 150 | init_ubyte_color_tab();
|
---|
| 151 |
|
---|
| 152 | initialized = GL_TRUE;
|
---|
| 153 | in_fast_math = 0;
|
---|
[3598] | 154 |
|
---|
| 155 | #if defined(_FPU_GETCW) && defined(_FPU_SETCW)
|
---|
| 156 | {
|
---|
| 157 | const char *debug = getenv("MESA_DEBUG");
|
---|
| 158 | if (debug && strcmp(debug, "FP")==0) {
|
---|
| 159 | /* die on FP exceptions */
|
---|
| 160 | fpu_control_t mask;
|
---|
| 161 | _FPU_GETCW(mask);
|
---|
| 162 | mask &= ~(_FPU_MASK_IM | _FPU_MASK_DM | _FPU_MASK_ZM
|
---|
| 163 | | _FPU_MASK_OM | _FPU_MASK_UM);
|
---|
| 164 | _FPU_SETCW(mask);
|
---|
| 165 | }
|
---|
| 166 | }
|
---|
| 167 | #endif
|
---|
[2938] | 168 | }
|
---|
| 169 | }
|
---|