dxx-rebirth/maths/fixc.c
Bradley Bell 9bd1ba7c47 This commit was generated by cvs2svn to compensate for changes in r2,
which included commits to RCS files with non-trunk default branches.
2001-01-19 03:30:16 +00:00

559 lines
11 KiB
C

/*
THE COMPUTER CODE CONTAINED HEREIN IS THE SOLE PROPERTY OF PARALLAX
SOFTWARE CORPORATION ("PARALLAX"). PARALLAX, IN DISTRIBUTING THE CODE TO
END-USERS, AND SUBJECT TO ALL OF THE TERMS AND CONDITIONS HEREIN, GRANTS A
ROYALTY-FREE, PERPETUAL LICENSE TO SUCH END-USERS FOR USE BY SUCH END-USERS
IN USING, DISPLAYING, AND CREATING DERIVATIVE WORKS THEREOF, SO LONG AS
SUCH USE, DISPLAY OR CREATION IS FOR NON-COMMERCIAL, ROYALTY OR REVENUE
FREE PURPOSES. IN NO EVENT SHALL THE END-USER USE THE COMPUTER CODE
CONTAINED HEREIN FOR REVENUE-BEARING PURPOSES. THE END-USER UNDERSTANDS
AND AGREES TO THE TERMS HEREIN AND ACCEPTS THE SAME BY USE OF THIS FILE.
COPYRIGHT 1993-1998 PARALLAX SOFTWARE CORPORATION. ALL RIGHTS RESERVED.
*/
/*
* $Source: /cvs/cvsroot/d2x/maths/fixc.c,v $
* $Revision: 1.1.1.1 $
* $Author: bradleyb $
* $Date: 2001-01-19 03:29:58 $
*
* C version of fixed point library
*
* $Log: not supported by cvs2svn $
* Revision 1.3 1999/10/18 00:31:01 donut
* more alpha fixes from Falk Hueffner
*
* Revision 1.2 1999/08/05 22:53:41 sekmu
*
* D3D patch(es) from ADB
*
* Revision 1.1.1.1 1999/06/14 22:13:35 donut
* Import of d1x 1.37 source.
*
* Revision 1.7 1995/09/22 14:08:16 allender
* fixed fix_atan2 to work correctly with doubles
*
* Revision 1.6 1995/08/31 15:43:49 allender
* *** empty log message ***
*
* Revision 1.5 1995/07/05 16:15:15 allender
* make fixmuldiv use doubles for PPC implementation
*
* Revision 1.4 1995/05/15 13:57:36 allender
* make fixmuldiv compile when compiling under 68k
*
* Revision 1.3 1995/05/11 13:02:59 allender
* some routines are now in assembly
*
* Revision 1.2 1995/05/04 20:04:45 allender
* use MPW fixdiv if compiling with MPW (why did I do this?)
*
* Revision 1.1 1995/04/17 11:37:54 allender
* Initial revision
*
*
* --- PC RCS Info ---
* Revision 1.1 1995/03/08 18:55:09 matt
* Initial revision
*
*
*/
#ifdef RCS
static char rcsid[] = "$Id: fixc.c,v 1.1.1.1 2001-01-19 03:29:58 bradleyb Exp $";
#endif
#include <conf.h>
#include "maths.h"
#ifdef NO_ASM
#include <stdlib.h>
#include <math.h>
#include "error.h"
#include "maths.h"
#ifdef NO_FIX_INLINE
#ifdef _MSC_VER
#pragma message ("warning: FIX NOT INLINED")
#else
#warning "FIX NOT INLINED"
#endif
#endif
extern ubyte guess_table[];
extern short sincos_table[];
extern ushort asin_table[];
extern ushort acos_table[];
extern fix isqrt_guess_table[];
//negate a quad
void fixquadnegate(quad *q)
{
q->low = 0 - q->low;
q->high = 0 - q->high - (q->low != 0);
}
//multiply two ints & add 64-bit result to 64-bit sum
void fixmulaccum(quad *q,fix a,fix b)
{
u_int32_t aa,bb;
u_int32_t ah,al,bh,bl;
u_int32_t t,c=0,old;
int neg;
neg = ((a^b) < 0);
aa = labs(a); bb = labs(b);
ah = aa>>16; al = aa&0xffff;
bh = bb>>16; bl = bb&0xffff;
t = ah*bl + bh*al;
if (neg)
fixquadnegate(q);
old = q->low;
q->low += al*bl;
if (q->low < old) q->high++;
old = q->low;
q->low += (t<<16);
if (q->low < old) q->high++;
q->high += ah*bh + (t>>16) + c;
if (neg)
fixquadnegate(q);
}
//extract a fix from a quad product
fix fixquadadjust(quad *q)
{
return (q->high<<16) + (q->low>>16);
}
#define EPSILON (F1_0/100)
#ifdef _MSC_VER
#define QLONG __int64
#else
#define QLONG long long
#endif
#ifdef NO_FIX_INLINE
fix fixmul(fix a, fix b) {
/* return (fix)(((double)a*(double)b)/65536.0);*/
/* register fix ret;
asm("imul %%edx; shrd $16,%%edx,%%eax" : "=a" (ret) : "a" (a), "d" (b) : "%edx");
return ret; */
return (fix)((((QLONG)a)*b) >> 16);
}
fix fixdiv(fix a, fix b)
{
/* return (fix)(((double)a * 65536.0) / (double)b);*/
return (fix)((((QLONG)a) << 16)/b);
/* register fix ret;
asm("mov %%eax,%%edx; sar $16,%%edx; shl $16,%%eax; idiv %%ebx" : "=a" (ret) : "a" (a), "b" (b) : "%edx");
return ret; */
}
fix fixmuldiv(fix a, fix b, fix c)
{
/* register fix ret;
asm("imul %%edx; idiv %%ebx" : "=a" (ret) : "a" (a), "d" (b), "b" (c) : "%edx");
return ret;*/
/* double d;
d = (double)a * (double) b;
return (fix)(d / (double) c);
*/
return (fix)((((QLONG)a)*b)/c);
}
#endif
//given cos & sin of an angle, return that angle.
//parms need not be normalized, that is, the ratio of the parms cos/sin must
//equal the ratio of the actual cos & sin for the result angle, but the parms
//need not be the actual cos & sin.
//NOTE: this is different from the standard C atan2, since it is left-handed.
fixang fix_atan2(fix cos,fix sin)
{
double d, dsin, dcos;
fixang t;
//Assert(!(cos==0 && sin==0));
//find smaller of two
dsin = (double)sin;
dcos = (double)cos;
d = sqrt((dsin * dsin) + (dcos * dcos));
if (d==0.0)
return 0;
if (labs(sin) < labs(cos)) { //sin is smaller, use arcsin
t = fix_asin((fix)((dsin / d) * 65536.0));
if (cos<0)
t = 0x8000 - t;
return t;
}
else {
t = fix_acos((fix)((dcos / d) * 65536.0));
if (sin<0)
t = -t;
return t;
}
}
#ifdef NO_FIX_INLINE
//divide a quad by a fix, returning a fix
int32_t fixdivquadlong(u_int32_t nl,u_int32_t nh,u_int32_t d)
{
int i;
u_int32_t tmp0;
ubyte tmp1;
u_int32_t r;
ubyte T,Q,M;
r = 0;
Q = ((nh&0x80000000)!=0);
M = ((d&0x80000000)!=0);
T = (M!=Q);
if (M == 0)
{
for (i=0; i<32; i++ ) {
r <<= 1;
r |= T;
T = ((nl&0x80000000L)!=0);
nl <<= 1;
switch( Q ) {
case 0:
Q = (unsigned char)((0x80000000L & nh) != 0 );
nh = (nh << 1) | (u_int32_t)T;
tmp0 = nh;
nh -= d;
tmp1 = (nh>tmp0);
if (Q == 0)
Q = tmp1;
else
Q = (unsigned char)(tmp1 == 0);
break;
case 1:
Q = (unsigned char)((0x80000000L & nh) != 0 );
nh = (nh << 1) | (u_int32_t)T;
tmp0 = nh;
nh += d;
tmp1 = (nh<tmp0);
if (Q == 0)
Q = tmp1;
else
Q = (unsigned char)(tmp1 == 0);
break;
}
T = (Q==M);
}
}
else
{
for (i=0; i<32; i++ ) {
r <<= 1;
r |= T;
T = ((nl&0x80000000L)!=0);
nl <<= 1;
switch( Q ) {
case 0:
Q = (unsigned char)((0x80000000L & nh) != 0 );
nh = (nh << 1) | (u_int32_t)T;
tmp0 = nh;
nh += d;
tmp1 = (nh<tmp0);
if (Q == 1)
Q = tmp1;
else
Q = (unsigned char)(tmp1 == 0);
break;
case 1:
Q = (unsigned char)((0x80000000L & nh) != 0 );
nh = (nh << 1) | (u_int32_t)T;
tmp0 = nh;
nh = nh - d;
tmp1 = (nh>tmp0);
if (Q == 1)
Q = tmp1;
else
Q = (unsigned char)(tmp1 == 0);
break;
}
T = (Q==M);
}
}
r = (r << 1) | T;
return r;
}
unsigned int fixdivquadlongu(uint nl, uint nh, uint d)
{
return fixdivquadlong((u_int32_t) nl,(u_int32_t) nh,(u_int32_t) d);
}
#else
int32_t fixdivquadlong(u_int32_t nl,u_int32_t nh,u_int32_t d) {
int32_t a;
__asm__("idivl %3"
:"=a" (a)
:"a" (nl), "d" (nh), "r" (d)
:"ax", "dx"
);
return (a);
}
static inline u_int32_t fixdivquadlongu(u_int32_t nl,u_int32_t nh,u_int32_t d) {
u_int32_t a;
__asm__("divl %3"
:"=a" (a)
:"a" (nl), "d" (nh), "r" (d)
:"ax", "dx"
);
return (a);
}
#endif
u_int32_t quad_sqrt(u_int32_t low,int32_t high)
{
int i, cnt;
u_int32_t r,old_r,t;
quad tq;
if (high<0)
return 0;
if (high==0 && (int32_t)low>=0)
return long_sqrt((int32_t)low);
if (high & 0xff000000) {
cnt=12+16; i = high >> 24;
} else if (high & 0xff0000) {
cnt=8+16; i = high >> 16;
} else if (high & 0xff00) {
cnt=4+16; i = high >> 8;
} else {
cnt=0+16; i = high;
}
r = guess_table[i]<<cnt;
//quad loop usually executed 4 times
r = (fixdivquadlongu(low,high,r)+r)/2;
r = (fixdivquadlongu(low,high,r)+r)/2;
r = (fixdivquadlongu(low,high,r)+r)/2;
do {
old_r = r;
t = fixdivquadlongu(low,high,r);
if (t==r) //got it!
return r;
r = (t+r)/2;
} while (!(r==t || r==old_r));
t = fixdivquadlongu(low,high,r);
//edited 05/17/99 Matt Mueller - tq.high is undefined here.. so set them to = 0
tq.low=tq.high=0;
//end edit -MM
fixmulaccum(&tq,r,t);
if (tq.low!=low || tq.high!=high)
r++;
return r;
}
//computes the square root of a long, returning a short
ushort long_sqrt(int32_t a)
{
int cnt,r,old_r,t;
if (a<=0)
return 0;
if (a & 0xff000000)
cnt=12;
else if (a & 0xff0000)
cnt=8;
else if (a & 0xff00)
cnt=4;
else
cnt=0;
r = guess_table[(a>>cnt)&0xff]<<cnt;
//the loop nearly always executes 3 times, so we'll unroll it 2 times and
//not do any checking until after the third time. By my calcutations, the
//loop is executed 2 times in 99.97% of cases, 3 times in 93.65% of cases,
//four times in 16.18% of cases, and five times in 0.44% of cases. It never
//executes more than five times. By timing, I determined that is is faster
//to always execute three times and not check for termination the first two
//times through. This means that in 93.65% of cases, we save 6 cmp/jcc pairs,
//and in 6.35% of cases we do an extra divide. In real life, these numbers
//might not be the same.
r = ((a/r)+r)/2;
r = ((a/r)+r)/2;
do {
old_r = r;
t = a/r;
if (t==r) //got it!
return r;
r = (t+r)/2;
} while (!(r==t || r==old_r));
if (a % r)
r++;
return r;
}
//computes the square root of a fix, returning a fix
fix fix_sqrt(fix a)
{
return ((fix) long_sqrt(a)) << 8;
}
//compute sine and cosine of an angle, filling in the variables
//either of the pointers can be NULL
//with interpolation
void fix_sincos(fix a,fix *s,fix *c)
{
int i,f;
fix ss,cc;
i = (a>>8)&0xff;
f = a&0xff;
ss = sincos_table[i];
if (s) *s = (ss + (((sincos_table[i+1] - ss) * f)>>8))<<2;
cc = sincos_table[i+64];
if (c) *c = (cc + (((sincos_table[i+64+1] - cc) * f)>>8))<<2;
}
//compute sine and cosine of an angle, filling in the variables
//either of the pointers can be NULL
//no interpolation
void fix_fastsincos(fix a,fix *s,fix *c)
{
int i;
i = (a>>8)&0xff;
if (s) *s = sincos_table[i] << 2;
if (c) *c = sincos_table[i+64] << 2;
}
//compute inverse sine
fixang fix_asin(fix v)
{
fix vv;
int i,f,aa;
vv = labs(v);
if (vv >= f1_0) //check for out of range
return 0x4000;
i = (vv>>8)&0xff;
f = vv&0xff;
aa = asin_table[i];
aa = aa + (((asin_table[i+1] - aa) * f)>>8);
if (v < 0)
aa = -aa;
return aa;
}
//compute inverse cosine
fixang fix_acos(fix v)
{
fix vv;
int i,f,aa;
vv = labs(v);
if (vv >= f1_0) //check for out of range
return 0;
i = (vv>>8)&0xff;
f = vv&0xff;
aa = acos_table[i];
aa = aa + (((acos_table[i+1] - aa) * f)>>8);
if (v < 0)
aa = 0x8000 - aa;
return aa;
}
#define TABLE_SIZE 1024
//for passed value a, returns 1/sqrt(a)
fix fix_isqrt( fix a )
{
int i, b = a;
int cnt = 0;
int r;
if ( a == 0 ) return 0;
while( b >= TABLE_SIZE ) {
b >>= 1;
cnt++;
}
//printf( "Count = %d (%d>>%d)\n", cnt, b, (cnt+1)/2 );
r = isqrt_guess_table[b] >> ((cnt+1)/2);
//printf( "Initial r = %d\n", r );
for (i=0; i<3; i++ ) {
int old_r = r;
r = fixmul( ( (3*65536) - fixmul(fixmul(r,r),a) ), r) / 2;
//printf( "r %d = %d\n", i, r );
if ( old_r >= r ) return (r+old_r)/2;
}
return r;
}
#endif // NO_ASM