|
|
/***
*tenpow.c - multiply a _LDBL12 by a power of 10 * * Copyright (c) 1991-2001, Microsoft Corporation. All rights reserved. * *Purpose: * *Revision History: * 07-17-91 GDP Initial version (ported from assembly) * 11-15-93 GJF Merged in NT SDK verions. Replaced MIPS and _ALPHA_ * by _M_MRX000 and _M_ALPHA (resp.). * 10-02-94 BWT PPC changes * 07-15-96 GJF Added parantheses to fix precedence problem in expr. * Also, detab-ed. * 05-05-99 RDL Added _M_IA64 to #if def's for alignment. * 07-15-01 PML Remove all ALPHA, MIPS, and PPC code * *******************************************************************************/
#include <cv.h>
extern _LDBL12 _pow10pos[]; extern _LDBL12 _pow10neg[];
/***
*void _CALLTYPE5 __ld12mul(_LDBL12 *px, _LDBL12 *py) - * _LDBL12 multiplication * *Purpose: multiply two _LDBL12 numbers * *Entry: px,py: pointers to the _LDBL12 operands * *Exit: *px contains the product * *Exceptions: * *******************************************************************************/
void _CALLTYPE5 __ld12mul(_LDBL12 *px, _LDBL12 *py) { u_short sign = 0; _LDBL12 tempman; /*this is actually a 12-byte mantissa,
not a 12-byte long double */ int i; u_short expx, expy, expsum; int roffs,poffs,qoffs; int sticky = 0;
*UL_LO_12(&tempman) = 0; *UL_MED_12(&tempman) = 0; *UL_HI_12(&tempman) = 0;
expx = *U_EXP_12(px); expy = *U_EXP_12(py);
sign = (expx ^ expy) & (u_short)0x8000; expx &= 0x7fff; expy &= 0x7fff; expsum = expx+expy; if (expx >= LD_MAXEXP || expy >= LD_MAXEXP || expsum > LD_MAXEXP+ LD_BIASM1){ /* overflow to infinity */ PUT_INF_12(px,sign); return; } if (expsum <= LD_BIASM1-63) { /* underflow to zero */ PUT_ZERO_12(px); return; } if (expx == 0) { /*
* If this is a denormal temp real then the mantissa * was shifted right once to set bit 63 to zero. */ expsum++; /* Correct for this */ if (ISZERO_12(px)) { /* put positive sign */ *U_EXP_12(px) = 0; return; } } if (expy == 0) { expsum++; /* because arg2 is denormal */ if (ISZERO_12(py)) { PUT_ZERO_12(px); return; } }
roffs = 0; for (i=0;i<5;i++) { int j; poffs = i<<1; qoffs = 8; for (j=5-i;j>0;j--) { u_long prod; #if defined(_M_IA64) || defined(_M_AMD64)
/* a variable to hold temprary sums */ u_long sum; #endif
int carry; u_short *p, *q; u_long *r; p = USHORT_12(px,poffs); q = USHORT_12(py,qoffs); r = ULONG_12(&tempman,roffs); prod = (u_long)*p * (u_long)*q; #if defined(_M_IA64) || defined(_M_AMD64)
/* handle misalignment problems */ if (i&0x1){ /* i is odd */ carry = __addl(*ALIGN(r), prod, &sum); *ALIGN(r) = sum; } else /* i is even */ carry = __addl(*r, prod, r); #else
carry = __addl(*r,prod,r); #endif
if (carry) { /* roffs should be less than 8 in this case */ (*USHORT_12(&tempman,roffs+4))++; } poffs+=2; qoffs-=2; } roffs+=2; }
expsum -= LD_BIASM1;
/* normalize */ while ((s_short)expsum > 0 && ((*UL_HI_12(&tempman) & MSB_ULONG) == 0)) { __shl_12(&tempman); expsum--; }
if ((s_short)expsum <= 0) { expsum--; while ((s_short)expsum < 0) { if (*U_XT_12(&tempman) & 0x1) sticky++; __shr_12(&tempman); expsum++; } if (sticky) *U_XT_12(&tempman) |= 0x1; }
if (*U_XT_12(&tempman) > 0x8000 || ((*UL_LO_12(&tempman) & 0x1ffff) == 0x18000)) { /* round up */ if (*UL_MANLO_12(&tempman) == MAX_ULONG) { *UL_MANLO_12(&tempman) = 0; if (*UL_MANHI_12(&tempman) == MAX_ULONG) { *UL_MANHI_12(&tempman) = 0; if (*U_EXP_12(&tempman) == MAX_USHORT) { /* 12-byte mantissa overflow */ *U_EXP_12(&tempman) = MSB_USHORT; expsum++; } else (*U_EXP_12(&tempman))++; } else (*UL_MANHI_12(&tempman))++; } else (*UL_MANLO_12(&tempman))++; }
/* check for exponent overflow */ if (expsum >= 0x7fff){ PUT_INF_12(px, sign); return; }
/* put result in px */ *U_XT_12(px) = *USHORT_12(&tempman,2); *UL_MANLO_12(px) = *UL_MED_12(&tempman); *UL_MANHI_12(px) = *UL_HI_12(&tempman); *U_EXP_12(px) = expsum | sign; }
void _CALLTYPE5 __multtenpow12(_LDBL12 *pld12, int pow, unsigned mult12) { _LDBL12 *pow_10p = _pow10pos-8; if (pow == 0) return; if (pow < 0) { pow = -pow; pow_10p = _pow10neg-8; }
if (!mult12) *U_XT_12(pld12) = 0;
while (pow) { int last3; /* the 3 LSBits of pow */ _LDBL12 unround; _LDBL12 *py;
pow_10p += 7; last3 = pow & 0x7; pow >>= 3; if (last3 == 0) continue; py = pow_10p + last3;
#ifdef _LDSUPPORT
if (mult12) { #endif
/* do an exact 12byte multiplication */ if (*U_XT_12(py) >= 0x8000) { /* copy number */ unround = *py; /* unround adjacent byte */ (*UL_MANLO_12(&unround))--; /* point to new operand */ py = &unround; } __ld12mul(pld12,py); #ifdef _LDSUPPORT
} else { /* do a 10byte multiplication */ py = (_LDBL12 *)TEN_BYTE_PART(py); *(long double *)TEN_BYTE_PART(pld12) *= *(long double *)py; } #endif
} }
|