mirror of https://github.com/yasm/yasm.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
716 lines
21 KiB
716 lines
21 KiB
/* |
|
* Floating point number functions. |
|
* |
|
* Copyright (C) 2001 Peter Johnson |
|
* |
|
* Based on public-domain x86 assembly code by Randall Hyde (8/28/91). |
|
* |
|
* This file is part of YASM. |
|
* |
|
* YASM is free software; you can redistribute it and/or modify |
|
* it under the terms of the GNU General Public License as published by |
|
* the Free Software Foundation; either version 2 of the License, or |
|
* (at your option) any later version. |
|
* |
|
* YASM is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
|
* GNU General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU General Public License |
|
* along with this program; if not, write to the Free Software |
|
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
|
*/ |
|
#include "util.h" |
|
/*@unused@*/ RCSID("$IdPath$"); |
|
|
|
#include <ctype.h> |
|
|
|
#include "bitvect.h" |
|
#include "file.h" |
|
|
|
#include "errwarn.h" |
|
#include "floatnum.h" |
|
|
|
|
|
/* 97-bit internal floating point format: |
|
* 0000000s eeeeeeee eeeeeeee m.....................................m |
|
* Sign exponent mantissa (80 bits) |
|
* 79 0 |
|
* |
|
* Only L.O. bit of Sign byte is significant. The rest is zero. |
|
* Exponent is bias 32767. |
|
* Mantissa does NOT have an implied one bit (it's explicit). |
|
*/ |
|
struct floatnum { |
|
/*@only@*/ wordptr mantissa; /* Allocated to MANT_BITS bits */ |
|
unsigned short exponent; |
|
unsigned char sign; |
|
unsigned char flags; |
|
}; |
|
|
|
/* constants describing parameters of internal floating point format */ |
|
#define MANT_BITS 80 |
|
#define MANT_BYTES 10 |
|
#define MANT_SIGDIGITS 24 |
|
#define EXP_BIAS 0x7FFF |
|
#define EXP_INF 0xFFFF |
|
#define EXP_MAX 0xFFFE |
|
#define EXP_MIN 1 |
|
#define EXP_ZERO 0 |
|
|
|
/* Flag settings for flags field */ |
|
#define FLAG_ISZERO 1<<0 |
|
|
|
/* Note this structure integrates the floatnum structure */ |
|
typedef struct POT_Entry_s { |
|
floatnum f; |
|
int dec_exponent; |
|
} POT_Entry; |
|
|
|
/* "Source" for POT_Entry. */ |
|
typedef struct POT_Entry_Source_s { |
|
unsigned char mantissa[MANT_BYTES]; /* little endian mantissa */ |
|
unsigned short exponent; /* Bias 32767 exponent */ |
|
} POT_Entry_Source; |
|
|
|
/* Power of ten tables used by the floating point I/O routines. |
|
* The POT_Table? arrays are built from the POT_Table?_Source arrays at |
|
* runtime by POT_Table_Init(). |
|
*/ |
|
|
|
/* This table contains the powers of ten raised to negative powers of two: |
|
* |
|
* entry[12-n] = 10 ** (-2 ** n) for 0 <= n <= 12. |
|
* entry[13] = 1.0 |
|
*/ |
|
/*@-nullassign@*/ |
|
static /*@only@*/ POT_Entry *POT_TableN = (POT_Entry *)NULL; |
|
/*@=nullassign@*/ |
|
static POT_Entry_Source POT_TableN_Source[] = { |
|
{{0xe3,0x2d,0xde,0x9f,0xce,0xd2,0xc8,0x04,0xdd,0xa6},0x4ad8}, /* 1e-4096 */ |
|
{{0x25,0x49,0xe4,0x2d,0x36,0x34,0x4f,0x53,0xae,0xce},0x656b}, /* 1e-2048 */ |
|
{{0xa6,0x87,0xbd,0xc0,0x57,0xda,0xa5,0x82,0xa6,0xa2},0x72b5}, /* 1e-1024 */ |
|
{{0x33,0x71,0x1c,0xd2,0x23,0xdb,0x32,0xee,0x49,0x90},0x795a}, /* 1e-512 */ |
|
{{0x91,0xfa,0x39,0x19,0x7a,0x63,0x25,0x43,0x31,0xc0},0x7cac}, /* 1e-256 */ |
|
{{0x7d,0xac,0xa0,0xe4,0xbc,0x64,0x7c,0x46,0xd0,0xdd},0x7e55}, /* 1e-128 */ |
|
{{0x24,0x3f,0xa5,0xe9,0x39,0xa5,0x27,0xea,0x7f,0xa8},0x7f2a}, /* 1e-64 */ |
|
{{0xde,0x67,0xba,0x94,0x39,0x45,0xad,0x1e,0xb1,0xcf},0x7f94}, /* 1e-32 */ |
|
{{0x2f,0x4c,0x5b,0xe1,0x4d,0xc4,0xbe,0x94,0x95,0xe6},0x7fc9}, /* 1e-16 */ |
|
{{0xc2,0xfd,0xfc,0xce,0x61,0x84,0x11,0x77,0xcc,0xab},0x7fe4}, /* 1e-8 */ |
|
{{0xc3,0xd3,0x2b,0x65,0x19,0xe2,0x58,0x17,0xb7,0xd1},0x7ff1}, /* 1e-4 */ |
|
{{0x71,0x3d,0x0a,0xd7,0xa3,0x70,0x3d,0x0a,0xd7,0xa3},0x7ff8}, /* 1e-2 */ |
|
{{0xcd,0xcc,0xcc,0xcc,0xcc,0xcc,0xcc,0xcc,0xcc,0xcc},0x7ffb}, /* 1e-1 */ |
|
{{0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x80},0x7fff}, /* 1e-0 */ |
|
}; |
|
|
|
/* This table contains the powers of ten raised to positive powers of two: |
|
* |
|
* entry[12-n] = 10 ** (2 ** n) for 0 <= n <= 12. |
|
* entry[13] = 1.0 |
|
* entry[-1] = entry[0]; |
|
* |
|
* There is a -1 entry since it is possible for the algorithm to back up |
|
* before the table. This -1 entry is created at runtime by duplicating the |
|
* 0 entry. |
|
*/ |
|
static /*@only@*/ POT_Entry *POT_TableP; |
|
static POT_Entry_Source POT_TableP_Source[] = { |
|
{{0x4c,0xc9,0x9a,0x97,0x20,0x8a,0x02,0x52,0x60,0xc4},0xb525}, /* 1e+4096 */ |
|
{{0x4d,0xa7,0xe4,0x5d,0x3d,0xc5,0x5d,0x3b,0x8b,0x9e},0x9a92}, /* 1e+2048 */ |
|
{{0x0d,0x65,0x17,0x0c,0x75,0x81,0x86,0x75,0x76,0xc9},0x8d48}, /* 1e+1024 */ |
|
{{0x65,0xcc,0xc6,0x91,0x0e,0xa6,0xae,0xa0,0x19,0xe3},0x86a3}, /* 1e+512 */ |
|
{{0xbc,0xdd,0x8d,0xde,0xf9,0x9d,0xfb,0xeb,0x7e,0xaa},0x8351}, /* 1e+256 */ |
|
{{0x6f,0xc6,0xdf,0x8c,0xe9,0x80,0xc9,0x47,0xba,0x93},0x81a8}, /* 1e+128 */ |
|
{{0xbf,0x3c,0xd5,0xa6,0xcf,0xff,0x49,0x1f,0x78,0xc2},0x80d3}, /* 1e+64 */ |
|
{{0x20,0xf0,0x9d,0xb5,0x70,0x2b,0xa8,0xad,0xc5,0x9d},0x8069}, /* 1e+32 */ |
|
{{0x00,0x00,0x00,0x00,0x00,0x04,0xbf,0xc9,0x1b,0x8e},0x8034}, /* 1e+16 */ |
|
{{0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x20,0xbc,0xbe},0x8019}, /* 1e+8 */ |
|
{{0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x40,0x9c},0x800c}, /* 1e+4 */ |
|
{{0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0xc8},0x8005}, /* 1e+2 */ |
|
{{0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0xa0},0x8002}, /* 1e+1 */ |
|
{{0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x80},0x7fff}, /* 1e+0 */ |
|
}; |
|
|
|
static void |
|
POT_Table_Init_Entry(/*@out@*/ POT_Entry *e, POT_Entry_Source *s, int dec_exp) |
|
{ |
|
/* Save decimal exponent */ |
|
e->dec_exponent = dec_exp; |
|
|
|
/* Initialize mantissa */ |
|
e->f.mantissa = BitVector_Create(MANT_BITS, FALSE); |
|
BitVector_Block_Store(e->f.mantissa, s->mantissa, MANT_BYTES); |
|
|
|
/* Initialize exponent */ |
|
e->f.exponent = s->exponent; |
|
|
|
/* Set sign to 0 (positive) */ |
|
e->f.sign = 0; |
|
|
|
/* Clear flags */ |
|
e->f.flags = 0; |
|
} |
|
|
|
/*@-compdef@*/ |
|
static void |
|
POT_Table_Init(void) |
|
/*@globals undef POT_TableN, undef POT_TableP @*/ |
|
{ |
|
int dec_exp = 1; |
|
int i; |
|
|
|
/* Allocate space for two POT tables */ |
|
POT_TableN = xmalloc(14*sizeof(POT_Entry)); |
|
POT_TableP = xmalloc(15*sizeof(POT_Entry)); /* note 1 extra for -1 */ |
|
|
|
/* Initialize entry[0..12] */ |
|
for (i=12; i>=0; i--) { |
|
POT_Table_Init_Entry(&POT_TableN[i], &POT_TableN_Source[i], 0-dec_exp); |
|
POT_Table_Init_Entry(&POT_TableP[i+1], &POT_TableP_Source[i], dec_exp); |
|
dec_exp *= 2; /* Update decimal exponent */ |
|
} |
|
|
|
/* Initialize entry[13] */ |
|
POT_Table_Init_Entry(&POT_TableN[13], &POT_TableN_Source[13], 0); |
|
POT_Table_Init_Entry(&POT_TableP[14], &POT_TableP_Source[13], 0); |
|
|
|
/* Initialize entry[-1] for POT_TableP */ |
|
POT_Table_Init_Entry(&POT_TableP[0], &POT_TableP_Source[0], 4096); |
|
|
|
/* Offset POT_TableP so that [0] becomes [-1] */ |
|
POT_TableP++; |
|
} |
|
/*@=compdef@*/ |
|
|
|
/*@-globstate@*/ |
|
void |
|
floatnum_shutdown(void) |
|
{ |
|
int i; |
|
|
|
if (!POT_TableN) |
|
return; |
|
|
|
/* Un-offset POT_TableP */ |
|
POT_TableP--; |
|
|
|
for (i=0; i<14; i++) { |
|
BitVector_Destroy(POT_TableN[i].f.mantissa); |
|
BitVector_Destroy(POT_TableP[i].f.mantissa); |
|
} |
|
BitVector_Destroy(POT_TableP[14].f.mantissa); |
|
|
|
xfree(POT_TableN); |
|
xfree(POT_TableP); |
|
} |
|
/*@=globstate@*/ |
|
|
|
static void |
|
floatnum_normalize(floatnum *flt) |
|
{ |
|
long norm_amt; |
|
|
|
if (BitVector_is_empty(flt->mantissa)) { |
|
flt->exponent = 0; |
|
return; |
|
} |
|
|
|
/* Look for the highest set bit, shift to make it the MSB, and adjust |
|
* exponent. Don't let exponent go negative. */ |
|
norm_amt = (MANT_BITS-1)-Set_Max(flt->mantissa); |
|
if (norm_amt > (long)flt->exponent) |
|
norm_amt = (long)flt->exponent; |
|
BitVector_Move_Left(flt->mantissa, (N_int)norm_amt); |
|
flt->exponent -= norm_amt; |
|
} |
|
|
|
/* acc *= op */ |
|
static void |
|
floatnum_mul(floatnum *acc, const floatnum *op) |
|
{ |
|
long exp; |
|
wordptr product, op1, op2; |
|
long norm_amt; |
|
|
|
/* Compute the new sign */ |
|
acc->sign ^= op->sign; |
|
|
|
/* Check for multiply by 0 */ |
|
if (BitVector_is_empty(acc->mantissa) || BitVector_is_empty(op->mantissa)) { |
|
BitVector_Empty(acc->mantissa); |
|
acc->exponent = EXP_ZERO; |
|
return; |
|
} |
|
|
|
/* Add exponents, checking for overflow/underflow. */ |
|
exp = (((int)acc->exponent)-EXP_BIAS) + (((int)op->exponent)-EXP_BIAS); |
|
exp += EXP_BIAS; |
|
if (exp > EXP_MAX) { |
|
/* Overflow; return infinity. */ |
|
BitVector_Empty(acc->mantissa); |
|
acc->exponent = EXP_INF; |
|
return; |
|
} else if (exp < EXP_MIN) { |
|
/* Underflow; return zero. */ |
|
BitVector_Empty(acc->mantissa); |
|
acc->exponent = EXP_ZERO; |
|
return; |
|
} |
|
|
|
/* Add one to the final exponent, as the multiply shifts one extra time. */ |
|
acc->exponent = (unsigned short)(exp+1); |
|
|
|
/* Allocate space for the multiply result */ |
|
product = BitVector_Create((N_int)((MANT_BITS+1)*2), FALSE); |
|
|
|
/* Allocate 1-bit-longer fields to force the operands to be unsigned */ |
|
op1 = BitVector_Create((N_int)(MANT_BITS+1), FALSE); |
|
op2 = BitVector_Create((N_int)(MANT_BITS+1), FALSE); |
|
|
|
/* Make the operands unsigned after copying from original operands */ |
|
BitVector_Copy(op1, acc->mantissa); |
|
BitVector_MSB(op1, 0); |
|
BitVector_Copy(op2, op->mantissa); |
|
BitVector_MSB(op2, 0); |
|
|
|
/* Compute the product of the mantissas */ |
|
BitVector_Multiply(product, op1, op2); |
|
|
|
/* Normalize the product. Note: we know the product is non-zero because |
|
* both of the original operands were non-zero. |
|
* |
|
* Look for the highest set bit, shift to make it the MSB, and adjust |
|
* exponent. Don't let exponent go negative. |
|
*/ |
|
norm_amt = (MANT_BITS*2-1)-Set_Max(product); |
|
if (norm_amt > (long)acc->exponent) |
|
norm_amt = (long)acc->exponent; |
|
BitVector_Move_Left(product, (N_int)norm_amt); |
|
acc->exponent -= norm_amt; |
|
|
|
/* Store the highest bits of the result */ |
|
BitVector_Interval_Copy(acc->mantissa, product, 0, MANT_BITS, MANT_BITS); |
|
|
|
/* Free allocated variables */ |
|
BitVector_Destroy(product); |
|
BitVector_Destroy(op1); |
|
BitVector_Destroy(op2); |
|
} |
|
|
|
floatnum * |
|
floatnum_new(const char *str) |
|
{ |
|
floatnum *flt; |
|
int dec_exponent, dec_exp_add; /* decimal (powers of 10) exponent */ |
|
int POT_index; |
|
wordptr operand[2]; |
|
int sig_digits; |
|
int decimal_pt; |
|
boolean carry; |
|
|
|
/* Initialize POT tables if necessary */ |
|
if (!POT_TableN) |
|
POT_Table_Init(); |
|
|
|
flt = xmalloc(sizeof(floatnum)); |
|
|
|
flt->mantissa = BitVector_Create(MANT_BITS, TRUE); |
|
|
|
/* allocate and initialize calculation variables */ |
|
operand[0] = BitVector_Create(MANT_BITS, TRUE); |
|
operand[1] = BitVector_Create(MANT_BITS, TRUE); |
|
dec_exponent = 0; |
|
sig_digits = 0; |
|
decimal_pt = 1; |
|
|
|
/* set initial flags to 0 */ |
|
flt->flags = 0; |
|
|
|
/* check for + or - character and skip */ |
|
if (*str == '-') { |
|
flt->sign = 1; |
|
str++; |
|
} else if (*str == '+') { |
|
flt->sign = 0; |
|
str++; |
|
} else |
|
flt->sign = 0; |
|
|
|
/* eliminate any leading zeros (which do not count as significant digits) */ |
|
while (*str == '0') |
|
str++; |
|
|
|
/* When we reach the end of the leading zeros, first check for a decimal |
|
* point. If the number is of the form "0---0.0000" we need to get rid |
|
* of the zeros after the decimal point and not count them as significant |
|
* digits. |
|
*/ |
|
if (*str == '.') { |
|
str++; |
|
while (*str == '0') { |
|
str++; |
|
dec_exponent--; |
|
} |
|
} else { |
|
/* The number is of the form "yyy.xxxx" (where y <> 0). */ |
|
while (isdigit(*str)) { |
|
/* See if we've processed more than the max significant digits: */ |
|
if (sig_digits < MANT_SIGDIGITS) { |
|
/* Multiply mantissa by 10 [x = (x<<1)+(x<<3)] */ |
|
BitVector_shift_left(flt->mantissa, 0); |
|
BitVector_Copy(operand[0], flt->mantissa); |
|
BitVector_Move_Left(flt->mantissa, 2); |
|
carry = 0; |
|
BitVector_add(operand[1], operand[0], flt->mantissa, &carry); |
|
|
|
/* Add in current digit */ |
|
BitVector_Empty(operand[0]); |
|
BitVector_Chunk_Store(operand[0], 4, 0, (N_long)(*str-'0')); |
|
carry = 0; |
|
BitVector_add(flt->mantissa, operand[1], operand[0], &carry); |
|
} else { |
|
/* Can't integrate more digits with mantissa, so instead just |
|
* raise by a power of ten. |
|
*/ |
|
dec_exponent++; |
|
} |
|
sig_digits++; |
|
str++; |
|
} |
|
|
|
if (*str == '.') |
|
str++; |
|
else |
|
decimal_pt = 0; |
|
} |
|
|
|
if (decimal_pt) { |
|
/* Process the digits to the right of the decimal point. */ |
|
while (isdigit(*str)) { |
|
/* See if we've processed more than 19 significant digits: */ |
|
if (sig_digits < 19) { |
|
/* Raise by a power of ten */ |
|
dec_exponent--; |
|
|
|
/* Multiply mantissa by 10 [x = (x<<1)+(x<<3)] */ |
|
BitVector_shift_left(flt->mantissa, 0); |
|
BitVector_Copy(operand[0], flt->mantissa); |
|
BitVector_Move_Left(flt->mantissa, 2); |
|
carry = 0; |
|
BitVector_add(operand[1], operand[0], flt->mantissa, &carry); |
|
|
|
/* Add in current digit */ |
|
BitVector_Empty(operand[0]); |
|
BitVector_Chunk_Store(operand[0], 4, 0, (N_long)(*str-'0')); |
|
carry = 0; |
|
BitVector_add(flt->mantissa, operand[1], operand[0], &carry); |
|
} |
|
sig_digits++; |
|
str++; |
|
} |
|
} |
|
|
|
if (*str == 'e' || *str == 'E') { |
|
str++; |
|
/* We just saw the "E" character, now read in the exponent value and |
|
* add it into dec_exponent. |
|
*/ |
|
dec_exp_add = 0; |
|
sscanf(str, "%d", &dec_exp_add); |
|
dec_exponent += dec_exp_add; |
|
} |
|
|
|
/* Free calculation variables. */ |
|
BitVector_Destroy(operand[1]); |
|
BitVector_Destroy(operand[0]); |
|
|
|
/* Normalize the number, checking for 0 first. */ |
|
if (BitVector_is_empty(flt->mantissa)) { |
|
/* Mantissa is 0, zero exponent too. */ |
|
flt->exponent = 0; |
|
/* Set zero flag so output functions don't see 0 value as underflow. */ |
|
flt->flags |= FLAG_ISZERO; |
|
/* Return 0 value. */ |
|
return flt; |
|
} |
|
/* Exponent if already norm. */ |
|
flt->exponent = (unsigned short)(0x7FFF+(MANT_BITS-1)); |
|
floatnum_normalize(flt); |
|
|
|
/* The number is normalized. Now multiply by 10 the number of times |
|
* specified in DecExponent. This uses the power of ten tables to speed |
|
* up this operation (and make it more accurate). |
|
*/ |
|
if (dec_exponent > 0) { |
|
POT_index = 0; |
|
/* Until we hit 1.0 or finish exponent or overflow */ |
|
while ((POT_index < 14) && (dec_exponent != 0) && |
|
(flt->exponent != EXP_INF)) { |
|
/* Find the first power of ten in the table which is just less than |
|
* the exponent. |
|
*/ |
|
while (dec_exponent < POT_TableP[POT_index].dec_exponent) |
|
POT_index++; |
|
|
|
if (POT_index < 14) { |
|
/* Subtract out what we're multiplying in from exponent */ |
|
dec_exponent -= POT_TableP[POT_index].dec_exponent; |
|
|
|
/* Multiply by current power of 10 */ |
|
floatnum_mul(flt, &POT_TableP[POT_index].f); |
|
} |
|
} |
|
} else if (dec_exponent < 0) { |
|
POT_index = 0; |
|
/* Until we hit 1.0 or finish exponent or underflow */ |
|
while ((POT_index < 14) && (dec_exponent != 0) && |
|
(flt->exponent != EXP_ZERO)) { |
|
/* Find the first power of ten in the table which is just less than |
|
* the exponent. |
|
*/ |
|
while (dec_exponent > POT_TableN[POT_index].dec_exponent) |
|
POT_index++; |
|
|
|
if (POT_index < 14) { |
|
/* Subtract out what we're multiplying in from exponent */ |
|
dec_exponent -= POT_TableN[POT_index].dec_exponent; |
|
|
|
/* Multiply by current power of 10 */ |
|
floatnum_mul(flt, &POT_TableN[POT_index].f); |
|
} |
|
} |
|
} |
|
|
|
/* Round the result. (Don't round underflow or overflow). */ |
|
if ((flt->exponent != EXP_INF) && (flt->exponent != EXP_ZERO)) |
|
BitVector_increment(flt->mantissa); |
|
|
|
return flt; |
|
} |
|
|
|
floatnum * |
|
floatnum_copy(const floatnum *flt) |
|
{ |
|
floatnum *f = xmalloc(sizeof(floatnum)); |
|
|
|
f->mantissa = BitVector_Clone(flt->mantissa); |
|
f->exponent = flt->exponent; |
|
f->sign = flt->sign; |
|
f->flags = flt->flags; |
|
|
|
return f; |
|
} |
|
|
|
void |
|
floatnum_delete(floatnum *flt) |
|
{ |
|
BitVector_Destroy(flt->mantissa); |
|
xfree(flt); |
|
} |
|
|
|
void |
|
floatnum_calc(floatnum *acc, ExprOp op, /*@unused@*/ floatnum *operand) |
|
{ |
|
if (op != EXPR_NEG) |
|
Error(_("Unsupported floating-point arithmetic operation")); |
|
else |
|
acc->sign ^= 1; |
|
} |
|
|
|
int |
|
floatnum_get_int(const floatnum *flt, unsigned long *ret_val) |
|
{ |
|
unsigned char t[4]; |
|
|
|
if (floatnum_get_sized(flt, t, 4)) |
|
return 1; |
|
|
|
LOAD_LONG(*ret_val, &t[0]); |
|
return 0; |
|
} |
|
|
|
/* Function used by conversion routines to actually perform the conversion. |
|
* |
|
* ptr -> the array to return the little-endian floating point value into. |
|
* flt -> the floating point value to convert. |
|
* byte_size -> the size in bytes of the output format. |
|
* mant_bits -> the size in bits of the output mantissa. |
|
* implicit1 -> does the output format have an implicit 1? 1=yes, 0=no. |
|
* exp_bits -> the size in bits of the output exponent. |
|
* |
|
* Returns 0 on success, 1 if overflow, -1 if underflow. |
|
*/ |
|
static int |
|
floatnum_get_common(const floatnum *flt, /*@out@*/ unsigned char *ptr, |
|
N_int byte_size, N_int mant_bits, int implicit1, |
|
N_int exp_bits) |
|
{ |
|
long exponent = (long)flt->exponent; |
|
wordptr output; |
|
charptr buf; |
|
unsigned int len; |
|
unsigned int overflow = 0, underflow = 0; |
|
int retval = 0; |
|
long exp_bias = (1<<(exp_bits-1))-1; |
|
long exp_inf = (1<<exp_bits)-1; |
|
|
|
output = BitVector_Create(byte_size*8, TRUE); |
|
|
|
/* copy mantissa */ |
|
BitVector_Interval_Copy(output, flt->mantissa, 0, |
|
(N_int)((MANT_BITS-implicit1)-mant_bits), |
|
mant_bits); |
|
|
|
/* round mantissa */ |
|
if (BitVector_bit_test(flt->mantissa, (MANT_BITS-implicit1)-(mant_bits+1))) |
|
BitVector_increment(output); |
|
|
|
if (BitVector_bit_test(output, mant_bits)) { |
|
/* overflowed, so zero mantissa (and set explicit bit if necessary) */ |
|
BitVector_Empty(output); |
|
BitVector_Bit_Copy(output, mant_bits-1, !implicit1); |
|
/* and up the exponent (checking for overflow) */ |
|
if (exponent+1 >= EXP_INF) |
|
overflow = 1; |
|
else |
|
exponent++; |
|
} |
|
|
|
/* adjust the exponent to the output bias, checking for overflow */ |
|
exponent -= EXP_BIAS-exp_bias; |
|
if (exponent >= exp_inf) |
|
overflow = 1; |
|
else if (exponent <= 0) |
|
underflow = 1; |
|
|
|
/* underflow and overflow both set!? */ |
|
if (underflow && overflow) |
|
InternalError(_("Both underflow and overflow set")); |
|
|
|
/* check for underflow or overflow and set up appropriate output */ |
|
if (underflow) { |
|
BitVector_Empty(output); |
|
exponent = 0; |
|
if (!(flt->flags & FLAG_ISZERO)) |
|
retval = -1; |
|
} else if (overflow) { |
|
BitVector_Empty(output); |
|
exponent = exp_inf; |
|
retval = 1; |
|
} |
|
|
|
/* move exponent into place */ |
|
BitVector_Chunk_Store(output, exp_bits, mant_bits, (N_long)exponent); |
|
|
|
/* merge in sign bit */ |
|
BitVector_Bit_Copy(output, byte_size*8-1, flt->sign); |
|
|
|
/* get little-endian bytes */ |
|
buf = BitVector_Block_Read(output, &len); |
|
if (len < byte_size) |
|
InternalError(_("Byte length of BitVector does not match bit length")); |
|
|
|
/* copy to output */ |
|
memcpy(ptr, buf, byte_size*sizeof(unsigned char)); |
|
|
|
/* free allocated resources */ |
|
xfree(buf); |
|
|
|
BitVector_Destroy(output); |
|
|
|
return retval; |
|
} |
|
|
|
/* IEEE-754 (Intel) "single precision" format: |
|
* 32 bits: |
|
* Bit 31 Bit 22 Bit 0 |
|
* | | | |
|
* seeeeeee emmmmmmm mmmmmmmm mmmmmmmm |
|
* |
|
* e = bias 127 exponent |
|
* s = sign bit |
|
* m = mantissa bits, bit 23 is an implied one bit. |
|
* |
|
* IEEE-754 (Intel) "double precision" format: |
|
* 64 bits: |
|
* bit 63 bit 51 bit 0 |
|
* | | | |
|
* seeeeeee eeeemmmm mmmmmmmm mmmmmmmm mmmmmmmm mmmmmmmm mmmmmmmm mmmmmmmm |
|
* |
|
* e = bias 1023 exponent. |
|
* s = sign bit. |
|
* m = mantissa bits. Bit 52 is an implied one bit. |
|
* |
|
* IEEE-754 (Intel) "extended precision" format: |
|
* 80 bits: |
|
* bit 79 bit 63 bit 0 |
|
* | | | |
|
* seeeeeee eeeeeeee mmmmmmmm m...m m...m m...m m...m m...m |
|
* |
|
* e = bias 16383 exponent |
|
* m = 64 bit mantissa with NO implied bit! |
|
* s = sign (for mantissa) |
|
*/ |
|
int |
|
floatnum_get_sized(const floatnum *flt, unsigned char *ptr, size_t size) |
|
{ |
|
switch (size) { |
|
case 4: |
|
return floatnum_get_common(flt, ptr, 4, 23, 1, 8); |
|
case 8: |
|
return floatnum_get_common(flt, ptr, 8, 52, 1, 11); |
|
case 10: |
|
return floatnum_get_common(flt, ptr, 10, 64, 0, 15); |
|
default: |
|
InternalError(_("Invalid float conversion size")); |
|
/*@notreached@*/ |
|
return 1; /* never reached, but silence GCC warning */ |
|
} |
|
} |
|
|
|
/* 1 if the size is valid, 0 if it isn't */ |
|
int |
|
floatnum_check_size(/*@unused@*/ const floatnum *flt, size_t size) |
|
{ |
|
switch (size) { |
|
case 4: |
|
case 8: |
|
case 10: |
|
return 1; |
|
default: |
|
return 0; |
|
} |
|
} |
|
|
|
void |
|
floatnum_print(FILE *f, const floatnum *flt) |
|
{ |
|
unsigned char out[10]; |
|
unsigned char *str; |
|
int i; |
|
|
|
/* Internal format */ |
|
str = BitVector_to_Hex(flt->mantissa); |
|
fprintf(f, "%c %s *2^%04x\n", flt->sign?'-':'+', (char *)str, |
|
flt->exponent); |
|
xfree(str); |
|
|
|
/* 32-bit (single precision) format */ |
|
fprintf(f, "32-bit: %d: ", floatnum_get_sized(flt, out, 4)); |
|
for (i=0; i<4; i++) |
|
fprintf(f, "%02x ", out[i]); |
|
fprintf(f, "\n"); |
|
|
|
/* 64-bit (double precision) format */ |
|
fprintf(f, "64-bit: %d: ", floatnum_get_sized(flt, out, 8)); |
|
for (i=0; i<8; i++) |
|
fprintf(f, "%02x ", out[i]); |
|
fprintf(f, "\n"); |
|
|
|
/* 80-bit (extended precision) format */ |
|
fprintf(f, "80-bit: %d: ", floatnum_get_sized(flt, out, 10)); |
|
for (i=0; i<10; i++) |
|
fprintf(f, "%02x ", out[i]); |
|
fprintf(f, "\n"); |
|
}
|
|
|