A Question Of Rounding

sprintf() · ^s

printf("%.0f", 2.5)
  printf("%.2f", 5000.525); 
/* 
 * Compile with: gcc -std=c99 -lm -o filename filename.c
 * 
 * Definition of _GNU_SOURCE required for compilation with the 
 * GNU C Compiler (disables warning about implicit definition of pow10())
 */
#define _GNU_SOURCE

#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <math.h>

// Utility function converts an IEEE double precision number to a
// fixed precision decimal format stored in a buffer.
void tobuf(size_t max, int *len, char *buf, 
           double x, int precision, double max_prec, double carry)
{
  int    sign  = x < 0;                             // remember the sign
  double q     = pow10(-precision);                 // current mask
  double y     = x==0?0:fmod(fabs(x), q);           // modulus
  double l_div = round(y*max_prec)/max_prec+carry;  // significant digit
  int    l_dec = (int)round(l_div*10/q);            // round to decimal
  
  carry = l_dec>=10?l_div:0;                        // carry forward?
  l_dec = l_dec % 10;                               // this decimal
  x = x>0?x-y:x+y;                                  // subtract modulus
  
  if (fabs(x) > 0)                                  // recurse while |x| > 0
    tobuf(max, len, buf, x, precision-1, max_prec, carry);
  else {                                            // x == 0 - first digit
    if (*len >= max) return;
    if (sign) { buf[*len] = '-'; *len = *len + 1; }
    if (*len+1 <= max && precision >= 0) { 
      buf[*len] = '0'; *len = *len + 1; 
      buf[*len] = '.'; *len = *len + 1; 
    }
    while (precision-- > 0) {
      buf[*len] = '0'; *len = *len + 1;
      if (*len >= max) return;
    }
    precision = -1;  // don't place another period
  }
  if (*len <= max && precision == 0) { 
    buf[*len] = '.'; *len = *len + 1; 
  }
  
  // for first and subsequent digits, add the digit to the buffer
  if (*len >= max) return;
  if (l_dec < 0) l_dec = 0;
  buf[*len] = '0' + l_dec;
  *len = *len + 1;
}

// Convert the value x to a decimal representation stored in a buffer
int dbl2buf(size_t max, char *buf, double x, int precision) {
  const int DECIMALS=15;
  int    max_dec = DECIMALS-(int)(trunc(log10(fabs(x)))+1); // max significant digits
  double max_prec = pow10(max_dec);                   // magnitude for precision loss
  int    len = 0;                                     // buffer length init
  
  double y       = x==0?0:fmod(fabs(x), 1/max_prec);  // determine error
  double l_carry = round(y*max_prec)/max_prec;        // error is carried forward

  if (x != x) { strncpy(buf, "NAN", max); return 0; }
  if ((x-x) != (x-x)) { strncpy(buf, "INF", max); return 0; }
  
  tobuf(max, &len, buf, x, precision-1, max_prec, l_carry); // fill in buffer
  buf[len] = 0;                                             // terminate buffer
  return len;                                      // return buffer length used
}

//  Usage of the dbl2buf function.
int main (void)
{
  char buf[64];
  double x = 5000.525; 
  dbl2buf(sizeof(buf), buf, x, 2); 
  printf("%.15f = %s\n", x, buf);
}

Home Main Site FAQ Site Map Mirrors Translations Search Archives Authors Mailing Lists Join Us! Contact Us
The Free International Online Linux Monthly	ISSN: 1934-371X	Main site: http://linuxgazette.net

Double-Format Bit Pattern	Value
0 < `e` < 2047	(-1)^s × 2^e-1023 x 1.`f` (normal numbers)
`e` = 0; `f` 0 (at least one bit in `f` is nonzero)	(-1)^s × 2^-1022 x 0.`f` (subnormal numbers)
`e` = 0; `f` = 0 (all bits in `f` are zero)	(-1)^s × 0.0 (signed zero)
`s` = 0; `e` = 2047; `f` = 0 (all bits in `f` are zero)	+INF (positive infinity)
`s` = 1; `e` = 2047; `f` = 0 (all bits in `f` are zero)	-INF (negative infinity)
`s` = u; `e` =2047; `f` 0 (at least one bit in `f` is nonzero)	NaN (Not-a-Number)

A Question Of Rounding

Introduction

The sign, mantissa and exponent

Values Represented by Bit Patterns in IEEE Double Format

The problem; GlibC & sprintf()

Conclusion

Late Addendum