ntp/libparse/mfp_mul.c

228753Smm/*
228753Smm * /src/NTP/ntp4-dev/libparse/mfp_mul.c,v 4.9 2005/07/17 20:34:40 kardel RELEASE_20050717_A
228753Smm *
228753Smm * mfp_mul.c,v 4.9 2005/07/17 20:34:40 kardel RELEASE_20050717_A
228753Smm *
228753Smm * $Created: Sat Aug 16 20:35:08 1997 $
228753Smm *
228753Smm * Copyright (c) 1997-2005 by Frank Kardel <kardel <AT> ntp.org>
228753Smm *
228753Smm * Redistribution and use in source and binary forms, with or without
228753Smm * modification, are permitted provided that the following conditions
228753Smm * are met:
228753Smm * 1. Redistributions of source code must retain the above copyright
228753Smm *    notice, this list of conditions and the following disclaimer.
228753Smm * 2. Redistributions in binary form must reproduce the above copyright
228753Smm *    notice, this list of conditions and the following disclaimer in the
228753Smm *    documentation and/or other materials provided with the distribution.
228753Smm * 3. Neither the name of the author nor the names of its contributors
228753Smm *    may be used to endorse or promote products derived from this software
228753Smm *    without specific prior written permission.
228753Smm *
228753Smm * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
228753Smm * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
228753Smm * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
228753Smm * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
228753Smm * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
228753Smm * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
228753Smm * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
228763Smm * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
228753Smm * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
228753Smm * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
228753Smm * SUCH DAMAGE.
228753Smm *
228753Smm */
228753Smm#include <config.h>
228753Smm#include <stdio.h>
228753Smm#include "ntp_stdlib.h"
228753Smm#include "ntp_types.h"
228753Smm#include "ntp_fp.h"
228753Smm
228753Smm#define LOW_MASK  (u_int32)((1<<(FRACTION_PREC/2))-1)
228753Smm#define HIGH_MASK (u_int32)(LOW_MASK << (FRACTION_PREC/2))
228753Smm
228753Smm/*
228753Smm * for those who worry about overflows (possibly triggered by static analysis tools):
228753Smm *
228753Smm * Largest value of a 2^n bit number is 2^n-1.
228753Smm * Thus the result is: (2^n-1)*(2^n-1) = 2^2n - 2^n - 2^n + 1 < 2^2n
228753Smm * Here overflow can not happen for 2 reasons:
228753Smm * 1) the code actually multiplies the absolute values of two signed
228753Smm *    64bit quantities.thus effectively multiplying 2 63bit quantities.
228753Smm * 2) Carry propagation is from low to high, building principle is
228753Smm *    addition, so no storage for the 2^2n term from above is needed.
232153Smm */
228753Smm
228753Smmvoid
228753Smmmfp_mul(
228753Smm	int32   *o_i,
228753Smm	u_int32 *o_f,
228753Smm	int32    a_i,
228753Smm	u_int32  a_f,
228753Smm	int32    b_i,
228753Smm	u_int32  b_f
248616Smm	)
228753Smm{
305192Smm  int32 i, j;
232153Smm  u_int32  f;
228753Smm  u_long a[4];			/* operand a */
228753Smm  u_long b[4];			/* operand b */
228753Smm  u_long c[5];			/* result c - 5 items for performance - see below */
248616Smm  u_long carry;
228753Smm
228753Smm  int neg = 0;
228753Smm
228753Smm  if (a_i < 0)			/* examine sign situation */
248616Smm    {
302001Smm      neg = 1;
228753Smm      M_NEG(a_i, a_f);
248616Smm    }
228753Smm
228753Smm  if (b_i < 0)			/* examine sign situation */
228753Smm    {
228753Smm      neg = !neg;
228753Smm      M_NEG(b_i, b_f);
302001Smm    }
228753Smm
228753Smm  a[0] = a_f & LOW_MASK;	/* prepare a operand */
228753Smm  a[1] = (a_f & HIGH_MASK) >> (FRACTION_PREC/2);
228753Smm  a[2] = a_i & LOW_MASK;
228753Smm  a[3] = (a_i & HIGH_MASK) >> (FRACTION_PREC/2);
248616Smm
228753Smm  b[0] = b_f & LOW_MASK;	/* prepare b operand */
228753Smm  b[1] = (b_f & HIGH_MASK) >> (FRACTION_PREC/2);
228753Smm  b[2] = b_i & LOW_MASK;
324418Smm  b[3] = (b_i & HIGH_MASK) >> (FRACTION_PREC/2);
228753Smm
228753Smm  c[0] = c[1] = c[2] = c[3] = c[4] = 0;
228753Smm
228753Smm  for (i = 0; i < 4; i++)	/* we do assume 32 * 32 = 64 bit multiplication */
228753Smm    for (j = 0; j < 4; j++)
228753Smm      {
228753Smm	u_long result_low, result_high;
228753Smm	int low_index = (i+j)/2;      /* formal [0..3]  - index for low long word */
228753Smm	int mid_index = 1+low_index;  /* formal [1..4]! - index for high long word
228753Smm					 will generate unecessary add of 0 to c[4]
228753Smm					 but save 15 'if (result_high) expressions' */
228753Smm	int high_index = 1+mid_index; /* formal [2..5]! - index for high word overflow
228753Smm					 - only assigned on overflow (limits range to 2..3) */
228753Smm
228753Smm	result_low = (u_long)a[i] * (u_long)b[j];	/* partial product */
228753Smm
228753Smm	if ((i+j) & 1)		/* splits across two result registers */
228753Smm	  {
228753Smm	    result_high   = result_low >> (FRACTION_PREC/2);
228753Smm	    result_low  <<= FRACTION_PREC/2;
228753Smm	    carry         = (unsigned)1<<(FRACTION_PREC/2);
228753Smm	  }
228753Smm	else
228753Smm	  {			/* stays in a result register - except for overflows */
228753Smm	    result_high = 0;
228753Smm	    carry       = 1;
232153Smm	  }
228753Smm
228753Smm	if (((c[low_index] >> 1) + (result_low >> 1) + ((c[low_index] & result_low & carry) != 0)) &
228753Smm	    (u_int32)((unsigned)1<<(FRACTION_PREC - 1))) {
228753Smm	  result_high++;	/* propagate overflows */
228753Smm        }
228753Smm
228753Smm	c[low_index]   += result_low; /* add up partial products */
228753Smm
228753Smm	if (((c[mid_index] >> 1) + (result_high >> 1) + ((c[mid_index] & result_high & 1) != 0)) &
228753Smm	    (u_int32)((unsigned)1<<(FRACTION_PREC - 1))) {
228753Smm	  c[high_index]++;		/* propagate overflows of high word sum */
228753Smm        }
228753Smm
228753Smm	c[mid_index] += result_high;  /* will add a 0 to c[4] once but saves 15 if conditions */
228753Smm      }
228753Smm
228753Smm#ifdef DEBUG
228753Smm  if (debug > 6)
228753Smm    printf("mfp_mul: 0x%04lx%04lx%04lx%04lx * 0x%04lx%04lx%04lx%04lx = 0x%08lx%08lx%08lx%08lx\n",
228753Smm	 a[3], a[2], a[1], a[0], b[3], b[2], b[1], b[0], c[3], c[2], c[1], c[0]);
228753Smm#endif
228753Smm
228753Smm  if (c[3])			/* overflow */
228753Smm    {
228753Smm      i = ((unsigned)1 << (FRACTION_PREC-1)) - 1;
228753Smm      f = ~(unsigned)0;
228753Smm    }
228753Smm  else
228753Smm    {				/* take produkt - discarding extra precision */
228753Smm      i = c[2];
228753Smm      f = c[1];
228753Smm    }
228753Smm
228753Smm  if (neg)			/* recover sign */
228753Smm    {
228753Smm      M_NEG(i, f);
228753Smm    }
228753Smm
228753Smm  *o_i = i;
228753Smm  *o_f = f;
228753Smm
228753Smm#ifdef DEBUG
228753Smm  if (debug > 6)
228753Smm    printf("mfp_mul: %s * %s => %s\n",
228753Smm	   mfptoa((u_long)a_i, a_f, 6),
228753Smm	   mfptoa((u_long)b_i, b_f, 6),
228753Smm	   mfptoa((u_long)i, f, 6));
228753Smm#endif
228753Smm}
228753Smm
228753Smm/*
228753Smm * History:
228753Smm *
228753Smm * mfp_mul.c,v
228753Smm * Revision 4.9  2005/07/17 20:34:40  kardel
228753Smm * correct carry propagation implementation
228753Smm *
228753Smm * Revision 4.8  2005/07/12 16:17:26  kardel
228753Smm * add explanation why we do not write into c[4]
228753Smm *
228753Smm * Revision 4.7  2005/04/16 17:32:10  kardel
228753Smm * update copyright
228753Smm *
228753Smm * Revision 4.6  2004/11/14 15:29:41  kardel
228753Smm * support PPSAPI, upgrade Copyright to Berkeley style
228753Smm *
228753Smm * Revision 4.3  1999/02/21 12:17:37  kardel
228753Smm * 4.91f reconcilation
228753Smm *
228753Smm * Revision 4.2  1998/12/20 23:45:28  kardel
228753Smm * fix types and warnings
228753Smm *
228753Smm * Revision 4.1  1998/05/24 07:59:57  kardel
228753Smm * conditional debug support
228753Smm *
228753Smm * Revision 4.0  1998/04/10 19:46:38  kardel
228753Smm * Start 4.0 release version numbering
228753Smm *
232153Smm * Revision 1.1  1998/04/10 19:27:47  kardel
228753Smm * initial NTP VERSION 4 integration of PARSE with GPS166 binary support
228753Smm *
228753Smm * Revision 1.1  1997/10/06 21:05:46  kardel
228753Smm * new parse structure
228753Smm *
228753Smm */
228753Smm