2005-09-08 Martin Hunt <hunt@redhat.com>

* arith.c (_stp_div64): For 64-bit cpus, just use native division. Otherwise call _div64(). (_stp_mod64): Call _mod64() isf necessary. (_div64): 64-bit division for 32-bit cpus. (_mod64): 64-bit modulo for 32-bit cpus.
author: hunt <hunt> 2005-09-08 18:22:52 +0000
committer: hunt <hunt> 2005-09-08 18:22:52 +0000
commit: 367e790dff1d5940e0e4ffa6fa4ce116d425626f (patch)
tree: 209270b33004f53bd3b3459ad89416c8b36d5ca1 /runtime/arith.c
parent: 284b7f2aab4828b34afafb5b19136e53522849e5 (diff)
download: systemtap-steved-367e790dff1d5940e0e4ffa6fa4ce116d425626f.tar.gz
systemtap-steved-367e790dff1d5940e0e4ffa6fa4ce116d425626f.tar.xz
systemtap-steved-367e790dff1d5940e0e4ffa6fa4ce116d425626f.zip
1 files changed, 275 insertions, 63 deletions
diff --git a/runtime/arith.c b/runtime/arith.c
index b1759e2a..e9977718 100644
--- a/runtime/arith.c
+++ b/runtime/arith.c
@@ -1,4 +1,14 @@
-#ifndef _ARITH_C_ /* -*- linux-c -*- */
+/* -*- linux-c -*- */
+/* Math functions
+ * Copyright (C) 2005 Red Hat Inc.
+ *
+ * This file is part of systemtap, and is free software.  You can
+ * redistribute it and/or modify it under the terms of the GNU General
+ * Public License (GPL); either version 2, or (at your option) any
+ * later version.
+ */
+
+#ifndef _ARITH_C_ 
 #define _ARITH_C_
 
 /** @file arith.
@@ -6,73 +16,71 @@
  */
 
 
-struct context;
-void _stp_divmod64 (const char **error, int64_t x, int64_t y,
-                    int64_t *quo, int64_t *rem);
+/* 64-bit division for 64-bit cpus and i386 */
+/* Other 32-bit cpus will need to modify this file. */
 
+#ifdef __i386__
+long long _div64 (long long u, long long v);
+long long _mod64 (long long u, long long v);
+#endif
 
 /** Divide x by y.  In case of overflow or division-by-zero,
  * set context error string, and return any old value.
  */
-inline int64_t _stp_div64 (const char **error, int64_t x, int64_t y)
+int64_t _stp_div64 (const char **error, int64_t x, int64_t y)
 {
-  if (likely ((x >= LONG_MIN && x <= LONG_MAX) &&
-              (y >= LONG_MIN && y <= LONG_MAX)))
-    {
-      long xx = (long) x;
-      long yy = (long) y;
-      // check for division-by-zero and overflow
-      if (unlikely (yy == 0 || (xx == LONG_MIN && yy == -1)))
-        {
-          *error = "divisor out of range";
-          return 0;
-        }
-      return xx / yy;
-    }
-  else
-    {
-      int64_t quo = 0;
-      _stp_divmod64 (error, x, y, &quo, NULL);
-      return quo;
-    }
+#ifdef __LP64__
+	if (unlikely (y == 0)) {	
+		*error = "attempt to divide by 0";
+		return 0;
+	}
+	return x/y;
+#else
+	if (likely ((x >= LONG_MIN && x <= LONG_MAX) && (y >= LONG_MIN && y <= LONG_MAX))) {
+		long xx = (long) x;
+		long yy = (long) y;
+
+		// check for division-by-zero and overflow
+		if (unlikely (yy == 0 || (xx == LONG_MIN && yy == -1))) {
+			*error = "divisor out of range";
+			return 0;
+		}
+		return xx / yy;
+	} else {
+		return _div64 (x, y);
+	}
+#endif
 }
 
 
 /** Modulo x by y.  In case of overflow or division-by-zero,
  * set context error string, and return any old value.
  */
-inline int64_t _stp_mod64 (const char **error, int64_t x, int64_t y)
+int64_t _stp_mod64 (const char **error, int64_t x, int64_t y)
 {
-  if (likely ((x >= LONG_MIN && x <= LONG_MAX) &&
-              (y >= LONG_MIN && y <= LONG_MAX)))
-    {
-      long xx = (long) x;
-      long yy = (long) y;
-      // check for division-by-zero and overflow
-      if (unlikely (yy == 0 || (xx == LONG_MIN && yy == -1)))
-        {
-          *error = "divisor out of range";
-          return 0;
-        }
-      return xx % yy;
-    }
-  else
-    {
-      int64_t rem = 0;
-      _stp_divmod64 (error, x, y, NULL, &rem);
-      return rem;
-    }
-}
+#ifdef __LP64__
+	if (unlikely (y == 0)) {	
+		*error = "attempt to divide by 0";
+		return 0;
+	}
+	return x%y;
 
+#else
 
-/** Perform general long division/modulus. */
-void _stp_divmod64 (const char **error, int64_t x, int64_t y,
-                    int64_t *quo, int64_t *rem)
-{
-  // XXX: wimp out for now
-  *error = "general division unsupported";
-  if (quo) *quo = 0;
-  if (rem) *rem = 0;
+	if (likely ((x >= LONG_MIN && x <= LONG_MAX) && (y >= LONG_MIN && y <= LONG_MAX))) {
+		long xx = (long) x;
+		long yy = (long) y;
+
+		// check for division-by-zero and overflow
+		if (unlikely (yy == 0 || (xx == LONG_MIN && yy == -1))) {
+			*error = "divisor out of range";
+			return 0;
+		}
+		return xx % yy;
+	} else {
+		return _mod64 (x,y);
+	}
+#endif
 }
 
 
@@ -81,21 +89,225 @@ void _stp_divmod64 (const char **error, int64_t x, int64_t y,
  */
 int _stp_random_pm (int n)
 {
-  static unsigned long seed;
-  static int initialized_p = 0;
+	static unsigned long seed;
+	static int initialized_p = 0;
+	
+	if (unlikely (! initialized_p)) {
+		seed = (unsigned long) jiffies;
+		initialized_p = 1;
+	}
+	
+	/* from glibc rand man page */
+	seed = seed * 1103515245 + 12345;
+	
+	return (seed % (2*n+1)-n);
+}
+
+#ifdef __i386__
+
+/* 64-bit division functions extracted from libgcc */
+typedef long long DWtype;
+typedef unsigned long long UDWtype;
+typedef unsigned long UWtype;
+typedef long Wtype;
+typedef unsigned int USItype;
+
+#ifdef _BIG_ENDIAN
+struct DWstruct {Wtype high, low;};
+#else
+struct DWstruct {Wtype low, high;};
+#endif
+
+#define W_TYPE_SIZE 32
+
+typedef union
+{
+  struct DWstruct s;
+  DWtype ll;
+} DWunion;
+
+
+/* these are the i386 versions of these macros from gcc/longlong.h */
+
+#define umul_ppmm(w1, w0, u, v) \
+  __asm__ ("mull %3"							\
+	   : "=a" ((USItype) (w0)),					\
+	     "=d" ((USItype) (w1))					\
+	   : "%0" ((USItype) (u)),					\
+	     "rm" ((USItype) (v)))
+
+#define sub_ddmmss(sh, sl, ah, al, bh, bl) \
+  __asm__ ("subl %5,%1\n\tsbbl %3,%0"					\
+	   : "=r" ((USItype) (sh)),					\
+	     "=&r" ((USItype) (sl))					\
+	   : "0" ((USItype) (ah)),					\
+	     "g" ((USItype) (bh)),					\
+	     "1" ((USItype) (al)),					\
+	     "g" ((USItype) (bl)))
 
-  if (unlikely (! initialized_p))
-    {
-      seed = (unsigned long) jiffies;
-      initialized_p = 1;
-    }
+#define udiv_qrnnd(q, r, n1, n0, dv) \
+  __asm__ ("divl %4"							\
+	   : "=a" ((USItype) (q)),					\
+	     "=d" ((USItype) (r))					\
+	   : "0" ((USItype) (n0)),					\
+	     "1" ((USItype) (n1)),					\
+	     "rm" ((USItype) (dv)))
 
-  /* from glibc rand man page */
-  seed = seed * 1103515245 + 12345;
+#define count_leading_zeros(count, x) \
+  do {									\
+    USItype __cbtmp;							\
+    __asm__ ("bsrl %1,%0"						\
+	     : "=r" (__cbtmp) : "rm" ((USItype) (x)));			\
+    (count) = __cbtmp ^ 31;						\
+  } while (0)
 
-  return (seed % (2*n+1)-n);
+inline UDWtype _stp_udivmoddi4 (UDWtype n, UDWtype d, UDWtype *rp)
+{
+	const DWunion nn = {.ll = n};
+	const DWunion dd = {.ll = d};
+	DWunion ww,rr;
+	UWtype d0, d1, n0, n1, n2;
+	UWtype q0, q1;
+	UWtype b, bm;
+	
+	d0 = dd.s.low;
+	d1 = dd.s.high;
+	n0 = nn.s.low;
+	n1 = nn.s.high;
+	
+	if (d1 == 0) {
+		if (d0 > n1)	{
+			/* 0q = nn / 0D */
+			udiv_qrnnd (q0, n0, n1, n0, d0);
+			q1 = 0;
+			/* Remainder in n0.  */
+		} else {
+			/* qq = NN / 0d */
+			if (d0 == 0)
+				d0 = 1 / d0;	/* Divide intentionally by zero.  */
+			udiv_qrnnd (q1, n1, 0, n1, d0);
+			udiv_qrnnd (q0, n0, n1, n0, d0);
+			/* Remainder in n0.  */
+		}
+		
+		if (rp != 0)	{
+			rr.s.low = n0;
+			rr.s.high = 0;
+			*rp = rr.ll;
+		}
+	} else {
+		if (d1 > n1) {
+			/* 00 = nn / DD */
+			q0 = 0;
+			q1 = 0;
+			
+			/* Remainder in n1n0.  */
+			if (rp != 0) {
+				rr.s.low = n0;
+				rr.s.high = n1;
+				*rp = rr.ll;
+			}
+		} else {
+			/* 0q = NN / dd */
+			count_leading_zeros (bm, d1);
+			if (bm == 0) {
+				/* From (n1 >= d1) /\ (the most significant bit of d1 is set),
+				   conclude (the most significant bit of n1 is set) /\ (the
+				   quotient digit q0 = 0 or 1).
+				   This special case is necessary, not an optimization.  */
+				
+				/* The condition on the next line takes advantage of that
+				   n1 >= d1 (true due to program flow).  */
+				if (n1 > d1 || n0 >= d0) {
+					q0 = 1;
+					sub_ddmmss (n1, n0, n1, n0, d1, d0);
+				} else
+					q0 = 0;
+				
+				q1 = 0;
+				
+				if (rp != 0) {
+					rr.s.low = n0;
+					rr.s.high = n1;
+					*rp = rr.ll;
+				}
+			} else {
+				UWtype m1, m0;
+				/* Normalize.  */
+				
+				b = W_TYPE_SIZE - bm;
+				
+				d1 = (d1 << bm) | (d0 >> b);
+				d0 = d0 << bm;
+				n2 = n1 >> b;
+				n1 = (n1 << bm) | (n0 >> b);
+				n0 = n0 << bm;
+		      
+				udiv_qrnnd (q0, n1, n2, n1, d1);
+				umul_ppmm (m1, m0, q0, d0);
+		      
+				if (m1 > n1 || (m1 == n1 && m0 > n0)) {
+					q0--;
+					sub_ddmmss (m1, m0, m1, m0, d1, d0);
+				}
+		      
+				q1 = 0;
+		      
+				/* Remainder in (n1n0 - m1m0) >> bm.  */
+				if (rp != 0) {
+					sub_ddmmss (n1, n0, n1, n0, m1, m0);
+					rr.s.low = (n1 << b) | (n0 >> bm);
+					rr.s.high = n1 >> bm;
+					*rp = rr.ll;
+				}
+			}
+		}
+	}
+  
+	ww.s.low = q0; ww.s.high = q1;
+	return ww.ll;
 }
 
+long long _div64 (long long u, long long v)
+{
+	long c = 0;
+	DWunion uu = {.ll = u};
+	DWunion vv = {.ll = v};
+	DWtype w;
+	
+	if (uu.s.high < 0)
+		c = ~c,
+			uu.ll = -uu.ll;
+	if (vv.s.high < 0)
+		c = ~c,
+			vv.ll = -vv.ll;
+	
+	w = _stp_udivmoddi4 (uu.ll, vv.ll, (UDWtype *) 0);
+	if (c)
+		w = -w;
+	
+	return w;
+}
 
+long long _mod64 (long long u, long long v)
+{
+	long c = 0;
+	DWunion uu = {.ll = u};
+	DWunion vv = {.ll = v};
+	DWtype w;
+	
+	if (uu.s.high < 0)
+		c = ~c,
+			uu.ll = -uu.ll;
+	if (vv.s.high < 0)
+		vv.ll = -vv.ll;
+	
+	(void) _stp_udivmoddi4 (uu.ll, vv.ll, (UDWtype*)&w);
+	if (c)
+		w = -w;
+	
+	return w;
+}
+#endif /* __i386__ */
 
 #endif /* _ARITH_C_ */
author	hunt <hunt>	2005-09-08 18:22:52 +0000
committer	hunt <hunt>	2005-09-08 18:22:52 +0000
commit	367e790dff1d5940e0e4ffa6fa4ce116d425626f (patch)
tree	209270b33004f53bd3b3459ad89416c8b36d5ca1 /runtime/arith.c
parent	284b7f2aab4828b34afafb5b19136e53522849e5 (diff)
download	systemtap-steved-367e790dff1d5940e0e4ffa6fa4ce116d425626f.tar.gz systemtap-steved-367e790dff1d5940e0e4ffa6fa4ce116d425626f.tar.xz systemtap-steved-367e790dff1d5940e0e4ffa6fa4ce116d425626f.zip