Speed up exp()

author: Erik Schnetter <schnetter@gmail.com> 2013-02-15 09:56:50 -0500
committer: Erik Schnetter <schnetter@gmail.com> 2013-02-15 09:56:50 -0500
commit: d05b06b7d7cd39d586f1df7e8452967e4d675691 (patch)
tree: 3681492ef12c9a3b8b2235c0d75fa4db7e9579c5 /mathfuncs_exp.h
parent: b384855d67f7e1afbeb8d193086bbe0ad7d94108 (diff)
download: vecmathlib-d05b06b7d7cd39d586f1df7e8452967e4d675691.zip
vecmathlib-d05b06b7d7cd39d586f1df7e8452967e4d675691.tar.gz
1 files changed, 21 insertions, 3 deletions
diff --git a/mathfuncs_exp.h b/mathfuncs_exp.h
index 46b3f2d..dd7b23e 100644
--- a/mathfuncs_exp.h
+++ b/mathfuncs_exp.h
@@ -17,7 +17,18 @@ namespace vecmathlib {
   {
     // Rescale
     realvec_t x0 = x;
-    realvec_t round_x = round(x);
+    
+    // realvec_t round_x = round(x);
+    // intvec_t iround_x = convert_int(round_x);
+    // r = scalbn(r, iround_x);
+    
+    // Round by adding, then subtracting again a large number
+    // Add a large number to move the mantissa bits to the right
+    int_t large = (U(1) << FP::mantissa_bits) + FP::exponent_offset;
+    realvec_t tmp = x + RV(R(large));
+    tmp.barrier();
+    
+    realvec_t round_x = tmp - RV(R(large));
     x -= round_x;
     assert(all(x >= RV(-0.5) && x <= RV(0.5)));
     
@@ -54,8 +65,15 @@ namespace vecmathlib {
     }
     
     // Undo rescaling
-    intvec_t iround_x = convert_int(round_x);
-    r = ifthen(x0 < RV(R(FP::min_exponent)), RV(0.0), scalbn(r, iround_x));
+    // Extract integer as lowest mantissa bits (highest bits still
+    // contain offset, exponent, and sign)
+    intvec_t itmp = as_int(tmp);
+    // Construct scale factor by setting exponent (this shifts out the
+    // highest bits)
+    realvec_t scale = as_float(itmp << I(FP::mantissa_bits));
+    scale = ifthen(x0 < RV(R(FP::min_exponent)), RV(0.0), scale);
+    
+    r *= scale;
     
     return r;
   }
author	Erik Schnetter <schnetter@gmail.com>	2013-02-15 09:56:50 -0500
committer	Erik Schnetter <schnetter@gmail.com>	2013-02-15 09:56:50 -0500
commit	d05b06b7d7cd39d586f1df7e8452967e4d675691 (patch)
tree	3681492ef12c9a3b8b2235c0d75fa4db7e9579c5 /mathfuncs_exp.h
parent	b384855d67f7e1afbeb8d193086bbe0ad7d94108 (diff)
download	vecmathlib-d05b06b7d7cd39d586f1df7e8452967e4d675691.zip vecmathlib-d05b06b7d7cd39d586f1df7e8452967e4d675691.tar.gz