buffer: speed up ascii character scanning

Speed up ASCII character scanning and conversion by 25% to 30% by scanning and converting whole words instead of individual bytes.
author: Ben Noordhuis <info@bnoordhuis.nl> 2012-12-06 05:26:35 +0100
committer: isaacs <i@izs.me> 2013-03-08 14:42:15 -0800
commit: e325ace53c83a89c94b24247c810ccdfa46f35df (patch)
tree: e371ad43cdb358183028e1968ff2b152e51c55ec /src/node_buffer.cc
parent: 96a314b68b19277cc71ccac06b6517956b8f8a22 (diff)
download: android-node-v8-e325ace53c83a89c94b24247c810ccdfa46f35df.tar.gz
android-node-v8-e325ace53c83a89c94b24247c810ccdfa46f35df.tar.bz2
android-node-v8-e325ace53c83a89c94b24247c810ccdfa46f35df.zip
1 files changed, 90 insertions, 2 deletions
diff --git a/src/node_buffer.cc b/src/node_buffer.cc
index af53c98efb..21960f8852 100644
--- a/src/node_buffer.cc
+++ b/src/node_buffer.cc
@@ -28,6 +28,7 @@
 
 #include <assert.h>
 #include <string.h> // memcpy
+#include <limits.h>
 
 #define MIN(a,b) ((a) < (b) ? (a) : (b))
 
@@ -247,7 +248,7 @@ Handle<Value> Buffer::BinarySlice(const Arguments &args) {
 }
 
 
-static bool contains_non_ascii(const char* buf, size_t len) {
+static bool contains_non_ascii_slow(const char* buf, size_t len) {
   for (size_t i = 0; i < len; ++i) {
     if (buf[i] & 0x80) return true;
   }
@@ -255,13 +256,100 @@ static bool contains_non_ascii(const char* buf, size_t len) {
 }
 
 
-static void force_ascii(const char* src, char* dst, size_t len) {
+static bool contains_non_ascii(const char* src, size_t len) {
+  if (len < 16) {
+    return contains_non_ascii_slow(src, len);
+  }
+
+  const unsigned bytes_per_word = BITS_PER_LONG / CHAR_BIT;
+  const unsigned align_mask = bytes_per_word - 1;
+  const unsigned unaligned = reinterpret_cast<uintptr_t>(src) & align_mask;
+
+  if (unaligned > 0) {
+    const unsigned n = bytes_per_word - unaligned;
+    if (contains_non_ascii_slow(src, n)) return true;
+    src += n;
+    len -= n;
+  }
+
+#if BITS_PER_LONG == 64
+  typedef uint64_t word;
+  const uint64_t mask = 0x8080808080808080ll;
+#else
+  typedef uint32_t word;
+  const uint32_t mask = 0x80808080l;
+#endif
+
+  const word* srcw = reinterpret_cast<const word*>(src);
+
+  for (size_t i = 0, n = len / bytes_per_word; i < n; ++i) {
+    if (srcw[i] & mask) return true;
+  }
+
+  const unsigned remainder = len & align_mask;
+  if (remainder > 0) {
+    const size_t offset = len - remainder;
+    if (contains_non_ascii_slow(src + offset, remainder)) return true;
+  }
+
+  return false;
+}
+
+
+static void force_ascii_slow(const char* src, char* dst, size_t len) {
   for (size_t i = 0; i < len; ++i) {
     dst[i] = src[i] & 0x7f;
   }
 }
 
 
+static void force_ascii(const char* src, char* dst, size_t len) {
+  if (len < 16) {
+    force_ascii_slow(src, dst, len);
+    return;
+  }
+
+  const unsigned bytes_per_word = BITS_PER_LONG / CHAR_BIT;
+  const unsigned align_mask = bytes_per_word - 1;
+  const unsigned src_unalign = reinterpret_cast<uintptr_t>(src) & align_mask;
+  const unsigned dst_unalign = reinterpret_cast<uintptr_t>(dst) & align_mask;
+
+  if (src_unalign > 0) {
+    if (src_unalign == dst_unalign) {
+      const unsigned unalign = bytes_per_word - src_unalign;
+      force_ascii_slow(src, dst, unalign);
+      src += unalign;
+      dst += unalign;
+      len -= src_unalign;
+    } else {
+      force_ascii_slow(src, dst, len);
+      return;
+    }
+  }
+
+#if BITS_PER_LONG == 64
+  typedef uint64_t word;
+  const uint64_t mask = ~0x8080808080808080ll;
+#else
+  typedef uint32_t word;
+  const uint32_t mask = ~0x80808080l;
+#endif
+
+  const word* srcw = reinterpret_cast<const word*>(src);
+  word* dstw = reinterpret_cast<word*>(dst);
+
+  for (size_t i = 0, n = len / bytes_per_word; i < n; ++i) {
+    dstw[i] = srcw[i] & mask;
+  }
+
+  const unsigned remainder = len & align_mask;
+  if (remainder > 0) {
+    const size_t offset = len - remainder;
+    force_ascii_slow(src + offset, dst + offset, remainder);
+  }
+}
+
+
 Handle<Value> Buffer::AsciiSlice(const Arguments &args) {
   HandleScope scope;
   Buffer *parent = ObjectWrap::Unwrap<Buffer>(args.This());
author	Ben Noordhuis <info@bnoordhuis.nl>	2012-12-06 05:26:35 +0100
committer	isaacs <i@izs.me>	2013-03-08 14:42:15 -0800
commit	e325ace53c83a89c94b24247c810ccdfa46f35df (patch)
tree	e371ad43cdb358183028e1968ff2b152e51c55ec /src/node_buffer.cc
parent	96a314b68b19277cc71ccac06b6517956b8f8a22 (diff)
download	android-node-v8-e325ace53c83a89c94b24247c810ccdfa46f35df.tar.gz android-node-v8-e325ace53c83a89c94b24247c810ccdfa46f35df.tar.bz2 android-node-v8-e325ace53c83a89c94b24247c810ccdfa46f35df.zip