simd-lite
diff --git a/‎.circleci/config.yml
Lines changed: 21 additions & 5 deletions b/‎.circleci/config.yml
Lines changed: 21 additions & 5 deletions
diff --git a/‎data/crash/crash000030.json
Lines changed: 1 addition & 0 deletions b/‎data/crash/crash000030.json
Lines changed: 1 addition & 0 deletions
diff --git a/‎data/crash/crash000031.json
Lines changed: 1 addition & 0 deletions b/‎data/crash/crash000031.json
Lines changed: 1 addition & 0 deletions
diff --git a/‎data/crash/crash000032.json
Lines changed: 1 addition & 0 deletions b/‎data/crash/crash000032.json
Lines changed: 1 addition & 0 deletions
diff --git a/‎data/crash/crash000033.json
Lines changed: 1 addition & 0 deletions b/‎data/crash/crash000033.json
Lines changed: 1 addition & 0 deletions
diff --git a/‎data/crash/crash000034.json
Lines changed: 9 additions & 0 deletions b/‎data/crash/crash000034.json
Lines changed: 9 additions & 0 deletions
diff --git a/‎data/crash/crash000035.json
Lines changed: 1 addition & 0 deletions b/‎data/crash/crash000035.json
Lines changed: 1 addition & 0 deletions
diff --git a/‎data/crash/crash000036.json
Lines changed: 5 additions & 0 deletions b/‎data/crash/crash000036.json
Lines changed: 5 additions & 0 deletions
diff --git a/‎simd-fuzz-target/Makefile
Lines changed: 5 additions & 1 deletion b/‎simd-fuzz-target/Makefile
Lines changed: 5 additions & 1 deletion
diff --git a/‎src/avx2/deser.rs
Lines changed: 207 additions & 0 deletions b/‎src/avx2/deser.rs
Lines changed: 207 additions & 0 deletions
@@ -3,11 +3,10 @@ version: 2.1
 #orbs:
 #  codecov: codecov/codecov@1.0.4
 
-jobs:
-  test:
-    docker:
-      - image: rust:1
-    steps:
+commands:
+  run_tests:
+    description: "A very simple command for demonstration purposes"
+    steps:     
       - checkout
         # - run:
         #   name: Install CMAKE
@@ -55,8 +54,25 @@ jobs:
       #    name: Run cycle benchmarks
       #     command: make perf
 
+jobs:
+  test:
+    docker:
+      - image: rust:1
+    environment:
+      RUSTFLAGS: '-C target-cpu=native'
+    steps:
+      - run_tests: {}
+  test-sse:
+    docker:
+      - image: rust:1
+    environment:
+      RUSTFLAGS: '-C target-cpu=native -C target-feature=-avx2'
+    steps:
+      - run_tests: {}
+
 workflows:
   version: 2
   workflow:
     jobs:
     - test
+    - test-sse
@@ -0,0 +1 @@
+{"Neh":-333333333333333333333333333333.3}
@@ -0,0 +1 @@
+[  -9265394459000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000.0p003]
@@ -0,0 +1 @@
+[348253421170671280348253421170679.6171,-]
@@ -0,0 +1 @@
+[3,28033333333333333333333333333333333348253421170679.6170-]
@@ -0,0 +1,9 @@
+[3,2825342119.61701e-0,1,
+128253421170679.61701e-0,1,
+128253421170679.61701e-0,1,
+0.1e1,-1e-1,-128253421170679.61701e3,28253421170679.61701e-0,1,
+48253421170679.61701e-0,1,
+1266666666661,-128253421170679.61701e3,28253421170679.61701e-0,1,
+48253421170679.61701e-0,1,
+12666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666661170679.61701e3,28253421170679.61701e-0,1,
+48253421170679.61701e-0,16666666666666666666666666666666666666666666666666666666666666666666666679.6111-]
@@ -0,0 +1 @@
+-9223372036854775808
@@ -0,0 +1,5 @@
+[
+ 1066,
+1e1,
+0.1e1,
+1e-1,-1e-0, -88888888888888888888888888888888.1,"rod"]
@@ -1,7 +1,11 @@
 run: build
-	RUSTFLAGS='-C codegen-units=1' cargo +nightly afl fuzz -i in -o out target/debug/simd-fuzz-target
+	RUSTFLAGS='-C codegen-units=1 -C target-cpu=native' cargo +nightly afl fuzz -i in -o out target/debug/simd-fuzz-target
 build: 
 	RUSTFLAGS='-C codegen-units=1' cargo +nightly afl build
+run-sse: build-sse
+	RUSTFLAGS='-C codegen-units=1 -C target-cpu=native -C target-feature=-avx2' cargo +nightly afl fuzz -i in -o out target/debug/simd-fuzz-target
+build-sse:
+	RUSTFLAGS='-C codegen-units=1 -C target-cpu=native -C target-feature=-avx2' cargo +nightly afl build
 
 copy:
 	for from in `ls out/crashes/id*`; do to=`echo $$from | sed -e 's;out/crashes/id:;crash;' -e 's;,.*;.json;'`; cp $$from ../simdjson-rs/data/crash/$$to; done
@@ -0,0 +1,207 @@
+#[cfg(target_arch = "x86")]
+use std::arch::x86::*;
+#[cfg(target_arch = "x86_64")]
+use std::arch::x86_64::*;
+
+use std::mem;
+
+pub use crate::error::{Error, ErrorType};
+pub use crate::Deserializer;
+pub use crate::Result;
+pub use crate::avx2::utf8check::*;
+pub use crate::stringparse::*;
+
+use crate::portability::trailingzeroes;
+
+
+impl<'de> Deserializer<'de> {
+    #[cfg_attr(not(feature = "no-inline"), inline(always))]
+    pub fn parse_str_(&mut self) -> Result<&'de str> {
+        // Add 1 to skip the initial "
+        let idx = self.iidx + 1;
+        let mut padding = [0u8; 32];
+        //let mut read: usize = 0;
+
+        // we include the terminal '"' so we know where to end
+        // This is safe since we check sub's lenght in the range access above and only
+        // create sub sliced form sub to `sub.len()`.
+
+        let src: &[u8] = unsafe { &self.input.get_unchecked(idx..) };
+        let mut src_i: usize = 0;
+        let mut len = src_i;
+        loop {
+            let v: __m256i = if src.len() >= src_i + 32 {
+                // This is safe since we ensure src is at least 32 wide
+                #[allow(clippy::cast_ptr_alignment)]
+                unsafe {
+                    _mm256_loadu_si256(src.as_ptr().add(src_i) as *const __m256i)
+                }
+            } else {
+                unsafe {
+                    padding
+                        .get_unchecked_mut(..src.len() - src_i)
+                        .clone_from_slice(src.get_unchecked(src_i..));
+                    // This is safe since we ensure src is at least 32 wide
+                    #[allow(clippy::cast_ptr_alignment)]
+                    _mm256_loadu_si256(padding.as_ptr() as *const __m256i)
+                }
+            };
+
+            // store to dest unconditionally - we can overwrite the bits we don't like
+            // later
+            let bs_bits: u32 = unsafe {
+                static_cast_u32!(_mm256_movemask_epi8(_mm256_cmpeq_epi8(
+                    v,
+                    _mm256_set1_epi8(b'\\' as i8)
+                )))
+            };
+            let quote_mask = unsafe { _mm256_cmpeq_epi8(v, _mm256_set1_epi8(b'"' as i8)) };
+            let quote_bits = unsafe { static_cast_u32!(_mm256_movemask_epi8(quote_mask)) };
+            if (bs_bits.wrapping_sub(1) & quote_bits) != 0 {
+                // we encountered quotes first. Move dst to point to quotes and exit
+                // find out where the quote is...
+                let quote_dist: u32 = trailingzeroes(u64::from(quote_bits)) as u32;
+
+                ///////////////////////
+                // Above, check for overflow in case someone has a crazy string (>=4GB?)
+                // But only add the overflow check when the document itself exceeds 4GB
+                // Currently unneeded because we refuse to parse docs larger or equal to 4GB.
+                ////////////////////////
+
+                // we advance the point, accounting for the fact that we have a NULl termination
+
+                len += quote_dist as usize;
+                unsafe {
+                    let v = self.input.get_unchecked(idx..idx + len) as *const [u8] as *const str;
+                    return Ok(&*v);
+                }
+
+                // we compare the pointers since we care if they are 'at the same spot'
+                // not if they are the same value
+            }
+            if (quote_bits.wrapping_sub(1) & bs_bits) != 0 {
+                // Move to the 'bad' character
+                let bs_dist: u32 = trailingzeroes(u64::from(bs_bits));
+                len += bs_dist as usize;
+                src_i += bs_dist as usize;
+                break;
+            } else {
+                // they are the same. Since they can't co-occur, it means we encountered
+                // neither.
+                src_i += 32;
+                len += 32;
+            }
+        }
+
+        let mut dst_i: usize = 0;
+        let dst: &mut [u8] = &mut self.strings;
+
+        loop {
+            let v: __m256i = if src.len() >= src_i + 32 {
+                // This is safe since we ensure src is at least 32 wide
+                #[allow(clippy::cast_ptr_alignment)]
+                unsafe {
+                    _mm256_loadu_si256(src.as_ptr().add(src_i) as *const __m256i)
+                }
+            } else {
+                unsafe {
+                    padding
+                        .get_unchecked_mut(..src.len() - src_i)
+                        .clone_from_slice(src.get_unchecked(src_i..));
+                    // This is safe since we ensure src is at least 32 wide
+                    #[allow(clippy::cast_ptr_alignment)]
+                    _mm256_loadu_si256(padding.as_ptr() as *const __m256i)
+                }
+            };
+
+            #[allow(clippy::cast_ptr_alignment)]
+            unsafe {
+                _mm256_storeu_si256(dst.as_mut_ptr().add(dst_i) as *mut __m256i, v)
+            };
+
+            // store to dest unconditionally - we can overwrite the bits we don't like
+            // later
+            let bs_bits: u32 = unsafe {
+                static_cast_u32!(_mm256_movemask_epi8(_mm256_cmpeq_epi8(
+                    v,
+                    _mm256_set1_epi8(b'\\' as i8)
+                )))
+            };
+            let quote_mask = unsafe { _mm256_cmpeq_epi8(v, _mm256_set1_epi8(b'"' as i8)) };
+            let quote_bits = unsafe { static_cast_u32!(_mm256_movemask_epi8(quote_mask)) };
+            if (bs_bits.wrapping_sub(1) & quote_bits) != 0 {
+                // we encountered quotes first. Move dst to point to quotes and exit
+                // find out where the quote is...
+                let quote_dist: u32 = trailingzeroes(u64::from(quote_bits)) as u32;
+
+                ///////////////////////
+                // Above, check for overflow in case someone has a crazy string (>=4GB?)
+                // But only add the overflow check when the document itself exceeds 4GB
+                // Currently unneeded because we refuse to parse docs larger or equal to 4GB.
+                ////////////////////////
+
+                // we advance the point, accounting for the fact that we have a NULl termination
+
+                dst_i += quote_dist as usize;
+                unsafe {
+                    self.input
+                        .get_unchecked_mut(idx + len..idx + len + dst_i)
+                        .clone_from_slice(&self.strings.get_unchecked(..dst_i));
+                    let v = self.input.get_unchecked(idx..idx + len + dst_i) as *const [u8]
+                        as *const str;
+                    self.str_offset += dst_i as usize;
+                    return Ok(&*v);
+                }
+
+                // we compare the pointers since we care if they are 'at the same spot'
+                // not if they are the same value
+            }
+            if (quote_bits.wrapping_sub(1) & bs_bits) != 0 {
+                // find out where the backspace is
+                let bs_dist: u32 = trailingzeroes(u64::from(bs_bits));
+                let escape_char: u8 = unsafe { *src.get_unchecked(src_i + bs_dist as usize + 1) };
+                // we encountered backslash first. Handle backslash
+                if escape_char == b'u' {
+                    // move src/dst up to the start; they will be further adjusted
+                    // within the unicode codepoint handling code.
+                    src_i += bs_dist as usize;
+                    dst_i += bs_dist as usize;
+                    let (o, s) = if let Ok(r) =
+                        handle_unicode_codepoint(unsafe { src.get_unchecked(src_i..) }, unsafe {
+                            dst.get_unchecked_mut(dst_i..)
+                        }) {
+                        r
+                    } else {
+                        return Err(self.error(ErrorType::InvlaidUnicodeCodepoint));
+                    };
+                    if o == 0 {
+                        return Err(self.error(ErrorType::InvlaidUnicodeCodepoint));
+                    };
+                    // We moved o steps forword at the destiation and 6 on the source
+                    src_i += s;
+                    dst_i += o;
+                } else {
+                    // simple 1:1 conversion. Will eat bs_dist+2 characters in input and
+                    // write bs_dist+1 characters to output
+                    // note this may reach beyond the part of the buffer we've actually
+                    // seen. I think this is ok
+                    let escape_result: u8 =
+                        unsafe { *ESCAPE_MAP.get_unchecked(escape_char as usize) };
+                    if escape_result == 0 {
+                        return Err(self.error(ErrorType::InvalidEscape));
+                    }
+                    unsafe {
+                        *dst.get_unchecked_mut(dst_i + bs_dist as usize) = escape_result;
+                    }
+                    src_i += bs_dist as usize + 2;
+                    dst_i += bs_dist as usize + 1;
+                }
+            } else {
+                // they are the same. Since they can't co-occur, it means we encountered
+                // neither.
+                src_i += 32;
+                dst_i += 32;
+            }
+        }
+    }
+}
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+{"Neh":-333333333333333333333333333333.3}`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+[ -9265394459000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000.0p003]`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+[348253421170671280348253421170679.6171,-]`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+[3,28033333333333333333333333333333333348253421170679.6170-]`
-Original file line number
+Diff line change
@@ @@ -0,0 +1,5 @@ @@
 +[
 + 1066,
 +1e1,
 +0.1e1,
 +1e-1,-1e-0, -88888888888888888888888888888888.1,"rod"]