Use "inline" get_range for speed-up and pin v0.1.1

Roderick Bovee · Roderick Bovee · commit 3471dcb1c080 · 2018-02-05T20:16:21.000-08:00
diff --git a/Cargo.toml b/Cargo.toml
@@ -1,11 +1,11 @@
 [package]
 name = "bfield"
-version = "0.1.0"
+version = "0.1.1"
 authors = ["Roderick Bovee <roderick@onecodex.com>"]
 
 [dependencies]
 bincode = "0.9.2"
-mmap-bitvec = { git = "ssh://git@github.com/onecodex/mmap-bitvec.git", rev = "171bf99df62ea3a1c57279d3ef2b99efdc490aba" }
+mmap-bitvec = { git="ssh://git@github.com/onecodex/mmap-bitvec.git", tag="v0.1.1" }
 murmurhash3 = "0.0.5"
 serde = "1.0.15"
 serde_derive = "1.0.15"
diff --git a/src/bfield_member.rs b/src/bfield_member.rs
@@ -2,10 +2,12 @@ use std::cmp::Ordering;
 #[cfg(feature = "legacy")]
 use std::fs::File;
 use std::io;
+use std::ops::Range;
 use std::path::Path;
 
 use bincode::{serialize, deserialize, Infinite};
 use mmap_bitvec::{BitVector, MmapBitVec, BitVecSlice};
+use mmap_bitvec::bitvec::BIT_VEC_SLICE_SIZE;
 use murmurhash3::murmurhash3_x64_128;
 use serde::Serialize;
 use serde::de::DeserializeOwned;
@@ -171,7 +173,7 @@ impl<T: Clone + DeserializeOwned + Serialize> BFieldMember<T> {
         let mut merged_marker = BitVecSlice::max_value();
         for marker_ix in 0usize..self.params.n_hashes as usize {
             let pos = marker_pos(hash, marker_ix, self.bitvec.size(), marker_width);
-            let marker = self.bitvec.get_range(pos..pos + marker_width);
+            let marker = get_range(&self.bitvec, pos..pos + marker_width);
             merged_marker &= marker;
             if merged_marker.count_ones().cmp(&k) == Ordering::Less {
                 return 0;
@@ -224,6 +226,50 @@ fn marker_pos(hash: (u64, u64), n: usize, total_size: usize, _: usize) -> usize
     i64::abs(mashed_hash % (total_size as i64 - 64)) as usize
 }
 
+/// This is totally messed up, but we get a speed bump by doing this
+/// instead of using the _exact same_ function on the struct.
+#[cfg(not(feature = "legacy"))]
+fn get_range(bitvec: &MmapBitVec, r: Range<usize>) -> BitVecSlice {
+    if r.end - r.start > BIT_VEC_SLICE_SIZE as usize {
+        panic!(format!("Range too large (>{})", BIT_VEC_SLICE_SIZE))
+    } else if r.end > bitvec.size {
+        panic!("Range ends outside of BitVec")
+    }
+    let byte_idx_st = (r.start >> 3) as usize;
+    let byte_idx_en = ((r.end - 1) >> 3) as usize;
+    let new_size: u8 = (r.end - r.start) as u8;
+
+    let mut v;
+    let ptr: *const u8 = bitvec.mmap.as_ptr();
+
+    // read the last byte first
+    unsafe {
+        v = BitVecSlice::from(*ptr.offset(byte_idx_en as isize));
+    }
+    // align the end of the data with the end of the u64/u128
+    v >>= 7 - ((r.end - 1) & 7);
+
+    let bit_offset = new_size + (r.start & 7) as u8;
+    // copy over byte by byte
+    // it would be faster to coerce into a u8 and a u64 (in case it spans 9 bytes) and then
+    // copy over, but this doesn't work if the start is <8 bytes from the end, so we're doing
+    // this for now and we can add a special case for that later
+    for (new_idx, old_idx) in (byte_idx_st..byte_idx_en).enumerate() {
+        unsafe {
+            v |= BitVecSlice::from(*ptr.offset(old_idx as isize)) <<
+                (bit_offset - 8u8 * (new_idx as u8 + 1));
+        }
+    }
+
+    // mask out the high bits in case we copied extra
+    v & BitVecSlice::max_value() >> (BIT_VEC_SLICE_SIZE - new_size)
+}
+
+#[cfg(feature = "legacy")]
+fn get_range(bitvec: &MmapBitVec, r: Range<usize>) -> BitVecSlice {
+    bitvec.get_range(r)
+}
+
 #[test]
 fn test_bfield() {
     let mut bfield: BFieldMember<usize> = BFieldMember::in_memory(1024, 3, 64, 4).unwrap();