├── .gitignore
├── graphs
    ├── String_lookup_hit.png
    ├── String_insert_remove.png
    ├── String_lookup_miss.png
    ├── dense_u64_sparse_u64_lookup_hit_16384.png
    ├── dense_u64_sparse_u64_insert_remove_16384.png
    ├── dense_u64_sparse_u64_lookup_hit_16777216.png
    ├── dense_u64_sparse_u64_lookup_miss_16384.png
    ├── dense_u64_sparse_u64_lookup_hit_268435456.png
    ├── dense_u64_sparse_u64_lookup_miss_16777216.png
    ├── dense_u64_sparse_u64_lookup_miss_268435456.png
    ├── dense_u64_sparse_u64_insert_remove_16777216.png
    ├── dense_u64_sparse_u64_insert_remove_268435456.png
    ├── make_csv
    └── make_graphs.r
├── Cargo.toml
├── src
    ├── lib.rs
    ├── macros.rs
    ├── common.rs
    ├── prefix_cache.rs
    ├── art_internal.rs
    └── art_impl.rs
├── Performance.md
├── README.md
├── benches
    └── set_bench.rs
└── LICENSE


/.gitignore:
--------------------------------------------------------------------------------
1 | 
2 | /target
3 | **/*.rs.bk
4 | Cargo.lock
5 | results.csv
6 | 


--------------------------------------------------------------------------------
/graphs/String_lookup_hit.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/String_lookup_hit.png


--------------------------------------------------------------------------------
/graphs/String_insert_remove.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/String_insert_remove.png


--------------------------------------------------------------------------------
/graphs/String_lookup_miss.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/String_lookup_miss.png


--------------------------------------------------------------------------------
/graphs/dense_u64_sparse_u64_lookup_hit_16384.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/dense_u64_sparse_u64_lookup_hit_16384.png


--------------------------------------------------------------------------------
/graphs/dense_u64_sparse_u64_insert_remove_16384.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/dense_u64_sparse_u64_insert_remove_16384.png


--------------------------------------------------------------------------------
/graphs/dense_u64_sparse_u64_lookup_hit_16777216.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/dense_u64_sparse_u64_lookup_hit_16777216.png


--------------------------------------------------------------------------------
/graphs/dense_u64_sparse_u64_lookup_miss_16384.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/dense_u64_sparse_u64_lookup_miss_16384.png


--------------------------------------------------------------------------------
/graphs/dense_u64_sparse_u64_lookup_hit_268435456.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/dense_u64_sparse_u64_lookup_hit_268435456.png


--------------------------------------------------------------------------------
/graphs/dense_u64_sparse_u64_lookup_miss_16777216.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/dense_u64_sparse_u64_lookup_miss_16777216.png


--------------------------------------------------------------------------------
/graphs/dense_u64_sparse_u64_lookup_miss_268435456.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/dense_u64_sparse_u64_lookup_miss_268435456.png


--------------------------------------------------------------------------------
/graphs/dense_u64_sparse_u64_insert_remove_16777216.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/dense_u64_sparse_u64_insert_remove_16777216.png


--------------------------------------------------------------------------------
/graphs/dense_u64_sparse_u64_insert_remove_268435456.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ezrosent/art-rs/HEAD/graphs/dense_u64_sparse_u64_insert_remove_268435456.png


--------------------------------------------------------------------------------
/Cargo.toml:
--------------------------------------------------------------------------------
 1 | [package]
 2 | name = "radix-tree"
 3 | version = "0.1.0"
 4 | authors = ["eli"]
 5 | 
 6 | [dependencies]
 7 | byteorder = "1.2.1"
 8 | simd = "0.2.1"
 9 | smallvec = "0.6.0"
10 | fnv = "1.0.3"
11 | 
12 | [features]
13 | default = []
14 | print_cache_stats = []
15 | 
16 | [dev-dependencies]
17 | quickcheck = "0.6.1"
18 | rand = "0.4"
19 | criterion = "0.2"
20 | 
21 | [[bench]]
22 | name = "set_bench"
23 | harness = false
24 | 


--------------------------------------------------------------------------------
/src/lib.rs:
--------------------------------------------------------------------------------
 1 | #![feature(swap_nonoverlapping)]
 2 | #![feature(cfg_target_feature)]
 3 | #![feature(stdsimd)]
 4 | #[macro_use]
 5 | mod macros;
 6 | mod common;
 7 | mod art_impl;
 8 | mod art_internal;
 9 | mod prefix_cache;
10 | 
11 | extern crate byteorder;
12 | extern crate smallvec;
13 | 
14 | pub use common::Digital;
15 | pub use art_impl::*;
16 | #[cfg(test)]
17 | #[macro_use]
18 | extern crate quickcheck;
19 | #[cfg(test)]
20 | extern crate rand;
21 | 
22 | #[cfg(test)]
23 | mod tests {
24 |     #[test]
25 |     fn it_works() {
26 |         assert_eq!(2 + 2, 4);
27 |     }
28 | }
29 | 


--------------------------------------------------------------------------------
/graphs/make_csv:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | # First run `cargo bench` (beware: this takes a long time and it uses a lot of memory).
 4 | # Then run this script from the crate root and redirect output to graphs/results.csv.
 5 | # Then run Rscript make_graphs.r to regenerate graphs.
 6 | 
 7 | CATEGORIES="dense_u64 sparse_u64 String"
 8 | DATA_STRUCTURES="ARTSet CachingARTSet HashSet BTreeSet"
 9 | BENCHES="lookup_hit lookup_miss insert_remove"
10 | 
11 | echo "data structure,data type,workload,number of elements,str number of elements,mean time per operation ns"
12 | for c in $CATEGORIES; do
13 | 	for d in $DATA_STRUCTURES; do
14 | 		for b in $BENCHES; do
15 | 			for sz in $(ls "target/criterion/${d}/${c}/${b}" | grep -Ev 'report|new|base|change'); do
16 | 				st_elts=$(echo "$sz" | gawk '{
17 | 				r20=rshift($1, 20)
18 | 				r10=rshift($1, 10)
19 | 				if (r20 > 0) {
20 | 					print r20"M"
21 | 				} else if (r10 > 0) {
22 | 					print r10"K"
23 | 				} else if ($1 > 0) {
24 | 					print $1
25 | 				}}')
26 | 				avg_perf=$(cat "target/criterion/${d}/${c}/${b}/${sz}/report/index.html" |
27 | 					grep '<td>Mean</td>' -A3 |
28 | 					tail -n2 |
29 | 					head -n1 |
30 | 					cut -d'>' -f2 |
31 | 					cut -d'<' -f1 | 
32 | 					awk '{ if ($2 == "ns") { print $1 } if ($2 == "us") { print 1000 * $1 } }')
33 | 				echo "$d,$c,$b,$sz,$st_elts,$avg_perf"
34 | 			done
35 | 		done
36 | 	done
37 | done
38 | 


--------------------------------------------------------------------------------
/src/macros.rs:
--------------------------------------------------------------------------------
 1 | macro_rules! with_node_inner {
 2 |     ($base_node: expr, $nod: ident, $body: expr, $r: tt) => {
 3 |         with_node_inner!($base_node, $nod, $body, $r, _)
 4 |     };
 5 |     ($base_node: expr, $nod: ident, $body: expr, $r: tt, $ty: tt) => {{
 6 |         let _b: $r<()> = $base_node;
 7 |         match _b.typ {
 8 |             NODE_4 => {
 9 |                 #[allow(unused_unsafe)]
10 |                 let $nod = unsafe { mem::transmute::<$r<_>, $r<Node4<$ty>>>(_b) };
11 |                 $body
12 |             }
13 |             NODE_16 => {
14 |                 #[allow(unused_unsafe)]
15 |                 let $nod = unsafe { mem::transmute::<$r<_>, $r<Node16<$ty>>>(_b) };
16 |                 $body
17 |             }
18 |             NODE_48 => {
19 |                 #[allow(unused_unsafe)]
20 |                 let $nod = unsafe { mem::transmute::<$r<_>, $r<Node48<$ty>>>(_b) };
21 |                 $body
22 |             }
23 |             NODE_256 => {
24 |                 #[allow(unused_unsafe)]
25 |                 let $nod = unsafe { mem::transmute::<$r<_>, $r<Node256<$ty>>>(_b) };
26 |                 $body
27 |             }
28 |             _ => panic!("Found unrecognized node type {:?}", _b.typ),
29 |         }
30 |     }};
31 | }
32 | 
33 | macro_rules! with_node_mut {
34 |     ($base_node: expr, $nod: ident, $body: expr) => {
35 |         with_node_mut!($base_node, $nod, $body, _)
36 |     };
37 |     ($base_node: expr, $nod: ident, $body: expr, $ty: tt) => {
38 |         with_node_inner!($base_node, $nod, $body, RawMutRef, $ty)
39 |     };
40 | }
41 | 
42 | macro_rules! with_node {
43 |     ($base_node: expr, $nod: ident, $body: expr) => {
44 |         with_node!($base_node, $nod, $body, _)
45 |     };
46 |     ($base_node: expr, $nod: ident, $body: expr, $ty: tt) => {
47 |         with_node_inner!($base_node, $nod, $body, RawRef, $ty)
48 |     };
49 | }
50 | 
51 | macro_rules! trace {
52 |     ($b:expr, $str:expr, $( $arg:expr ),+) => {
53 |         #[cfg(debug_assertions)]
54 |         {
55 |             if $b { eprintln!("{} {} {}", file!(), line!(), format!($str, $( $arg ),*)) }
56 |         }
57 |     };
58 |     ($b:expr, $str:expr) => { trace!($b, "{}", $str) };
59 |     ($b:expr) => { trace!($b, "") };
60 | }
61 | 


--------------------------------------------------------------------------------
/Performance.md:
--------------------------------------------------------------------------------
 1 | # ART Performance
 2 | 
 3 | We benchmarked lookups (keys within the set and keys not in the set) and
 4 | insert/delete pairs for `ARTSet` (our ART implementation), `CachingARTSet` (an
 5 | ART with a prefix cache), rust's `BTreeSet` and rust's `HashSet`. We use random
 6 | integer keys where the keys are chosen from 0 to the size of the set ("dense")
 7 | and where they are chosen from all possible 64-bit integers ("sparse"). We also
 8 | include benchmarks for random UTF-8 strings.
 9 | 
10 | ### Integers
11 | 
12 | Here we see that the ART generally does somewhere between the performance of
13 | the BTree and the hash table. The cache is little help for small tables or
14 | dense keys. This makes sense, as the dense keys will often share a prefix,
15 | making the likely depth of the tree fairly short, while prefix compression will
16 | ensure the absolute depth of the tree is quite low when there are few elements.
17 | Prefix caching *does*, however, make a substantial difference for sparse
18 | integers in larger tables.
19 | 
20 | ![Integer Performance 16K](graphs/dense_u64_sparse_u64_lookup_miss_16384.png?raw=true)
21 | ![Integer Performance 16M](graphs/dense_u64_sparse_u64_lookup_miss_16777216.png?raw=true)
22 | ![Integer Performance 256M](graphs/dense_u64_sparse_u64_lookup_miss_268435456.png?raw=true)
23 | 
24 | ![Integer Performance 16K](graphs/dense_u64_sparse_u64_lookup_hit_16384.png?raw=true)
25 | ![Integer Performance 16M](graphs/dense_u64_sparse_u64_lookup_hit_16777216.png?raw=true)
26 | ![Integer Performance 256M](graphs/dense_u64_sparse_u64_lookup_hit_268435456.png?raw=true)
27 | 
28 | ![Integer Performance 16K](graphs/dense_u64_sparse_u64_insert_remove_16384.png?raw=true)
29 | ![Integer Performance 16M](graphs/dense_u64_sparse_u64_insert_remove_16777216.png?raw=true)
30 | ![Integer Performance 256M](graphs/dense_u64_sparse_u64_insert_remove_268435456.png?raw=true)
31 | 
32 | ### Strings
33 | 
34 | There is a similar story here as to the integer workloads above. The benefit of
35 | caching here is, however, more pronounced for both lookups and mutations.
36 | 
37 | ![String Hits](graphs/String_lookup_hit.png?raw=true)
38 | ![String Misses](graphs/String_lookup_miss.png?raw=true)
39 | ![String Mutates](graphs/String_insert_remove.png?raw=true)
40 | 


--------------------------------------------------------------------------------
/graphs/make_graphs.r:
--------------------------------------------------------------------------------
 1 | library(ggplot2)
 2 | alldata = read.csv('graphs/results.csv')
 3 | 
 4 | strgrapher <- function(exclude, ty, wl, title) {
 5 | 	ftab = subset(subset(subset(alldata, data.type == ty), workload == wl), number.of.elements != exclude)
 6 | 	tags=ftab$data.structure
 7 | 	sizes=ftab$str.number.of.elements
 8 | 	optimes=ftab$mean.time.per.operation.ns
 9 | 	btab = data.frame(Size=sizes, Data.Structure=tags, ns.Per.Op=optimes)
10 | 	# print(btab)
11 | 	png(filename=paste('graphs/', paste(ty,wl,sep='_'), '.png', sep=''), width=600, height=600)
12 | 	posns <- c("16K", "1M", "16M")
13 | 	ggplot(btab, aes(fill=Data.Structure,y=ns.Per.Op, x=Size)) + 
14 | 		scale_x_discrete(limits=posns) +
15 | 		geom_bar(position="dodge", stat="identity") +
16 | 		labs(title=title, x="Number of Elements", y="ns Per Operation")
17 | }
18 | 
19 | intgrapher <- function(size, ty1, ty2, wl, title) {
20 | 	ftab1 = subset(subset(subset(alldata, number.of.elements == size), data.type == ty1), workload == wl)
21 | 	ftab2 = subset(subset(subset(alldata, number.of.elements == size), data.type == ty2), workload == wl)
22 | 	png(filename=paste('graphs/', paste(ty1,ty2,wl,size,sep='_'), '.png', sep=''), width=600, height=600)
23 | 	tags = c(rep('dense', length(ftab1$mean.time.per.operation.ns)),
24 | 		 rep('sparse', length(ftab1$mean.time.per.operation.ns)))
25 | 	btab = data.frame(Data.Structure=rep(ftab1$data.structure, 2),
26 | 			  ns.Per.Operation=c(ftab1$mean.time.per.operation.ns, ftab2$mean.time.per.operation.ns),
27 | 			  workload=tags)
28 | 	ggplot(btab, aes(fill=workload, y=ns.Per.Operation, x=Data.Structure)) +
29 | 		geom_bar(position="dodge", stat="identity") +
30 | 		labs(title=title, x="Data Structure", y="ns Per Operation")
31 | }
32 | 
33 | intgrapher(16384,     'dense_u64', 'sparse_u64', 'lookup_hit',
34 | 	  'Lookups for elements in the set with integer keys, 16K elements')
35 | intgrapher(16777216,  'dense_u64', 'sparse_u64', 'lookup_hit',
36 | 	  'Lookups for elements in the set with integer keys, 16M elements')
37 | intgrapher(268435456, 'dense_u64', 'sparse_u64', 'lookup_hit',
38 | 	  'Lookups for elements in the set with integer keys, 256M elements')
39 | 
40 | intgrapher(16384,     'dense_u64', 'sparse_u64', 'lookup_miss',
41 | 	  'Lookups for elements not in the set with integer keys, 16K elements')
42 | intgrapher(16777216,  'dense_u64', 'sparse_u64', 'lookup_miss',
43 | 	  'Lookups for elements not in the set with integer keys, 16M elements')
44 | intgrapher(268435456, 'dense_u64', 'sparse_u64', 'lookup_miss',
45 | 	  'Lookups for elements not in the set with integer keys, 256M elements')
46 | 
47 | intgrapher(16384,     'dense_u64', 'sparse_u64', 'insert_remove',
48 | 	  'Insert/Remove pairs with integer keys, 16K elements')
49 | intgrapher(16777216,  'dense_u64', 'sparse_u64', 'insert_remove',
50 | 	  'Insert/Remove pairs with integer keys, 16M elements')
51 | intgrapher(268435456, 'dense_u64', 'sparse_u64', 'insert_remove',
52 | 	  'Insert/Remove pairs with integer keys, 256M elements')
53 | 
54 | strgrapher(67108864,'String', 'lookup_hit', 'Lookups in the set, UTF-8 Strings of mean length 10')
55 | strgrapher(67108864,'String', 'lookup_miss', 'Lookups not in the set, UTF-8 Strings of mean length 10')
56 | strgrapher(67108864,'String', 'insert_remove', 'Insert/Remove Pairs, UTF-8 Strings of mean length 10')
57 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # art-rs: Efficient ordered containers.
 2 | The adaptive radix tree (ART) is an efficient radix tree (aka trie) design introduced by [Leis, Kemper
 3 | and
 4 | Neumann](https://15721.courses.cs.cmu.edu/spring2018/papers/09-oltpindexes2/leis-icde2013.pdf) in 2013.
 5 | This includes an implementation of the ART data-structure described in that
 6 | work, along with experimental support for *prefix-caching*.
 7 | 
 8 | ## Overview
 9 | 
10 | ARTs operate on types that can be decomposed into sequences of bytes. If the
11 | types are ordered, and these byte sequences (with a lexicographic ordering)
12 | respect the ordering on the type, then ARTs also support efficient range scans.
13 | Because most ordered types can also be efficiently decomposed to byte
14 | sequences[1], this makes them a potential alternative to ordered tree
15 | data-structures, like Rust's `BTreeSet` or `std::set` in C++ (often a Red-Black
16 | Tree).
17 | 
18 | Compared to the classic [Trie datastructure](https://en.wikipedia.org/wiki/Trie),
19 | the ART paper details lots of intricate optimizations to speed up lookups and
20 | insertions. The most important of these are:
21 | 
22 |   * *Prefix Compression*: A sequence of interior that do not point directly to a
23 |     leaf can be compressed into a single node, thus reducing the length of the
24 |     path that must be traversed.
25 | 
26 |   * *Lazy Expansion*: A sequence of interior nodes that only point to a single
27 |     leaf can be elided entirely.
28 | 
29 |   * *Specialized Interior Nodes*: Inner nodes in the tree have specialized
30 |     implementations for ones with up to 4, 16, 48 and 256 children. This
31 |     balances space efficiency with the speed of lookups.
32 | 
33 | See the ART paper for a more complete description of these features.
34 |   
35 | 
36 | ## Prefix-Caching
37 | 
38 | Keys for this data-structure can be decomposed into byte sequences. Short byte
39 | sequences can be hashed efficiently. This repo provides variants of the ART
40 | that store a hash table mapping from key prefixes to *interior nodes* within
41 | the tree. This allows traversals for either mutation operations or lookups to
42 | skip several levels of the tree in their traversal.  This sort of trick is much
43 | harder for ordered tree data-structures, as their keys do not necessarily have
44 | the needed structure, and they may have more complicated rebalancing operations
45 | which can make it more difficult to maintain the validity of the hash table.
46 | 
47 | The length of the cached prefixes can be customized, allowing you to limit the
48 | maximum size of the cache.
49 | 
50 | ## Performance
51 | 
52 | While not complete, we have a number of benchmarks that compare the ART-based
53 | data-structures to rust's `HashSet` and `BTreeSet`. They show promising
54 | performance for the vanilla ART implementation, and demonstrate that prefix
55 | caching can improve performance even further when the set is large. See
56 | `Performance.md` for more information and measurements.
57 | 
58 | ## TODOs
59 | 
60 | This implementation if very rough, and likely contains bugs. On top of general
61 | code improvements, there is also still a lot to do to get it to feature-parity
62 | with the standard Rust container types.
63 | 
64 | ### API Parity with `BTreeSet`
65 | This includes good implementations of set operations, as well as a proper
66 | iterator API. While we have a callback-based traversal API, we lack an idiomatic iterator
67 | implementation 
68 | 
69 | ### Bulk Insertions
70 | The ART paper describes a method for performing optimized bulk insertions of
71 | values, which is not yet implemented in this code-base.
72 | 
73 | ### Multithreading
74 | While [follow-up work](https://db.in.tum.de/~leis/papers/artsync.pdf)
75 | implemented synchronization for the ART, this repo only includes a
76 | single-threaded implementation. I am interested in implementing a multithreaded
77 | version at some point in the future.
78 | 
79 | ### Slab Allocation
80 | We currently do heap allocations for all new interior nodes and leaf nodes. At
81 | the very least interior nodes could probably benefit from slab allocation.
82 | 
83 | ### Space-optimized Prefix Caching
84 | Because real-world map workloads are often skewed towards a small subset of the
85 | keys, it should be possible tune the prefix cache to store a small subset of
86 | keys. This would reduce the space overhead of the cache while still hopefully
87 | preserving most of the performance gains.
88 | 
89 | 
90 | [1]: See section 4 of the paper for more information on this. In this code, it
91 | is encapsulated by the `Digital` trait, which has implementation for common
92 | integer and string types.
93 | 


--------------------------------------------------------------------------------
/src/common.rs:
--------------------------------------------------------------------------------
  1 | use std::iter::Iterator;
  2 | use std::str;
  3 | use super::byteorder::{BigEndian, ByteOrder};
  4 | 
  5 | /// `Digital` describes types that can be expressed as sequences of bytes.
  6 | ///
  7 | /// The type's `digits` should respect equality and ordering on the type.
  8 | /// Furthermore, if the `digits` of one value are a prefix of the `digits`
  9 | /// of another value of the same type, the two values must be equal.
 10 | ///
 11 | /// TODO implement floating point support. This is described in the ART paper but a couple details
 12 | /// are left out.
 13 | ///
 14 | /// TODO implement macro/derive that will create a "digits" representation for any ordered type.
 15 | pub trait Digital<'a> {
 16 |     // TODO: consider providing a more efficient interface here (e.g. passing a slice directly)
 17 |     type I: Iterator<Item = u8> + 'a;
 18 |     const STOP_CHARACTER: Option<u8> = None;
 19 |     fn digits(&'a self) -> Self::I;
 20 | }
 21 | 
 22 | pub struct U32BytesIterator {
 23 |     cursor: usize,
 24 |     bytes: [u8; 4],
 25 | }
 26 | 
 27 | impl Iterator for U32BytesIterator {
 28 |     type Item = u8;
 29 |     fn next(&mut self) -> Option<u8> {
 30 |         if self.cursor < 4 {
 31 |             self.cursor += 1;
 32 |             Some(self.bytes[self.cursor - 1])
 33 |         } else {
 34 |             None
 35 |         }
 36 |     }
 37 | 
 38 |     fn nth(&mut self, n: usize) -> Option<u8> {
 39 |         self.cursor += n;
 40 |         self.next()
 41 |     }
 42 | }
 43 | 
 44 | impl<'a> Digital<'a> for u32 {
 45 |     type I = U32BytesIterator;
 46 |     fn digits(&self) -> U32BytesIterator {
 47 |         let mut res = U32BytesIterator {
 48 |             cursor: 0,
 49 |             bytes: [0; 4],
 50 |         };
 51 |         BigEndian::write_u32(&mut res.bytes, *self);
 52 |         res
 53 |     }
 54 | }
 55 | 
 56 | impl<'a> Digital<'a> for i32 {
 57 |     type I = U32BytesIterator;
 58 |     fn digits(&self) -> U32BytesIterator {
 59 |         let mut res = U32BytesIterator {
 60 |             cursor: 0,
 61 |             bytes: [0; 4],
 62 |         };
 63 |         BigEndian::write_i32(&mut res.bytes, *self ^ (1 << 31));
 64 |         res
 65 |     }
 66 | }
 67 | 
 68 | impl<'a> Digital<'a> for i64 {
 69 |     type I = U64BytesIterator;
 70 |     fn digits(&self) -> U64BytesIterator {
 71 |         let mut res = U64BytesIterator {
 72 |             cursor: 0,
 73 |             bytes: [0; 8],
 74 |         };
 75 |         BigEndian::write_i64(&mut res.bytes, *self ^ (1 << 63));
 76 |         res
 77 |     }
 78 | }
 79 | 
 80 | impl<'a> Digital<'a> for usize {
 81 |     // Just treat usize as u64. This should (inefficiently) support platforms with a smaller type,
 82 |     // and we debug-assert that usize <= u64 in size.
 83 |     type I = U64BytesIterator;
 84 |     fn digits(&self) -> Self::I {
 85 |         debug_assert!(::std::mem::size_of::<usize>() <= ::std::mem::size_of::<u64>());
 86 |         (*self as u64).digits()
 87 |     }
 88 | }
 89 | 
 90 | impl<'a> Digital<'a> for isize {
 91 |     type I = U64BytesIterator;
 92 |     fn digits(&self) -> Self::I {
 93 |         debug_assert!(::std::mem::size_of::<isize>() <= ::std::mem::size_of::<i64>());
 94 |         (*self as i64).digits()
 95 |     }
 96 | }
 97 | 
 98 | pub struct U64BytesIterator {
 99 |     cursor: usize,
100 |     bytes: [u8; 8],
101 | }
102 | 
103 | impl Iterator for U64BytesIterator {
104 |     type Item = u8;
105 |     fn next(&mut self) -> Option<u8> {
106 |         if self.cursor < 8 {
107 |             self.cursor += 1;
108 |             Some(self.bytes[self.cursor - 1])
109 |         } else {
110 |             None
111 |         }
112 |     }
113 | 
114 |     fn nth(&mut self, n: usize) -> Option<u8> {
115 |         self.cursor += n;
116 |         self.next()
117 |     }
118 | }
119 | 
120 | impl<'a> Digital<'a> for u64 {
121 |     type I = U64BytesIterator;
122 |     fn digits(&self) -> U64BytesIterator {
123 |         let mut res = U64BytesIterator {
124 |             cursor: 0,
125 |             bytes: [0; 8],
126 |         };
127 |         BigEndian::write_u64(&mut res.bytes, *self);
128 |         res
129 |     }
130 | }
131 | 
132 | /// NullTerminate transforms iterator corresponding to the bytes of a valid UTF-8 string into an
133 | /// iterator suitable for use in a `Digital` implementation. This comes for free in languages using
134 | /// C-style ASCII strings by convention, because null-termination guarantees the "prefixes"
135 | /// property of the trait.
136 | ///
137 | /// In Rust, strings are most commonly encoded as UTF-8. For such strings,  NUL characters are
138 | /// kosher in the middle of a string, and picking a different byte as a terminator character will
139 | /// ruin the compatibility with Ord[0]. To ensure that a null terminator is valid, we increase the
140 | /// value of all bytes emitted by `I` by 1. We are guaranteed no overflow by the fact that 255 is
141 | /// an invalid byte for UTF-8 strings. Given no overflow, equality and ordering are clearly
142 | /// conserved.
143 | ///
144 | /// [0]: To see why this is the case, consider the example of "" and "a". "" < "a", but "\u{255}" >
145 | /// "a\u{255}".
146 | pub struct NullTerminate<I> {
147 |     done: bool,
148 |     i: I,
149 | }
150 | 
151 | impl<I> NullTerminate<I> {
152 |     fn new(i: I) -> Self {
153 |         NullTerminate { done: false, i: i }
154 |     }
155 | }
156 | 
157 | impl<I: Iterator<Item = u8>> Iterator for NullTerminate<I> {
158 |     type Item = u8;
159 |     fn next(&mut self) -> Option<u8> {
160 |         if self.done {
161 |             return None;
162 |         }
163 |         let res = self.i.next();
164 |         if let Some(s) = res {
165 |             debug_assert!(s < 255);
166 |             Some(s + 1)
167 |         } else {
168 |             self.done = true;
169 |             Some(0)
170 |         }
171 |     }
172 | 
173 |     fn nth(&mut self, n: usize) -> Option<u8> {
174 |         if self.done {
175 |             return None;
176 |         }
177 |         let (remaining, _max) = self.i.size_hint();
178 |         debug_assert_eq!(
179 |             Some(remaining),
180 |             _max,
181 |             "must use iterator with exact length for NullTerminate"
182 |         );
183 |         if n + 1 == remaining {
184 |             self.done = true;
185 |             Some(0)
186 |         } else {
187 |             self.i.nth(n).map(|x| x + 1)
188 |         }
189 |     }
190 | }
191 | 
192 | impl<'a> Digital<'a> for str {
193 |     type I = NullTerminate<str::Bytes<'a>>;
194 |     const STOP_CHARACTER: Option<u8> = Some(0);
195 |     fn digits(&'a self) -> Self::I {
196 |         NullTerminate::new(self.bytes())
197 |     }
198 | }
199 | 
200 | impl<'a> Digital<'a> for String {
201 |     type I = NullTerminate<str::Bytes<'a>>;
202 |     const STOP_CHARACTER: Option<u8> = Some(0);
203 |     fn digits(&'a self) -> Self::I {
204 |         NullTerminate::new(self.as_str().bytes())
205 |     }
206 | }
207 | 
208 | #[cfg(test)]
209 | mod tests {
210 |     use super::*;
211 | 
212 |     fn test_digits_obey_order<D: for<'a> Digital<'a> + PartialOrd>(x: D, y: D) -> bool {
213 |         let vx: Vec<_> = x.digits().collect();
214 |         let vy: Vec<_> = y.digits().collect();
215 |         if x < y {
216 |             vx < vy
217 |         } else {
218 |             vx >= vy
219 |         }
220 |     }
221 | 
222 |     quickcheck! {
223 |         fn digits_strings(x: String, y: String) -> bool {
224 |             test_digits_obey_order(x, y)
225 |         }
226 | 
227 |         fn digits_u64(x: u64, y: u64) -> bool {
228 |             // why shift left? the RNG seems to generate numbers <256, so endianness bugs do not
229 |             // get caught!
230 |             test_digits_obey_order(x.wrapping_shl(20), y.wrapping_shl(20))
231 |         }
232 | 
233 |         fn digits_u32(x: u32, y: u32) -> bool {
234 |             test_digits_obey_order(x.wrapping_shl(20), y.wrapping_shl(20))
235 |         }
236 | 
237 |         fn digits_i32(x: i32, y: i32) -> bool {
238 |             test_digits_obey_order(x.wrapping_mul(1 << 10), y.wrapping_mul(1 << 10))
239 |         }
240 | 
241 |         fn digits_i64(x: i64, y: i64) -> bool {
242 |             test_digits_obey_order(x.wrapping_mul(1 << 20), y.wrapping_mul(1 << 20))
243 |         }
244 | 
245 |         fn digits_isize(x: isize, y: isize) -> bool {
246 |             test_digits_obey_order(x.wrapping_mul(1 << 20), y.wrapping_mul(1 << 20))
247 |         }
248 | 
249 |         fn digits_usize(x: usize, y: usize) -> bool {
250 |             test_digits_obey_order(x.wrapping_shl(20), y.wrapping_shl(20))
251 |         }
252 |     }
253 | }
254 | 


--------------------------------------------------------------------------------
/benches/set_bench.rs:
--------------------------------------------------------------------------------
  1 | #[macro_use]
  2 | extern crate criterion;
  3 | extern crate radix_tree;
  4 | extern crate rand;
  5 | 
  6 | use criterion::{Bencher, Criterion};
  7 | use rand::{Rng, SeedableRng, StdRng};
  8 | use std::collections::btree_set::BTreeSet;
  9 | use std::collections::HashSet;
 10 | use std::hash::Hash;
 11 | 
 12 | use radix_tree::{ARTSet, ArtElement, CachingARTSet, Digital, PrefixCache, RawART};
 13 | 
 14 | /// We use a deterministic seed when generating random data to cut down on variance between
 15 | /// different benchmark runs.
 16 | const RAND_SEED: [usize; 32] = [1; 32];
 17 | 
 18 | /// Barebones set trait to abstract over various collections.
 19 | trait Set<T> {
 20 |     fn new() -> Self;
 21 |     fn contains(&self, t: &T) -> bool;
 22 |     fn insert(&mut self, t: T);
 23 |     fn delete(&mut self, t: &T) -> bool;
 24 | }
 25 | 
 26 | trait ARTArg {
 27 |     const PREFIX_LEN: usize;
 28 | }
 29 | 
 30 | impl ARTArg for u64 {
 31 |     const PREFIX_LEN: usize = 3;
 32 | }
 33 | 
 34 | impl ARTArg for String {
 35 |     const PREFIX_LEN: usize = 8;
 36 | }
 37 | 
 38 | impl<T: ARTArg + for<'a> Digital<'a> + Ord, C: PrefixCache<ArtElement<T>>> Set<T>
 39 |     for RawART<ArtElement<T>, C>
 40 | {
 41 |     fn new() -> Self {
 42 |         Self::with_prefix_buckets(T::PREFIX_LEN)
 43 |     }
 44 |     fn contains(&self, t: &T) -> bool {
 45 |         self.contains(t)
 46 |     }
 47 |     fn insert(&mut self, t: T) {
 48 |         self.replace(t);
 49 |     }
 50 |     fn delete(&mut self, t: &T) -> bool {
 51 |         self.remove(t)
 52 |     }
 53 | }
 54 | 
 55 | impl<T: Hash + Eq> Set<T> for HashSet<T> {
 56 |     fn new() -> Self {
 57 |         HashSet::new()
 58 |     }
 59 |     fn contains(&self, t: &T) -> bool {
 60 |         self.get(t).is_some()
 61 |     }
 62 |     fn insert(&mut self, t: T) {
 63 |         self.replace(t);
 64 |     }
 65 |     fn delete(&mut self, t: &T) -> bool {
 66 |         self.remove(t)
 67 |     }
 68 | }
 69 | 
 70 | impl<T: Ord> Set<T> for BTreeSet<T> {
 71 |     fn new() -> Self {
 72 |         BTreeSet::new()
 73 |     }
 74 |     fn contains(&self, t: &T) -> bool {
 75 |         self.get(t).is_some()
 76 |     }
 77 |     fn insert(&mut self, t: T) {
 78 |         self.replace(t);
 79 |     }
 80 |     fn delete(&mut self, t: &T) -> bool {
 81 |         self.remove(t)
 82 |     }
 83 | }
 84 | 
 85 | fn random_vec(len: usize, max_val: u64) -> Vec<u64> {
 86 |     let mut rng = StdRng::from_seed(&RAND_SEED[..]);
 87 |     (0..len.next_power_of_two())
 88 |         .map(|_| rng.gen_range::<u64>(0, max_val))
 89 |         .collect()
 90 | }
 91 | 
 92 | fn random_dense_vec(len: u64, bias: u64) -> Vec<u64> {
 93 |     let mut rng = StdRng::from_seed(&RAND_SEED[..]);
 94 |     let mut res = (0..len.next_power_of_two())
 95 |         .map(|x| x + bias)
 96 |         .collect::<Vec<u64>>();
 97 |     rng.shuffle(res.as_mut_slice());
 98 |     res
 99 | }
100 | 
101 | fn random_string_vec(max_len: usize, len: usize) -> Vec<String> {
102 |     let mut rng = StdRng::from_seed(&RAND_SEED[..]);
103 |     (0..len.next_power_of_two())
104 |         .map(|_| {
105 |             let mlen = max_len as isize;
106 |             let s_len = mlen + rng.gen_range::<isize>(-mlen / 2, mlen / 2);
107 |             rng.gen_iter::<char>()
108 |                 .take(s_len as usize)
109 |                 .collect::<String>()
110 |         })
111 |         .collect()
112 | }
113 | 
114 | fn bench_set_rand_int_lookup<T: for<'a> Digital<'a>, S: Set<T>>(
115 |     b: &mut Bencher,
116 |     contents: &S,
117 |     lookups: &Vec<T>,
118 | ) {
119 |     assert!(lookups.len().is_power_of_two());
120 |     let mut ix = 0;
121 |     b.iter(|| {
122 |         contents.contains(&lookups[ix]);
123 |         ix += 1;
124 |         ix = ix & (lookups.len() - 1);
125 |     })
126 | }
127 | 
128 | fn bench_set_insert_remove<T: Clone + for<'a> Digital<'a>, S: Set<T>>(
129 |     b: &mut Bencher,
130 |     contents: &mut S,
131 |     lookups: &Vec<T>,
132 | ) {
133 |     assert!(lookups.len().is_power_of_two());
134 |     let mut ix = 0;
135 |     b.iter(|| {
136 |         contents.insert(lookups[ix].clone());
137 |         ix += 1;
138 |         ix = ix & (lookups.len() - 1);
139 |         contents.delete(&lookups[ix]);
140 |         // Why += 2? lookups has an even length, but we don't want all inserts to converge to
141 |         // "replace" ops (similarly, deletes should sometimes succeed).
142 |         // TODO: There's probably a more principled way of doing this.
143 |         ix += 2;
144 |         ix = ix & (lookups.len() - 1);
145 |     })
146 | }
147 | 
148 | fn criterion_benchmark(c: &mut Criterion) {
149 |     use std::fmt::{Debug, Error, Formatter};
150 |     #[derive(Clone)]
151 |     struct SizeVec<T>(Vec<T>, Vec<T>);
152 |     impl<T> Debug for SizeVec<T> {
153 |         fn fmt(&self, f: &mut Formatter) -> Result<(), Error> {
154 |             write!(f, "{:?}", self.0.len())
155 |         }
156 |     }
157 |     fn make_bench<T: 'static + Clone + for<'a> Digital<'a>, S: Set<T> + 'static>(
158 |         c: &mut Criterion,
159 |         desc: String,
160 |         inp: &Vec<SizeVec<T>>,
161 |     ) {
162 |         eprintln!("Generating for {} (1/3)", desc);
163 |         struct Wrap<S, T>(SizeVec<S>, Box<T>);
164 |         impl<S, T> Debug for Wrap<S, T> {
165 |             fn fmt(&self, f: &mut Formatter) -> Result<(), Error> {
166 |                 write!(f, "{:?}", self.0)
167 |             }
168 |         }
169 |         let sets1 = inp.iter()
170 |             .map(|sv| {
171 |                 let mut s = S::new();
172 |                 for i in sv.0.iter() {
173 |                     s.insert(i.clone());
174 |                 }
175 |                 Wrap(sv.clone(), Box::new(s))
176 |             })
177 |             .collect::<Vec<Wrap<_, _>>>();
178 |         c.bench_function_over_inputs(
179 |             &format!("{}/lookup_hit", desc),
180 |             |b, &Wrap(ref sv, ref s)| bench_set_rand_int_lookup::<T, S>(b, &*s, &sv.0),
181 |             sets1,
182 |         );
183 |         eprintln!("Generating for {} (2/3)", desc);
184 |         let sets2 = inp.iter()
185 |             .map(|sv| {
186 |                 let mut s = S::new();
187 |                 for i in sv.0.iter() {
188 |                     s.insert(i.clone());
189 |                 }
190 |                 Wrap(sv.clone(), Box::new(s))
191 |             })
192 |             .collect::<Vec<Wrap<_, _>>>();
193 |         c.bench_function_over_inputs(
194 |             &format!("{}/lookup_miss", desc),
195 |             |b, &Wrap(ref sv, ref s)| bench_set_rand_int_lookup::<T, S>(b, &*s, &sv.1),
196 |             sets2,
197 |         );
198 |         eprintln!("Generating for {} (3/3)", desc);
199 |         use std::cell::UnsafeCell;
200 |         let sets3 = inp.iter()
201 |             .map(|sv| {
202 |                 let mut s = S::new();
203 |                 for i in sv.0.iter() {
204 |                     s.insert(i.clone());
205 |                 }
206 |                 Wrap(sv.clone(), Box::new(UnsafeCell::new(s)))
207 |             })
208 |             .collect::<Vec<Wrap<_, _>>>();
209 |         unsafe {
210 |             c.bench_function_over_inputs(
211 |                 &format!("{}/insert_remove", desc),
212 |                 |b, &Wrap(ref sv, ref s)| bench_set_insert_remove::<T, S>(b, &mut *s.get(), &sv.0),
213 |                 sets3,
214 |             );
215 |         }
216 |     }
217 |     macro_rules! bench_inner {
218 |         ($c: expr, $container: tt, $ivec: expr, $ivec2: expr, $svec: expr) => {{
219 |             make_bench::<u64, $container<u64>>($c, format!("{}/sparse_u64", stringify!($container)), $ivec);
220 |             make_bench::<u64, $container<u64>>($c, format!("{}/dense_u64", stringify!($container)), $ivec2);
221 |             make_bench::<String, $container<String>>(
222 |                 $c,
223 |                 format!("{}/String", stringify!($container)),
224 |                 $svec,
225 |             );
226 |         }};
227 |     }
228 |     macro_rules! bench_all {
229 |         ($c:expr, $ivec:expr, $ivec2:expr, $svec:expr, $( $container:tt ),+) => {
230 |             $(
231 |                 bench_inner!($c, $container, $ivec, $ivec2, $svec);
232 |             )+
233 |         }
234 |     }
235 |     eprintln!("Generating Ints");
236 |     let v1s: Vec<SizeVec<u64>> = [16 << 10, 16 << 20, 256 << 20]
237 |         .iter()
238 |         .map(|size: &usize| SizeVec(random_vec(*size, !0), random_vec(*size, !0)))
239 |         .collect();
240 |     let v1_dense: Vec<SizeVec<u64>> = [16 << 10, 16 << 20, 256 << 20]
241 |         .iter()
242 |         .map(|size: &usize| {
243 |             SizeVec(
244 |                 random_dense_vec(*size as u64, 0),
245 |                 random_dense_vec(*size as u64, *size as u64 * 2),
246 |             )
247 |         })
248 |         .collect();
249 |     eprintln!("Generating Strings");
250 |     let v2s: Vec<SizeVec<String>> = [16 << 10, 1 << 20, 16 << 20]
251 |         .iter()
252 |         // NB: random_string_vec will make random UTF8 strings, in practice asking for a string of
253 |         // length 10 can give you far more than 10 bytes.
254 |         .map(|size: &usize| SizeVec(random_string_vec(10, *size), random_string_vec(10, *size)))
255 |         .collect();
256 | 
257 |     bench_all!(
258 |         c,
259 |         &v1s,
260 |         &v1_dense,
261 |         &v2s,
262 |         ARTSet,
263 |         HashSet,
264 |         BTreeSet,
265 |         CachingARTSet
266 |     );
267 | }
268 | 
269 | criterion_group!(benches, criterion_benchmark);
270 | criterion_main!(benches);
271 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
  1 |                                  Apache License
  2 |                            Version 2.0, January 2004
  3 |                         http://www.apache.org/licenses/
  4 | 
  5 |    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
  6 | 
  7 |    1. Definitions.
  8 | 
  9 |       "License" shall mean the terms and conditions for use, reproduction,
 10 |       and distribution as defined by Sections 1 through 9 of this document.
 11 | 
 12 |       "Licensor" shall mean the copyright owner or entity authorized by
 13 |       the copyright owner that is granting the License.
 14 | 
 15 |       "Legal Entity" shall mean the union of the acting entity and all
 16 |       other entities that control, are controlled by, or are under common
 17 |       control with that entity. For the purposes of this definition,
 18 |       "control" means (i) the power, direct or indirect, to cause the
 19 |       direction or management of such entity, whether by contract or
 20 |       otherwise, or (ii) ownership of fifty percent (50%) or more of the
 21 |       outstanding shares, or (iii) beneficial ownership of such entity.
 22 | 
 23 |       "You" (or "Your") shall mean an individual or Legal Entity
 24 |       exercising permissions granted by this License.
 25 | 
 26 |       "Source" form shall mean the preferred form for making modifications,
 27 |       including but not limited to software source code, documentation
 28 |       source, and configuration files.
 29 | 
 30 |       "Object" form shall mean any form resulting from mechanical
 31 |       transformation or translation of a Source form, including but
 32 |       not limited to compiled object code, generated documentation,
 33 |       and conversions to other media types.
 34 | 
 35 |       "Work" shall mean the work of authorship, whether in Source or
 36 |       Object form, made available under the License, as indicated by a
 37 |       copyright notice that is included in or attached to the work
 38 |       (an example is provided in the Appendix below).
 39 | 
 40 |       "Derivative Works" shall mean any work, whether in Source or Object
 41 |       form, that is based on (or derived from) the Work and for which the
 42 |       editorial revisions, annotations, elaborations, or other modifications
 43 |       represent, as a whole, an original work of authorship. For the purposes
 44 |       of this License, Derivative Works shall not include works that remain
 45 |       separable from, or merely link (or bind by name) to the interfaces of,
 46 |       the Work and Derivative Works thereof.
 47 | 
 48 |       "Contribution" shall mean any work of authorship, including
 49 |       the original version of the Work and any modifications or additions
 50 |       to that Work or Derivative Works thereof, that is intentionally
 51 |       submitted to Licensor for inclusion in the Work by the copyright owner
 52 |       or by an individual or Legal Entity authorized to submit on behalf of
 53 |       the copyright owner. For the purposes of this definition, "submitted"
 54 |       means any form of electronic, verbal, or written communication sent
 55 |       to the Licensor or its representatives, including but not limited to
 56 |       communication on electronic mailing lists, source code control systems,
 57 |       and issue tracking systems that are managed by, or on behalf of, the
 58 |       Licensor for the purpose of discussing and improving the Work, but
 59 |       excluding communication that is conspicuously marked or otherwise
 60 |       designated in writing by the copyright owner as "Not a Contribution."
 61 | 
 62 |       "Contributor" shall mean Licensor and any individual or Legal Entity
 63 |       on behalf of whom a Contribution has been received by Licensor and
 64 |       subsequently incorporated within the Work.
 65 | 
 66 |    2. Grant of Copyright License. Subject to the terms and conditions of
 67 |       this License, each Contributor hereby grants to You a perpetual,
 68 |       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 69 |       copyright license to reproduce, prepare Derivative Works of,
 70 |       publicly display, publicly perform, sublicense, and distribute the
 71 |       Work and such Derivative Works in Source or Object form.
 72 | 
 73 |    3. Grant of Patent License. Subject to the terms and conditions of
 74 |       this License, each Contributor hereby grants to You a perpetual,
 75 |       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 76 |       (except as stated in this section) patent license to make, have made,
 77 |       use, offer to sell, sell, import, and otherwise transfer the Work,
 78 |       where such license applies only to those patent claims licensable
 79 |       by such Contributor that are necessarily infringed by their
 80 |       Contribution(s) alone or by combination of their Contribution(s)
 81 |       with the Work to which such Contribution(s) was submitted. If You
 82 |       institute patent litigation against any entity (including a
 83 |       cross-claim or counterclaim in a lawsuit) alleging that the Work
 84 |       or a Contribution incorporated within the Work constitutes direct
 85 |       or contributory patent infringement, then any patent licenses
 86 |       granted to You under this License for that Work shall terminate
 87 |       as of the date such litigation is filed.
 88 | 
 89 |    4. Redistribution. You may reproduce and distribute copies of the
 90 |       Work or Derivative Works thereof in any medium, with or without
 91 |       modifications, and in Source or Object form, provided that You
 92 |       meet the following conditions:
 93 | 
 94 |       (a) You must give any other recipients of the Work or
 95 |           Derivative Works a copy of this License; and
 96 | 
 97 |       (b) You must cause any modified files to carry prominent notices
 98 |           stating that You changed the files; and
 99 | 
100 |       (c) You must retain, in the Source form of any Derivative Works
101 |           that You distribute, all copyright, patent, trademark, and
102 |           attribution notices from the Source form of the Work,
103 |           excluding those notices that do not pertain to any part of
104 |           the Derivative Works; and
105 | 
106 |       (d) If the Work includes a "NOTICE" text file as part of its
107 |           distribution, then any Derivative Works that You distribute must
108 |           include a readable copy of the attribution notices contained
109 |           within such NOTICE file, excluding those notices that do not
110 |           pertain to any part of the Derivative Works, in at least one
111 |           of the following places: within a NOTICE text file distributed
112 |           as part of the Derivative Works; within the Source form or
113 |           documentation, if provided along with the Derivative Works; or,
114 |           within a display generated by the Derivative Works, if and
115 |           wherever such third-party notices normally appear. The contents
116 |           of the NOTICE file are for informational purposes only and
117 |           do not modify the License. You may add Your own attribution
118 |           notices within Derivative Works that You distribute, alongside
119 |           or as an addendum to the NOTICE text from the Work, provided
120 |           that such additional attribution notices cannot be construed
121 |           as modifying the License.
122 | 
123 |       You may add Your own copyright statement to Your modifications and
124 |       may provide additional or different license terms and conditions
125 |       for use, reproduction, or distribution of Your modifications, or
126 |       for any such Derivative Works as a whole, provided Your use,
127 |       reproduction, and distribution of the Work otherwise complies with
128 |       the conditions stated in this License.
129 | 
130 |    5. Submission of Contributions. Unless You explicitly state otherwise,
131 |       any Contribution intentionally submitted for inclusion in the Work
132 |       by You to the Licensor shall be under the terms and conditions of
133 |       this License, without any additional terms or conditions.
134 |       Notwithstanding the above, nothing herein shall supersede or modify
135 |       the terms of any separate license agreement you may have executed
136 |       with Licensor regarding such Contributions.
137 | 
138 |    6. Trademarks. This License does not grant permission to use the trade
139 |       names, trademarks, service marks, or product names of the Licensor,
140 |       except as required for reasonable and customary use in describing the
141 |       origin of the Work and reproducing the content of the NOTICE file.
142 | 
143 |    7. Disclaimer of Warranty. Unless required by applicable law or
144 |       agreed to in writing, Licensor provides the Work (and each
145 |       Contributor provides its Contributions) on an "AS IS" BASIS,
146 |       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
147 |       implied, including, without limitation, any warranties or conditions
148 |       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
149 |       PARTICULAR PURPOSE. You are solely responsible for determining the
150 |       appropriateness of using or redistributing the Work and assume any
151 |       risks associated with Your exercise of permissions under this License.
152 | 
153 |    8. Limitation of Liability. In no event and under no legal theory,
154 |       whether in tort (including negligence), contract, or otherwise,
155 |       unless required by applicable law (such as deliberate and grossly
156 |       negligent acts) or agreed to in writing, shall any Contributor be
157 |       liable to You for damages, including any direct, indirect, special,
158 |       incidental, or consequential damages of any character arising as a
159 |       result of this License or out of the use or inability to use the
160 |       Work (including but not limited to damages for loss of goodwill,
161 |       work stoppage, computer failure or malfunction, or any and all
162 |       other commercial damages or losses), even if such Contributor
163 |       has been advised of the possibility of such damages.
164 | 
165 |    9. Accepting Warranty or Additional Liability. While redistributing
166 |       the Work or Derivative Works thereof, You may choose to offer,
167 |       and charge a fee for, acceptance of support, warranty, indemnity,
168 |       or other liability obligations and/or rights consistent with this
169 |       License. However, in accepting such obligations, You may act only
170 |       on Your own behalf and on Your sole responsibility, not on behalf
171 |       of any other Contributor, and only if You agree to indemnify,
172 |       defend, and hold each Contributor harmless for any liability
173 |       incurred by, or claims asserted against, such Contributor by reason
174 |       of your accepting any such warranty or additional liability.
175 | 
176 |    END OF TERMS AND CONDITIONS
177 | 
178 |    APPENDIX: How to apply the Apache License to your work.
179 | 
180 |       To apply the Apache License to your work, attach the following
181 |       boilerplate notice, with the fields enclosed by brackets "[]"
182 |       replaced with your own identifying information. (Don't include
183 |       the brackets!)  The text should be enclosed in the appropriate
184 |       comment syntax for the file format. We also recommend that a
185 |       file or class name and description of purpose be included on the
186 |       same "printed page" as the copyright notice for easier
187 |       identification within third-party archives.
188 | 
189 |    Copyright [yyyy] [name of copyright owner]
190 | 
191 |    Licensed under the Apache License, Version 2.0 (the "License");
192 |    you may not use this file except in compliance with the License.
193 |    You may obtain a copy of the License at
194 | 
195 |        http://www.apache.org/licenses/LICENSE-2.0
196 | 
197 |    Unless required by applicable law or agreed to in writing, software
198 |    distributed under the License is distributed on an "AS IS" BASIS,
199 |    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
200 |    See the License for the specific language governing permissions and
201 |    limitations under the License.
202 | 


--------------------------------------------------------------------------------
/src/prefix_cache.rs:
--------------------------------------------------------------------------------
  1 | extern crate fnv;
  2 | #[cfg(feature = "print_cache_stats")]
  3 | use std::cell::UnsafeCell;
  4 | use std::cmp;
  5 | use std::marker::PhantomData;
  6 | use std::ptr;
  7 | 
  8 | use super::art_internal::MarkedPtr;
  9 | 
 10 | pub use self::dense_hash_set::HashSetPrefixCache;
 11 | 
 12 | /// PrefixCache describes types that can cache pointers interior to an ART.
 13 | pub trait PrefixCache<T> {
 14 |     /// If true, the cache is used during ART set operations. If false, the cache is ignored.
 15 |     const ENABLED: bool;
 16 |     /// If true, lookup returning None indicates that no nodes with prefix `bs` are in the set.
 17 |     const COMPLETE: bool;
 18 |     fn new() -> Self;
 19 |     fn lookup(&self, bs: &[u8]) -> Option<MarkedPtr<T>>;
 20 |     fn replace(&mut self, bs: &[u8], ptr: MarkedPtr<T>) -> Option<MarkedPtr<T>> {
 21 |         self.insert(bs, ptr);
 22 |         None
 23 |     }
 24 |     fn insert(&mut self, bs: &[u8], ptr: MarkedPtr<T>) {
 25 |         let _ = self.replace(bs, ptr);
 26 |     }
 27 |     #[inline(always)]
 28 |     fn debug_assert_unreachable(&self, _ptr: MarkedPtr<T>) {}
 29 | }
 30 | pub struct NullBuckets<T>(PhantomData<T>);
 31 | 
 32 | impl<T> PrefixCache<T> for NullBuckets<T> {
 33 |     const ENABLED: bool = false;
 34 |     const COMPLETE: bool = false;
 35 |     fn new() -> Self {
 36 |         NullBuckets(PhantomData)
 37 |     }
 38 |     fn lookup(&self, _: &[u8]) -> Option<MarkedPtr<T>> {
 39 |         None
 40 |     }
 41 |     fn insert(&mut self, _: &[u8], _ptr: MarkedPtr<T>) {}
 42 | }
 43 | 
 44 | mod dense_hash_set {
 45 |     use super::*;
 46 |     use super::fnv::FnvHasher;
 47 |     use super::super::Digital;
 48 |     use super::super::byteorder::{BigEndian, ByteOrder};
 49 | 
 50 |     use std::hash::{Hash, Hasher};
 51 |     use std::mem;
 52 | 
 53 |     fn read_u64(bs: &[u8]) -> u64 {
 54 |         debug_assert!(bs.len() <= 8);
 55 |         let mut arr = [0 as u8; 8];
 56 |         unsafe { ptr::copy_nonoverlapping(&bs[0], &mut arr[0], cmp::min(bs.len(), 8)) };
 57 |         BigEndian::read_u64(&arr[..])
 58 |     }
 59 | 
 60 |     pub struct HashSetPrefixCache<T>(DenseHashTable<MarkedElt<T>>);
 61 |     impl<T> PrefixCache<T> for HashSetPrefixCache<T> {
 62 |         const ENABLED: bool = true;
 63 |         const COMPLETE: bool = true;
 64 |         fn new() -> Self {
 65 |             HashSetPrefixCache(DenseHashTable::new())
 66 |         }
 67 | 
 68 |         #[cfg(debug_assertions)]
 69 |         fn debug_assert_unreachable(&self, ptr: MarkedPtr<T>) {
 70 |             for elt in self.0.buckets.iter() {
 71 |                 if elt.ptr == ptr {
 72 |                     assert!(
 73 |                         self.0.lookup(&elt.prefix).is_some(),
 74 |                         "attempted to look up {:?}:{:?} but failed",
 75 |                         elt.prefix,
 76 |                         elt.ptr
 77 |                     );
 78 |                     let l = self.0.lookup(&elt.prefix).unwrap();
 79 |                     assert!(l.ptr == elt.ptr, "got {:?} != elt {:?}", l, elt);
 80 |                     assert!(
 81 |                         elt.ptr != ptr,
 82 |                         "Found ptr {:?} in elt with prefix {:?} [{:?}]",
 83 |                         ptr,
 84 |                         elt.prefix,
 85 |                         elt.prefix.digits().collect::<Vec<u8>>().as_slice()
 86 |                     )
 87 |                 }
 88 |             }
 89 |         }
 90 | 
 91 |         fn lookup(&self, bs: &[u8]) -> Option<MarkedPtr<T>> {
 92 |             let prefix = read_u64(bs);
 93 |             let res = self.0.lookup(&prefix).map(|elt| elt.ptr.clone());
 94 |             #[cfg(debug_assertions)]
 95 |             unsafe {
 96 |                 if let Some(Err(inner)) = res.as_ref()
 97 |                     .map(|x| x.get().expect("stored pointer should be non-null"))
 98 |                 {
 99 |                     assert!(
100 |                         inner.children != !0,
101 |                         "Returning an expired node {:?} (ty={:?})",
102 |                         res,
103 |                         inner.typ
104 |                     );
105 |                 }
106 |             }
107 |             res
108 |         }
109 | 
110 |         fn insert(&mut self, bs: &[u8], ptr: MarkedPtr<T>) {
111 |             let prefix = read_u64(bs);
112 |             if ptr.is_null() {
113 |                 self.0.delete(&prefix);
114 |                 debug_assert!(self.lookup(bs).is_none());
115 |             } else {
116 |                 let _ = self.0.insert(MarkedElt {
117 |                     prefix: prefix,
118 |                     ptr: ptr,
119 |                 });
120 |             }
121 |         }
122 | 
123 |         fn replace(&mut self, bs: &[u8], ptr: MarkedPtr<T>) -> Option<MarkedPtr<T>> {
124 |             let prefix = read_u64(bs);
125 |             if ptr.is_null() {
126 |                 self.0.delete(&prefix)
127 |             } else {
128 |                 match self.0.insert(MarkedElt {
129 |                     prefix: prefix,
130 |                     ptr: ptr,
131 |                 }) {
132 |                     Ok(()) => None,
133 |                     Err(t) => Some(t),
134 |                 }
135 |             }.map(|t| t.ptr)
136 |         }
137 |     }
138 | 
139 |     trait DHTE {
140 |         type Key;
141 |         fn null() -> Self;
142 |         fn tombstone() -> Self;
143 |         fn is_null(&self) -> bool;
144 |         fn is_tombstone(&self) -> bool;
145 |         fn key(&self) -> &Self::Key;
146 |     }
147 | 
148 |     const MARKED_TOMBSTONE: usize = !0;
149 |     struct MarkedElt<T> {
150 |         prefix: u64,
151 |         ptr: MarkedPtr<T>,
152 |     }
153 |     impl<T> ::std::fmt::Debug for MarkedElt<T> {
154 |         fn fmt(&self, f: &mut ::std::fmt::Formatter) -> Result<(), ::std::fmt::Error> {
155 |             write!(
156 |                 f,
157 |                 "MarkedElt{{ {:?}, {:?} }}",
158 |                 self.prefix.digits().collect::<Vec<u8>>().as_slice(),
159 |                 self.ptr
160 |             )
161 |         }
162 |     }
163 | 
164 |     impl<T> DHTE for MarkedElt<T> {
165 |         type Key = u64;
166 |         fn null() -> Self {
167 |             MarkedElt {
168 |                 prefix: 0,
169 |                 ptr: MarkedPtr::null(),
170 |             }
171 |         }
172 |         fn tombstone() -> Self {
173 |             MarkedElt {
174 |                 prefix: 0,
175 |                 ptr: MarkedPtr::from_leaf(MARKED_TOMBSTONE as *mut T),
176 |             }
177 |         }
178 | 
179 |         fn is_null(&self) -> bool {
180 |             self.ptr.is_null()
181 |         }
182 |         fn is_tombstone(&self) -> bool {
183 |             self.ptr.raw_eq(MARKED_TOMBSTONE)
184 |         }
185 |         fn key(&self) -> &Self::Key {
186 |             &self.prefix
187 |         }
188 |     }
189 | 
190 |     /// A bare-bones implementation of Google's dense_hash_set. Not a full-featured map, but
191 |     /// contains sufficient functionality to be used as a PrefixCache
192 |     ///
193 |     /// TODO: explore optimizing this more (for time or for space).
194 |     struct DenseHashTable<T> {
195 |         buckets: Vec<T>,
196 |         len: usize,
197 |         set: usize,
198 |     }
199 | 
200 |     impl<T: DHTE> DenseHashTable<T>
201 |     where
202 |         T::Key: Eq + Hash,
203 |     {
204 |         fn next_probe(hash: usize, i: usize) -> usize {
205 |             // hash + i
206 |             hash + (i + i * i) / 2
207 |         }
208 | 
209 |         fn new() -> Self {
210 |             DenseHashTable {
211 |                 buckets: Vec::new(),
212 |                 len: 0,
213 |                 set: 0,
214 |             }
215 |         }
216 | 
217 |         fn seek(
218 |             &self,
219 |             k: &T::Key,
220 |         ) -> (
221 |             Option<*mut T>, /* first tombstone */
222 |             Option<*mut T>, /* matching or null */
223 |         ) {
224 |             let mut tombstone = None;
225 |             let l = self.buckets.len();
226 |             debug_assert!(l.is_power_of_two());
227 |             let hash = {
228 |                 let mut hasher = FnvHasher::default();
229 |                 k.hash(&mut hasher);
230 |                 hasher.finish() as usize
231 |             };
232 |             let mut ix = hash;
233 |             let mut times = 0;
234 |             while times < l {
235 |                 ix &= l - 1;
236 |                 debug_assert!(ix < self.buckets.len());
237 |                 times += 1;
238 |                 let bucket = unsafe { self.buckets.get_unchecked(ix) };
239 |                 let bucket_raw = bucket as *const T as *mut T;
240 |                 if tombstone.is_none() && bucket.is_tombstone() {
241 |                     tombstone = Some(bucket_raw);
242 |                 } else if bucket.is_null() || bucket.key() == k {
243 |                     return (tombstone, Some(bucket_raw));
244 |                 }
245 |                 ix = Self::next_probe(hash, times);
246 |             }
247 |             (tombstone, None)
248 |         }
249 | 
250 |         fn grow(&mut self) {
251 |             debug_assert!(self.set >= self.len);
252 |             let old_len = if self.buckets.len() == 0 {
253 |                 self.buckets.push(T::null());
254 |                 return;
255 |             } else if self.buckets.len() < 32
256 |                 || (self.set as i64) - (self.len as i64) < (self.buckets.len() as i64 / 4)
257 |             {
258 |                 // actually grow. If this condition is not met, then we just re-hash
259 |                 let l = self.buckets.len();
260 |                 self.buckets.extend((0..l).map(|_| T::null()));
261 |                 l
262 |             } else {
263 |                 self.buckets.len()
264 |             };
265 |             debug_assert!(self.buckets.len().is_power_of_two());
266 |             debug_assert!(old_len.is_power_of_two());
267 |             let mut v = Vec::with_capacity(self.len);
268 |             for i in &mut self.buckets[0..old_len] {
269 |                 if i.is_null() {
270 |                     continue;
271 |                 }
272 |                 if i.is_tombstone() {
273 |                     *i = T::null();
274 |                     continue;
275 |                 }
276 |                 let mut t = T::null();
277 |                 mem::swap(i, &mut t);
278 |                 v.push(t);
279 |             }
280 |             self.set = 0;
281 |             self.len = 0;
282 |             for elt in v.into_iter() {
283 |                 let _res = self.insert(elt);
284 |                 debug_assert!(_res.is_ok());
285 |             }
286 |         }
287 | 
288 |         fn lookup(&self, k: &T::Key) -> Option<&T> {
289 |             if self.buckets.len() == 0 {
290 |                 return None;
291 |             }
292 |             let (_, b_opt) = self.seek(k);
293 |             b_opt.and_then(|b| unsafe {
294 |                 if (*b).is_null() {
295 |                     None
296 |                 } else {
297 |                     Some(&*b)
298 |                 }
299 |             })
300 |         }
301 | 
302 |         fn delete(&mut self, k: &T::Key) -> Option<T> {
303 |             if self.buckets.len() == 0 {
304 |                 return None;
305 |             }
306 |             let (_, b_opt) = self.seek(k);
307 |             b_opt.and_then(|b| unsafe {
308 |                 if (*b).is_null() {
309 |                     None
310 |                 } else {
311 |                     let mut tomb = T::tombstone();
312 |                     mem::swap(&mut *b, &mut tomb);
313 |                     self.len -= 1;
314 |                     Some(tomb)
315 |                 }
316 |             })
317 |         }
318 | 
319 |         fn insert(&mut self, mut t: T) -> Result<(), T> {
320 |             if self.set >= self.buckets.len() / 2 {
321 |                 self.grow();
322 |             }
323 |             debug_assert!(!t.is_null());
324 |             debug_assert!(!t.is_tombstone());
325 |             let (tmb, b_opt) = self.seek(t.key());
326 |             unsafe {
327 |                 let bucket = b_opt.unwrap();
328 |                 if (*bucket).is_null() {
329 |                     // t is not already in the table. We insert it somewhere
330 |                     if let Some(tombstone_bucket) = tmb {
331 |                         // there was a tombstone earlier in the probe chain. We overwrite its
332 |                         // value.
333 |                         *tombstone_bucket = t;
334 |                     } else {
335 |                         // we insert it into the new slot
336 |                         *bucket = t;
337 |                         self.set += 1;
338 |                     }
339 |                     self.len += 1;
340 |                     Ok(())
341 |                 } else {
342 |                     // t is already in the table, we simply swap in the new value
343 |                     mem::swap(&mut *bucket, &mut t);
344 |                     Err(t)
345 |                 }
346 |             }
347 |         }
348 |     }
349 | 
350 |     #[cfg(test)]
351 |     mod tests {
352 |         use super::*;
353 |         use super::super::super::rand;
354 |         use super::super::super::rand::Rng;
355 |         fn random_vec(max_val: usize, len: usize) -> Vec<usize> {
356 |             let mut rng = rand::thread_rng();
357 |             (0..len)
358 |                 .map(|_| rng.gen_range::<usize>(0, max_val))
359 |                 .collect()
360 |         }
361 | 
362 |         #[derive(Debug)]
363 |         struct UsizeElt(usize, usize);
364 |         impl DHTE for UsizeElt {
365 |             type Key = usize;
366 |             fn null() -> Self {
367 |                 UsizeElt(0, 0)
368 |             }
369 |             fn tombstone() -> Self {
370 |                 UsizeElt(0, 2)
371 |             }
372 |             fn is_null(&self) -> bool {
373 |                 self.1 == 0
374 |             }
375 |             fn is_tombstone(&self) -> bool {
376 |                 self.1 == 2
377 |             }
378 |             fn key(&self) -> &Self::Key {
379 |                 &self.0
380 |             }
381 |         }
382 | 
383 |         impl UsizeElt {
384 |             fn new(u: usize) -> Self {
385 |                 UsizeElt(u, 1)
386 |             }
387 |         }
388 | 
389 |         #[test]
390 |         fn dense_hash_set_smoke_test() {
391 |             let mut s = DenseHashTable::<UsizeElt>::new();
392 |             let mut v1 = random_vec(!0, 1 << 18);
393 |             for item in v1.iter() {
394 |                 let _ = s.insert(UsizeElt::new(*item));
395 |                 assert!(
396 |                     s.lookup(item).is_some(),
397 |                     "lookup failed immediately for {:?}",
398 |                     *item
399 |                 );
400 |             }
401 |             let mut missing = Vec::new();
402 |             for item in v1.iter() {
403 |                 if s.lookup(item).is_none() {
404 |                     missing.push(*item)
405 |                 }
406 |             }
407 |             assert_eq!(missing.len(), 0, "missing={:?}", missing);
408 |             v1.sort();
409 |             v1.dedup_by_key(|x| *x);
410 |             let mut v2 = Vec::new();
411 |             for _ in 0..(1 << 17) {
412 |                 if let Some(x) = v1.pop() {
413 |                     v2.push(x)
414 |                 } else {
415 |                     break;
416 |                 }
417 |             }
418 |             let mut failures = 0;
419 |             for i in v2.iter() {
420 |                 let mut fail = 0;
421 |                 if s.lookup(i).is_none() {
422 |                     eprintln!("{:?} no longer in the set!", *i);
423 |                     fail = 1;
424 |                 }
425 |                 let res = s.delete(i);
426 |                 if res.is_none() {
427 |                     fail = 1;
428 |                 }
429 |                 if s.lookup(i).is_some() {
430 |                     fail = 1;
431 |                 }
432 |                 failures += fail;
433 |             }
434 |             assert_eq!(failures, 0);
435 |             let mut failed = false;
436 |             for i in v2.iter() {
437 |                 if s.lookup(i).is_some() {
438 |                     eprintln!("Deleted {:?}, but it's still there!", *i);
439 |                     failed = true;
440 |                 };
441 |             }
442 |             assert!(!failed);
443 |             for i in v1.iter() {
444 |                 assert!(
445 |                     s.lookup(i).is_some(),
446 |                     "Didn't delete {:?}, but it is gone!",
447 |                     *i
448 |                 );
449 |             }
450 |         }
451 |     }
452 | }
453 | 


--------------------------------------------------------------------------------
/src/art_internal.rs:
--------------------------------------------------------------------------------
   1 | use std::cmp;
   2 | use std::marker::PhantomData;
   3 | use std::mem;
   4 | use std::ptr;
   5 | use super::common::Digital;
   6 | 
   7 | extern crate simd;
   8 | 
   9 | #[cfg(target_arch = "x86")]
  10 | use std::arch::x86::_mm_movemask_epi8;
  11 | #[cfg(target_arch = "x86_64")]
  12 | use std::arch::x86_64::_mm_movemask_epi8;
  13 | use super::smallvec::{Array, SmallVec};
  14 | 
  15 | pub const PREFIX_LEN: usize = 8;
  16 | /// used by the `with_node_mut` macro
  17 | pub type RawMutRef<'a, T> = &'a mut RawNode<T>;
  18 | 
  19 | /// used by the `with_node` macro
  20 | pub type RawRef<'a, T> = &'a RawNode<T>;
  21 | 
  22 | /// a non-owning reference to a `ChildPtr<T>`
  23 | pub struct MarkedPtr<T>(usize, PhantomData<T>);
  24 | pub use self::node_variants::{NODE_16, NODE_256, NODE_4, NODE_48, Node16, Node256, Node48,
  25 |                               NodeType};
  26 | 
  27 | impl<T> PartialEq for MarkedPtr<T> {
  28 |     fn eq(&self, other: &MarkedPtr<T>) -> bool {
  29 |         self.0 == other.0
  30 |     }
  31 | }
  32 | 
  33 | impl<T> Eq for MarkedPtr<T> {}
  34 | 
  35 | pub trait Element {
  36 |     type Key: for<'a> Digital<'a> + PartialOrd;
  37 |     fn key(&self) -> &Self::Key;
  38 |     fn matches(&self, k: &Self::Key) -> bool;
  39 |     fn replace_matching(&mut self, other: &mut Self);
  40 | }
  41 | 
  42 | impl<T> Clone for MarkedPtr<T> {
  43 |     fn clone(&self) -> Self {
  44 |         MarkedPtr(self.0, PhantomData)
  45 |     }
  46 | }
  47 | pub struct ChildPtr<T>(MarkedPtr<T>);
  48 | 
  49 | impl<T> ::std::ops::Deref for ChildPtr<T> {
  50 |     type Target = MarkedPtr<T>;
  51 |     fn deref(&self) -> &MarkedPtr<T> {
  52 |         &self.0
  53 |     }
  54 | }
  55 | 
  56 | impl<T> ::std::ops::DerefMut for ChildPtr<T> {
  57 |     fn deref_mut(&mut self) -> &mut MarkedPtr<T> {
  58 |         &mut self.0
  59 |     }
  60 | }
  61 | 
  62 | impl<T> Drop for ChildPtr<T> {
  63 |     fn drop(&mut self) {
  64 |         unsafe {
  65 |             match self.get_mut() {
  66 |                 None => return,
  67 |                 Some(Ok(x)) => mem::drop(Box::from_raw(x)),
  68 |                 // with_node_mut! will "un-erase" the actual type of the RawNode. We want to call drop
  69 |                 // on that to ensure all children are dropped
  70 |                 // ... and to avoid undefined behavior, as we could wind up passing free the wrong size :)
  71 |                 Some(Err(x)) => with_node_mut!(x, nod, mem::drop(Box::from_raw(nod)), T),
  72 |             }
  73 |         }
  74 |     }
  75 | }
  76 | 
  77 | impl<T> ::std::fmt::Debug for MarkedPtr<T> {
  78 |     fn fmt(&self, f: &mut ::std::fmt::Formatter) -> Result<(), ::std::fmt::Error> {
  79 |         unsafe {
  80 |             write!(
  81 |                 f,
  82 |                 "MarkedPtr({})",
  83 |                 match self.get_raw() {
  84 |                     None => String::from("null"),
  85 |                     Some(Ok(leaf_ptr)) => format!("leaf:{:?}", leaf_ptr),
  86 |                     Some(Err(inner)) => format!("inner:{:?}", *inner),
  87 |                 }
  88 |             )
  89 |         }
  90 |     }
  91 | }
  92 | 
  93 | impl<T> ::std::fmt::Debug for ChildPtr<T> {
  94 |     fn fmt(&self, f: &mut ::std::fmt::Formatter) -> Result<(), ::std::fmt::Error> {
  95 |         write!(f, "ChildPtr({:?})", (self.0).0 as *mut ())
  96 |     }
  97 | }
  98 | 
  99 | impl<T> ChildPtr<T> {
 100 |     pub fn null() -> Self {
 101 |         ChildPtr(MarkedPtr::null())
 102 |     }
 103 | 
 104 |     pub fn from_node<R>(p: *mut RawNode<R>) -> Self {
 105 |         ChildPtr(MarkedPtr::from_node(p))
 106 |     }
 107 | 
 108 |     pub fn from_leaf(p: *mut T) -> Self {
 109 |         ChildPtr(MarkedPtr::from_leaf(p))
 110 |     }
 111 | 
 112 |     pub fn swap_null(&mut self) -> Self {
 113 |         let mut self_ptr = ChildPtr::null();
 114 |         mem::swap(self, &mut self_ptr);
 115 |         self_ptr
 116 |     }
 117 | 
 118 |     pub unsafe fn to_marked(&self) -> MarkedPtr<T> {
 119 |         ptr::read(&self.0)
 120 |     }
 121 | }
 122 | 
 123 | impl<T> MarkedPtr<T> {
 124 |     pub fn null() -> Self {
 125 |         MarkedPtr(0, PhantomData)
 126 |     }
 127 | 
 128 |     pub fn from_node<R>(p: *mut RawNode<R>) -> Self {
 129 |         debug_assert!(!p.is_null());
 130 |         MarkedPtr(p as usize, PhantomData)
 131 |     }
 132 | 
 133 |     pub fn from_leaf(p: *mut T) -> Self {
 134 |         debug_assert!(!p.is_null());
 135 |         MarkedPtr((p as usize) | 1, PhantomData)
 136 |     }
 137 | 
 138 |     pub fn is_null(&self) -> bool {
 139 |         self.0 == 0
 140 |     }
 141 | 
 142 |     pub fn raw_eq(&self, other: usize) -> bool {
 143 |         self.0 == other
 144 |     }
 145 | 
 146 |     pub unsafe fn get(&self) -> Option<Result<&T, &RawNode<()>>> {
 147 |         if self.0 == 0 {
 148 |             None
 149 |         } else if self.0 & 1 == 1 {
 150 |             Some(Ok(&*((self.0 & !1) as *const T)))
 151 |         } else {
 152 |             Some(Err(&*(self.0 as *const RawNode<()>)))
 153 |         }
 154 |     }
 155 | 
 156 |     pub unsafe fn get_raw(&self) -> Option<Result<*mut T, *mut RawNode<()>>> {
 157 |         if self.0 == 0 {
 158 |             None
 159 |         } else if self.0 & 1 == 1 {
 160 |             Some(Ok((self.0 & !1) as *mut T))
 161 |         } else {
 162 |             Some(Err(self.0 as *mut RawNode<()>))
 163 |         }
 164 |     }
 165 | 
 166 |     pub unsafe fn get_mut(&mut self) -> Option<Result<&mut T, &mut RawNode<()>>> {
 167 |         if self.0 == 0 {
 168 |             None
 169 |         } else if self.0 & 1 == 1 {
 170 |             Some(Ok(&mut *((self.0 & !1) as *mut T)))
 171 |         } else {
 172 |             Some(Err(&mut *(self.0 as *mut RawNode<()>)))
 173 |         }
 174 |     }
 175 | }
 176 | 
 177 | unsafe fn place_in_hole_at<T>(slice: &mut [T], at: usize, v: T, buff_len: usize) {
 178 |     let raw_p = slice.get_unchecked_mut(0) as *mut T;
 179 |     let target = raw_p.offset(at as isize);
 180 |     ptr::copy(target, raw_p.offset(at as isize + 1), buff_len - at - 1);
 181 |     ptr::write(target, v);
 182 | }
 183 | 
 184 | #[cfg(test)]
 185 | mod place_test {
 186 |     use super::*;
 187 | 
 188 |     #[test]
 189 |     fn place_in_hole_test() {
 190 |         let mut v1 = vec![0, 1, 3, 4, 0];
 191 |         let len = v1.len();
 192 |         unsafe {
 193 |             place_in_hole_at(&mut v1[..], 2, 2, len);
 194 |         }
 195 |         assert_eq!(v1, vec![0, 1, 2, 3, 4]);
 196 |     }
 197 | }
 198 | 
 199 | #[repr(C)]
 200 | #[derive(Debug)]
 201 | pub struct RawNode<Footer> {
 202 |     pub typ: NodeType,
 203 |     pub children: u16,
 204 |     pub count: u32,
 205 |     pub consumed: u32,
 206 |     pub prefix: [u8; PREFIX_LEN],
 207 |     node: Footer,
 208 | }
 209 | 
 210 | impl<T> RawNode<T> {
 211 |     pub fn append_prefix(&mut self, d: &[u8], total_count: u32) {
 212 |         debug_assert!(d.len() <= PREFIX_LEN);
 213 |         unsafe {
 214 |             ptr::copy(
 215 |                 &self.prefix[0],
 216 |                 &mut self.prefix[d.len()],
 217 |                 PREFIX_LEN - d.len(),
 218 |             );
 219 |             ptr::copy(&d[0], &mut self.prefix[0], d.len());
 220 |         }
 221 |         self.count += total_count;
 222 |         self.consumed -= total_count;
 223 |     }
 224 | }
 225 | 
 226 | impl RawNode<()> {
 227 |     pub fn get_matching_prefix<T: Element>(
 228 |         &self,
 229 |         digits: &[u8],
 230 |         consumed: usize,
 231 |         _marker: PhantomData<T>,
 232 |     ) -> (usize, Option<*const T>) {
 233 |         debug_assert!(
 234 |             consumed < digits.len(),
 235 |             "consumed={}, digits={:?}",
 236 |             consumed,
 237 |             digits
 238 |         );
 239 |         let count = cmp::min(self.count as usize, PREFIX_LEN);
 240 |         for i in 0..count {
 241 |             if digits[consumed + i] != self.prefix[i] {
 242 |                 return (i, None);
 243 |             }
 244 |         }
 245 |         if self.count as usize > PREFIX_LEN {
 246 |             let mut matches = PREFIX_LEN;
 247 |             with_node!(
 248 |                 self,
 249 |                 node,
 250 |                 {
 251 |                     let min_node = node.get_min()
 252 |                         .expect("node with implicit prefix must be nonempty");
 253 |                     for (d, m) in digits[consumed + PREFIX_LEN..]
 254 |                         .iter()
 255 |                         .zip(min_node.key().digits().skip(consumed + PREFIX_LEN))
 256 |                     {
 257 |                         if *d != m {
 258 |                             break;
 259 |                         }
 260 |                         matches += 1;
 261 |                     }
 262 |                     (matches, Some(min_node as *const T))
 263 |                 },
 264 |                 T
 265 |             )
 266 |         } else {
 267 |             (count, None)
 268 |         }
 269 |     }
 270 | }
 271 | 
 272 | impl<T> RawNode<T> {
 273 |     pub fn prefix_matches_optimistic(&self, digits: &[u8]) -> Option<(bool, usize)> {
 274 |         let count = self.count as usize;
 275 |         if digits.len() < count {
 276 |             return None;
 277 |         }
 278 |         for i in 0..cmp::min(count, PREFIX_LEN) {
 279 |             if digits[i] != self.prefix[i] {
 280 |                 return None;
 281 |             }
 282 |         }
 283 |         Some((count <= PREFIX_LEN, count))
 284 |     }
 285 | }
 286 | 
 287 | pub enum DeleteResult<T> {
 288 |     Failure,
 289 |     Success(ChildPtr<T>),
 290 |     Singleton {
 291 |         deleted: ChildPtr<T>,
 292 |         last: ChildPtr<T>,
 293 |         last_d: u8,
 294 |     },
 295 | }
 296 | 
 297 | pub trait Direction: Copy {
 298 |     const LEFT_TO_RIGHT: bool;
 299 | }
 300 | 
 301 | #[derive(Copy, Clone)]
 302 | pub struct Increasing;
 303 | #[derive(Copy, Clone)]
 304 | pub struct Decreasing;
 305 | 
 306 | impl Direction for Increasing {
 307 |     const LEFT_TO_RIGHT: bool = true;
 308 | }
 309 | 
 310 | impl Direction for Decreasing {
 311 |     const LEFT_TO_RIGHT: bool = false;
 312 | }
 313 | 
 314 | pub trait Node<T: Element>: Sized {
 315 |     // insert assumes that 'd' is not present in the node. This is enforced in debug buids
 316 |     unsafe fn insert(
 317 |         &mut self,
 318 |         d: u8,
 319 |         ptr: ChildPtr<T>,
 320 |         // Error == ptr, indicates there was no space _and_ could not upgrade
 321 |         pptr: Option<*mut ChildPtr<T>>,
 322 |     ) -> Result<(), ChildPtr<T>>;
 323 |     unsafe fn delete(&mut self, d: u8) -> DeleteResult<T>;
 324 |     fn is_full(&self) -> bool;
 325 |     fn get_min(&self) -> Option<&T>;
 326 |     fn find_raw(&self, d: u8) -> Option<*mut ChildPtr<T>>;
 327 |     fn find(&self, d: u8) -> Option<&ChildPtr<T>> {
 328 |         self.find_raw(d).map(|raw_ptr| unsafe { &*raw_ptr })
 329 |     }
 330 |     fn find_mut(&self, d: u8) -> Option<&mut ChildPtr<T>> {
 331 |         self.find_raw(d).map(|raw_ptr| unsafe {
 332 |             debug_assert!(!(*raw_ptr).is_null());
 333 |             &mut *raw_ptr
 334 |         })
 335 |     }
 336 | 
 337 |     // iterate over all non-null direct children of the node.
 338 |     fn local_foreach<F: FnMut(u8, MarkedPtr<T>)>(&self, f: F);
 339 | 
 340 |     fn for_each<F: FnMut(&T), D: Direction>(
 341 |         &self,
 342 |         f: &mut F,
 343 |         lower: Option<&[u8]>,
 344 |         upper: Option<&[u8]>,
 345 |         lval: Option<&T::Key>,
 346 |         rval: Option<&T::Key>,
 347 |         _dir: D,
 348 |     );
 349 | }
 350 | 
 351 | fn get_matching_prefix_slice<'a, 'b, A, I1, I2>(d1: I1, d2: I2, v: &mut SmallVec<A>)
 352 | where
 353 |     A: Array<Item = u8>,
 354 |     I1: Iterator<Item = &'a u8>,
 355 |     I2: Iterator<Item = &'b u8>,
 356 | {
 357 |     for (d1, d2) in d1.zip(d2) {
 358 |         if *d1 != *d2 {
 359 |             return;
 360 |         }
 361 |         v.push(*d1)
 362 |     }
 363 | }
 364 | 
 365 | pub fn make_node_with_prefix<T>(prefix: &[u8], consumed: u32) -> Box<RawNode<Node4<T>>> {
 366 |     let mut new_node = Box::new(RawNode {
 367 |         typ: NODE_4,
 368 |         children: 0,
 369 |         consumed: consumed,
 370 |         count: prefix.len() as u32,
 371 |         prefix: [0; PREFIX_LEN],
 372 |         node: Node4 {
 373 |             keys: [0; 4],
 374 |             ptrs: unsafe { mem::transmute::<[usize; 4], [ChildPtr<T>; 4]>([0 as usize; 4]) },
 375 |         },
 376 |     });
 377 |     let new_len = cmp::min(prefix.len(), PREFIX_LEN);
 378 |     if prefix.len() > 0 {
 379 |         unsafe {
 380 |             ptr::copy_nonoverlapping(
 381 |                 &prefix[0] as *const _,
 382 |                 &mut new_node.prefix[0] as *mut _,
 383 |                 new_len,
 384 |             );
 385 |         }
 386 |     }
 387 |     new_node
 388 | }
 389 | 
 390 | pub fn make_node_from_common_prefix<T>(
 391 |     d1: &[u8],
 392 |     d2: &[u8],
 393 |     consumed: u32,
 394 | ) -> Box<RawNode<Node4<T>>> {
 395 |     let mut common_prefix_digits = SmallVec::<[u8; 32]>::new();
 396 |     get_matching_prefix_slice(d1.iter(), d2.iter(), &mut common_prefix_digits);
 397 |     make_node_with_prefix(&common_prefix_digits[..], consumed)
 398 | }
 399 | 
 400 | pub struct Node4<T> {
 401 |     keys: [u8; 4],
 402 |     ptrs: [ChildPtr<T>; 4],
 403 | }
 404 | 
 405 | impl<T> ::std::fmt::Debug for Node4<T> {
 406 |     fn fmt(&self, f: &mut ::std::fmt::Formatter) -> Result<(), ::std::fmt::Error> {
 407 |         write!(f, "Node4({:?}, {:?})", self.keys, &self.ptrs[..])
 408 |     }
 409 | }
 410 | 
 411 | pub fn visit_leaf<T, F, D>(
 412 |     c: &ChildPtr<T>,
 413 |     f: &mut F,
 414 |     mut lower: Option<&[u8]>,
 415 |     mut upper: Option<&[u8]>,
 416 |     lval: Option<&T::Key>,
 417 |     rval: Option<&T::Key>,
 418 |     _dir: D,
 419 | ) where
 420 |     F: FnMut(&T),
 421 |     T: Element,
 422 |     D: Direction,
 423 | {
 424 |     fn advance_by(s: &mut Option<&[u8]>, by: usize) {
 425 |         if s.is_none() {
 426 |             return;
 427 |         }
 428 |         debug_assert!(s.unwrap().len() > 0);
 429 |         let slice = s.unwrap();
 430 |         if slice.len() <= by {
 431 |             *s = None;
 432 |         }
 433 |         *s = Some(&slice[by..]);
 434 |     }
 435 | 
 436 |     /// An over the prefix of a `RawNode`. This is used to encapsulate the tricky "implicit prefix"
 437 |     /// semantics which are occasionally required for large keys.
 438 |     struct PrefixIter<'a, T: Element + 'a> {
 439 |         ix: usize,
 440 |         len: usize,
 441 |         node: &'a RawNode<()>,
 442 |         _min: SmallVec<[u8; 2]>,
 443 |         _marker: PhantomData<T>,
 444 |     }
 445 | 
 446 |     impl<'a, T: Element + 'a> PrefixIter<'a, T> {
 447 |         fn new(node: &'a RawNode<()>) -> Self {
 448 |             PrefixIter {
 449 |                 ix: 0,
 450 |                 len: node.count as usize,
 451 |                 node: node,
 452 |                 _min: SmallVec::new(),
 453 |                 _marker: PhantomData,
 454 |             }
 455 |         }
 456 | 
 457 |         fn reset(&mut self) {
 458 |             self.ix = 0;
 459 |         }
 460 |     }
 461 | 
 462 |     impl<'a, T: 'a + Element> Iterator for PrefixIter<'a, T> {
 463 |         type Item = u8;
 464 | 
 465 |         fn next(&mut self) -> Option<u8> {
 466 |             if self.ix >= self.len {
 467 |                 return None;
 468 |             }
 469 |             if self.ix < PREFIX_LEN {
 470 |                 let res = self.node.prefix[self.ix];
 471 |                 self.ix += 1;
 472 |                 return Some(res);
 473 |             }
 474 |             None
 475 |         }
 476 |     }
 477 |     match unsafe { c.get() } {
 478 |         None => {}
 479 |         Some(Ok(ref leaf)) => {
 480 |             if let Some(up) = rval {
 481 |                 if up <= leaf.key() {
 482 |                     return;
 483 |                 }
 484 |             }
 485 |             // N.B: If we choose to fully handle implicit prefixes then this check should be
 486 |             // unnecessary.
 487 |             if let Some(low) = lval {
 488 |                 if low > leaf.key() {
 489 |                     return;
 490 |                 }
 491 |             }
 492 |             f(leaf)
 493 |         }
 494 |         Some(Err(inner)) => {
 495 |             let mut iter = PrefixIter::<T>::new(inner);
 496 |             if let Some(slice) = lower {
 497 |                 for (l, byte) in slice.iter().zip(&mut iter) {
 498 |                     if byte < *l {
 499 |                         return;
 500 |                     }
 501 |                 }
 502 |             }
 503 |             iter.reset();
 504 |             if let Some(slice) = upper {
 505 |                 for (h, byte) in slice.iter().zip(&mut iter) {
 506 |                     if byte > *h {
 507 |                         return;
 508 |                     }
 509 |                 }
 510 |             }
 511 |             advance_by(&mut lower, inner.count as usize);
 512 |             advance_by(&mut upper, inner.count as usize);
 513 |             with_node!(inner, node, {
 514 |                 node.for_each(f, lower, upper, lval, rval, _dir)
 515 |             })
 516 |         }
 517 |     }
 518 | }
 519 | 
 520 | mod node_variants {
 521 |     use super::*;
 522 |     #[derive(Debug, Clone, Copy, PartialEq, Eq)]
 523 |     pub struct NodeType(u16);
 524 |     pub const NODE_4: NodeType = NodeType(1);
 525 |     pub const NODE_16: NodeType = NodeType(2);
 526 |     pub const NODE_48: NodeType = NodeType(3);
 527 |     pub const NODE_256: NodeType = NodeType(4);
 528 | 
 529 |     fn advance_or(s: &mut Option<&[u8]>, b: usize) -> usize {
 530 |         if s.is_none() {
 531 |             return b;
 532 |         }
 533 |         debug_assert!(s.unwrap().len() > 0);
 534 |         let slice = s.unwrap();
 535 |         let res = slice[0] as usize;
 536 |         if slice.len() == 1 {
 537 |             *s = None;
 538 |         } else {
 539 |             *s = Some(&slice[1..]);
 540 |         }
 541 |         res
 542 |     }
 543 | 
 544 |     // (very) ad-hoc polymorphism!
 545 |     macro_rules! n416_delete {
 546 |         ($slf: expr, $d: expr) => {{
 547 |             let _res = match $slf.find_internal($d) {
 548 |                 None => DeleteResult::Failure,
 549 |                 Some((ix, ptr)) => {
 550 |                     let deleted = (*ptr).swap_null();
 551 |                     //  trace!(true, "d={} slf={:?}", $d, $slf);
 552 |                     if ix + 1 < $slf.node.keys[..].len() {
 553 |                         ptr::copy(
 554 |                             &$slf.node.keys[ix + 1],
 555 |                             &mut $slf.node.keys[ix],
 556 |                             $slf.children as usize - ix,
 557 |                         );
 558 |                         ptr::copy(
 559 |                             &$slf.node.ptrs[ix + 1],
 560 |                             &mut $slf.node.ptrs[ix],
 561 |                             $slf.children as usize - ix,
 562 |                         );
 563 |                     }
 564 |                     debug_assert!($slf.children > 0);
 565 |                     $slf.children -= 1;
 566 |                     ptr::write(
 567 |                         &mut $slf.node.ptrs[$slf.children as usize],
 568 |                         ChildPtr::null(),
 569 |                     );
 570 |                     if $slf.children == 1 {
 571 |                         let mut c_ptr = ChildPtr::null();
 572 |                         debug_assert!(
 573 |                             !$slf.node.ptrs[0].is_null(),
 574 |                             "{:?} Uh oh! {:?}",
 575 |                             $slf as *const _,
 576 |                             $slf
 577 |                         );
 578 |                         mem::swap(&mut $slf.node.ptrs[0], &mut c_ptr);
 579 | 
 580 |                         debug_assert!(
 581 |                             Some($slf.node.keys[0]) != T::Key::STOP_CHARACTER
 582 |                                 || c_ptr.get().unwrap().is_ok(),
 583 |                             "Singleton is stop {:#?}",
 584 |                             $slf
 585 |                         );
 586 |                         DeleteResult::Singleton {
 587 |                             deleted: deleted,
 588 |                             last: c_ptr,
 589 |                             last_d: $slf.node.keys[0],
 590 |                         }
 591 |                     } else {
 592 |                         DeleteResult::Success(deleted)
 593 |                     }
 594 |                 }
 595 |             };
 596 |             debug_assert!($slf.find_internal($d).is_none());
 597 |             _res
 598 |         }};
 599 |     }
 600 |     impl<T> ::std::fmt::Debug for Node16<T> {
 601 |         fn fmt(&self, f: &mut ::std::fmt::Formatter) -> Result<(), ::std::fmt::Error> {
 602 |             write!(f, "Node16({:?}, {:?})", self.keys, &self.ptrs[..])
 603 |         }
 604 |     }
 605 | 
 606 |     fn is_sorted(slice: &[u8]) -> bool {
 607 |         let mut v: Vec<u8> = Vec::new();
 608 |         v.extend(slice);
 609 |         v.sort();
 610 |         let res = &v[..] == slice;
 611 |         if !res {
 612 |             eprintln!("Not sorted! {:?} != {:?}", slice, v);
 613 |         }
 614 |         res
 615 |     }
 616 | 
 617 |     macro_rules! do_foreach_dir {
 618 |         ($ltr:expr, $rng:expr, $lvar:ident, $body:expr) => {
 619 |             if $ltr {
 620 |                 for $lvar in $rng {
 621 |                     $body
 622 |                 }
 623 |             } else {
 624 |                 for $lvar in ($rng).rev() {
 625 |                     $body
 626 |                 }
 627 |             }
 628 |         };
 629 |     }
 630 | 
 631 |     macro_rules! n416_foreach {
 632 |         ($slf: expr, $f: expr, $lower: expr,
 633 |          $upper: expr, $lval: expr, $uval: expr,
 634 |          $dir:expr, $ltr:expr) => {{
 635 |             debug_assert!(is_sorted(&$slf.node.keys[..$slf.children as usize]));
 636 |             let low = advance_or(&mut $lower, 0);
 637 |             let high = advance_or(&mut $upper, 255);
 638 |             let children = $slf.children as usize;
 639 |             do_foreach_dir!($ltr, 0..children, i, {
 640 |                 let k = $slf.node.keys[i] as usize;
 641 |                 if $ltr {
 642 |                     if k < low {
 643 |                         continue;
 644 |                     }
 645 |                     if k > high {
 646 |                         break;
 647 |                     }
 648 |                 } else {
 649 |                     if k > high {
 650 |                         continue;
 651 |                     }
 652 |                     if k < low {
 653 |                         break;
 654 |                     }
 655 |                 }
 656 |                 let low = if k == low { $lower } else { None };
 657 |                 let high = if k == high { $upper } else { None };
 658 |                 visit_leaf(&$slf.node.ptrs[i], $f, low, high, $lval, $uval, $dir)
 659 |             })
 660 |         }};
 661 |     }
 662 | 
 663 |     macro_rules! n416_local_foreach {
 664 |         ($slf: expr, $f: expr) => {{
 665 |             debug_assert!(is_sorted(&$slf.node.keys[..$slf.children as usize]));
 666 |             let children = $slf.children as usize;
 667 |             for i in 0..children {
 668 |                 let k = $slf.node.keys[i];
 669 |                 let ptr = &$slf.node.ptrs[i];
 670 |                 debug_assert!(!ptr.is_null());
 671 |                 $f(k, unsafe { ptr.to_marked() });
 672 |             }
 673 |         }};
 674 |     }
 675 |     impl<T> RawNode<Node4<T>> {
 676 |         fn find_internal(&self, d: u8) -> Option<(usize, *mut ChildPtr<T>)> {
 677 |             debug_assert!(self.children <= 4);
 678 |             for i in 0..4 {
 679 |                 if i == self.children as usize {
 680 |                     break;
 681 |                 }
 682 |                 if self.node.keys[i] == d {
 683 |                     unsafe {
 684 |                         debug_assert!(
 685 |                             !self.node.ptrs[i].is_null(),
 686 |                             "Returning something null (i={}, d={}) (already-deleted node?)! keys={:?} ptrs={:?}",
 687 |                             i, d, &self.node.keys[..], &self.node.ptrs[..]);
 688 |                         return Some((i, self.node.ptrs.get_unchecked(i) as *const _ as *mut _));
 689 |                     };
 690 |                 }
 691 |             }
 692 |             None
 693 |         }
 694 |     }
 695 | 
 696 |     impl<T: Element> Node<T> for RawNode<Node4<T>> {
 697 |         fn find_raw(&self, d: u8) -> Option<*mut ChildPtr<T>> {
 698 |             self.find_internal(d).map(|(_, ptr)| ptr)
 699 |         }
 700 | 
 701 |         unsafe fn delete(&mut self, d: u8) -> DeleteResult<T> {
 702 |             n416_delete!(self, d)
 703 |         }
 704 | 
 705 |         fn local_foreach<F: FnMut(u8, MarkedPtr<T>)>(&self, mut f: F) {
 706 |             n416_local_foreach!(self, f)
 707 |         }
 708 | 
 709 |         fn get_min(&self) -> Option<&T> {
 710 |             debug_assert!(self.children <= 4);
 711 |             if self.children == 0 {
 712 |                 return None;
 713 |             }
 714 |             // we keep the child list sorted, so we recur at '0'
 715 |             match unsafe { self.node.ptrs[0 as usize].get().unwrap() } {
 716 |                 Ok(t) => Some(t),
 717 |                 Err(inner_node) => with_node!(inner_node, node, { node.get_min() }),
 718 |             }
 719 |         }
 720 | 
 721 |         fn is_full(&self) -> bool {
 722 |             self.children == 4
 723 |         }
 724 | 
 725 |         unsafe fn insert(
 726 |             &mut self,
 727 |             d: u8,
 728 |             ptr: ChildPtr<T>,
 729 |             pptr: Option<*mut ChildPtr<T>>,
 730 |         ) -> Result<(), ChildPtr<T>> {
 731 |             debug_assert!(self.find_raw(d).is_none());
 732 |             debug_assert!(Some(d) != T::Key::STOP_CHARACTER || ptr.get().unwrap().is_ok());
 733 |             if self.children == 4 {
 734 |                 if let Some(pp) = pptr {
 735 |                     let new_node = &mut *Box::into_raw(Box::new(RawNode {
 736 |                         typ: NODE_16,
 737 |                         children: self.children,
 738 |                         consumed: self.consumed,
 739 |                         count: self.count,
 740 |                         prefix: self.prefix,
 741 |                         node: Node16 {
 742 |                             keys: [0; 16],
 743 |                             ptrs: mem::transmute::<[usize; 16], [ChildPtr<T>; 16]>(
 744 |                                 [0 as usize; 16],
 745 |                             ),
 746 |                         },
 747 |                     }));
 748 |                     ptr::swap_nonoverlapping(&mut self.node.keys[0], &mut new_node.node.keys[0], 4);
 749 |                     ptr::swap_nonoverlapping(&mut self.node.ptrs[0], &mut new_node.node.ptrs[0], 4);
 750 |                     #[cfg(debug_assertions)]
 751 |                     {
 752 |                         self.children = !0;
 753 |                     }
 754 |                     let new_cptr = ChildPtr::from_node(new_node);
 755 |                     *pp = new_cptr;
 756 |                     let res = new_node.insert(d, ptr, None);
 757 |                     debug_assert!(res.is_ok());
 758 |                     return res;
 759 |                 } else {
 760 |                     return Err(ptr);
 761 |                 }
 762 |             }
 763 |             for i in 0..4 {
 764 |                 if i == (self.children as usize) {
 765 |                     // found an empty slot!
 766 |                     debug_assert!(self.node.ptrs[i].is_null());
 767 |                     self.node.keys[i] = d;
 768 |                     self.node.ptrs[i] = ptr;
 769 |                     self.children += 1;
 770 |                     debug_assert!(is_sorted(&self.node.keys[..self.children as usize]));
 771 |                     return Ok(());
 772 |                 }
 773 |                 let cur_digit = self.node.keys[i];
 774 |                 debug_assert!(
 775 |                     cur_digit != d,
 776 |                     "Found matching current digit! cur_digit={:?}, prefix={:?}, count={:?}, children={:?} keys={:?}",
 777 |                     cur_digit,
 778 |                     &self.prefix[..],
 779 |                     self.count,
 780 |                     self.children,
 781 |                     &self.node.keys[..],
 782 |                 );
 783 |                 if cur_digit > d {
 784 |                     // we keep the list sorted, so we need to move all other entries ahead by 1
 785 |                     // slot. This is not safe if it's already full.
 786 |                     place_in_hole_at(&mut self.node.keys[..], i, d, 4);
 787 |                     place_in_hole_at(&mut self.node.ptrs[..], i, ptr, 4);
 788 |                     self.children += 1;
 789 |                     debug_assert!(is_sorted(&self.node.keys[..self.children as usize]));
 790 |                     return Ok(());
 791 |                 }
 792 |             }
 793 |             unreachable!()
 794 |         }
 795 | 
 796 |         fn for_each<F: FnMut(&T), D: Direction>(
 797 |             &self,
 798 |             f: &mut F,
 799 |             mut lower: Option<&[u8]>,
 800 |             mut upper: Option<&[u8]>,
 801 |             lval: Option<&T::Key>,
 802 |             rval: Option<&T::Key>,
 803 |             _dir: D,
 804 |         ) {
 805 |             n416_foreach!(self, f, lower, upper, lval, rval, _dir, D::LEFT_TO_RIGHT)
 806 |         }
 807 |     }
 808 | 
 809 |     pub struct Node16<T> {
 810 |         keys: [u8; 16],
 811 |         ptrs: [ChildPtr<T>; 16],
 812 |     }
 813 | 
 814 |     impl<T> RawNode<Node16<T>> {
 815 |         fn find_internal(&self, d: u8) -> Option<(usize, *mut ChildPtr<T>)> {
 816 |             debug_assert!(self.children != !0, "This node has been upgraded");
 817 |             let mask = (1 << (self.children as usize)) - 1;
 818 |             #[cfg(all(any(target_arch = "x86_64", target_arch = "x86"), target_feature = "sse2"))]
 819 |             {
 820 |                 let ks = simd::u8x16::load(&self.node.keys[..], 0);
 821 |                 let d_splat = simd::u8x16::splat(d);
 822 |                 let comps = d_splat.eq(ks);
 823 |                 let bits = unsafe { _mm_movemask_epi8(mem::transmute(comps)) } & mask;
 824 |                 return if bits == 0 {
 825 |                     None
 826 |                 } else {
 827 |                     debug_assert_eq!(bits.count_ones(), 1);
 828 |                     let target = bits.trailing_zeros() as usize;
 829 |                     debug_assert!(target < 16);
 830 |                     debug_assert!(
 831 |                         !self.node.ptrs[target].is_null(),
 832 |                         "children={} keys={:?} ptrs={:?}",
 833 |                         self.children,
 834 |                         &self.node.keys[..],
 835 |                         &self.node.ptrs[..]
 836 |                     );
 837 |                     Some((target, unsafe {
 838 |                         self.node.ptrs.get_unchecked(target) as *const _ as *mut _
 839 |                     }))
 840 |                 };
 841 |             }
 842 |             #[cfg(not(all(any(target_arch = "x86_64", target_arch = "x86"),
 843 |                           target_feature = "sse2")))]
 844 |             {
 845 |                 // copy over Node4 implementation
 846 |                 unimplemented!()
 847 |             }
 848 |         }
 849 |     }
 850 | 
 851 |     impl<T: Element> Node<T> for RawNode<Node16<T>> {
 852 |         fn is_full(&self) -> bool {
 853 |             self.children == 16
 854 |         }
 855 |         fn find_raw(&self, d: u8) -> Option<*mut ChildPtr<T>> {
 856 |             self.find_internal(d).map(|(_, ptr)| ptr)
 857 |         }
 858 | 
 859 |         fn local_foreach<F: FnMut(u8, MarkedPtr<T>)>(&self, mut f: F) {
 860 |             n416_local_foreach!(self, f)
 861 |         }
 862 | 
 863 |         unsafe fn delete(&mut self, d: u8) -> DeleteResult<T> {
 864 |             n416_delete!(self, d)
 865 |         }
 866 | 
 867 |         fn get_min(&self) -> Option<&T> {
 868 |             debug_assert!(self.children <= 16);
 869 |             if self.children == 0 {
 870 |                 return None;
 871 |             }
 872 |             let min_key_ix = 0; // we keep the child list sorted
 873 |             match unsafe { self.node.ptrs[min_key_ix as usize].get().unwrap() } {
 874 |                 Ok(t) => Some(t),
 875 |                 Err(inner_node) => with_node!(inner_node, node, { node.get_min() }),
 876 |             }
 877 |         }
 878 | 
 879 |         unsafe fn insert(
 880 |             &mut self,
 881 |             d: u8,
 882 |             ptr: ChildPtr<T>,
 883 |             pptr: Option<*mut ChildPtr<T>>,
 884 |         ) -> Result<(), ChildPtr<T>> {
 885 |             debug_assert!(Some(d) != T::Key::STOP_CHARACTER || ptr.get().unwrap().is_ok());
 886 |             debug_assert!(self.find_raw(d).is_none());
 887 |             let mask = (1 << (self.children as usize)) - 1;
 888 |             if self.children == 16 {
 889 |                 if let Some(pp) = pptr {
 890 |                     // upgrade
 891 |                     let new_node = &mut *Box::into_raw(Box::new(RawNode {
 892 |                         typ: NODE_48,
 893 |                         children: 16,
 894 |                         count: self.count,
 895 |                         consumed: self.consumed,
 896 |                         prefix: self.prefix,
 897 |                         node: Node48 {
 898 |                             keys: [0; 256],
 899 |                             ptrs: mem::transmute::<[usize; 48], [ChildPtr<T>; 48]>(
 900 |                                 [0 as usize; 48],
 901 |                             ),
 902 |                         },
 903 |                     }));
 904 |                     for i in 0..16 {
 905 |                         let ix = self.node.keys[i] as usize;
 906 |                         mem::swap(
 907 |                             self.node.ptrs.get_unchecked_mut(i),
 908 |                             new_node.node.ptrs.get_unchecked_mut(i),
 909 |                         );
 910 |                         new_node.node.keys[ix] = i as u8 + 1;
 911 |                     }
 912 |                     #[cfg(debug_assertions)]
 913 |                     {
 914 |                         self.children = !0;
 915 |                     }
 916 |                     let new_cptr = ChildPtr::from_node(new_node);
 917 |                     *pp = new_cptr;
 918 |                     let res = new_node.insert(d, ptr, None);
 919 |                     debug_assert!(res.is_ok());
 920 |                     return Ok(());
 921 |                 } else {
 922 |                     return Err(ptr);
 923 |                 }
 924 |             }
 925 |             #[cfg(all(any(target_arch = "x86_64", target_arch = "x86"), target_feature = "sse2"))]
 926 |             {
 927 |                 let ks = simd::u8x16::load(&self.node.keys[..], 0);
 928 |                 let d_splat = simd::u8x16::splat(d);
 929 |                 let comps = d_splat.lt(ks);
 930 |                 let bits: i32 = _mm_movemask_epi8(mem::transmute(comps)) & mask;
 931 |                 let zeros = bits.trailing_zeros();
 932 |                 let target = if zeros == 32 {
 933 |                     self.children as usize
 934 |                 } else {
 935 |                     zeros as usize
 936 |                 };
 937 |                 place_in_hole_at(&mut self.node.keys[..], target, d, 16);
 938 |                 place_in_hole_at(&mut self.node.ptrs[..], target, ptr, 16);
 939 |             }
 940 |             #[cfg(not(all(any(target_arch = "x86_64", target_arch = "x86"),
 941 |                           target_feature = "sse2")))]
 942 |             {
 943 |                 // copy over Node16 implementation
 944 |                 unimplemented!()
 945 |             }
 946 |             self.children += 1;
 947 |             debug_assert!(is_sorted(&self.node.keys[..self.children as usize]));
 948 |             return Ok(());
 949 |         }
 950 | 
 951 |         fn for_each<F: FnMut(&T), D: Direction>(
 952 |             &self,
 953 |             f: &mut F,
 954 |             mut lower: Option<&[u8]>,
 955 |             mut upper: Option<&[u8]>,
 956 |             lval: Option<&T::Key>,
 957 |             rval: Option<&T::Key>,
 958 |             _dir: D,
 959 |         ) {
 960 |             n416_foreach!(self, f, lower, upper, lval, rval, _dir, D::LEFT_TO_RIGHT)
 961 |         }
 962 |     }
 963 | 
 964 |     pub struct Node48<T> {
 965 |         keys: [u8; 256],
 966 |         ptrs: [ChildPtr<T>; 48],
 967 |     }
 968 | 
 969 |     impl<T> RawNode<Node48<T>> {
 970 |         unsafe fn get_min_inner(&self) -> Option<(usize, *mut ChildPtr<T>)> {
 971 |             for d in 0..256 {
 972 |                 let i = self.node.keys[d];
 973 |                 if i == 0 {
 974 |                     continue;
 975 |                 }
 976 |                 return Some((d, &self.node.ptrs[i as usize - 1] as *const _ as *mut _));
 977 |             }
 978 |             None
 979 |             // potentially optimized solution below:
 980 |             // const KEYS_PER_WORD: usize = 8;
 981 |             // const N_WORDS: usize = 256 / KEYS_PER_WORD;
 982 |             // if self.children == 0 {
 983 |             //     return None;
 984 |             // }
 985 |             // let keys_words = mem::transmute::<&[u8; 256], &[u64; N_WORDS]>(&self.node.keys);
 986 |             // for i in 0..N_WORDS {
 987 |             //     let word = keys_words[i];
 988 |             //     if word == 0 {
 989 |             //         continue;
 990 |             //     }
 991 |             //     let word_bytes = mem::transmute::<u64, [u8; 8]>(word);
 992 |             //     for ii in 0..8 {
 993 |             //         let b = word_bytes[ii];
 994 |             //         if b != 0 {
 995 |             //             let ix = b - 1;
 996 |             //             return Some((
 997 |             //                 i * KEYS_PER_WORD + ii,
 998 |             //                 &self.node.ptrs[ix as usize] as *const _ as *mut _,
 999 |             //             ));
1000 |             //         }
1001 |             //     }
1002 |             // }
1003 |             // unreachable!()
1004 |         }
1005 | 
1006 |         #[inline(always)]
1007 |         fn state_valid(&self) {
1008 |             #[cfg(debug_assertions)]
1009 |             {
1010 |                 let mut present = 0;
1011 |                 for ix in &self.node.keys[..] {
1012 |                     present += if *ix > 0 { 1 } else { 0 }
1013 |                 }
1014 |                 assert_eq!(
1015 |                     present, self.children,
1016 |                     "Only see {:?} present but have {:?} children",
1017 |                     present, self.children
1018 |                 )
1019 |             }
1020 |         }
1021 |     }
1022 | 
1023 |     impl<T: Element> Node<T> for RawNode<Node48<T>> {
1024 |         fn find_raw(&self, d: u8) -> Option<*mut ChildPtr<T>> {
1025 |             self.state_valid();
1026 |             let ix = unsafe { *self.node.keys.get_unchecked(d as usize) as usize };
1027 |             if ix == 0 {
1028 |                 None
1029 |             } else {
1030 |                 unsafe {
1031 |                     debug_assert!(!self.node.ptrs[ix - 1].is_null());
1032 |                     Some(self.node.ptrs.get_unchecked(ix - 1) as *const _ as *mut ChildPtr<T>)
1033 |                 }
1034 |             }
1035 |         }
1036 | 
1037 |         fn local_foreach<F: FnMut(u8, MarkedPtr<T>)>(&self, mut f: F) {
1038 |             for d in 0..256 {
1039 |                 let i = self.node.keys[d];
1040 |                 if i == 0 {
1041 |                     continue;
1042 |                 }
1043 |                 let ix = i as usize - 1;
1044 |                 let ptr = &self.node.ptrs[ix];
1045 |                 unsafe {
1046 |                     debug_assert!(!ptr.is_null());
1047 |                     debug_assert!(d < 256);
1048 |                     f(d as u8, ptr.to_marked())
1049 |                 };
1050 |             }
1051 |         }
1052 | 
1053 |         fn get_min(&self) -> Option<&T> {
1054 |             self.state_valid();
1055 |             unsafe {
1056 |                 self.get_min_inner()
1057 |                     .and_then(|(_, t)| match (*t).get().unwrap() {
1058 |                         Ok(t) => Some(t),
1059 |                         Err(inner_node) => with_node!(inner_node, node, { node.get_min() }),
1060 |                     })
1061 |             }
1062 |         }
1063 |         fn is_full(&self) -> bool {
1064 |             self.children == 48
1065 |         }
1066 |         unsafe fn delete(&mut self, d: u8) -> DeleteResult<T> {
1067 |             self.state_valid();
1068 |             match self.find_raw(d) {
1069 |                 None => DeleteResult::Failure,
1070 |                 Some(p) => {
1071 |                     // Found a pointer, swap out a null ChildPtr and set keys index to 0.
1072 |                     let deleted = (*p).swap_null();
1073 |                     self.node.keys[d as usize] = 0;
1074 |                     debug_assert!(self.children > 0);
1075 |                     self.children -= 1;
1076 |                     if self.children == 1 {
1077 |                         // TODO remove the first entry, it isn't required
1078 |                         let (ix, or_ptr) = self.get_min_inner().expect("Should be one more child");
1079 |                         debug_assert!(
1080 |                             Some(ix) != T::Key::STOP_CHARACTER.map(|x| x as usize)
1081 |                                 || (*or_ptr).get().unwrap().is_ok(),
1082 |                             "Singleton is stop {:#?}",
1083 |                             self
1084 |                         );
1085 |                         self.node.keys[ix] = 0; // not really necessary
1086 |                         DeleteResult::Singleton {
1087 |                             deleted: deleted,
1088 |                             last: (*or_ptr).swap_null(),
1089 |                             last_d: ix as u8,
1090 |                         }
1091 |                     } else {
1092 |                         DeleteResult::Success(deleted)
1093 |                     }
1094 |                 }
1095 |             }
1096 |         }
1097 | 
1098 |         unsafe fn insert(
1099 |             &mut self,
1100 |             d: u8,
1101 |             ptr: ChildPtr<T>,
1102 |             pptr: Option<*mut ChildPtr<T>>,
1103 |         ) -> Result<(), ChildPtr<T>> {
1104 |             debug_assert!(Some(d) != T::Key::STOP_CHARACTER || ptr.get().unwrap().is_ok());
1105 |             debug_assert!(self.find_raw(d).is_none());
1106 |             self.state_valid();
1107 |             debug_assert!(self.children <= 48);
1108 |             if self.children == 48 {
1109 |                 if let Some(pp) = pptr {
1110 |                     let new_node = &mut *Box::into_raw(Box::new(RawNode {
1111 |                         typ: NODE_256,
1112 |                         children: 48,
1113 |                         count: self.count,
1114 |                         consumed: self.consumed,
1115 |                         prefix: self.prefix,
1116 |                         node: Node256 {
1117 |                             ptrs: mem::transmute::<[usize; 256], [ChildPtr<T>; 256]>(
1118 |                                 [0 as usize; 256],
1119 |                             ),
1120 |                         },
1121 |                     }));
1122 |                     for i in 0..256 {
1123 |                         if let Some(node_ptr) = self.find_raw(i as u8) {
1124 |                             debug_assert!(i != d as usize, "{:?} == {:?}", i, d);
1125 |                             mem::swap(&mut *node_ptr, new_node.node.ptrs.get_unchecked_mut(i))
1126 |                         }
1127 |                     }
1128 |                     #[cfg(debug_assertions)]
1129 |                     {
1130 |                         self.children = !0;
1131 |                     }
1132 |                     let new_cptr = ChildPtr::from_node(new_node);
1133 |                     *pp = new_cptr;
1134 |                     let res = new_node.insert(d, ptr, None);
1135 |                     debug_assert!(res.is_ok());
1136 |                     return Ok(());
1137 |                 } else {
1138 |                     return Err(ptr);
1139 |                 }
1140 |             }
1141 |             for i in 0..48 {
1142 |                 let slot = self.node.ptrs.get_unchecked_mut(i);
1143 |                 if slot.is_null() {
1144 |                     ptr::write(slot, ptr);
1145 |                     self.node.keys[d as usize] = i as u8 + 1;
1146 |                     self.children += 1;
1147 |                     return Ok(());
1148 |                 }
1149 |             }
1150 |             unreachable!()
1151 |         }
1152 | 
1153 |         fn for_each<F: FnMut(&T), D: Direction>(
1154 |             &self,
1155 |             f: &mut F,
1156 |             mut lower: Option<&[u8]>,
1157 |             mut upper: Option<&[u8]>,
1158 |             lval: Option<&T::Key>,
1159 |             rval: Option<&T::Key>,
1160 |             _dir: D,
1161 |         ) {
1162 |             let low = advance_or(&mut lower, 0);
1163 |             let high = advance_or(&mut upper, 255);
1164 |             do_foreach_dir!(D::LEFT_TO_RIGHT, low..(high + 1), i, {
1165 |                 let ix = self.node.keys[i];
1166 |                 if ix == 0 {
1167 |                     continue;
1168 |                 }
1169 |                 visit_leaf(
1170 |                     &self.node.ptrs[ix as usize - 1],
1171 |                     f,
1172 |                     if i == low { lower } else { None },
1173 |                     if i == high { upper } else { None },
1174 |                     lval,
1175 |                     rval,
1176 |                     _dir,
1177 |                 );
1178 |             })
1179 |         }
1180 |     }
1181 | 
1182 |     pub struct Node256<T> {
1183 |         ptrs: [ChildPtr<T>; 256],
1184 |     }
1185 |     impl<T> ::std::fmt::Debug for Node48<T> {
1186 |         fn fmt(&self, f: &mut ::std::fmt::Formatter) -> Result<(), ::std::fmt::Error> {
1187 |             write!(
1188 |                 f,
1189 |                 "Node48(keys={:?},ptrs={:?})",
1190 |                 &self.keys[..],
1191 |                 &self.ptrs[..]
1192 |             )
1193 |         }
1194 |     }
1195 | 
1196 |     impl<T> ::std::fmt::Debug for Node256<T> {
1197 |         fn fmt(&self, f: &mut ::std::fmt::Formatter) -> Result<(), ::std::fmt::Error> {
1198 |             let v: Vec<_> = self.ptrs
1199 |                 .iter()
1200 |                 .enumerate()
1201 |                 .filter(|&(_, cp)| !cp.is_null())
1202 |                 .collect();
1203 |             write!(f, "Node256({:?})", v)
1204 |         }
1205 |     }
1206 | 
1207 |     impl<T: Element> Node<T> for RawNode<Node256<T>> {
1208 |         fn find_raw(&self, d: u8) -> Option<*mut ChildPtr<T>> {
1209 |             unsafe {
1210 |                 let p = self.node.ptrs.get_unchecked(d as usize) as *const ChildPtr<T>
1211 |                     as *mut ChildPtr<T>;
1212 |                 if (*p).is_null() {
1213 |                     None
1214 |                 } else {
1215 |                     Some(p)
1216 |                 }
1217 |             }
1218 |         }
1219 | 
1220 |         fn is_full(&self) -> bool {
1221 |             self.children == 256
1222 |         }
1223 | 
1224 |         fn local_foreach<F: FnMut(u8, MarkedPtr<T>)>(&self, mut f: F) {
1225 |             for d in 0..256 {
1226 |                 unsafe {
1227 |                     let ptr = self.node.ptrs.get_unchecked(d);
1228 |                     if ptr.is_null() {
1229 |                         continue;
1230 |                     }
1231 |                     f(d as u8, ptr.to_marked());
1232 |                 }
1233 |             }
1234 |         }
1235 | 
1236 |         fn get_min(&self) -> Option<&T> {
1237 |             // TODO benchmark with this vs. 0..256 + get_unchecked.
1238 |             // This search can also be sped up using simd to bulk-compare >0 for each cell.
1239 |             // While probably overkill, worth exploring if this sort of search becomes expensive.
1240 |             if self.children == 0 {
1241 |                 return None;
1242 |             }
1243 | 
1244 |             for p in &self.node.ptrs[..] {
1245 |                 if p.is_null() {
1246 |                     continue;
1247 |                 }
1248 |                 return match unsafe { p.get().unwrap() } {
1249 |                     Ok(t) => Some(t),
1250 |                     Err(inner_node) => with_node!(inner_node, node, { node.get_min() }),
1251 |                 };
1252 |             }
1253 |             unreachable!()
1254 |         }
1255 | 
1256 |         unsafe fn delete(&mut self, d: u8) -> DeleteResult<T> {
1257 |             if self.children == 0 || self.node.ptrs[d as usize].is_null() {
1258 |                 return DeleteResult::Failure;
1259 |             }
1260 |             let deleted = self.node.ptrs[d as usize].swap_null();
1261 |             self.children -= 1;
1262 |             if self.children == 1 {
1263 |                 for i in 0..256 {
1264 |                     debug_assert!(
1265 |                         self.node.ptrs[i].is_null()
1266 |                             || Some(i) != T::Key::STOP_CHARACTER.map(|x| x as usize)
1267 |                             || self.node.ptrs[i].get().unwrap().is_ok(),
1268 |                         "Singleton is stop {:#?}",
1269 |                         self
1270 |                     );
1271 |                     let node = &mut self.node.ptrs[i];
1272 |                     if node.is_null() {
1273 |                         continue;
1274 |                     }
1275 | 
1276 |                     return DeleteResult::Singleton {
1277 |                         deleted: deleted,
1278 |                         last: node.swap_null(),
1279 |                         last_d: i as u8,
1280 |                     };
1281 |                 }
1282 |                 panic!("Should have found a node!")
1283 |             }
1284 |             DeleteResult::Success(deleted)
1285 |         }
1286 | 
1287 |         unsafe fn insert(
1288 |             &mut self,
1289 |             d: u8,
1290 |             ptr: ChildPtr<T>,
1291 |             _p: Option<*mut ChildPtr<T>>,
1292 |         ) -> Result<(), ChildPtr<T>> {
1293 |             debug_assert!(Some(d) != T::Key::STOP_CHARACTER || ptr.get().unwrap().is_ok());
1294 |             debug_assert!(self.find_raw(d).is_none(), "d={:?} IN {:?}", d, self);
1295 |             debug_assert!(self.children <= 256);
1296 |             debug_assert!(self.node.ptrs[d as usize].is_null());
1297 |             self.children += 1;
1298 |             ptr::write(self.node.ptrs.get_unchecked_mut(d as usize), ptr);
1299 |             Ok(())
1300 |         }
1301 | 
1302 |         fn for_each<F: FnMut(&T), D: Direction>(
1303 |             &self,
1304 |             f: &mut F,
1305 |             mut lower: Option<&[u8]>,
1306 |             mut upper: Option<&[u8]>,
1307 |             lval: Option<&T::Key>,
1308 |             rval: Option<&T::Key>,
1309 |             _dir: D,
1310 |         ) {
1311 |             let low = advance_or(&mut lower, 0);
1312 |             let high = advance_or(&mut upper, 255);
1313 |             do_foreach_dir!(
1314 |                 D::LEFT_TO_RIGHT,
1315 |                 low..(high + 1),
1316 |                 i,
1317 |                 visit_leaf(
1318 |                     &self.node.ptrs[i],
1319 |                     f,
1320 |                     if i == low { lower } else { None },
1321 |                     if i == high { upper } else { None },
1322 |                     lval,
1323 |                     rval,
1324 |                     _dir,
1325 |                 )
1326 |             );
1327 |         }
1328 |     }
1329 | }
1330 | 


--------------------------------------------------------------------------------
/src/art_impl.rs:
--------------------------------------------------------------------------------
   1 | //! Single-threaded radix tree implementation based on HyPer's ART
   2 | use std::borrow::Borrow;
   3 | use std::cmp;
   4 | use std::marker::PhantomData;
   5 | use std::mem;
   6 | use std::ptr;
   7 | 
   8 | use super::Digital;
   9 | use super::art_internal::*;
  10 | use super::prefix_cache::{HashSetPrefixCache, NullBuckets};
  11 | use super::smallvec::SmallVec;
  12 | pub use super::prefix_cache::PrefixCache;
  13 | 
  14 | pub struct ArtPair<K: for<'a> Digital<'a> + PartialOrd, V>(K, V);
  15 | 
  16 | impl<K: for<'a> Digital<'a> + PartialOrd, V> ArtPair<K, V> {
  17 |     pub fn new(k: K, v: V) -> ArtPair<K, V> {
  18 |         ArtPair(k, v)
  19 |     }
  20 | }
  21 | 
  22 | pub struct ArtElement<T: for<'a> Digital<'a> + PartialOrd>(T);
  23 | 
  24 | impl<T: for<'a> Digital<'a> + PartialOrd> ArtElement<T> {
  25 |     pub fn new(t: T) -> ArtElement<T> {
  26 |         ArtElement(t)
  27 |     }
  28 | }
  29 | 
  30 | impl<T: for<'a> Digital<'a> + PartialOrd> Element for ArtElement<T> {
  31 |     type Key = T;
  32 |     fn key(&self) -> &T {
  33 |         &self.0
  34 |     }
  35 | 
  36 |     fn matches(&self, k: &Self::Key) -> bool {
  37 |         *k == self.0
  38 |     }
  39 | 
  40 |     fn replace_matching(&mut self, other: &mut ArtElement<T>) {
  41 |         debug_assert!(self.matches(other.key()));
  42 |         mem::swap(self, other);
  43 |     }
  44 | }
  45 | 
  46 | impl<K: for<'a> Digital<'a> + PartialOrd, V> Element for ArtPair<K, V> {
  47 |     type Key = K;
  48 |     fn key(&self) -> &K {
  49 |         &self.0
  50 |     }
  51 | 
  52 |     fn matches(&self, k: &Self::Key) -> bool {
  53 |         *k == self.0
  54 |     }
  55 | 
  56 |     fn replace_matching(&mut self, other: &mut ArtPair<K, V>) {
  57 |         debug_assert!(self.matches(other.key()));
  58 |         mem::swap(self, other);
  59 |     }
  60 | }
  61 | 
  62 | pub type ARTSet<T> = RawART<ArtElement<T>, NullBuckets<ArtElement<T>>>;
  63 | pub type CachingARTSet<T> = RawART<ArtElement<T>, HashSetPrefixCache<ArtElement<T>>>;
  64 | pub type ARTMap<K, V> = RawART<ArtPair<K, V>, NullBuckets<ArtPair<K, V>>>;
  65 | pub type CachingARTMap<K, V> = RawART<ArtPair<K, V>, HashSetPrefixCache<ArtPair<K, V>>>;
  66 | 
  67 | impl<K: for<'a> Digital<'a> + PartialOrd, V, C: PrefixCache<ArtPair<K, V>>>
  68 |     RawART<ArtPair<K, V>, C>
  69 | {
  70 |     pub fn contains<Q>(&self, key: &Q) -> bool
  71 |     where
  72 |         Q: Borrow<K> + ?Sized,
  73 |     {
  74 |         unsafe { self.lookup_raw(key.borrow()).is_some() }
  75 |     }
  76 | 
  77 |     pub fn contains_val(&self, key: K) -> bool {
  78 |         self.contains(&key)
  79 |     }
  80 | 
  81 |     pub fn add(&mut self, k: K, v: V) -> bool {
  82 |         self.replace(k, v).is_some()
  83 |     }
  84 | 
  85 |     pub fn replace(&mut self, k: K, v: V) -> Option<(K, V)> {
  86 |         match unsafe { self.insert_raw(ArtPair::new(k, v)) } {
  87 |             Ok(()) => None,
  88 |             Err(ArtPair(k, v)) => Some((k, v)),
  89 |         }
  90 |     }
  91 | 
  92 |     pub fn take<Q>(&mut self, key: &Q) -> Option<(K, V)>
  93 |     where
  94 |         Q: Borrow<K> + ?Sized,
  95 |     {
  96 |         unsafe { self.delete_raw(key.borrow()) }.map(|x| (x.0, x.1))
  97 |     }
  98 | 
  99 |     pub fn remove_val(&mut self, key: K) -> bool {
 100 |         self.remove(&key)
 101 |     }
 102 | 
 103 |     pub fn remove<Q>(&mut self, key: &Q) -> bool
 104 |     where
 105 |         Q: Borrow<K> + ?Sized,
 106 |     {
 107 |         self.take(key).is_some()
 108 |     }
 109 | 
 110 |     pub fn for_each_range<F: FnMut(&K, &V)>(
 111 |         &self,
 112 |         f: F,
 113 |         lower_bound: Option<&K>,
 114 |         upper_bound: Option<&K>,
 115 |     ) {
 116 |         self.for_each_range_dir(f, lower_bound, upper_bound, Increasing);
 117 |     }
 118 | 
 119 |     pub fn for_each_range_rev<F: FnMut(&K, &V)>(
 120 |         &self,
 121 |         f: F,
 122 |         lower_bound: Option<&K>,
 123 |         upper_bound: Option<&K>,
 124 |     ) {
 125 |         self.for_each_range_dir(f, lower_bound, upper_bound, Decreasing);
 126 |     }
 127 | 
 128 |     fn for_each_range_dir<F: FnMut(&K, &V), D: Direction>(
 129 |         &self,
 130 |         mut f: F,
 131 |         lower_bound: Option<&K>,
 132 |         upper_bound: Option<&K>,
 133 |         _dir: D,
 134 |     ) {
 135 |         let mut lower_digits = SmallVec::<[u8; 16]>::new();
 136 |         let mut upper_digits = SmallVec::<[u8; 16]>::new();
 137 |         let mut ff = |x: &ArtPair<K, V>| f(&x.0, &x.1);
 138 |         visit_leaf(
 139 |             &self.root,
 140 |             &mut ff,
 141 |             lower_bound.map(|x| {
 142 |                 lower_digits.extend(x.digits());
 143 |                 &lower_digits[..]
 144 |             }),
 145 |             upper_bound.map(|x| {
 146 |                 upper_digits.extend(x.digits());
 147 |                 &upper_digits[..]
 148 |             }),
 149 |             lower_bound,
 150 |             upper_bound,
 151 |             _dir,
 152 |         );
 153 |     }
 154 | }
 155 | impl<T: for<'a> Digital<'a> + PartialOrd, C: PrefixCache<ArtElement<T>>> RawART<ArtElement<T>, C> {
 156 |     pub fn contains<Q>(&self, key: &Q) -> bool
 157 |     where
 158 |         Q: Borrow<T> + ?Sized,
 159 |     {
 160 |         unsafe { self.lookup_raw(key.borrow()).is_some() }
 161 |     }
 162 | 
 163 |     pub fn contains_val(&self, key: T) -> bool {
 164 |         self.contains(&key)
 165 |     }
 166 | 
 167 |     pub fn add(&mut self, k: T) -> bool {
 168 |         self.replace(k).is_some()
 169 |     }
 170 | 
 171 |     pub fn replace(&mut self, k: T) -> Option<T> {
 172 |         match unsafe { self.insert_raw(ArtElement::new(k)) } {
 173 |             Ok(()) => None,
 174 |             Err(ArtElement(t)) => Some(t),
 175 |         }
 176 |     }
 177 | 
 178 |     pub fn take<Q>(&mut self, key: &Q) -> Option<T>
 179 |     where
 180 |         Q: Borrow<T> + ?Sized,
 181 |     {
 182 |         unsafe { self.delete_raw(key.borrow()) }.map(|x| x.0)
 183 |     }
 184 | 
 185 |     pub fn remove_val(&mut self, key: T) -> bool {
 186 |         self.remove(&key)
 187 |     }
 188 | 
 189 |     pub fn remove<Q>(&mut self, key: &Q) -> bool
 190 |     where
 191 |         Q: Borrow<T> + ?Sized,
 192 |     {
 193 |         self.take(key).is_some()
 194 |     }
 195 | 
 196 |     pub fn for_each_range<F: FnMut(&T)>(
 197 |         &self,
 198 |         f: F,
 199 |         lower_bound: Option<&T>,
 200 |         upper_bound: Option<&T>,
 201 |     ) {
 202 |         self.for_each_range_dir(f, lower_bound, upper_bound, Increasing);
 203 |     }
 204 | 
 205 |     pub fn for_each_range_rev<F: FnMut(&T)>(
 206 |         &self,
 207 |         f: F,
 208 |         lower_bound: Option<&T>,
 209 |         upper_bound: Option<&T>,
 210 |     ) {
 211 |         self.for_each_range_dir(f, lower_bound, upper_bound, Decreasing);
 212 |     }
 213 | 
 214 |     fn for_each_range_dir<F: FnMut(&T), D: Direction>(
 215 |         &self,
 216 |         mut f: F,
 217 |         lower_bound: Option<&T>,
 218 |         upper_bound: Option<&T>,
 219 |         _dir: D,
 220 |     ) {
 221 |         let mut lower_digits = SmallVec::<[u8; 16]>::new();
 222 |         let mut upper_digits = SmallVec::<[u8; 16]>::new();
 223 |         let mut ff = |x: &ArtElement<T>| f(&x.0);
 224 |         visit_leaf(
 225 |             &self.root,
 226 |             &mut ff,
 227 |             lower_bound.map(|x| {
 228 |                 lower_digits.extend(x.digits());
 229 |                 &lower_digits[..]
 230 |             }),
 231 |             upper_bound.map(|x| {
 232 |                 upper_digits.extend(x.digits());
 233 |                 &upper_digits[..]
 234 |             }),
 235 |             lower_bound,
 236 |             upper_bound,
 237 |             _dir,
 238 |         );
 239 |     }
 240 | }
 241 | 
 242 | enum PartialResult<T> {
 243 |     Failure(T),
 244 |     Replaced(T),
 245 |     Success,
 246 | }
 247 | 
 248 | enum PartialDeleteResult<T> {
 249 |     Partial,
 250 |     Failure,
 251 |     Success(T),
 252 | }
 253 | 
 254 | pub struct RawART<T: Element, C: PrefixCache<T>> {
 255 |     len: usize,
 256 |     root: ChildPtr<T>,
 257 |     prefix_target: usize,
 258 |     buckets: C,
 259 | }
 260 | 
 261 | impl<T: Element, C: PrefixCache<T>> RawART<T, C> {
 262 |     pub fn new() -> Self {
 263 |         RawART::with_prefix_buckets(8)
 264 |     }
 265 | 
 266 |     /// Construct a new ART that caches interior nodes corresponding to prefixes of length
 267 |     /// `prefix_len`. The prefix length must be positive, and it cannot exceed 8.
 268 |     pub fn with_prefix_buckets(prefix_len: usize) -> Self {
 269 |         assert!(prefix_len <= 8);
 270 |         assert!(prefix_len > 0);
 271 |         RawART {
 272 |             len: 0,
 273 |             root: ChildPtr::null(),
 274 |             buckets: C::new(),
 275 |             prefix_target: prefix_len,
 276 |         }
 277 |     }
 278 | 
 279 |     pub fn len(&self) -> usize {
 280 |         self.len
 281 |     }
 282 | 
 283 |     fn hash_lookup(&self, digits: &[u8]) -> (bool, Option<Result<*mut T, MarkedPtr<T>>>) {
 284 |         if digits.len() <= self.prefix_target {
 285 |             (false, None)
 286 |         } else {
 287 |             let res = self.buckets.lookup(&digits[0..self.prefix_target]);
 288 |             (
 289 |                 true,
 290 |                 match res {
 291 |                     Some(ptr) => Some({
 292 |                         match unsafe { ptr.get_raw().unwrap() } {
 293 |                             Ok(leaf) => Ok(leaf),
 294 |                             Err(_) => Err(ptr),
 295 |                         }
 296 |                     }),
 297 |                     None => None,
 298 |                 },
 299 |             )
 300 |         }
 301 |     }
 302 | 
 303 |     // TODO: replace with NonNull
 304 |     pub unsafe fn lookup_raw(&self, k: &T::Key) -> Option<*mut T> {
 305 |         let mut digits = SmallVec::<[u8; 32]>::new();
 306 |         digits.extend(k.digits());
 307 |         let _check = false;
 308 |         trace!(_check, "lookup_raw");
 309 |         unsafe fn lookup_raw_recursive<T: Element>(
 310 |             curr: MarkedPtr<T>,
 311 |             k: &T::Key,
 312 |             digits: &[u8],
 313 |             mut consumed: usize,
 314 |             dont_check: bool,
 315 |         ) -> Option<*mut T> {
 316 |             let _check = false;
 317 |             match curr.get_raw() {
 318 |                 None => None,
 319 |                 Some(Ok(leaf_node)) => {
 320 |                     if (dont_check && digits.len() == consumed) || (*leaf_node).matches(k) {
 321 |                         trace!(
 322 |                             _check,
 323 |                             "FOUND dont_check={}, consumed_check={}, matches={}",
 324 |                             dont_check,
 325 |                             digits.len() == consumed,
 326 |                             (*leaf_node).matches(k)
 327 |                         );
 328 |                         Some(leaf_node)
 329 |                     } else {
 330 |                         trace!(_check);
 331 |                         None
 332 |                     }
 333 |                 }
 334 |                 Some(Err(inner_node)) => {
 335 |                     consumed = (*inner_node).consumed as usize;
 336 |                     trace!(
 337 |                         _check,
 338 |                         "[lookup, d={}] found an inner node {:?}@{:?}",
 339 |                         digits[consumed],
 340 |                         *inner_node,
 341 |                         inner_node
 342 |                     );
 343 |                     if consumed >= digits.len() {
 344 |                         trace!(_check, "consumed too big");
 345 |                         return None;
 346 |                     }
 347 |                     // handle prefixes now
 348 |                     (*inner_node)
 349 |                         .prefix_matches_optimistic(&digits[consumed..])
 350 |                         .and_then(|(dont_check_new, con)| {
 351 |                             consumed += con;
 352 |                             // let new_digits = &digits[consumed..];
 353 |                             if digits.len() == consumed {
 354 |                                 trace!(_check);
 355 |                                 // Our digits were entirely consumed, but this is a non-leaf node.
 356 |                                 // That means our node is not present.
 357 |                                 return None;
 358 |                             }
 359 |                             with_node!(&*inner_node, nod, {
 360 |                                 nod.find_raw(digits[consumed]).and_then(|next_node| {
 361 |                                     trace!(_check);
 362 |                                     lookup_raw_recursive(
 363 |                                         (&*next_node).to_marked(),
 364 |                                         k,
 365 |                                         digits,
 366 |                                         consumed + 1,
 367 |                                         dont_check && dont_check_new,
 368 |                                     )
 369 |                                 })
 370 |                             })
 371 |                         })
 372 |                 }
 373 |             }
 374 |         }
 375 |         if C::ENABLED {
 376 |             trace!(_check);
 377 |             let (elligible, opt) = self.hash_lookup(digits.as_slice());
 378 |             let node_ref = if let Some(ptr) = opt {
 379 |                 match ptr {
 380 |                     Ok(leaf) => {
 381 |                         return if (*leaf).matches(k) {
 382 |                             trace!(_check);
 383 |                             Some(leaf)
 384 |                         } else {
 385 |                             trace!(_check);
 386 |                             None
 387 |                         }
 388 |                     }
 389 |                     Err(node) => node,
 390 |                 }
 391 |             } else if C::COMPLETE && elligible && self.len > 1 {
 392 |                 trace!(_check);
 393 |                 return None;
 394 |             } else {
 395 |                 trace!(_check);
 396 |                 self.root.to_marked()
 397 |             };
 398 |             trace!(_check);
 399 |             lookup_raw_recursive(node_ref, k, digits.as_slice(), 0, true)
 400 |         } else {
 401 |             lookup_raw_recursive(self.root.to_marked(), k, digits.as_slice(), 0, true)
 402 |         }
 403 |     }
 404 | 
 405 |     pub unsafe fn delete_raw(&mut self, k: &T::Key) -> Option<T> {
 406 |         // Also, consider hypothesis that promoting last doesn't work, and is leading to failed
 407 |         // lookups
 408 |         //
 409 |         // TODO: This method (particularly delete_raw_recursive) is way too long; should break it
 410 |         // out into more helpers.
 411 |         let mut digits = SmallVec::<[u8; 32]>::new();
 412 |         digits.extend(k.digits());
 413 |         use self::PartialDeleteResult::*;
 414 |         let _check = false;
 415 |         trace!(_check, "delete_raw {:?}", &digits[..]);
 416 |         unsafe fn delete_raw_recursive<T: Element, C: PrefixCache<T>>(
 417 |             k: &T::Key,
 418 |             mut curr: MarkedPtr<T>,
 419 |             curr_ptr: Option<&mut ChildPtr<T>>,
 420 |             parent: Option<(u8, Result<MarkedPtr<T>, &mut ChildPtr<T>>)>,
 421 |             digits: &[u8],
 422 |             mut consumed: usize,
 423 |             target: usize,
 424 |             buckets: &mut C,
 425 |             is_root: bool,
 426 |             // return the deleted node
 427 |         ) -> PartialDeleteResult<T> {
 428 |             let _check = false;
 429 |             use self::PartialDeleteResult::*;
 430 |             if curr.is_null() {
 431 |                 return Failure;
 432 |             }
 433 |             unsafe fn move_val_out<T>(mut cptr: ChildPtr<T>) -> T {
 434 |                 let res = {
 435 |                     // first we read the memory out
 436 |                     let r = cptr.get_mut().unwrap().unwrap();
 437 |                     ptr::read(r)
 438 |                 };
 439 |                 // Now we want to deallocate the memory that once held the element, but we don't
 440 |                 // want to run its destructor if it has one.
 441 |                 let cptr2 = mem::transmute::<ChildPtr<T>, ChildPtr<mem::ManuallyDrop<T>>>(cptr);
 442 |                 mem::drop(cptr2);
 443 |                 res
 444 |             }
 445 | 
 446 |             let rest_opts = match curr.get_mut().unwrap() {
 447 |                 Ok(leaf_node) => {
 448 |                     trace!(_check);
 449 |                     if leaf_node.matches(k) {
 450 |                         trace!(_check);
 451 |                         // we have a match! delete the leaf
 452 |                         if let Some((d, mut parent_ref)) = parent {
 453 |                             let (res, asgn) = with_node_mut!(
 454 |                                 match parent_ref {
 455 |                                     Ok(ref mut marked_parent) => {
 456 |                                         let p_ref = marked_parent.get_mut().unwrap().err().unwrap();
 457 |                                         trace!(_check, "{:?}", p_ref);
 458 |                                         if p_ref.children == 2 {
 459 |                                             trace!(_check, "[delete] returning partial");
 460 |                                             return Partial;
 461 |                                         }
 462 |                                         p_ref
 463 |                                     }
 464 |                                     Err(ref mut parent_ptr) => {
 465 |                                         trace!(_check);
 466 |                                         parent_ptr.get_mut().unwrap().err().unwrap()
 467 |                                     }
 468 |                                 },
 469 |                                 node,
 470 |                                 {
 471 |                                     trace!(_check, "digits={:?}, d={}", digits, d);
 472 |                                     match node.delete(d) {
 473 |                                         DeleteResult::Success(deleted) => {
 474 |                                             // we are deleteing an individual node. Time to check
 475 |                                             // if it is in buckets: if it is we should remove it.
 476 |                                             if C::ENABLED && digits.len() >= target
 477 |                                                 && consumed <= target
 478 |                                             {
 479 |                                                 trace!(_check);
 480 |                                                 if C::COMPLETE {
 481 |                                                     debug_assert!(
 482 |                                                         buckets
 483 |                                                             .lookup(&digits[0..target])
 484 |                                                             .is_some()
 485 |                                                     );
 486 |                                                 }
 487 |                                                 buckets
 488 |                                                     .insert(&digits[0..target], MarkedPtr::null());
 489 |                                             }
 490 |                                             trace!(_check);
 491 |                                             (Success(move_val_out(deleted)), None)
 492 |                                         }
 493 |                                         DeleteResult::Singleton {
 494 |                                             deleted,
 495 |                                             last,
 496 |                                             last_d,
 497 |                                         } => {
 498 |                                             trace!(_check);
 499 |                                             if C::ENABLED && digits.len() >= target
 500 |                                                 && consumed <= target
 501 |                                             {
 502 |                                                 trace!(_check);
 503 |                                                 if C::COMPLETE {
 504 |                                                     debug_assert!(
 505 |                                                         buckets
 506 |                                                             .lookup(&digits[0..target])
 507 |                                                             .is_some()
 508 |                                                     );
 509 |                                                 }
 510 |                                                 buckets
 511 |                                                     .insert(&digits[0..target], MarkedPtr::null());
 512 |                                             }
 513 |                                             if C::ENABLED {
 514 |                                                 trace!(_check);
 515 |                                                 if let Ok(_leaf) = last.get().unwrap() {
 516 |                                                     let mut leaf_digits =
 517 |                                                         SmallVec::<[u8; 8]>::new();
 518 |                                                     let leaf: &T = _leaf;
 519 |                                                     leaf_digits.extend(leaf.key().digits().take(8));
 520 |                                                     if leaf_digits.len() >= target
 521 |                                                         && consumed <= target
 522 |                                                     {
 523 |                                                         trace!(_check);
 524 |                                                         buckets.insert(
 525 |                                                             &leaf_digits[0..target],
 526 |                                                             last.to_marked(),
 527 |                                                         );
 528 |                                                         debug_assert_eq!(
 529 |                                                             buckets.lookup(&leaf_digits[0..target]),
 530 |                                                             Some(last.to_marked())
 531 |                                                         );
 532 |                                                         // N.B. when debugging deletes, consider
 533 |                                                         // this extra consistency check. This is
 534 |                                                         // off by default because it does an O(n)
 535 |                                                         // scan of `buckets` which slows things
 536 |                                                         // down considerably on debug builds.
 537 |                                                         //
 538 |                                                         // // this declaration needs to be moved up
 539 |                                                         // // a few blocks
 540 |                                                         // let marked_p = parent_ref.to_marked();
 541 |                                                         // eprintln!("Remapping digits {:?} while deleting {:?}",
 542 |                                                         //           &leaf_digits[..], &digits[..]);
 543 |                                                         // buckets.debug_assert_unreachable(marked_p);
 544 |                                                     }
 545 |                                                 }
 546 |                                             }
 547 |                                             debug_assert!(deleted.get().unwrap().is_ok());
 548 |                                             (Success(move_val_out(deleted)), Some((last, last_d)))
 549 |                                         }
 550 |                                         DeleteResult::Failure => unreachable!(),
 551 |                                     }
 552 |                                 }
 553 |                             );
 554 |                             if let Some((mut c_ptr, last_d)) = asgn {
 555 |                                 let _check_2 = true;
 556 |                                 trace!(_check);
 557 |                                 // we are promoting a "last" so we must increase its prefix
 558 |                                 // length
 559 |                                 let mut switch = false; // flag for inserting a new interior node
 560 | 
 561 |                                 // flag for invalidating the cache (as it may contain the node we are deleting)
 562 |                                 let mut replace = false;
 563 |                                 let mut ds = SmallVec::<[u8; 8]>::new();
 564 |                                 {
 565 |                                     let _p_marked = match parent_ref {
 566 |                                         Ok(ref m) => m.clone(),
 567 |                                         Err(ref ptr) => ptr.to_marked(),
 568 |                                     };
 569 |                                     let pp = match parent_ref {
 570 |                                         Ok(ref m) => m.get().unwrap().err().unwrap(),
 571 |                                         Err(ref ptr) => ptr.get().unwrap().err().unwrap(),
 572 |                                     };
 573 |                                     if C::ENABLED && pp.consumed as usize <= target
 574 |                                         && target <= pp.consumed as usize + pp.count as usize
 575 |                                     {
 576 |                                         trace!(_check);
 577 |                                         // We want to construct enough context to clear out the
 578 |                                         // cache below. Because digits[..] may be too short to fill
 579 |                                         // the hash prefix cache, we need to fill in additional
 580 |                                         // context from the interior nodes.
 581 |                                         //
 582 |                                         // In this case, we start the work by filling in the prefix
 583 |                                         // not present in 'pp'. Below we do the same for `inner` in
 584 |                                         // case it replaces 'pp'.
 585 |                                         replace = true;
 586 |                                         if digits.len() < target {
 587 |                                             for dd in &digits[0..pp.consumed as usize] {
 588 |                                                 ds.push(*dd)
 589 |                                             }
 590 |                                         }
 591 |                                     } else if C::ENABLED && digits.len() >= target {
 592 |                                         trace!(_check);
 593 |                                         debug_assert!(
 594 |                                             buckets.lookup(&digits[0..target]) != Some(_p_marked)
 595 |                                         );
 596 |                                     }
 597 |                                     if let Err(inner) = c_ptr.get_mut().unwrap() {
 598 |                                         debug_assert!(Some(last_d) != T::Key::STOP_CHARACTER);
 599 |                                         // The "last" node that we are promoting is an interior
 600 |                                         // node. As a result, we have to modify its prefix and
 601 |                                         // potentially insert it into the prefix cache.
 602 |                                         let parent_count = pp.count;
 603 |                                         let mut prefix_digits =
 604 |                                             SmallVec::<[u8; PREFIX_LEN + 1]>::new();
 605 |                                         for dd in &pp.prefix
 606 |                                             [0..cmp::min(parent_count as usize, PREFIX_LEN)]
 607 |                                         {
 608 |                                             prefix_digits.push(*dd);
 609 |                                         }
 610 |                                         prefix_digits.push(last_d);
 611 |                                         inner.append_prefix(
 612 |                                             prefix_digits.as_slice(),
 613 |                                             prefix_digits.len() as u32,
 614 |                                         );
 615 |                                         trace!(
 616 |                                             _check_2,
 617 |                                             "[last_d={}] updating inner node @{:?} {:?} (min={:?})",
 618 |                                             last_d,
 619 |                                             inner as *const _,
 620 |                                             inner,
 621 |                                             with_node!(
 622 |                                                 inner,
 623 |                                                 nod,
 624 |                                                 nod.get_min()
 625 |                                                     .unwrap()
 626 |                                                     .key()
 627 |                                                     .digits()
 628 |                                                     .collect::<Vec<u8>>(),
 629 |                                                 T
 630 |                                             )
 631 |                                         );
 632 |                                         debug_assert_eq!(inner.consumed, pp.consumed);
 633 |                                         if C::ENABLED && inner.consumed as usize <= target
 634 |                                             && target
 635 |                                                 <= inner.consumed as usize + inner.count as usize
 636 |                                         {
 637 |                                             trace!(_check);
 638 |                                             switch = true;
 639 |                                             if digits.len() < target {
 640 |                                                 if !replace {
 641 |                                                     trace!(_check);
 642 |                                                     for dd in &digits[0..pp.consumed as usize] {
 643 |                                                         ds.push(*dd);
 644 |                                                     }
 645 |                                                 }
 646 |                                                 for dd in &inner.prefix
 647 |                                                     [0..cmp::min(inner.count as usize, PREFIX_LEN)]
 648 |                                                 {
 649 |                                                     trace!(_check);
 650 |                                                     ds.push(*dd);
 651 |                                                 }
 652 |                                             }
 653 |                                         }
 654 |                                     }
 655 |                                     if C::ENABLED && replace && !switch && digits.len() < target {
 656 |                                         trace!(_check);
 657 |                                         for dd in
 658 |                                             &pp.prefix[0..cmp::min(pp.count as usize, PREFIX_LEN)]
 659 |                                         {
 660 |                                             ds.push(*dd);
 661 |                                         }
 662 |                                     }
 663 |                                 }
 664 |                                 let c_marked = c_ptr.to_marked();
 665 |                                 mem::swap(parent_ref.err().unwrap(), &mut c_ptr);
 666 |                                 if C::ENABLED {
 667 |                                     trace!(_check);
 668 |                                     if switch || replace {
 669 |                                         let mut dsn = SmallVec::<[u8; 8]>::new();
 670 |                                         let mut d_slice = &digits[..];
 671 |                                         if digits.len() < target {
 672 |                                             debug_assert!(target <= 8);
 673 |                                             // need to construct new digits
 674 |                                             d_slice = ds.as_slice();
 675 |                                         }
 676 |                                         if consumed <= target {
 677 |                                             // there's an edge case here. If consumed == target,
 678 |                                             // and digits is of lenght >= target, then the promoted
 679 |                                             // node will not have the same target-length prefix as
 680 |                                             // digits[..]. It will share all but the last element.
 681 |                                             for d in &digits[0..target - 1] {
 682 |                                                 dsn.push(*d)
 683 |                                             }
 684 |                                             dsn.push(last_d);
 685 |                                             d_slice = &dsn[..]
 686 |                                         }
 687 |                                         trace!(_check);
 688 |                                         buckets.insert(&d_slice[0..target], c_marked);
 689 |                                     }
 690 |                                 }
 691 |                             }
 692 |                             trace!(_check);
 693 |                             return res;
 694 |                         } else {
 695 |                             trace!(_check);
 696 |                             None
 697 |                         }
 698 |                     } else {
 699 |                         trace!(_check);
 700 |                         return Failure;
 701 |                     }
 702 |                 }
 703 |                 Err(inner_node) => {
 704 |                     #[cfg(debug_assertions)]
 705 |                     {
 706 |                         with_node!(
 707 |                             inner_node,
 708 |                             nod,
 709 |                             {
 710 |                                 let _leaf = nod.get_min().unwrap();
 711 |                                 let mut _leaf_ds = Vec::with_capacity(digits.len());
 712 |                                 _leaf_ds.extend(_leaf.key().digits());
 713 |                                 trace!(_check, "[delete, d={}] found an inner node {:?}@{:?}\n\t(leaf_ds={:?})",
 714 |                                    digits[nod.consumed as usize],
 715 |                                    nod,
 716 |                                    inner_node as *const RawNode<()>,
 717 |                                    _leaf_ds);
 718 |                             },
 719 |                             T
 720 |                         );
 721 |                     }
 722 |                     debug_assert!(
 723 |                         inner_node.consumed as usize <= digits.len(),
 724 |                         "inner_node.consumed={} too high, nod={:?}",
 725 |                         inner_node.consumed,
 726 |                         inner_node
 727 |                     );
 728 |                     consumed = inner_node.consumed as usize;
 729 |                     let (matched, _) = inner_node.get_matching_prefix(
 730 |                         digits,
 731 |                         consumed,
 732 |                         PhantomData as PhantomData<T>,
 733 |                     );
 734 |                     // if the prefix matches, recur, otherwise just bail out
 735 |                     if matched == inner_node.count as usize {
 736 |                         trace!(_check);
 737 |                         // the prefix matched! we recur below
 738 |                         debug_assert!(digits.len() > matched);
 739 |                         Some((inner_node as *mut RawNode<()>, matched))
 740 |                     } else {
 741 |                         trace!(_check, "delete failing consumed={}", consumed);
 742 |                         // prefix was not a match, the key is not here
 743 |                         return Failure;
 744 |                     }
 745 |                 }
 746 |             };
 747 |             if let Some((inner_node, matched)) = rest_opts {
 748 |                 trace!(_check);
 749 |                 let next_digit = digits[consumed + matched];
 750 |                 with_node_mut!(&mut *inner_node, node, {
 751 |                     if let Some(c_ptr) = node.find_mut(next_digit) {
 752 |                         trace!(_check);
 753 |                         consumed += matched + 1;
 754 |                         let marked = c_ptr.to_marked();
 755 |                         delete_raw_recursive(
 756 |                             k,
 757 |                             marked,
 758 |                             Some(c_ptr),
 759 |                             Some((
 760 |                                 next_digit,
 761 |                                 match curr_ptr {
 762 |                                     Some(x) => Err(x),
 763 |                                     None => Ok(curr),
 764 |                                 },
 765 |                             )),
 766 |                             digits,
 767 |                             consumed,
 768 |                             target,
 769 |                             buckets,
 770 |                             false,
 771 |                         )
 772 |                     } else {
 773 |                         trace!(_check);
 774 |                         Failure
 775 |                     }
 776 |                 })
 777 |             } else if let Some(cp) = curr_ptr {
 778 |                 if !is_root {
 779 |                     trace!(_check);
 780 |                     return Partial;
 781 |                 }
 782 |                 trace!(_check);
 783 |                 // we are in the root, set curr to null.
 784 |                 let c_ptr = cp.swap_null();
 785 |                 if C::ENABLED && digits.len() >= target {
 786 |                     buckets.insert(&digits[0..target], MarkedPtr::null());
 787 |                 }
 788 |                 Success(move_val_out(c_ptr))
 789 |             } else {
 790 |                 trace!(_check);
 791 |                 Partial
 792 |             }
 793 |         }
 794 |         let mut res = Partial;
 795 |         if C::ENABLED {
 796 |             let (elligible, opt) = self.hash_lookup(digits.as_slice());
 797 |             res = if let Some(ptr) = opt {
 798 |                 trace!(_check, "cache hit");
 799 |                 match ptr {
 800 |                     Ok(_leaf) => Partial,
 801 |                     Err(inner) => {
 802 |                         #[cfg(debug_assertions)]
 803 |                         with_node!(
 804 |                             inner.get().unwrap().err().unwrap(),
 805 |                             node,
 806 |                             {
 807 |                                 let min = node.get_min().unwrap();
 808 |                                 let mut min_ds = SmallVec::<[u8; 10]>::new();
 809 |                                 min_ds.extend(min.key().digits());
 810 |                                 if _check {
 811 |                                     assert_eq!(
 812 |                                         &min_ds[0..self.prefix_target - 1],
 813 |                                         &digits[0..self.prefix_target - 1]
 814 |                                     );
 815 |                                 }
 816 |                             },
 817 |                             T
 818 |                         );
 819 |                         delete_raw_recursive(
 820 |                             k,
 821 |                             inner,
 822 |                             None,
 823 |                             None,
 824 |                             &digits[..],
 825 |                             0,
 826 |                             self.prefix_target,
 827 |                             &mut self.buckets,
 828 |                             false,
 829 |                         )
 830 |                     }
 831 |                 }
 832 |             } else if C::COMPLETE && elligible && self.len > 1 {
 833 |                 return None;
 834 |             } else {
 835 |                 Partial
 836 |             };
 837 |         }
 838 |         if let Partial = res {
 839 |             let marked_root = self.root.to_marked();
 840 |             res = delete_raw_recursive(
 841 |                 k,
 842 |                 marked_root,
 843 |                 Some(&mut self.root),
 844 |                 None,
 845 |                 &digits[..],
 846 |                 0,
 847 |                 self.prefix_target,
 848 |                 &mut self.buckets,
 849 |                 true,
 850 |             );
 851 |         }
 852 |         match res {
 853 |             Success(x) => {
 854 |                 debug_assert!(self.len > 0);
 855 |                 self.len -= 1;
 856 |                 Some(x)
 857 |             }
 858 |             Failure => None,
 859 |             Partial => panic!("Got a partial!"),
 860 |         }
 861 |     }
 862 | 
 863 |     pub unsafe fn insert_raw(&mut self, elt: T) -> Result<(), T> {
 864 |         let mut digits = SmallVec::<[u8; 32]>::new();
 865 |         digits.extend(elt.key().digits());
 866 |         unsafe fn insert_raw_recursive<T: Element, C: PrefixCache<T>>(
 867 |             curr: MarkedPtr<T>,
 868 |             mut e: T,
 869 |             digits: &[u8],
 870 |             mut consumed: usize,
 871 |             pptr: Option<*mut ChildPtr<T>>,
 872 |             buckets: &mut C,
 873 |             target: usize,
 874 |         ) -> PartialResult<T> {
 875 |             use self::PartialResult::*;
 876 |             debug_assert!(consumed <= digits.len());
 877 |             if curr.is_null() {
 878 |                 // Case 1: We found a null pointer, just replace it with a new leaf.
 879 |                 let new_leaf = ChildPtr::<T>::from_leaf(Box::into_raw(Box::new(e)));
 880 |                 (*pptr.unwrap()) = new_leaf;
 881 |                 if C::ENABLED && digits.len() >= target && consumed <= target {
 882 |                     debug_assert!(buckets.lookup(&digits[0..target]).is_none());
 883 |                     buckets.insert(&digits[0..target], (*pptr.unwrap()).to_marked());
 884 |                 }
 885 | 
 886 |                 return Success;
 887 |             }
 888 |             match curr.get_raw().unwrap() {
 889 |                 Ok(ln) => {
 890 |                     debug_assert!(pptr.is_some());
 891 |                     // Case 2: We found a leaf node. We need to construct a new inner node with a the
 892 |                     // prefix corresponding to the shared prefix of this leaf node and `e`, add
 893 |                     // this leaf and `e` as a child to this new node, and replace the node as the
 894 |                     // root.
 895 |                     //
 896 |                     // Of course, we have already borrowed curr mutably, so we cannot accomplish
 897 |                     // these last few steps while we have still borrowed lead_node. We instead
 898 |                     // return the leaf's digits so we can do the rest of the loop outside of the
 899 |                     // match.
 900 |                     let leaf_node = &mut *ln;
 901 |                     if leaf_node.matches(e.key()) {
 902 |                         // Found a matching leaf node. We swap in our value and return the old one.
 903 |                         leaf_node.replace_matching(&mut e);
 904 | 
 905 |                         return Replaced(e);
 906 |                     }
 907 |                     // found a leaf node, need to split it to a Node4 with two leaves
 908 |                     let mut leaf_digits = SmallVec::<[u8; 8]>::new();
 909 |                     leaf_digits.extend(leaf_node.key().digits());
 910 |                     let pp = pptr.unwrap();
 911 |                     let n4: Box<RawNode<Node4<T>>> = make_node_from_common_prefix(
 912 |                         &leaf_digits[consumed..],
 913 |                         &digits[consumed..],
 914 |                         consumed as u32,
 915 |                     );
 916 |                     let prefix_len = n4.count as usize;
 917 |                     let mut n4_raw = Box::into_raw(n4);
 918 |                     let mut leaf_ptr = ChildPtr::from_node(n4_raw);
 919 |                     let new_leaf = ChildPtr::from_leaf(Box::into_raw(Box::new(e)));
 920 |                     mem::swap(&mut *pp, &mut leaf_ptr);
 921 | 
 922 |                     if C::ENABLED && consumed <= target
 923 |                         && target <= consumed + (*n4_raw).count as usize
 924 |                     {
 925 |                         buckets.insert(&digits[0..target], (*pp).to_marked());
 926 |                         debug_assert!((*pp).get().unwrap().is_err());
 927 |                     } else if C::ENABLED && digits.len() >= target && consumed <= target {
 928 |                         debug_assert!(buckets.lookup(&digits[0..target]).is_none());
 929 |                         buckets.insert(&digits[0..target], (*pp).to_marked());
 930 | 
 931 |                         // buckets.insert(&digits[0..target], new_leaf.to_marked());
 932 |                     }
 933 | 
 934 |                     if C::ENABLED && leaf_digits.len() >= target && consumed <= target {
 935 |                         buckets.insert(&leaf_digits[0..target], (*pp).to_marked());
 936 |                     }
 937 |                     if C::ENABLED && C::COMPLETE && leaf_digits.len() >= target
 938 |                         && consumed <= target
 939 |                     {
 940 |                         debug_assert!(buckets.lookup(&leaf_digits[0..target]).is_some())
 941 |                     }
 942 |                     // n4_raw has now replaced the leaf, we need to reinsert the leaf, along with
 943 |                     // our child pointer.
 944 |                     debug_assert!(consumed + prefix_len < leaf_digits.len(),
 945 |                                   "leaf digits ({:?}) out of space due to prefix shared with d={:?} (consumed={:?})",
 946 |                                   &leaf_digits[..],
 947 |                                   digits,
 948 |                                   consumed);
 949 | 
 950 |                     (*n4_raw)
 951 |                         .insert(leaf_digits[consumed + prefix_len], leaf_ptr, None)
 952 |                         .unwrap();
 953 | 
 954 |                     (*n4_raw)
 955 |                         .insert(digits[consumed + prefix_len], new_leaf, None)
 956 |                         .unwrap()
 957 |                 }
 958 |                 Err(inn) => {
 959 |                     let inner_node = &mut *inn;
 960 |                     #[cfg(debug_assertions)]
 961 |                     {
 962 |                         if pptr.is_some() {
 963 |                             debug_assert_eq!(consumed, inner_node.consumed as usize);
 964 |                         }
 965 |                     }
 966 |                     consumed = inner_node.consumed as usize;
 967 |                     // found an interior node. need to continue the search!
 968 |                     let (matched, min_ref) = inner_node.get_matching_prefix(
 969 |                         &digits[..],
 970 |                         consumed,
 971 |                         PhantomData as PhantomData<T>,
 972 |                     );
 973 | 
 974 |                     if matched == inner_node.count as usize {
 975 |                         // Case 3: we found an inner node, with a matching prefix.
 976 |                         //
 977 |                         // In this case we recursively insert our node into this inner node, making
 978 |                         // sure to update the 'consumed' variable appropriately.
 979 |                         consumed += matched;
 980 |                         // N.B what if consumed == digits.len()? the structure of the keys must
 981 |                         // guarantee that we do not see this. For example, if we store u64s,
 982 |                         // then all keys are 8 bytes long so `consumed` cannot be more than 7.
 983 |                         //
 984 |                         // For variable-length keys, (like strings) we require a "stop"
 985 |                         // character to appear to avoid this problem. For us, the
 986 |                         // null-terminator is such a stop character.
 987 |                         debug_assert!(consumed < digits.len());
 988 |                         let d = digits[consumed];
 989 | 
 990 |                         with_node_mut!(inner_node, nod, {
 991 |                             // TODO validate the prefix logic here:
 992 |                             // if there's an optimistic prefix we may have to adjust its
 993 |                             // length...  for now it may be safer to just truncate the prefix
 994 |                             nod.count = cmp::min(nod.count, PREFIX_LEN as u32);
 995 |                             if let Some(next_ptr) = nod.find_mut(d) {
 996 |                                 let pp = Some(next_ptr as *mut _);
 997 | 
 998 |                                 return insert_raw_recursive(
 999 |                                     next_ptr.to_marked(),
1000 |                                     e,
1001 |                                     digits,
1002 |                                     consumed + 1,
1003 |                                     pp,
1004 |                                     buckets,
1005 |                                     target,
1006 |                                 );
1007 |                             }
1008 |                             let full = nod.is_full();
1009 |                             if C::ENABLED && full && pptr.is_none() {
1010 |                                 return Failure(e);
1011 |                             }
1012 |                             let c_ptr = ChildPtr::<T>::from_leaf(Box::into_raw(Box::new(e)));
1013 |                             let _r = nod.insert(d, c_ptr, pptr);
1014 |                             debug_assert!(_r.is_ok());
1015 |                             if C::ENABLED {
1016 |                                 if nod.consumed as usize <= target
1017 |                                     && target <= nod.consumed as usize + nod.count as usize
1018 |                                 {
1019 |                                     if full {
1020 |                                         let marked_p = (*pptr.unwrap()).to_marked();
1021 |                                         buckets.insert(&digits[0..target], marked_p.clone());
1022 |                                     }
1023 |                                 } else if digits.len() >= target && consumed <= target && !full {
1024 |                                     #[cfg(debug_assertions)]
1025 |                                     {
1026 |                                         if let Some(ptr) = buckets.lookup(&digits[0..target]) {
1027 |                                             match ptr.get().unwrap() {
1028 |                                                 Ok(_leaf) => eprintln!("overwriting leaf node!"),
1029 |                                                 Err(other_inner) =>
1030 |                                                     eprintln!("overwriting inner node: {:?} ptr={:?} pptr={:?} inner={:?}",
1031 |                                                               other_inner,
1032 |                                                               ptr,
1033 |                                                               pptr.map(|x| &*x),
1034 |                                                               inn),
1035 |                                             }
1036 |                                             panic!("Overwriting leaf insertion");
1037 |                                         }
1038 |                                     }
1039 | 
1040 |                                     buckets.insert(&digits[0..target], MarkedPtr::from_node(nod));
1041 |                                 } else if full && consumed <= target {
1042 |                                     let marked_p = (*pptr.unwrap()).to_marked();
1043 |                                     // If we were full we have to remap all leaves that are
1044 |                                     // children of nod to the new value.
1045 |                                     let mut mp = marked_p.clone();
1046 |                                     let new_nod = mp.get_mut().unwrap().err().unwrap();
1047 |                                     with_node_mut!(
1048 |                                         new_nod,
1049 |                                         nod,
1050 |                                         {
1051 |                                             nod.local_foreach(|_, n| {
1052 |                                                 if let Ok(leaf) = n.get().unwrap() {
1053 |                                                     let mut ds = SmallVec::<[u8; 8]>::new();
1054 |                                                     ds.extend(leaf.key().digits());
1055 |                                                     if ds.len() < target {
1056 |                                                         return;
1057 |                                                     }
1058 |                                                     buckets
1059 |                                                         .insert(&ds[0..target], marked_p.clone());
1060 |                                                 }
1061 |                                             });
1062 |                                         },
1063 |                                         T
1064 |                                     );
1065 |                                 }
1066 |                             }
1067 | 
1068 |                             return Success;
1069 |                         });
1070 |                     } else {
1071 |                         let inner_d = inner_node.prefix[matched];
1072 |                         if pptr.is_none() {
1073 |                             return Failure(e);
1074 |                         }
1075 |                         // Case 4: Our inner node shares a non-matching prefix with the current node.
1076 |                         //
1077 |                         // Here we have to figure out where the mismatch is and create a new parent
1078 |                         // node for the inner node and our current node.
1079 |                         unsafe fn adjust_prefix<R, T: Element>(
1080 |                             n: &mut RawNode<R>,
1081 |                             by: usize,
1082 |                             leaf: Option<*const T>,
1083 |                             consumed: usize,
1084 |                         ) {
1085 |                             debug_assert!(by > 0);
1086 |                             debug_assert!(
1087 |                                 by <= n.count as usize,
1088 |                                 "by={:?} > n.count={:?}",
1089 |                                 by,
1090 |                                 n.count
1091 |                             );
1092 |                             let old_count = n.count as usize;
1093 |                             n.count -= by as u32;
1094 |                             let start: *const _ = &n.prefix[by];
1095 |                             ptr::copy(start, &mut n.prefix[0], n.count as usize);
1096 |                             if old_count > PREFIX_LEN {
1097 |                                 let leaf_ref = &*leaf.unwrap();
1098 |                                 for (p, d) in n.prefix[PREFIX_LEN - by..]
1099 |                                     .iter_mut()
1100 |                                     .zip(leaf_ref.key().digits().skip(consumed))
1101 |                                 {
1102 |                                     *p = d;
1103 |                                 }
1104 |                             }
1105 |                         }
1106 |                         debug_assert!(
1107 |                             inner_node.count > 0,
1108 |                             "Found 0 inner_node.count in split case, matched={:?}",
1109 |                             matched
1110 |                         );
1111 | 
1112 |                         // first make a new node that will be the parent to both `inner` and a leaf
1113 |                         // containing `e`.
1114 |                         let common_prefix_digits = &digits[consumed..consumed + matched];
1115 |                         debug_assert_eq!(common_prefix_digits.len(), matched);
1116 |                         let n4: Box<RawNode<Node4<T>>> =
1117 |                             make_node_with_prefix(&common_prefix_digits[..], consumed as u32);
1118 |                         inner_node.consumed += n4.count + 1;
1119 |                         debug_assert_eq!(n4.count as usize, common_prefix_digits.len());
1120 |                         let update_cache_inner = C::ENABLED && consumed <= target
1121 |                             && target <= consumed + n4.count as usize;
1122 |                         consumed += n4.count as usize;
1123 |                         let by = matched + 1;
1124 |                         adjust_prefix(inner_node, by, min_ref, consumed);
1125 | 
1126 |                         // Now allocate a node to contain `e`, insert it into the prefix cache if
1127 |                         // necessary, and insert it into n4.
1128 |                         let c_ptr = ChildPtr::<T>::from_leaf(Box::into_raw(Box::new(e)));
1129 | 
1130 |                         let mut n4_raw = Box::into_raw(n4);
1131 |                         let _r = (*n4_raw).insert(digits[consumed], c_ptr, None);
1132 |                         debug_assert!(_r.is_ok());
1133 |                         let mut n4_cptr = ChildPtr::from_node(n4_raw);
1134 |                         // Now swap `inner` with n4 (thereby inserting it into the tree) and insert
1135 |                         // `inner` as a child of n4.
1136 |                         let pp = pptr.unwrap();
1137 |                         mem::swap(&mut *pp, &mut n4_cptr);
1138 |                         if update_cache_inner {
1139 |                             buckets.insert(&digits[0..target], (*pp).to_marked());
1140 |                             debug_assert!((*pp).get().unwrap().is_err());
1141 |                         } else if C::ENABLED && digits.len() >= target && consumed <= target {
1142 |                             buckets.insert(&digits[0..target], (*pp).to_marked());
1143 |                         }
1144 | 
1145 |                         (*n4_raw).insert(inner_d, n4_cptr, None).unwrap()
1146 |                     }
1147 |                 }
1148 |             };
1149 |             Success
1150 |         }
1151 |         if C::ENABLED {
1152 |             let e = {
1153 |                 let (node_ref, consumed, pptr) = {
1154 |                     let (_, opt) = self.hash_lookup(digits.as_slice());
1155 |                     if let Some(Err(inner)) = opt {
1156 |                         (inner, self.prefix_target, None)
1157 |                     } else {
1158 |                         let root_alias = Some(&mut self.root as *mut _);
1159 |                         (self.root.to_marked(), 0, root_alias)
1160 |                     }
1161 |                 };
1162 |                 match insert_raw_recursive(
1163 |                     node_ref,
1164 |                     elt,
1165 |                     digits.as_slice(),
1166 |                     consumed,
1167 |                     pptr,
1168 |                     &mut self.buckets,
1169 |                     self.prefix_target,
1170 |                 ) {
1171 |                     PartialResult::Failure(e) => e,
1172 |                     PartialResult::Success => {
1173 |                         self.len += 1;
1174 |                         return Ok(());
1175 |                     }
1176 |                     PartialResult::Replaced(t) => {
1177 |                         return Err(t);
1178 |                     }
1179 |                 }
1180 |             };
1181 |             // Hash-indexed inserts can fail, retry a default root-based traversal.
1182 |             let root_alias = Some(&mut self.root as *mut _);
1183 |             match insert_raw_recursive(
1184 |                 self.root.to_marked(),
1185 |                 e,
1186 |                 digits.as_slice(),
1187 |                 0,
1188 |                 root_alias,
1189 |                 &mut self.buckets,
1190 |                 self.prefix_target,
1191 |             ) {
1192 |                 PartialResult::Success => {
1193 |                     self.len += 1;
1194 |                     Ok(())
1195 |                 }
1196 |                 PartialResult::Replaced(t) => Err(t),
1197 |                 PartialResult::Failure(_) => unreachable!(),
1198 |             }
1199 |         } else {
1200 |             let root_alias = Some(&mut self.root as *mut _);
1201 |             match insert_raw_recursive(
1202 |                 self.root.to_marked(),
1203 |                 elt,
1204 |                 digits.as_slice(),
1205 |                 0,
1206 |                 root_alias,
1207 |                 &mut self.buckets,
1208 |                 self.prefix_target,
1209 |             ) {
1210 |                 PartialResult::Success => {
1211 |                     self.len += 1;
1212 |                     Ok(())
1213 |                 }
1214 |                 PartialResult::Replaced(t) => Err(t),
1215 |                 PartialResult::Failure(_) => unreachable!(),
1216 |             }
1217 |         }
1218 |     }
1219 | }
1220 | 
1221 | #[cfg(test)]
1222 | mod tests {
1223 |     use super::*;
1224 |     use super::super::rand;
1225 |     use super::super::rand::Rng;
1226 |     // Use StdRng::rom_seed to debug test failures with deterministic inputs
1227 |     // use super::super::rand::{Rng, SeedableRng, StdRng};
1228 |     use std::fmt::{Debug, Error, Formatter};
1229 | 
1230 |     macro_rules! for_each_set {
1231 |         ($s:ident, $body:expr, $( $base:tt - $param:tt),+) => {
1232 |             $({
1233 |                 // eprintln!("Testing {}", stringify!($base));
1234 |                 let mut $s = $base::<$param>::new();
1235 |                 $body
1236 |             };)+
1237 |         };
1238 |     }
1239 | 
1240 |     fn random_vec(max_val: u64, len: usize) -> Vec<u64> {
1241 |         let mut rng = rand::thread_rng();
1242 |         (0..len).map(|_| rng.gen_range::<u64>(0, max_val)).collect()
1243 |     }
1244 | 
1245 |     fn random_string_vec(max_len: usize, len: usize) -> Vec<String> {
1246 |         // For deterministic vecs:
1247 |         // const RAND_SEED: [usize; 32] = [1; 32];
1248 |         // let mut rng = StdRng::from_seed(&RAND_SEED[..]);
1249 |         let mut rng = rand::thread_rng();
1250 |         (0..len.next_power_of_two())
1251 |             .map(|_| {
1252 |                 let mlen = max_len as isize;
1253 |                 let s_len = mlen + rng.gen_range::<isize>(-mlen / 2, mlen / 2);
1254 |                 rng.gen_iter::<char>()
1255 |                     .take(s_len as usize)
1256 |                     .collect::<String>()
1257 |             })
1258 |             .collect()
1259 |     }
1260 | 
1261 |     struct DebugVal<V: Debug + for<'a> Digital<'a>>(V);
1262 |     impl<V: Debug + for<'a> Digital<'a>> Debug for DebugVal<V> {
1263 |         fn fmt(&self, f: &mut Formatter) -> Result<(), Error> {
1264 |             write!(
1265 |                 f,
1266 |                 "[{:?} : {:?}]",
1267 |                 self.0,
1268 |                 self.0.digits().collect::<Vec<_>>()
1269 |             )
1270 |         }
1271 |     }
1272 | 
1273 |     #[test]
1274 |     fn basic_set_behavior() {
1275 |         for_each_set!(
1276 |             s,
1277 |             {
1278 |                 let mut v1 = random_vec(!0, 1 << 18);
1279 |                 {
1280 |                     let mut i = 0;
1281 |                     for item in v1.iter() {
1282 |                         s.add(*item);
1283 |                         assert!(
1284 |                             s.contains(item),
1285 |                             "[{:?}] lookup failed immediately for {:?}",
1286 |                             i,
1287 |                             DebugVal(*item)
1288 |                         );
1289 |                         i += 1;
1290 |                     }
1291 |                 }
1292 |                 let mut missing = Vec::new();
1293 |                 for item in v1.iter() {
1294 |                     if !s.contains(item) {
1295 |                         missing.push(*item)
1296 |                     }
1297 |                 }
1298 |                 let v: Vec<_> = missing
1299 |                     .iter()
1300 |                     .map(|x| {
1301 |                         let v: Vec<_> = x.digits().collect();
1302 |                         (x, v)
1303 |                     })
1304 |                     .collect();
1305 |                 assert_eq!(missing.len(), 0, "missing={:?}", v);
1306 |                 v1.sort();
1307 |                 v1.dedup_by_key(|x| *x);
1308 |                 let mut v2 = Vec::new();
1309 |                 for _ in 0..(1 << 17) {
1310 |                     if let Some(x) = v1.pop() {
1311 |                         v2.push(x)
1312 |                     } else {
1313 |                         break;
1314 |                     }
1315 |                 }
1316 |                 let mut failures = 0;
1317 |                 {
1318 |                     let mut ix = 0;
1319 |                     for i in v2.iter() {
1320 |                         let mut fail = 0;
1321 |                         if !s.contains(i) {
1322 |                             eprintln!("[{}] {:?} no longer in the set!", ix, DebugVal(*i));
1323 |                             fail = 1;
1324 |                         }
1325 |                         let res = s.remove(i);
1326 |                         if !res {
1327 |                             eprintln!("[{}] Failed to remove {:?}!", ix, DebugVal(*i));
1328 |                             fail = 1;
1329 |                         }
1330 |                         if s.contains(i) {
1331 |                             eprintln!(
1332 |                                 "[{}] {:?} still in the set after removal!",
1333 |                                 ix,
1334 |                                 DebugVal(*i)
1335 |                             );
1336 |                             fail = 1;
1337 |                         }
1338 |                         failures += fail;
1339 |                         ix += 1;
1340 |                     }
1341 |                 }
1342 |                 assert_eq!(failures, 0);
1343 |                 let mut failed = false;
1344 |                 for i in v2.iter() {
1345 |                     if s.contains(i) {
1346 |                         eprintln!("Deleted {:?}, but it's still there!", DebugVal(*i));
1347 |                         failed = true;
1348 |                     };
1349 |                 }
1350 |                 assert!(!failed);
1351 |                 for i in v1.iter() {
1352 |                     assert!(
1353 |                         s.contains(i),
1354 |                         "Didn't delete {:?}, but it is gone!",
1355 |                         DebugVal(*i)
1356 |                     );
1357 |                 }
1358 |             },
1359 |             CachingARTSet - u64,
1360 |             ARTSet - u64
1361 |         );
1362 |     }
1363 | 
1364 |     #[test]
1365 |     fn string_set_insert_remove() {
1366 |         for_each_set!(
1367 |             s,
1368 |             {
1369 |                 let v1 = random_string_vec(30, 1 << 18);
1370 |                 {
1371 |                     let mut failed = false;
1372 |                     for (i, item) in v1.iter().enumerate() {
1373 |                         s.add(item.clone());
1374 |                         if !s.contains(item) {
1375 |                             failed = true;
1376 |                             eprintln!(
1377 |                                 "[{}] lookup failed immediately for {:?}",
1378 |                                 i,
1379 |                                 DebugVal(item.clone())
1380 |                             );
1381 |                         }
1382 |                     }
1383 |                     assert!(!failed);
1384 |                 }
1385 |                 let mut ix = 0;
1386 |                 for t in 0..(1 << 18) {
1387 |                     s.add(v1[ix].clone());
1388 |                     assert!(s.contains(&v1[ix]));
1389 |                     ix += 1;
1390 |                     ix %= 1 << 18;
1391 |                     let in_set = s.contains(&v1[ix]);
1392 |                     let deleted = s.remove(&v1[ix]);
1393 |                     assert!(!in_set || deleted, "in_set={}, deleted={}", in_set, deleted);
1394 |                     assert!(
1395 |                         !s.contains(&v1[ix]),
1396 |                         "failed assertion (deleted={}) at t={} str={:?}",
1397 |                         deleted,
1398 |                         t,
1399 |                         DebugVal(v1[ix].clone())
1400 |                     );
1401 |                     ix += 1;
1402 |                     ix %= 1 << 18;
1403 |                 }
1404 |             },
1405 |             CachingARTSet - String,
1406 |             ARTSet - String
1407 |         );
1408 |     }
1409 | 
1410 |     #[test]
1411 |     fn string_set_behavior() {
1412 |         for_each_set!(
1413 |             s,
1414 |             {
1415 |                 let mut v1 = random_string_vec(30, 1 << 18);
1416 |                 {
1417 |                     let mut failed = false;
1418 |                     for (i, item) in v1.iter().enumerate() {
1419 |                         s.add(item.clone());
1420 |                         if !s.contains(item) {
1421 |                             failed = true;
1422 |                             eprintln!(
1423 |                                 "[{}] lookup failed immediately for {:?}",
1424 |                                 i,
1425 |                                 DebugVal(item.clone())
1426 |                             );
1427 |                         }
1428 |                     }
1429 |                     assert!(!failed);
1430 |                 }
1431 |                 let mut missing = Vec::new();
1432 |                 for item in v1.iter() {
1433 |                     if !s.contains(item) {
1434 |                         missing.push(item.clone())
1435 |                     }
1436 |                 }
1437 |                 let v: Vec<_> = missing
1438 |                     .iter()
1439 |                     .map(|x| {
1440 |                         let v: Vec<_> = x.digits().collect();
1441 |                         (x, v)
1442 |                     })
1443 |                     .collect();
1444 |                 assert_eq!(missing.len(), 0, "missing={:?}", v);
1445 |                 v1.sort();
1446 |                 v1.dedup_by_key(|x| x.clone());
1447 |                 let mut v2 = Vec::new();
1448 |                 for _ in 0..(1 << 17) {
1449 |                     if let Some(x) = v1.pop() {
1450 |                         v2.push(x)
1451 |                     } else {
1452 |                         break;
1453 |                     }
1454 |                 }
1455 |                 for (t, i) in v2.iter().enumerate() {
1456 |                     s.remove(i);
1457 |                     assert!(
1458 |                         !s.contains(i),
1459 |                         "[{}] Deletion failed immediately for {:?}",
1460 |                         t,
1461 |                         DebugVal(i.clone())
1462 |                     );
1463 |                 }
1464 |                 let mut failed = false;
1465 |                 for i in v2.iter() {
1466 |                     if s.contains(i) {
1467 |                         eprintln!("Deleted {:?}, but it's still there!", DebugVal(i.clone()));
1468 |                         failed = true;
1469 |                     };
1470 |                 }
1471 |                 assert!(!failed);
1472 |                 for i in v1.iter() {
1473 |                     assert!(
1474 |                         s.contains(i),
1475 |                         "Didn't delete {:?}, but it is gone!",
1476 |                         i.clone()
1477 |                     );
1478 |                 }
1479 |             },
1480 |             CachingARTSet - String,
1481 |             ARTSet - String
1482 |         );
1483 |     }
1484 | 
1485 |     fn assert_lists_equal<T: Debug + Eq + for<'a> Digital<'a> + Clone>(v1: &[T], v2: &[T]) {
1486 |         if v1 == v2 {
1487 |             return;
1488 |         }
1489 |         eprintln!("v1.len()={:?} v2.len()={:?}", v1.len(), v2.len());
1490 |         let mut ix = 0;
1491 |         for (i, j) in v1.iter().zip(v2.iter()) {
1492 |             if *i != *j {
1493 |                 eprintln!(
1494 |                     "[{:4?}] {:20?} != {:20?}",
1495 |                     ix,
1496 |                     DebugVal(i.clone()),
1497 |                     DebugVal(j.clone())
1498 |                 );
1499 |             }
1500 |             ix += 1;
1501 |         }
1502 |         assert!(false, "See error logs");
1503 |     }
1504 | 
1505 |     #[test]
1506 |     fn iterator_behavior() {
1507 |         let mut s = ARTSet::<u64>::new();
1508 |         let mut v1 = random_vec(!0, 1 << 10);
1509 |         for item in v1.iter() {
1510 |             s.add(*item);
1511 |             assert!(s.contains(item));
1512 |         }
1513 | 
1514 |         v1.sort();
1515 |         v1.dedup_by_key(|x| *x);
1516 |         // Iterating over the entire set should give us back the elements in sorted order.
1517 |         let mut elts = Vec::new();
1518 |         s.for_each_range(|x| elts.push(*x), None, None);
1519 |         assert_lists_equal(&v1[..], &elts[..]);
1520 |         if v1.len() < 4 {
1521 |             // extremely unlikely but retry in this case!
1522 |             iterator_behavior();
1523 |             return;
1524 |         }
1525 | 
1526 |         let q1 = v1.len() / 4;
1527 |         let q3 = 3 * (v1.len() / 4);
1528 |         elts.clear();
1529 |         eprintln!("q1={:?} q3={:?}", DebugVal(v1[q1]), DebugVal(v1[q3]));
1530 |         s.for_each_range(|x| elts.push(*x), Some(&v1[q1]), Some(&v1[q3]));
1531 |         assert_lists_equal(&v1[q1..q3], &elts[..]);
1532 |         elts.clear();
1533 |         s.for_each_range(|x| elts.push(*x), Some(&v1[q3]), Some(&v1[q1]));
1534 |         assert_eq!(elts.len(), 0);
1535 |         elts.clear();
1536 |         s.for_each_range(|x| elts.push(*x), Some(&v1[q1]), None);
1537 |         assert_lists_equal(&v1[q1..], &elts[..]);
1538 |         elts.clear();
1539 |         s.for_each_range(|x| elts.push(*x), None, Some(&v1[q3]));
1540 |         assert_lists_equal(&v1[..q3], &elts[..]);
1541 |         elts.clear();
1542 |         s.for_each_range_rev(|x| elts.push(*x), Some(&v1[q1]), Some(&v1[q3]));
1543 |         let vs = (&v1[q1..q3]).iter().rev().map(|x| *x).collect::<Vec<_>>();
1544 |         assert_lists_equal(&vs[..], &elts[..]);
1545 |     }
1546 | }
1547 | 


--------------------------------------------------------------------------------