├── .github
    └── workflows
    │   └── ci.yml
├── .gitignore
├── CITATION.cff
├── LICENSE
├── README.md
├── bench.nim
├── docs
    ├── .nojekyll
    └── index.html
├── example.nim
├── lapper.nimble
├── nim.cfg
└── src
    └── lapper.nim


/.github/workflows/ci.yml:
--------------------------------------------------------------------------------
 1 | name: CI
 2 | 
 3 | on:
 4 |   push:
 5 |     branches: [ master ]
 6 |   pull_request:
 7 |     branches: [ master ]
 8 | 
 9 | jobs:
10 |   test:
11 |     runs-on: ubuntu-latest
12 |     strategy:
13 |       matrix:
14 |         nim-version: ['1.6.20', '2.0.4', 'stable']
15 |     
16 |     steps:
17 |     - uses: actions/checkout@v4
18 |     
19 |     - name: Setup Nim
20 |       uses: jiro4989/setup-nim-action@v2
21 |       with:
22 |         nim-version: ${{ matrix.nim-version }}
23 |         repo-token: ${{ secrets.GITHUB_TOKEN }}
24 |     
25 |     - name: Run example
26 |       run: nim c -r example.nim


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
1 | nimcache
2 | src/lapper
3 | 


--------------------------------------------------------------------------------
/CITATION.cff:
--------------------------------------------------------------------------------
 1 | cff-version: 1.2.0
 2 | message: "If you use this software, please cite it as below."
 3 | authors:
 4 |   - 
 5 |     family-names: Pedersen
 6 |     given-names: Brent S.
 7 |     email: bpederse@gmail.com
 8 | 
 9 | title: "nim-lapper: fast, simple interval overlapping"
10 | version: 0.1.7
11 | date-released: 2021-01-01
12 | license: MIT
13 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2017 Brent S. Pedersen
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | simple, fast interval searches for nim
 2 | 
 3 | This uses a binary search in a sorted list of intervals along with knowledge of the longest interval.
 4 | It works when the size of the largest interval is smaller than the average distance between intervals.
 5 | As that ratio of largest-size::mean-distance increases, the performance decreases.
 6 | On realistic (for my use-case) data, this is 1000 times faster to query results and >5000
 7 | times faster to check for presence than a brute-force method. 
 8 | 
 9 | Lapper also has a special case `seek` method when we know that the queries will be in order.
10 | This method uses a cursor to indicate that start of the last search and does a linear search
11 | from that cursor to find matching intervals. This gives an additional 2-fold speedup over
12 | the `find` method.
13 | 
14 | API docs and examples in `nim-doc` format are available [here](https://brentp.github.io/nim-lapper/index.html)
15 | 
16 | See the `Performance` section for how large the intervals can be and still get a performance
17 | benefit.
18 | 
19 | To use this, it's simply required that your type have a `start(m) int` and `stop(m) int` method to satisfy
20 | the [concept](https://nim-lang.org/docs/manual.html#generics-concepts) used by `Lapper`
21 | 
22 | You can install this with `nimble install lapper`.
23 | 
24 | ## Example
25 | 
26 | ```nim
27 | import lapper
28 | import strutils
29 | 
30 | # define an appropriate data-type. it must have a `start(m) int` and `stop(m) int` method.
31 | #type myinterval = tuple[start:int, stop:int, val:int]
32 | # if we want to modify the result, then we have to use a ref object type
33 | type myinterval = ref object
34 |   start: int
35 |   stop: int
36 |   val: int
37 | 
38 | proc start(m: myinterval): int {.inline.} = return m.start
39 | proc stop(m: myinterval): int {.inline.} = return m.stop
40 | proc `$`(m:myinterval): string = return "(start:$#, stop:$#, val:$#)" % [$m.start, $m.stop, $m.val]
41 | 
42 | # create some fake data
43 | var ivs = new_seq[myinterval]()
44 | for i in countup(0, 100, 10):
45 |   ivs.add(myinterval(start:i, stop:i + 15, val:0))
46 | 
47 | # make the Lapper "data-structure"
48 | var l = lapify(ivs)
49 | var empty:seq[myinterval]
50 | 
51 | assert l.find(10, 20, empty)
52 | var notfound = not l.find(200, 300, empty)
53 | assert notfound
54 | 
55 | var res = new_seq[myinterval]()
56 | 
57 | # find is the more general case, l.seek gives a speed benefit when consecutive queries are in order.
58 | echo l.find(50, 70, res)
59 | echo res
60 | # @[(start: 40, stop: 55, val:0), (start: 50, stop: 65, val: 0), (start: 60, stop: 75, val: 0), (start: 70, stop: 85, val: 0)]
61 | for r in res:
62 |   r.val += 1
63 | 
64 | # or we can do a function on each overlapping interval
65 | l.each_seek(50, 60, proc(a:myinterval) = inc(a.val))
66 | # or
67 | l.each_find(50, 60, proc(a:myinterval) = a.val += 10)
68 | 
69 | discard l.seek(50, 70, res)
70 | echo res
71 | #@[(start:40, stop:55, val:12), (start:50, stop:65, val:12), (start:60, stop:75, val:1)]
72 | 
73 | ```
74 | 
75 | 
76 | ## Performance
77 | 
78 | The output of running `bench.nim` (with -d:release) which generates *200K intervals*
79 | with positions ranging from 0 to 50 million and max lengths from 10 to 1M is:
80 | 
81 | | max interval size | lapper time | lapper seek time | brute-force time | speedup | seek speedup | each-seek speedup |
82 | | ----------------- | ----------- | ---------------- | ---------------  | ------- | ------------ | ----------------- |
83 | |10|0.06|0.04|387.44|6983.81|9873.11|9681.66|
84 | |100|0.05|0.04|384.92|7344.32|10412.97|15200.84|
85 | |1000|0.06|0.05|375.37|6250.23|7942.50|15703.24|
86 | |10000|0.15|0.14|377.29|2554.61|2702.13|15942.76|
87 | |100000|0.99|0.99|377.88|383.36|381.37|16241.61|
88 | |1000000|12.52|12.53|425.61|34.01|33.96|17762.58|
89 | 
90 | Note that this is a worst-case scenario as we could also 
91 | simulate a case where there are few long intervals instead of
92 | many large ones as in this case. Even so, we get a 34X speedup with `lapper`.
93 | 
94 | Also note that testing for presence will be even faster than
95 | the above comparisons as it returns true as soon as an overlap is found.
96 | 


--------------------------------------------------------------------------------
/bench.nim:
--------------------------------------------------------------------------------
  1 | import lapper
  2 | import algorithm
  3 | import math
  4 | import strutils
  5 | import random
  6 | import times
  7 | 
  8 | #type myinterval = tuple[start:int, stop:int]
  9 | #proc start(m: myinterval): int {.inline.} = return m.start
 10 | #proc stop(m: myinterval): int {.inline.} = return m.stop
 11 | 
 12 | # define an appropriate data-type. it must have a `start(m) int` and `stop(m) int` method.
 13 | #type myinterval = tuple[start:int, stop:int, val:int]
 14 | # if we want to modify the result, then we have to use a ref object type
 15 | type myinterval = ref object
 16 |   start: int
 17 |   stop: int
 18 |   val: int
 19 | 
 20 | 
 21 | proc start(m: myinterval): int {.inline.} = return m.start
 22 | proc stop(m: myinterval): int {.inline.} = return m.stop
 23 | proc `$`(m:myinterval): string = return "(start:$#, stop:$#, val:$#)" % [$m.start, $m.stop, $m.val]
 24 | 
 25 | proc randomi(imin:int, imax:int): int =
 26 |   return imin + random(imax - imin)
 27 | 
 28 | proc brute_force(ivs: seq[Interval], start:int, stop:int, res: var seq[Interval]) =
 29 |   if res.len != 0: res.set_len(0)
 30 |   for i in ivs:
 31 |     if i.start <= stop and i.stop >= start: res.add(i)
 32 | 
 33 | proc make_random(n:int, range_max:int, size_min:int, size_max:int): seq[myinterval] =
 34 |   result = new_seq[myinterval](n)
 35 |   for i in 0..<n:
 36 |     var s = randomi(0, range_max)
 37 |     var e = s + randomi(size_min, size_max)
 38 |     var m:myinterval = myinterval(start:s, stop:e, val: 0)
 39 |     result[i] = m
 40 | 
 41 | 
 42 | var n_intervals = 200000
 43 | var range_max = 50000000 # 50M
 44 | var res = new_seq[myinterval](100)
 45 | 
 46 | echo "# generating and searching $#K random intervals in the domain of 0..$#M" % [$(n_intervals / 1000).int, $(range_max / 1000000).int]
 47 | echo "| max interval size | brute-force time | lapper time | lapper seek time | speedup | seek speedup | each_seek speedup |"
 48 | echo "| ----------------- | ---------------- | ----------- | ---------------  | ------- | ------------ | ----------------- |"
 49 | proc doit(m:myinterval) =
 50 |   discard m
 51 | 
 52 | for max_length_pow in @[1, 2, 3, 4, 5, 6, 7]:
 53 |     var size_max = pow(10'f64, max_length_pow.float64)
 54 |     var size_min = size_max / 3
 55 | 
 56 |     var ivs = make_random(n_intervals, range_max, size_min.int, size_max.int)
 57 |     ivs.sort(proc(a, b: myinterval): int =
 58 |       if a.start == b.start:
 59 |         return a.stop - b.stop
 60 |       else:
 61 |         return a.start - b.start)
 62 |     var icopy = ivs
 63 | 
 64 |     var t = cpuTime()
 65 |     for itry in 0..10:
 66 |       var l = lapify(ivs)
 67 |       for iv in icopy:
 68 |         discard l.find(iv.start, iv.stop, res)
 69 |         if len(res) == 0:
 70 |             stderr.write_line "WTF!!!"
 71 |             quit(2)
 72 |     var lap_time = (cpuTime() - t)/10
 73 | 
 74 |     t = cpuTime()
 75 |     for itry in 0..10:
 76 |       var l = lapify(ivs)
 77 |       for iv in ivs:
 78 |         discard l.seek(iv.start, iv.stop, res)
 79 |         if len(res) == 0:
 80 |             stderr.write_line "WTF!!!"
 81 |             quit(2)
 82 |     var lap_seek_time = (cpuTime() - t)/10
 83 | 
 84 |     t = cpuTime()
 85 |     for itry in 0..10:
 86 |       var l = lapify(ivs)
 87 |       for iv in ivs:
 88 |         l.each_seek(iv.start, iv.stop, doit)
 89 |     var lap_seek_do_time = (cpuTime() - t) / 10
 90 | 
 91 |     t = cpuTime()
 92 |     var brute_step = 10000
 93 |     # brute force is too slow so do 1/10th of intervals then multiply time
 94 |     for i in countup(0, icopy.high, brute_step):
 95 |       var iv = icopy[i]
 96 |       brute_force(icopy, iv.start, iv.stop, res)
 97 |       if len(res) == 0:
 98 |           stderr.write_line "brute WTF!!!"
 99 |           quit(2)
100 |     var brute_time = brute_step.float64 * (cpuTime() - t)
101 | 
102 |     var speed_up = brute_time / lap_time
103 |     var seek_speed_up = brute_time / lap_seek_time
104 |     var seek_do_speed_up = brute_time / lap_seek_do_time
105 | 
106 |     proc f(v:float64, precision:int=2): string =
107 |       return formatFloat(v, ffDecimal, precision=precision)
108 | 
109 |     echo "|", pow(10'f64, max_length_pow.float64).int, "|", f(brute_time), "|", f(lap_time, 3), "|", f(lap_seek_time, 3), "|", f(speed_up) , "|", f(seek_speed_up), "|", f(seek_do_speed_up), "|"
110 | 


--------------------------------------------------------------------------------
/docs/.nojekyll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/brentp/nim-lapper/bdd43a522d2bf1730794e3a68a45673f83a42cfe/docs/.nojekyll


--------------------------------------------------------------------------------
/docs/index.html:
--------------------------------------------------------------------------------
   1 | <?xml version="1.0" encoding="utf-8" ?>
   2 | <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
   3 |   "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
   4 | <!--  This file is generated by Nim. -->
   5 | <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
   6 | <head>
   7 | <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
   8 | 
   9 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  10 | 
  11 | <!-- Favicon -->
  12 | <link rel="shortcut icon" href="data:image/x-icon;base64,AAABAAEAEBAAAAEAIABoBAAAFgAAACgAAAAQAAAAIAAAAAEAIAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AAAAAAUAAAAF////AP///wD///8A////AP///wD///8A////AP///wD///8A////AAAAAAIAAABbAAAAlQAAAKIAAACbAAAAmwAAAKIAAACVAAAAWwAAAAL///8A////AP///wD///8A////AAAAABQAAADAAAAAYwAAAA3///8A////AP///wD///8AAAAADQAAAGMAAADAAAAAFP///wD///8A////AP///wAAAACdAAAAOv///wD///8A////AP///wD///8A////AP///wD///8AAAAAOgAAAJ3///8A////AP///wAAAAAnAAAAcP///wAAAAAoAAAASv///wD///8A////AP///wAAAABKAAAAKP///wAAAABwAAAAJ////wD///8AAAAAgQAAABwAAACIAAAAkAAAAJMAAACtAAAAFQAAABUAAACtAAAAkwAAAJAAAACIAAAAHAAAAIH///8A////AAAAAKQAAACrAAAAaP///wD///8AAAAARQAAANIAAADSAAAARf///wD///8AAAAAaAAAAKsAAACk////AAAAADMAAACcAAAAnQAAABj///8A////AP///wAAAAAYAAAAGP///wD///8A////AAAAABgAAACdAAAAnAAAADMAAAB1AAAAwwAAAP8AAADpAAAAsQAAAE4AAAAb////AP///wAAAAAbAAAATgAAALEAAADpAAAA/wAAAMMAAAB1AAAAtwAAAOkAAAD/AAAA/wAAAP8AAADvAAAA3gAAAN4AAADeAAAA3gAAAO8AAAD/AAAA/wAAAP8AAADpAAAAtwAAAGUAAAA/AAAA3wAAAP8AAAD/AAAA/wAAAP8AAAD/AAAA/wAAAP8AAAD/AAAA/wAAAP8AAADfAAAAPwAAAGX///8A////AAAAAEgAAADtAAAAvwAAAL0AAADGAAAA7wAAAO8AAADGAAAAvQAAAL8AAADtAAAASP///wD///8A////AP///wD///8AAAAAO////wD///8A////AAAAAIcAAACH////AP///wD///8AAAAAO////wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A//8AAP//AAD4HwAA7/cAAN/7AAD//wAAoYUAAJ55AACf+QAAh+EAAAAAAADAAwAA4AcAAP5/AAD//wAA//8AAA=="/>
  13 | 
  14 | <!-- Google fonts -->
  15 | <link href='https://fonts.googleapis.com/css?family=Raleway:400,600,900' rel='stylesheet' type='text/css'/>
  16 | <link href='https://fonts.googleapis.com/css?family=Source+Code+Pro:400,500,600' rel='stylesheet' type='text/css'/>
  17 | 
  18 | <!-- CSS -->
  19 | <title>Module lapper</title>
  20 | <style type="text/css" >
  21 | /*
  22 | Stylesheet for use with Docutils/rst2html.
  23 | 
  24 | See http://docutils.sf.net/docs/howto/html-stylesheets.html for how to
  25 | customize this style sheet.
  26 | 
  27 | Modified from Chad Skeeters' rst2html-style
  28 | https://bitbucket.org/cskeeters/rst2html-style/
  29 | 
  30 | Modified by Boyd Greenfield
  31 | */
  32 | /* SCSS variables */
  33 | /* Text weights */
  34 | /* Body colors */
  35 | /* Text colors */
  36 | /* Link colors */
  37 | /* Syntax highlighting colors */
  38 | /* Pct changes */
  39 | /* Mixins */
  40 | /* Body/layout */
  41 | html {
  42 |   font-size: 100%;
  43 |   -webkit-text-size-adjust: 100%;
  44 |   -ms-text-size-adjust: 100%; }
  45 | 
  46 | /* Where we want fancier font if available */
  47 | h1, h2, h3, h4, h5, h6, p.module-desc, table.docinfo + blockquote p, table.docinfo blockquote p, h1 + blockquote p {
  48 |   font-family: "Raleway", "Helvetica Neue", "HelveticaNeue", Helvetica, Arial, sans-serif !important; }
  49 | 
  50 | h1.title {
  51 |   font-weight: 900; }
  52 | 
  53 | body {
  54 |   font-family: "Helvetica Neue", "HelveticaNeue", "Raleway", Helvetica, Arial, sans-serif;
  55 |   font-weight: 400;
  56 |   font-size: 14px;
  57 |   line-height: 20px;
  58 |   color: #666;
  59 |   background-color: rgba(252, 248, 244, 0.75); }
  60 | 
  61 | /* Skeleton grid */
  62 | .container {
  63 |   position: relative;
  64 |   width: 100%;
  65 |   max-width: 960px;
  66 |   margin: 0 auto;
  67 |   padding: 0 20px;
  68 |   box-sizing: border-box; }
  69 | 
  70 | .column,
  71 | .columns {
  72 |   width: 100%;
  73 |   float: left;
  74 |   box-sizing: border-box; }
  75 | 
  76 | /* For devices larger than 400px */
  77 | @media (min-width: 400px) {
  78 |   .container {
  79 |     width: 100%;
  80 |     padding: 0; } }
  81 | /* For devices larger than 650px */
  82 | @media (min-width: 650px) {
  83 |   .container {
  84 |     width: 100%; }
  85 | 
  86 |   .column,
  87 |   .columns {
  88 |     margin-left: 4%; }
  89 | 
  90 |   .column:first-child,
  91 |   .columns:first-child {
  92 |     margin-left: 0; }
  93 | 
  94 |   .one.column,
  95 |   .one.columns {
  96 |     width: 4.66666666667%; }
  97 | 
  98 |   .two.columns {
  99 |     width: 13.3333333333%; }
 100 | 
 101 |   .three.columns {
 102 |     width: 22%; }
 103 | 
 104 |   .four.columns {
 105 |     width: 30.6666666667%; }
 106 | 
 107 |   .five.columns {
 108 |     width: 39.3333333333%; }
 109 | 
 110 |   .six.columns {
 111 |     width: 48%; }
 112 | 
 113 |   .seven.columns {
 114 |     width: 56.6666666667%; }
 115 | 
 116 |   .eight.columns {
 117 |     width: 65.3333333333%; }
 118 | 
 119 |   .nine.columns {
 120 |     width: 74.0%; }
 121 | 
 122 |   .ten.columns {
 123 |     width: 82.6666666667%; }
 124 | 
 125 |   .eleven.columns {
 126 |     width: 91.3333333333%; }
 127 | 
 128 |   .twelve.columns {
 129 |     width: 100%;
 130 |     margin-left: 0; }
 131 | 
 132 |   .one-third.column {
 133 |     width: 30.6666666667%; }
 134 | 
 135 |   .two-thirds.column {
 136 |     width: 65.3333333333%; } }
 137 | /* Customer Overrides */
 138 | .footer {
 139 |   text-align: center;
 140 |   color: #969696;
 141 |   padding-top: 10%; }
 142 | 
 143 | p.module-desc {
 144 |   font-size: 1.1em;
 145 |   color: #666666; }
 146 | 
 147 | a.link-seesrc {
 148 |   color: #aec7d2;
 149 |   font-style: italic; }
 150 | 
 151 | a.link-seesrc:hover {
 152 |   color: #6c9aae; }
 153 | 
 154 | #toc-list {
 155 |   word-wrap: break-word; }
 156 | 
 157 | ul.simple-toc {
 158 |   list-style: none; }
 159 | 
 160 | ul.simple-toc a.reference-toplevel {
 161 |   font-weight: bold;
 162 |   color: #0077b3; }
 163 | 
 164 | ul.simple-toc-section {
 165 |   list-style-type: circle;
 166 |   color: #6c9aae; }
 167 | 
 168 | ul.simple-toc-section a.reference {
 169 |   color: #0077b3; }
 170 | 
 171 | cite {
 172 |   font-style: italic !important; }
 173 | 
 174 | dt > pre {
 175 |   border-color: rgba(0, 0, 0, 0.15);
 176 |   background-color: transparent;
 177 |   margin: 15px 0px 5px; }
 178 | 
 179 | dd > pre {
 180 |   border-color: rgba(0, 0, 0, 0.1);
 181 |   background-color: whitesmoke;
 182 |   margin-top: 8px; }
 183 | 
 184 | .item > dd {
 185 |   margin-left: 10px;
 186 |   margin-bottom: 30px; }
 187 | 
 188 | /* Nim line-numbered tables */
 189 | .line-nums-table {
 190 |   width: 100%;
 191 |   table-layout: fixed; }
 192 | 
 193 | table.line-nums-table {
 194 |   border-radius: 4px;
 195 |   border: 1px solid #cccccc;
 196 |   background-color: whitesmoke;
 197 |   border-collapse: separate;
 198 |   margin-top: 15px;
 199 |   margin-bottom: 25px; }
 200 | 
 201 | .line-nums-table tbody {
 202 |   border: none; }
 203 | 
 204 | .line-nums-table td pre {
 205 |   border: none;
 206 |   background-color: transparent; }
 207 | 
 208 | .line-nums-table td.blob-line-nums {
 209 |   width: 28px; }
 210 | 
 211 | .line-nums-table td.blob-line-nums pre {
 212 |   color: #b0b0b0;
 213 |   -webkit-filter: opacity(75%);
 214 |   text-align: right;
 215 |   border-color: transparent;
 216 |   background-color: transparent;
 217 |   padding-left: 0px;
 218 |   margin-left: 0px;
 219 |   padding-right: 0px;
 220 |   margin-right: 0px; }
 221 | 
 222 | /* Docgen styles */
 223 | /* Links */
 224 | a {
 225 |   color: #0077b3;
 226 |   text-decoration: none; }
 227 | 
 228 | a:hover,
 229 | a:focus {
 230 |   color: #00334d;
 231 |   text-decoration: underline; }
 232 | 
 233 | a:visited {
 234 |   color: #00334d; }
 235 | 
 236 | a:focus {
 237 |   outline: thin dotted #2d2d2d;
 238 |   outline: 5px auto -webkit-focus-ring-color;
 239 |   outline-offset: -2px; }
 240 | 
 241 | a:hover,
 242 | a:active {
 243 |   outline: 0; }
 244 | 
 245 | sub,
 246 | sup {
 247 |   position: relative;
 248 |   font-size: 75%;
 249 |   line-height: 0;
 250 |   vertical-align: baseline; }
 251 | 
 252 | sup {
 253 |   top: -0.5em; }
 254 | 
 255 | sub {
 256 |   bottom: -0.25em; }
 257 | 
 258 | img {
 259 |   width: auto;
 260 |   height: auto;
 261 |   max-width: 100%;
 262 |   vertical-align: middle;
 263 |   border: 0;
 264 |   -ms-interpolation-mode: bicubic; }
 265 | 
 266 | @media print {
 267 |   * {
 268 |     color: black !important;
 269 |     text-shadow: none !important;
 270 |     background: transparent !important;
 271 |     box-shadow: none !important; }
 272 | 
 273 |   a,
 274 |   a:visited {
 275 |     text-decoration: underline; }
 276 | 
 277 |   a[href]:after {
 278 |     content: " (" attr(href) ")"; }
 279 | 
 280 |   abbr[title]:after {
 281 |     content: " (" attr(title) ")"; }
 282 | 
 283 |   .ir a:after,
 284 |   a[href^="javascript:"]:after,
 285 |   a[href^="#"]:after {
 286 |     content: ""; }
 287 | 
 288 |   pre,
 289 |   blockquote {
 290 |     border: 1px solid #999;
 291 |     page-break-inside: avoid; }
 292 | 
 293 |   thead {
 294 |     display: table-header-group; }
 295 | 
 296 |   tr,
 297 |   img {
 298 |     page-break-inside: avoid; }
 299 | 
 300 |   img {
 301 |     max-width: 100% !important; }
 302 | 
 303 |   @page {
 304 |     margin: 0.5cm; }
 305 | 
 306 |   h1 {
 307 |     page-break-before: always; }
 308 | 
 309 |   h1.title {
 310 |     page-break-before: avoid; }
 311 | 
 312 |   p,
 313 |   h2,
 314 |   h3 {
 315 |     orphans: 3;
 316 |     widows: 3; }
 317 | 
 318 |   h2,
 319 |   h3 {
 320 |     page-break-after: avoid; } }
 321 | .img-rounded {
 322 |   -webkit-border-radius: 6px;
 323 |   -moz-border-radius: 6px;
 324 |   border-radius: 6px; }
 325 | 
 326 | .img-polaroid {
 327 |   padding: 4px;
 328 |   background-color: rgba(252, 248, 244, 0.75);
 329 |   border: 1px solid #ccc;
 330 |   border: 1px solid rgba(0, 0, 0, 0.2);
 331 |   -webkit-box-shadow: 0 1px 3px rgba(0, 0, 0, 0.1);
 332 |   -moz-box-shadow: 0 1px 3px rgba(0, 0, 0, 0.1);
 333 |   box-shadow: 0 1px 3px rgba(0, 0, 0, 0.1); }
 334 | 
 335 | p {
 336 |   margin: 0 0 12px; }
 337 | 
 338 | small {
 339 |   font-size: 85%; }
 340 | 
 341 | strong {
 342 |   font-weight: 600; }
 343 | 
 344 | em {
 345 |   font-style: italic; }
 346 | 
 347 | cite {
 348 |   font-style: normal; }
 349 | 
 350 | h1,
 351 | h2,
 352 | h3,
 353 | h4,
 354 | h5,
 355 | h6 {
 356 |   font-family: "Helvetica Neue", "HelveticaNeue", "Raleway", Helvetica, Arial, sans-serif;
 357 |   font-weight: 600;
 358 |   line-height: 20px;
 359 |   color: inherit;
 360 |   text-rendering: optimizelegibility; }
 361 | 
 362 | h1 {
 363 |   font-size: 2em;
 364 |   padding-bottom: .15em;
 365 |   border-bottom: 1px solid #aaaaaa;
 366 |   margin-top: 1.0em;
 367 |   line-height: 1.2em; }
 368 | 
 369 | h1.title {
 370 |   padding-bottom: 1em;
 371 |   border-bottom: 0px;
 372 |   font-size: 2.75em; }
 373 | 
 374 | h2 {
 375 |   font-size: 1.5em;
 376 |   margin-top: 1.5em; }
 377 | 
 378 | h3 {
 379 |   font-size: 1.3em;
 380 |   font-style: italic;
 381 |   margin-top: 0.75em; }
 382 | 
 383 | h4 {
 384 |   font-size: 1.3em;
 385 |   margin-top: 0.5em; }
 386 | 
 387 | h5 {
 388 |   font-size: 1.2em;
 389 |   margin-top: 0.25em; }
 390 | 
 391 | h6 {
 392 |   font-size: 1.1em; }
 393 | 
 394 | ul,
 395 | ol {
 396 |   padding: 0;
 397 |   margin: 0 0 0px 15px; }
 398 | 
 399 | ul ul,
 400 | ul ol,
 401 | ol ol,
 402 | ol ul {
 403 |   margin-bottom: 0; }
 404 | 
 405 | li {
 406 |   line-height: 20px; }
 407 | 
 408 | dl {
 409 |   margin-bottom: 20px; }
 410 | 
 411 | dt,
 412 | dd {
 413 |   line-height: 20px; }
 414 | 
 415 | dt {
 416 |   font-weight: bold; }
 417 | 
 418 | dd {
 419 |   margin-left: 10px;
 420 |   margin-bottom: 26px; }
 421 | 
 422 | hr {
 423 |   margin: 20px 0;
 424 |   border: 0;
 425 |   border-top: 1px solid #eeeeee;
 426 |   border-bottom: 1px solid #ffffff; }
 427 | 
 428 | abbr[title],
 429 | abbr[data-original-title] {
 430 |   cursor: help;
 431 |   border-bottom: 1px dotted #999999; }
 432 | 
 433 | abbr.initialism {
 434 |   font-size: 90%;
 435 |   text-transform: uppercase; }
 436 | 
 437 | blockquote {
 438 |   padding: 0 0 0 15px;
 439 |   margin: 0 0 20px;
 440 |   border-left: 5px solid #EFEBE0; }
 441 | 
 442 | table.docinfo + blockquote, table.docinfo blockquote, h1 + blockquote {
 443 |   border-left: 5px solid #c9c9c9;
 444 | }
 445 | 
 446 | table.docinfo + blockquote p, table.docinfo blockquote p, h1 + blockquote p {
 447 |   margin-bottom: 0;
 448 |   font-size: 15px;
 449 |   font-weight: 200;
 450 |   line-height: 1.5;
 451 |   font-style: italic; }
 452 | 
 453 | q:before,
 454 | q:after,
 455 | blockquote:before,
 456 | blockquote:after {
 457 |   content: ""; }
 458 | 
 459 | address {
 460 |   display: block;
 461 |   margin-bottom: 20px;
 462 |   font-style: normal;
 463 |   line-height: 20px; }
 464 | 
 465 | code,
 466 | pre {
 467 |   font-family: "Source Code Pro", Monaco, Menlo, Consolas, "Courier New", monospace;
 468 |   padding: 0 3px 2px;
 469 |   font-weight: 500;
 470 |   font-size: 12px;
 471 |   color: #444444;
 472 |   -webkit-border-radius: 3px;
 473 |   -moz-border-radius: 3px;
 474 |   border-radius: 3px; }
 475 | 
 476 | .pre {
 477 |   font-family: "Source Code Pro", Monaco, Menlo, Consolas, "Courier New", monospace;
 478 |   font-weight: 600;
 479 |   /*color: #504da6;*/
 480 | }
 481 | 
 482 | code {
 483 |   padding: 2px 4px;
 484 |   color: #444444;
 485 |   white-space: nowrap;
 486 |   background-color: white;
 487 |   border: 1px solid #777777; }
 488 | 
 489 | pre {
 490 |   display: inline-block;
 491 |   box-sizing: border-box;
 492 |   min-width: calc(100% - 19.5px);
 493 |   padding: 9.5px;
 494 |   margin: 0.25em 10px 0.25em 10px;
 495 |   font-size: 14px;
 496 |   line-height: 20px;
 497 |   white-space: pre !important;
 498 |   overflow-y: hidden;
 499 |   overflow-x: visible;
 500 |   background-color: whitesmoke;
 501 |   border: 1px solid #cccccc;
 502 |   -webkit-border-radius: 4px;
 503 |   -moz-border-radius: 4px;
 504 |   border-radius: 4px; }
 505 | 
 506 | pre.prettyprint {
 507 |   margin-bottom: 20px; }
 508 | 
 509 | pre code {
 510 |   padding: 0;
 511 |   color: inherit;
 512 |   white-space: pre;
 513 |   overflow-x: visible;
 514 |   background-color: transparent;
 515 |   border: 0; }
 516 | 
 517 | .pre-scrollable {
 518 |   max-height: 340px;
 519 |   overflow-y: scroll; }
 520 | 
 521 | table {
 522 |   max-width: 100%;
 523 |   background-color: transparent;
 524 |   border-collapse: collapse;
 525 |   border-spacing: 0; }
 526 | 
 527 | table th, table td {
 528 |   padding: 0px 8px 0px;
 529 | }
 530 | 
 531 | .table {
 532 |   width: 100%;
 533 |   margin-bottom: 20px; }
 534 | 
 535 | .table th,
 536 | .table td {
 537 |   padding: 8px;
 538 |   line-height: 20px;
 539 |   text-align: left;
 540 |   vertical-align: top;
 541 |   border-top: 1px solid #444444; }
 542 | 
 543 | .table th {
 544 |   font-weight: bold; }
 545 | 
 546 | .table thead th {
 547 |   vertical-align: bottom; }
 548 | 
 549 | .table caption + thead tr:first-child th,
 550 | .table caption + thead tr:first-child td,
 551 | .table colgroup + thead tr:first-child th,
 552 | .table colgroup + thead tr:first-child td,
 553 | .table thead:first-child tr:first-child th,
 554 | .table thead:first-child tr:first-child td {
 555 |   border-top: 0; }
 556 | 
 557 | .table tbody + tbody {
 558 |   border-top: 2px solid #444444; }
 559 | 
 560 | .table .table {
 561 |   background-color: rgba(252, 248, 244, 0.75); }
 562 | 
 563 | .table-condensed th,
 564 | .table-condensed td {
 565 |   padding: 4px 5px; }
 566 | 
 567 | .table-bordered {
 568 |   border: 1px solid #444444;
 569 |   border-collapse: separate;
 570 |   *border-collapse: collapse;
 571 |   border-left: 0;
 572 |   -webkit-border-radius: 4px;
 573 |   -moz-border-radius: 4px;
 574 |   border-radius: 4px; }
 575 | 
 576 | .table-bordered th,
 577 | .table-bordered td {
 578 |   border-left: 1px solid #444444; }
 579 | 
 580 | .table-bordered caption + thead tr:first-child th,
 581 | .table-bordered caption + tbody tr:first-child th,
 582 | .table-bordered caption + tbody tr:first-child td,
 583 | .table-bordered colgroup + thead tr:first-child th,
 584 | .table-bordered colgroup + tbody tr:first-child th,
 585 | .table-bordered colgroup + tbody tr:first-child td,
 586 | .table-bordered thead:first-child tr:first-child th,
 587 | .table-bordered tbody:first-child tr:first-child th,
 588 | .table-bordered tbody:first-child tr:first-child td {
 589 |   border-top: 0; }
 590 | 
 591 | .table-bordered thead:first-child tr:first-child > th:first-child,
 592 | .table-bordered tbody:first-child tr:first-child > td:first-child,
 593 | .table-bordered tbody:first-child tr:first-child > th:first-child {
 594 |   -webkit-border-top-left-radius: 4px;
 595 |   border-top-left-radius: 4px;
 596 |   -moz-border-radius-topleft: 4px; }
 597 | 
 598 | .table-bordered thead:first-child tr:first-child > th:last-child,
 599 | .table-bordered tbody:first-child tr:first-child > td:last-child,
 600 | .table-bordered tbody:first-child tr:first-child > th:last-child {
 601 |   -webkit-border-top-right-radius: 4px;
 602 |   border-top-right-radius: 4px;
 603 |   -moz-border-radius-topright: 4px; }
 604 | 
 605 | .table-bordered thead:last-child tr:last-child > th:first-child,
 606 | .table-bordered tbody:last-child tr:last-child > td:first-child,
 607 | .table-bordered tbody:last-child tr:last-child > th:first-child,
 608 | .table-bordered tfoot:last-child tr:last-child > td:first-child,
 609 | .table-bordered tfoot:last-child tr:last-child > th:first-child {
 610 |   -webkit-border-bottom-left-radius: 4px;
 611 |   border-bottom-left-radius: 4px;
 612 |   -moz-border-radius-bottomleft: 4px; }
 613 | 
 614 | .table-bordered thead:last-child tr:last-child > th:last-child,
 615 | .table-bordered tbody:last-child tr:last-child > td:last-child,
 616 | .table-bordered tbody:last-child tr:last-child > th:last-child,
 617 | .table-bordered tfoot:last-child tr:last-child > td:last-child,
 618 | .table-bordered tfoot:last-child tr:last-child > th:last-child {
 619 |   -webkit-border-bottom-right-radius: 4px;
 620 |   border-bottom-right-radius: 4px;
 621 |   -moz-border-radius-bottomright: 4px; }
 622 | 
 623 | .table-bordered tfoot + tbody:last-child tr:last-child td:first-child {
 624 |   -webkit-border-bottom-left-radius: 0;
 625 |   border-bottom-left-radius: 0;
 626 |   -moz-border-radius-bottomleft: 0; }
 627 | 
 628 | .table-bordered tfoot + tbody:last-child tr:last-child td:last-child {
 629 |   -webkit-border-bottom-right-radius: 0;
 630 |   border-bottom-right-radius: 0;
 631 |   -moz-border-radius-bottomright: 0; }
 632 | 
 633 | .table-bordered caption + thead tr:first-child th:first-child,
 634 | .table-bordered caption + tbody tr:first-child td:first-child,
 635 | .table-bordered colgroup + thead tr:first-child th:first-child,
 636 | .table-bordered colgroup + tbody tr:first-child td:first-child {
 637 |   -webkit-border-top-left-radius: 4px;
 638 |   border-top-left-radius: 4px;
 639 |   -moz-border-radius-topleft: 4px; }
 640 | 
 641 | .table-bordered caption + thead tr:first-child th:last-child,
 642 | .table-bordered caption + tbody tr:first-child td:last-child,
 643 | .table-bordered colgroup + thead tr:first-child th:last-child,
 644 | .table-bordered colgroup + tbody tr:first-child td:last-child {
 645 |   -webkit-border-top-right-radius: 4px;
 646 |   border-top-right-radius: 4px;
 647 |   -moz-border-radius-topright: 4px; }
 648 | 
 649 | table.docutils th {
 650 |   background-color: #e8e8e8; }
 651 | 
 652 | table.docutils tr:hover {
 653 |   background-color: whitesmoke; }
 654 | 
 655 | .table-striped tbody > tr:nth-child(odd) > td,
 656 | .table-striped tbody > tr:nth-child(odd) > th {
 657 |   background-color: rgba(252, 248, 244, 0.75); }
 658 | 
 659 | .table-hover tbody tr:hover > td,
 660 | .table-hover tbody tr:hover > th {
 661 |   background-color: rgba(241, 222, 204, 0.75); }
 662 | 
 663 | table td[class*="span"],
 664 | table th[class*="span"],
 665 | .row-fluid table td[class*="span"],
 666 | .row-fluid table th[class*="span"] {
 667 |   display: table-cell;
 668 |   float: none;
 669 |   margin-left: 0; }
 670 | 
 671 | .hero-unit {
 672 |   padding: 60px;
 673 |   margin-bottom: 30px;
 674 |   font-size: 18px;
 675 |   font-weight: 200;
 676 |   line-height: 30px;
 677 |   color: inherit;
 678 |   background-color: rgba(230, 197, 164, 0.75);
 679 |   -webkit-border-radius: 6px;
 680 |   -moz-border-radius: 6px;
 681 |   border-radius: 6px; }
 682 | 
 683 | .hero-unit h1 {
 684 |   margin-bottom: 0;
 685 |   font-size: 60px;
 686 |   line-height: 1;
 687 |   letter-spacing: -1px;
 688 |   color: inherit; }
 689 | 
 690 | .hero-unit li {
 691 |   line-height: 30px; }
 692 | 
 693 | /* rst2html default used to remove borders from tables and images */
 694 | .borderless, table.borderless td, table.borderless th {
 695 |   border: 0; }
 696 | 
 697 | table.borderless td, table.borderless th {
 698 |   /* Override padding for "table.docutils td" with "! important".
 699 |      The right padding separates the table cells. */
 700 |   padding: 0 0.5em 0 0 !important; }
 701 | 
 702 | .first {
 703 |   /* Override more specific margin styles with "! important". */
 704 |   margin-top: 0 !important; }
 705 | 
 706 | .last, .with-subtitle {
 707 |   margin-bottom: 0 !important; }
 708 | 
 709 | .hidden {
 710 |   display: none; }
 711 | 
 712 | a.toc-backref {
 713 |   text-decoration: none;
 714 |   color: #444444; }
 715 | 
 716 | blockquote.epigraph {
 717 |   margin: 2em 5em; }
 718 | 
 719 | dl.docutils dd {
 720 |   margin-bottom: 0.5em; }
 721 | 
 722 | object[type="image/svg+xml"], object[type="application/x-shockwave-flash"] {
 723 |   overflow: hidden; }
 724 | 
 725 | /* Uncomment (and remove this text!) to get bold-faced definition list terms
 726 | dl.docutils dt {
 727 |   font-weight: bold }
 728 | */
 729 | div.abstract {
 730 |   margin: 2em 5em; }
 731 | 
 732 | div.abstract p.topic-title {
 733 |   font-weight: bold;
 734 |   text-align: center; }
 735 | 
 736 | div.admonition, div.attention, div.caution, div.danger, div.error,
 737 | div.hint, div.important, div.note, div.tip, div.warning {
 738 |   margin: 2em;
 739 |   border: medium outset;
 740 |   padding: 1em; }
 741 | 
 742 | div.note, div.warning {
 743 |   margin: 1.5em 0px;
 744 |   border: none; }
 745 | 
 746 | div.note p.admonition-title,
 747 | div.warning p.admonition-title {
 748 |   display: none; }
 749 | 
 750 | /* Clearfix
 751 |  * http://css-tricks.com/snippets/css/clear-fix/
 752 |  */
 753 | div.note:after,
 754 | div.warning:after {
 755 |   content: "";
 756 |   display: table;
 757 |   clear: both; }
 758 | 
 759 | div.note p:before,
 760 | div.warning p:before {
 761 |   display: block;
 762 |   float: left;
 763 |   font-size: 4em;
 764 |   line-height: 1em;
 765 |   margin-right: 20px;
 766 |   margin-left: 0em;
 767 |   margin-top: -10px;
 768 |   content: '\0270D';
 769 |   /*handwriting*/ }
 770 | 
 771 | div.warning p:before {
 772 |   content: '\026A0';
 773 |   /*warning*/ }
 774 | 
 775 | div.admonition p.admonition-title, div.hint p.admonition-title,
 776 | div.important p.admonition-title, div.note p.admonition-title,
 777 | div.tip p.admonition-title {
 778 |   font-weight: bold;
 779 |   font-family: "Helvetica Neue", "HelveticaNeue", "Raleway", Helvetica, Arial, sans-serif; }
 780 | 
 781 | div.attention p.admonition-title, div.caution p.admonition-title,
 782 | div.danger p.admonition-title, div.error p.admonition-title,
 783 | div.warning p.admonition-title, .code .error {
 784 |   color: #b30000;
 785 |   font-weight: bold;
 786 |   font-family: "Helvetica Neue", "HelveticaNeue", "Raleway", Helvetica, Arial, sans-serif; }
 787 | 
 788 | /* Uncomment (and remove this text!) to get reduced vertical space in
 789 |    compound paragraphs.
 790 | div.compound .compound-first, div.compound .compound-middle {
 791 |   margin-bottom: 0.5em }
 792 | 
 793 | div.compound .compound-last, div.compound .compound-middle {
 794 |   margin-top: 0.5em }
 795 | */
 796 | div.dedication {
 797 |   margin: 2em 5em;
 798 |   text-align: center;
 799 |   font-style: italic; }
 800 | 
 801 | div.dedication p.topic-title {
 802 |   font-weight: bold;
 803 |   font-style: normal; }
 804 | 
 805 | div.figure {
 806 |   margin-left: 2em;
 807 |   margin-right: 2em; }
 808 | 
 809 | div.footer, div.header {
 810 |   clear: both;
 811 |   font-size: smaller; }
 812 | 
 813 | div.line-block {
 814 |   display: block;
 815 |   margin-top: 1em;
 816 |   margin-bottom: 1em; }
 817 | 
 818 | div.line-block div.line-block {
 819 |   margin-top: 0;
 820 |   margin-bottom: 0;
 821 |   margin-left: 1.5em; }
 822 | 
 823 | div.sidebar {
 824 |   margin: 0 0 0.5em 1em;
 825 |   border: medium outset;
 826 |   padding: 1em;
 827 |   background-color: rgba(252, 248, 244, 0.75);
 828 |   width: 40%;
 829 |   float: right;
 830 |   clear: right; }
 831 | 
 832 | div.sidebar p.rubric {
 833 |   font-family: "Helvetica Neue", "HelveticaNeue", "Raleway", Helvetica, Arial, sans-serif;
 834 |   font-size: medium; }
 835 | 
 836 | div.system-messages {
 837 |   margin: 5em; }
 838 | 
 839 | div.system-messages h1 {
 840 |   color: #b30000; }
 841 | 
 842 | div.system-message {
 843 |   border: medium outset;
 844 |   padding: 1em; }
 845 | 
 846 | div.system-message p.system-message-title {
 847 |   color: #b30000;
 848 |   font-weight: bold; }
 849 | 
 850 | div.topic {
 851 |   margin: 2em; }
 852 | 
 853 | h1.section-subtitle, h2.section-subtitle, h3.section-subtitle,
 854 | h4.section-subtitle, h5.section-subtitle, h6.section-subtitle {
 855 |   margin-top: 0.4em; }
 856 | 
 857 | h1.title {
 858 |   text-align: center; }
 859 | 
 860 | h2.subtitle {
 861 |   text-align: center; }
 862 | 
 863 | hr.docutils {
 864 |   width: 75%; }
 865 | 
 866 | img.align-left, .figure.align-left, object.align-left {
 867 |   clear: left;
 868 |   float: left;
 869 |   margin-right: 1em; }
 870 | 
 871 | img.align-right, .figure.align-right, object.align-right {
 872 |   clear: right;
 873 |   float: right;
 874 |   margin-left: 1em; }
 875 | 
 876 | img.align-center, .figure.align-center, object.align-center {
 877 |   display: block;
 878 |   margin-left: auto;
 879 |   margin-right: auto; }
 880 | 
 881 | .align-left {
 882 |   text-align: left; }
 883 | 
 884 | .align-center {
 885 |   clear: both;
 886 |   text-align: center; }
 887 | 
 888 | .align-right {
 889 |   text-align: right; }
 890 | 
 891 | /* reset inner alignment in figures */
 892 | div.align-right {
 893 |   text-align: inherit; }
 894 | 
 895 | /* div.align-center * { */
 896 | /*   text-align: left } */
 897 | 
 898 | ul.simple > li {
 899 |   margin-bottom: 0.5em }
 900 | 
 901 | ol.simple, ul.simple {
 902 |   margin-bottom: 1em; }
 903 | 
 904 | ol.arabic {
 905 |   list-style: decimal; }
 906 | 
 907 | ol.loweralpha {
 908 |   list-style: lower-alpha; }
 909 | 
 910 | ol.upperalpha {
 911 |   list-style: upper-alpha; }
 912 | 
 913 | ol.lowerroman {
 914 |   list-style: lower-roman; }
 915 | 
 916 | ol.upperroman {
 917 |   list-style: upper-roman; }
 918 | 
 919 | p.attribution {
 920 |   text-align: right;
 921 |   margin-left: 50%; }
 922 | 
 923 | p.caption {
 924 |   font-style: italic; }
 925 | 
 926 | p.credits {
 927 |   font-style: italic;
 928 |   font-size: smaller; }
 929 | 
 930 | p.label {
 931 |   white-space: nowrap; }
 932 | 
 933 | p.rubric {
 934 |   font-weight: bold;
 935 |   font-size: larger;
 936 |   color: maroon;
 937 |   text-align: center; }
 938 | 
 939 | p.sidebar-title {
 940 |   font-family: "Helvetica Neue", "HelveticaNeue", "Raleway", Helvetica, Arial, sans-serif;
 941 |   font-weight: bold;
 942 |   font-size: larger; }
 943 | 
 944 | p.sidebar-subtitle {
 945 |   font-family: "Helvetica Neue", "HelveticaNeue", "Raleway", Helvetica, Arial, sans-serif;
 946 |   font-weight: bold; }
 947 | 
 948 | p.topic-title {
 949 |   font-weight: bold; }
 950 | 
 951 | pre.address {
 952 |   margin-bottom: 0;
 953 |   margin-top: 0;
 954 |   font: inherit; }
 955 | 
 956 | pre.literal-block, pre.doctest-block, pre.math, pre.code {
 957 |   margin-left: 2em;
 958 |   margin-right: 2em; }
 959 | 
 960 | pre.code .ln {
 961 |   color: grey; }
 962 | 
 963 | /* line numbers */
 964 | pre.code, code {
 965 |   background-color: #eeeeee; }
 966 | 
 967 | pre.code .comment, code .comment {
 968 |   color: #5c6576; }
 969 | 
 970 | pre.code .keyword, code .keyword {
 971 |   color: #3B0D06;
 972 |   font-weight: bold; }
 973 | 
 974 | pre.code .literal.string, code .literal.string {
 975 |   color: #0c5404; }
 976 | 
 977 | pre.code .name.builtin, code .name.builtin {
 978 |   color: #352b84; }
 979 | 
 980 | pre.code .deleted, code .deleted {
 981 |   background-color: #DEB0A1; }
 982 | 
 983 | pre.code .inserted, code .inserted {
 984 |   background-color: #A3D289; }
 985 | 
 986 | span.classifier {
 987 |   font-family: "Helvetica Neue", "HelveticaNeue", "Raleway", Helvetica, Arial, sans-serif;
 988 |   font-style: oblique; }
 989 | 
 990 | span.classifier-delimiter {
 991 |   font-family: "Helvetica Neue", "HelveticaNeue", "Raleway", Helvetica, Arial, sans-serif;
 992 |   font-weight: bold; }
 993 | 
 994 | span.interpreted {
 995 |   font-family: "Helvetica Neue", "HelveticaNeue", "Raleway", Helvetica, Arial, sans-serif; }
 996 | 
 997 | span.option {
 998 |   white-space: nowrap; }
 999 | 
1000 | span.pre {
1001 |   white-space: pre; }
1002 | 
1003 | span.problematic {
1004 |   color: #b30000; }
1005 | 
1006 | span.section-subtitle {
1007 |   /* font-size relative to parent (h1..h6 element) */
1008 |   font-size: 80%; }
1009 | 
1010 | table.citation {
1011 |   border-left: solid 1px #666666;
1012 |   margin-left: 1px; }
1013 | 
1014 | table.docinfo {
1015 |   margin: 0em;
1016 |   margin-top: 2em;
1017 |   margin-bottom: 2em;
1018 |   font-family: "Raleway", "Helvetica Neue", "HelveticaNeue", Helvetica, Arial, sans-serif !important;
1019 |   color: #444444; }
1020 | 
1021 | table.docutils {
1022 |   margin-top: 0.5em;
1023 |   margin-bottom: 0.5em; }
1024 | 
1025 | table.footnote {
1026 |   border-left: solid 1px #2d2d2d;
1027 |   margin-left: 1px; }
1028 | 
1029 | table.docutils td, table.docutils th,
1030 | table.docinfo td, table.docinfo th {
1031 |   padding-left: 0.5em;
1032 |   padding-right: 0.5em;
1033 |   vertical-align: top; }
1034 | 
1035 | table.docutils th.field-name, table.docinfo th.docinfo-name {
1036 |   font-weight: 700;
1037 |   text-align: left;
1038 |   white-space: nowrap;
1039 |   padding-left: 0; }
1040 | 
1041 | h1 tt.docutils, h2 tt.docutils, h3 tt.docutils,
1042 | h4 tt.docutils, h5 tt.docutils, h6 tt.docutils {
1043 |   font-size: 100%; }
1044 | 
1045 | ul.auto-toc {
1046 |   list-style-type: none; }
1047 | 
1048 | span.DecNumber {
1049 |   color: #252dbe; }
1050 | 
1051 | span.BinNumber {
1052 |   color: #252dbe; }
1053 | 
1054 | span.HexNumber {
1055 |   color: #252dbe; }
1056 | 
1057 | span.OctNumber {
1058 |   color: #252dbe; }
1059 | 
1060 | span.FloatNumber {
1061 |   color: #252dbe; }
1062 | 
1063 | span.Identifier {
1064 |   color: #3b3b3b; }
1065 | 
1066 | span.Keyword {
1067 |   font-weight: 600;
1068 |   color: #5e8f60; }
1069 | 
1070 | span.StringLit {
1071 |   color: #a4255b; }
1072 | 
1073 | span.LongStringLit {
1074 |   color: #a4255b; }
1075 | 
1076 | span.CharLit {
1077 |   color: #a4255b; }
1078 | 
1079 | span.EscapeSequence {
1080 |   color: black; }
1081 | 
1082 | span.Operator {
1083 |   color: black; }
1084 | 
1085 | span.Punctuation {
1086 |   color: black; }
1087 | 
1088 | span.Comment, span.LongComment {
1089 |   font-style: italic;
1090 |   font-weight: 400;
1091 |   color: #484a86; }
1092 | 
1093 | span.RegularExpression {
1094 |   color: darkviolet; }
1095 | 
1096 | span.TagStart {
1097 |   color: darkviolet; }
1098 | 
1099 | span.TagEnd {
1100 |   color: darkviolet; }
1101 | 
1102 | span.Key {
1103 |   color: #252dbe; }
1104 | 
1105 | span.Value {
1106 |   color: #252dbe; }
1107 | 
1108 | span.RawData {
1109 |   color: #a4255b; }
1110 | 
1111 | span.Assembler {
1112 |   color: #252dbe; }
1113 | 
1114 | span.Preprocessor {
1115 |   color: #252dbe; }
1116 | 
1117 | span.Directive {
1118 |   color: #252dbe; }
1119 | 
1120 | span.Command, span.Rule, span.Hyperlink, span.Label, span.Reference,
1121 | span.Other {
1122 |   color: black; }
1123 | 
1124 | /* Pop type, const, proc, and iterator defs in nim def blocks */
1125 | dt pre > span.Identifier, dt pre > span.Operator {
1126 |   color: #155da4;
1127 |   font-weight: 700; }
1128 | 
1129 | dt pre > span.Identifier ~ span.Identifier, dt pre > span.Operator ~ span.Identifier {
1130 |   color: inherit;
1131 |   font-weight: inherit; }
1132 | 
1133 | dt pre > span.Operator ~ span.Identifier, dt pre > span.Operator ~ span.Operator {
1134 |   color: inherit;
1135 |   font-weight: inherit; }
1136 | 
1137 | /* Nim sprite for the footer (taken from main page favicon) */
1138 | .nim-sprite {
1139 |   display: inline-block;
1140 |   height: 12px;
1141 |   width: 12px;
1142 |   background-position: 0 0;
1143 |   background-size: 12px 12px;
1144 |   -webkit-filter: opacity(50%);
1145 |   background-repeat: no-repeat;
1146 |   background-image: url("data:image/x-icon;base64,AAABAAEAEBAAAAEAIABoBAAAFgAAACgAAAAQAAAAIAAAAAEAIAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AAAAAAUAAAAF////AP///wD///8A////AP///wD///8A////AP///wD///8A////AAAAAAIAAABbAAAAlQAAAKIAAACbAAAAmwAAAKIAAACVAAAAWwAAAAL///8A////AP///wD///8A////AAAAABQAAADAAAAAYwAAAA3///8A////AP///wD///8AAAAADQAAAGMAAADAAAAAFP///wD///8A////AP///wAAAACdAAAAOv///wD///8A////AP///wD///8A////AP///wD///8AAAAAOgAAAJ3///8A////AP///wAAAAAnAAAAcP///wAAAAAoAAAASv///wD///8A////AP///wAAAABKAAAAKP///wAAAABwAAAAJ////wD///8AAAAAgQAAABwAAACIAAAAkAAAAJMAAACtAAAAFQAAABUAAACtAAAAkwAAAJAAAACIAAAAHAAAAIH///8A////AAAAAKQAAACrAAAAaP///wD///8AAAAARQAAANIAAADSAAAARf///wD///8AAAAAaAAAAKsAAACk////AAAAADMAAACcAAAAnQAAABj///8A////AP///wAAAAAYAAAAGP///wD///8A////AAAAABgAAACdAAAAnAAAADMAAAB1AAAAwwAAAP8AAADpAAAAsQAAAE4AAAAb////AP///wAAAAAbAAAATgAAALEAAADpAAAA/wAAAMMAAAB1AAAAtwAAAOkAAAD/AAAA/wAAAP8AAADvAAAA3gAAAN4AAADeAAAA3gAAAO8AAAD/AAAA/wAAAP8AAADpAAAAtwAAAGUAAAA/AAAA3wAAAP8AAAD/AAAA/wAAAP8AAAD/AAAA/wAAAP8AAAD/AAAA/wAAAP8AAADfAAAAPwAAAGX///8A////AAAAAEgAAADtAAAAvwAAAL0AAADGAAAA7wAAAO8AAADGAAAAvQAAAL8AAADtAAAASP///wD///8A////AP///wD///8AAAAAO////wD///8A////AAAAAIcAAACH////AP///wD///8AAAAAO////wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A////AP///wD///8A//8AAP//AAD4HwAA7/cAAN/7AAD//wAAoYUAAJ55AACf+QAAh+EAAAAAAADAAwAA4AcAAP5/AAD//wAA//8AAA==");
1147 |   margin-bottom: -5px; }
1148 |   div.pragma {
1149 |     display: none;
1150 |   }
1151 |   span.pragmabegin {
1152 |     cursor: pointer;
1153 |   }
1154 |   span.pragmaend {
1155 |     cursor: pointer;
1156 |   }
1157 | 
1158 | div.search_results {
1159 |   background-color: antiquewhite;
1160 |   margin: 3em;
1161 |   padding: 1em;
1162 |   border: 1px solid #4d4d4d;
1163 | }
1164 | </style>
1165 | 
1166 | <script type="text/javascript" src="../dochack.js"></script>
1167 | 
1168 | <script type="text/javascript">
1169 | function togglepragma(d) {
1170 |   if (d.style.display != 'inline')
1171 |     d.style.display = 'inline';
1172 |   else
1173 |     d.style.display = 'none';
1174 | }
1175 | 
1176 | function main() {
1177 |   var elements = document.getElementsByClassName("pragmabegin");
1178 |   for (var i = 0; i < elements.length; ++i) {
1179 |     var e = elements[i];
1180 |     e.onclick = function(event) {
1181 |       togglepragma(event.target.nextSibling);
1182 |     };
1183 |   }
1184 |   var elements = document.getElementsByClassName("pragmaend");
1185 |   for (var i = 0; i < elements.length; ++i) {
1186 |     var e = elements[i];
1187 |     e.onclick = function(event) {
1188 |       togglepragma(event.target.previousSibling);
1189 |     };
1190 |   }
1191 | }
1192 | </script>
1193 | 
1194 | </head>
1195 | <body onload="main()">
1196 | <div class="document" id="documentId">
1197 |   <div class="container">
1198 |     <h1 class="title">Module lapper</h1>
1199 |     <div class="row">
1200 |   <div class="three columns">
1201 |   <div>
1202 |     Search: <input type="text" id="searchInput"
1203 |       onkeyup="search()" />
1204 |   </div>
1205 |   <div>
1206 |     Group by:
1207 |     <select onchange="groupBy(this.value)">
1208 |       <option value="section">Section</option>
1209 |       <option value="type">Type</option>
1210 |     </select>
1211 |   </div>
1212 |   <ul class="simple simple-toc" id="toc-list">
1213 | <li>
1214 |   <a class="reference reference-toplevel" href="#6" id="56">Imports</a>
1215 |   <ul class="simple simple-toc-section">
1216 |     
1217 |   </ul>
1218 | </li>
1219 | <li>
1220 |   <a class="reference reference-toplevel" href="#7" id="57">Types</a>
1221 |   <ul class="simple simple-toc-section">
1222 |       <li><a class="reference" href="#Interval"
1223 |     title="Interval = concept i
1224 |     start(i) is int
1225 |     stop(i) is int"><wbr />Interval<span class="attachedType" style="visibility:hidden"></span></a></li>
1226 |   <li><a class="reference" href="#Lapper"
1227 |     title="Lapper[T] = object
1228 |   intervals: seq[T]
1229 |   max_len: int
1230 |   cursor: int                  ## `cursor` is used internally by ordered find"><wbr />Lapper<span class="attachedType" style="visibility:hidden"></span></a></li>
1231 | 
1232 |   </ul>
1233 | </li>
1234 | <li>
1235 |   <a class="reference reference-toplevel" href="#12" id="62">Procs</a>
1236 |   <ul class="simple simple-toc-section">
1237 |       <li><a class="reference" href="#overlap,T,int,int"
1238 |     title="overlap[T: Interval](a: T; start: int; stop: int): bool"><wbr />overlap<span class="attachedType" style="visibility:hidden"></span></a></li>
1239 |   <li><a class="reference" href="#lapify,seq[T]"
1240 |     title="lapify[T: Interval](ivs: var seq[T]): Lapper[T]"><wbr />lapify<span class="attachedType" style="visibility:hidden">Lapper</span></a></li>
1241 |   <li><a class="reference" href="#len,Lapper[T: Interval]"
1242 |     title="len[T: Interval](L: Lapper[T]): int"><wbr />len<span class="attachedType" style="visibility:hidden">Lapper</span></a></li>
1243 |   <li><a class="reference" href="#find,Lapper[T: Interval],int,int,seq[T]"
1244 |     title="find[T: Interval](L: Lapper[T]; start: int; stop: int; ivs: var seq[T]): bool"><wbr />find<span class="attachedType" style="visibility:hidden">Lapper</span></a></li>
1245 |   <li><a class="reference" href="#each_find,Lapper[T: Interval],int,int,proc(T)"
1246 |     title="each_find[T: Interval](L: Lapper[T]; start: int; stop: int; fn: proc (v: T))"><wbr />each_<wbr />find<span class="attachedType" style="visibility:hidden">Lapper</span></a></li>
1247 |   <li><a class="reference" href="#seek,Lapper[T: Interval],int,int,seq[T]"
1248 |     title="seek[T: Interval](L: var Lapper[T]; start: int; stop: int; ivs: var seq[T]): bool"><wbr />seek<span class="attachedType" style="visibility:hidden">Lapper</span></a></li>
1249 |   <li><a class="reference" href="#each_seek,Lapper[T: Interval],int,int,proc(T)"
1250 |     title="each_seek[T: Interval](L: var Lapper[T]; start: int; stop: int; fn: proc (v: T))"><wbr />each_<wbr />seek<span class="attachedType" style="visibility:hidden">Lapper</span></a></li>
1251 | 
1252 |   </ul>
1253 | </li>
1254 | 
1255 | </ul>
1256 | 
1257 |   </div>
1258 |   <div class="nine columns" id="content">
1259 |   <div id="tocRoot"></div>
1260 |   <p class="module-desc"><p>This module provides a simple data-structure for fast interval searches. It does not use an interval tree, instead, it operates on the assumption that most intervals are of similar length; or, more exactly, that the longest interval in the set is not long compared to the average distance between intervals. On any dataset where that is not the case, this method will not perform well. For cases where this holds true (as it often does with genomic data), we can sort by start and use binary search on the starts, accounting for the length of the longest interval. The advantage of this approach is simplicity of implementation and speed. In realistic tests queries returning the overlapping intervals are 1000 times faster than brute force and queries that merely check for the overlaps are &gt; 5000 times faster.</p>
1261 | <p>The main methods are <cite>find</cite> and <cite>seek</cite> where the latter uses a cursor and is very fast for cases when the queries are sorted. This is another innovation in this library that allows an addition ~50% speed improvement when consecutive queries are known to be in sort order.</p>
1262 | <p>For both find and seek, if the given intervals parameter is nil, the function will return a boolean indicating if any intervals in the set overlap the query. This is much faster than modifying the intervals.</p>
1263 | <p>The example below shows off most of the API of <cite>Lapper</cite>.</p>
1264 | <pre class="listing"><span class="Keyword">import</span> <span class="Identifier">lapper</span>
1265 | <span class="Keyword">type</span> <span class="Identifier">myinterval</span> <span class="Operator">=</span> <span class="Keyword">ref</span> <span class="Keyword">object</span>
1266 |    <span class="Identifier">start</span><span class="Punctuation">:</span> <span class="Identifier">int</span>
1267 |    <span class="Identifier">stop</span><span class="Punctuation">:</span> <span class="Identifier">int</span>
1268 |    <span class="Identifier">val</span><span class="Punctuation">:</span> <span class="Identifier">int</span>
1269 |  
1270 |  <span class="Keyword">proc</span> <span class="Identifier">start</span><span class="Punctuation">(</span><span class="Identifier">m</span><span class="Punctuation">:</span> <span class="Identifier">myinterval</span><span class="Punctuation">)</span><span class="Punctuation">:</span> <span class="Identifier">int</span> <span class="Punctuation">{</span><span class="Operator">.</span><span class="Identifier">inline</span><span class="Operator">.</span><span class="Punctuation">}</span> <span class="Operator">=</span> <span class="Keyword">return</span> <span class="Identifier">m</span><span class="Operator">.</span><span class="Identifier">start</span>
1271 |  <span class="Keyword">proc</span> <span class="Identifier">stop</span><span class="Punctuation">(</span><span class="Identifier">m</span><span class="Punctuation">:</span> <span class="Identifier">myinterval</span><span class="Punctuation">)</span><span class="Punctuation">:</span> <span class="Identifier">int</span> <span class="Punctuation">{</span><span class="Operator">.</span><span class="Identifier">inline</span><span class="Operator">.</span><span class="Punctuation">}</span> <span class="Operator">=</span> <span class="Keyword">return</span> <span class="Identifier">m</span><span class="Operator">.</span><span class="Identifier">stop</span>
1272 |  <span class="Keyword">proc</span> <span class="Punctuation">`</span><span class="Operator">$</span><span class="Punctuation">`</span><span class="Punctuation">(</span><span class="Identifier">m</span><span class="Punctuation">:</span><span class="Identifier">myinterval</span><span class="Punctuation">)</span><span class="Punctuation">:</span> <span class="Identifier">string</span> <span class="Operator">=</span> <span class="Keyword">return</span> <span class="StringLit">&quot;(start:$#, stop:$#, val:$#)&quot;</span> <span class="Operator">%</span> <span class="Punctuation">[</span><span class="Operator">$</span><span class="Identifier">m</span><span class="Operator">.</span><span class="Identifier">start</span><span class="Punctuation">,</span> <span class="Operator">$</span><span class="Identifier">m</span><span class="Operator">.</span><span class="Identifier">stop</span><span class="Punctuation">,</span> <span class="Operator">$</span><span class="Identifier">m</span><span class="Operator">.</span><span class="Identifier">val</span><span class="Punctuation">]</span></pre><blockquote><p>create some fake data</p></blockquote>
1273 | <pre class="listing"><span class="Keyword">var</span> <span class="Identifier">ivs</span> <span class="Operator">=</span> <span class="Identifier">new_seq</span><span class="Punctuation">[</span><span class="Identifier">myinterval</span><span class="Punctuation">]</span><span class="Punctuation">(</span><span class="Punctuation">)</span>
1274 | <span class="Keyword">for</span> <span class="Identifier">i</span> <span class="Keyword">in</span> <span class="Identifier">countup</span><span class="Punctuation">(</span><span class="DecNumber">0</span><span class="Punctuation">,</span> <span class="DecNumber">100</span><span class="Punctuation">,</span> <span class="DecNumber">10</span><span class="Punctuation">)</span><span class="Punctuation">:</span>
1275 |   <span class="Identifier">ivs</span><span class="Operator">.</span><span class="Identifier">add</span><span class="Punctuation">(</span><span class="Identifier">myinterval</span><span class="Punctuation">(</span><span class="Identifier">start</span><span class="Punctuation">:</span><span class="Identifier">i</span><span class="Punctuation">,</span> <span class="Identifier">stop</span><span class="Punctuation">:</span><span class="Identifier">i</span> <span class="Operator">+</span> <span class="DecNumber">15</span><span class="Punctuation">,</span> <span class="Identifier">val</span><span class="Punctuation">:</span><span class="DecNumber">0</span><span class="Punctuation">)</span><span class="Punctuation">)</span></pre>make the Lapper &quot;data-structure&quot;<pre class="listing"><span class="Identifier">l</span> <span class="Operator">=</span> <span class="Identifier">lapify</span><span class="Punctuation">(</span><span class="Identifier">ivs</span><span class="Punctuation">)</span>
1276 | <span class="Identifier">empty</span><span class="Punctuation">:</span><span class="Identifier">seq</span><span class="Punctuation">[</span><span class="Identifier">myinterval</span><span class="Punctuation">]</span></pre><pre class="listing"><span class="Identifier">l</span><span class="Operator">.</span><span class="Identifier">find</span><span class="Punctuation">(</span><span class="DecNumber">10</span><span class="Punctuation">,</span> <span class="DecNumber">20</span><span class="Punctuation">,</span> <span class="Identifier">empty</span><span class="Punctuation">)</span>
1277 | <span class="Identifier">notfound</span> <span class="Operator">=</span> <span class="Keyword">not</span> <span class="Identifier">l</span><span class="Operator">.</span><span class="Identifier">find</span><span class="Punctuation">(</span><span class="DecNumber">200</span><span class="Punctuation">,</span> <span class="DecNumber">300</span><span class="Punctuation">,</span> <span class="Identifier">empty</span><span class="Punctuation">)</span>
1278 | <span class="Identifier">assert</span> <span class="Identifier">notfound</span></pre><pre class="listing"><span class="Identifier">res</span> <span class="Operator">=</span> <span class="Identifier">new_seq</span><span class="Punctuation">[</span><span class="Identifier">myinterval</span><span class="Punctuation">]</span><span class="Punctuation">(</span><span class="Punctuation">)</span></pre>find is the more general case, l.seek gives a speed benefit when consecutive queries are in order.<pre class="listing"><span class="Identifier">echo</span> <span class="Identifier">l</span><span class="Operator">.</span><span class="Identifier">find</span><span class="Punctuation">(</span><span class="DecNumber">50</span><span class="Punctuation">,</span> <span class="DecNumber">70</span><span class="Punctuation">,</span> <span class="Identifier">res</span><span class="Punctuation">)</span>
1279 | <span class="Identifier">echo</span> <span class="Identifier">res</span>
1280 | <span class="Comment"># @[(start: 40, stop: 55, val:0), (start: 50, stop: 65, val: 0), (start: 60, stop: 75, val: 0), (start: 70, stop: 85, val: 0)]</span>
1281 | <span class="Keyword">for</span> <span class="Identifier">r</span> <span class="Keyword">in</span> <span class="Identifier">res</span><span class="Punctuation">:</span>
1282 |    <span class="Identifier">r</span><span class="Operator">.</span><span class="Identifier">val</span> <span class="Operator">+=</span> <span class="DecNumber">1</span></pre>or we can do a function on each overlapping interval<pre class="listing"><span class="Identifier">l</span><span class="Operator">.</span><span class="Identifier">each_seek</span><span class="Punctuation">(</span><span class="DecNumber">50</span><span class="Punctuation">,</span> <span class="DecNumber">60</span><span class="Punctuation">,</span> <span class="Keyword">proc</span><span class="Punctuation">(</span><span class="Identifier">a</span><span class="Punctuation">:</span><span class="Identifier">myinterval</span><span class="Punctuation">)</span> <span class="Operator">=</span> <span class="Identifier">inc</span><span class="Punctuation">(</span><span class="Identifier">a</span><span class="Operator">.</span><span class="Identifier">val</span><span class="Punctuation">)</span><span class="Punctuation">)</span></pre>or<pre class="listing"><span class="Identifier">l</span><span class="Operator">.</span><span class="Identifier">each_find</span><span class="Punctuation">(</span><span class="DecNumber">50</span><span class="Punctuation">,</span> <span class="DecNumber">60</span><span class="Punctuation">,</span> <span class="Keyword">proc</span><span class="Punctuation">(</span><span class="Identifier">a</span><span class="Punctuation">:</span><span class="Identifier">myinterval</span><span class="Punctuation">)</span> <span class="Operator">=</span> <span class="Identifier">a</span><span class="Operator">.</span><span class="Identifier">val</span> <span class="Operator">+=</span> <span class="DecNumber">10</span><span class="Punctuation">)</span></pre><pre class="listing"><span class="Keyword">discard</span> <span class="Identifier">l</span><span class="Operator">.</span><span class="Identifier">seek</span><span class="Punctuation">(</span><span class="DecNumber">50</span><span class="Punctuation">,</span> <span class="DecNumber">70</span><span class="Punctuation">,</span> <span class="Identifier">res</span><span class="Punctuation">)</span>
1283 | <span class="Identifier">echo</span> <span class="Identifier">res</span>
1284 | <span class="Comment"># @[(start:40, stop:55, val:12), (start:50, stop:65, val:12), (start:60, stop:75, val:1)]</span></pre></p>
1285 |   <div class="section" id="6">
1286 | <h1><a class="toc-backref" href="#6">Imports</a></h1>
1287 | <dl class="item">
1288 | <a class="reference external" href="algorithm.html">algorithm</a>, <a class="reference external" href="random.html">random</a>, <a class="reference external" href="times.html">times</a>, <a class="reference external" href="strutils.html">strutils</a>
1289 | </dl></div>
1290 | <div class="section" id="7">
1291 | <h1><a class="toc-backref" href="#7">Types</a></h1>
1292 | <dl class="item">
1293 | <dt id="Interval"><a name="Interval"></a><pre><span class="Identifier">Interval</span> <span class="Other">=</span> <span class="Keyword">concept</span> <span class="Identifier">i</span>
1294 |     <span class="Identifier">start</span><span class="Other">(</span><span class="Identifier">i</span><span class="Other">)</span> <span class="Identifier">is</span> <span class="Identifier">int</span>
1295 |     <span class="Identifier">stop</span><span class="Other">(</span><span class="Identifier">i</span><span class="Other">)</span> <span class="Identifier">is</span> <span class="Identifier">int</span></pre></dt>
1296 | <dd>
1297 | An object/tuple must implement these 2 methods to use this module
1298 | 
1299 | </dd>
1300 | <dt id="Lapper"><a name="Lapper"></a><pre><span class="Identifier">Lapper</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">]</span> <span class="Other">=</span> <span class="Keyword">object</span>
1301 |   <span class="Identifier">intervals</span><span class="Other">:</span> <span class="Identifier">seq</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">]</span>
1302 |   <span class="Identifier">max_len</span><span class="Other">:</span> <span class="Identifier">int</span>
1303 |   <span class="Identifier">cursor</span><span class="Other">:</span> <span class="Identifier">int</span>                  <span class="Comment">## `cursor` is used internally by ordered find</span>
1304 |   </pre></dt>
1305 | <dd>
1306 | Lapper enables fast interval searches
1307 | 
1308 | </dd>
1309 | 
1310 | </dl></div>
1311 | <div class="section" id="12">
1312 | <h1><a class="toc-backref" href="#12">Procs</a></h1>
1313 | <dl class="item">
1314 | <dt id="overlap"><a name="overlap,T,int,int"></a><pre><span class="Keyword">proc</span> <span class="Identifier">overlap</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">:</span> <span class="Identifier">Interval</span><span class="Other">]</span><span class="Other">(</span><span class="Identifier">a</span><span class="Other">:</span> <span class="Identifier">T</span><span class="Other">;</span> <span class="Identifier">start</span><span class="Other">:</span> <span class="Identifier">int</span><span class="Other">;</span> <span class="Identifier">stop</span><span class="Other">:</span> <span class="Identifier">int</span><span class="Other">)</span><span class="Other">:</span> <span class="Identifier">bool</span> <span class="Other pragmabegin">{.</span><div class="pragma"><span class="Identifier">inline</span></div><span class="Other pragmaend">.}</span></pre></dt>
1315 | <dd>
1316 | overlap returns true if half-open intervals overlap
1317 | 
1318 | </dd>
1319 | <dt id="lapify"><a name="lapify,seq[T]"></a><pre><span class="Keyword">proc</span> <span class="Identifier">lapify</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">:</span> <span class="Identifier">Interval</span><span class="Other">]</span><span class="Other">(</span><span class="Identifier">ivs</span><span class="Other">:</span> <span class="Keyword">var</span> <span class="Identifier">seq</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">]</span><span class="Other">)</span><span class="Other">:</span> <span class="Identifier">Lapper</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">]</span></pre></dt>
1320 | <dd>
1321 | create a new Lapper object; ivs will be sorted.
1322 | 
1323 | </dd>
1324 | <dt id="len"><a name="len,Lapper[T: Interval]"></a><pre><span class="Keyword">proc</span> <span class="Identifier">len</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">:</span> <span class="Identifier">Interval</span><span class="Other">]</span><span class="Other">(</span><span class="Identifier">L</span><span class="Other">:</span> <span class="Identifier">Lapper</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">]</span><span class="Other">)</span><span class="Other">:</span> <span class="Identifier">int</span></pre></dt>
1325 | <dd>
1326 | len returns the number of intervals in the Lapper
1327 | 
1328 | </dd>
1329 | <dt id="find"><a name="find,Lapper[T: Interval],int,int,seq[T]"></a><pre><span class="Keyword">proc</span> <span class="Identifier">find</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">:</span> <span class="Identifier">Interval</span><span class="Other">]</span><span class="Other">(</span><span class="Identifier">L</span><span class="Other">:</span> <span class="Identifier">Lapper</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">]</span><span class="Other">;</span> <span class="Identifier">start</span><span class="Other">:</span> <span class="Identifier">int</span><span class="Other">;</span> <span class="Identifier">stop</span><span class="Other">:</span> <span class="Identifier">int</span><span class="Other">;</span> <span class="Identifier">ivs</span><span class="Other">:</span> <span class="Keyword">var</span> <span class="Identifier">seq</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">]</span><span class="Other">)</span><span class="Other">:</span> <span class="Identifier">bool</span></pre></dt>
1330 | <dd>
1331 | fill ivs with all intervals in L that overlap start .. stop. if ivs is nil, then this will just return true if it finds an interval and false otherwise
1332 | 
1333 | </dd>
1334 | <dt id="each_find"><a name="each_find,Lapper[T: Interval],int,int,proc(T)"></a><pre><span class="Keyword">proc</span> <span class="Identifier">each_find</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">:</span> <span class="Identifier">Interval</span><span class="Other">]</span><span class="Other">(</span><span class="Identifier">L</span><span class="Other">:</span> <span class="Identifier">Lapper</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">]</span><span class="Other">;</span> <span class="Identifier">start</span><span class="Other">:</span> <span class="Identifier">int</span><span class="Other">;</span> <span class="Identifier">stop</span><span class="Other">:</span> <span class="Identifier">int</span><span class="Other">;</span> <span class="Identifier">fn</span><span class="Other">:</span> <span class="Keyword">proc</span> <span class="Other">(</span><span class="Identifier">v</span><span class="Other">:</span> <span class="Identifier">T</span><span class="Other">)</span><span class="Other">)</span></pre></dt>
1335 | <dd>
1336 | call fn(x) for each interval x in L that overlaps start..stop
1337 | 
1338 | </dd>
1339 | <dt id="seek"><a name="seek,Lapper[T: Interval],int,int,seq[T]"></a><pre><span class="Keyword">proc</span> <span class="Identifier">seek</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">:</span> <span class="Identifier">Interval</span><span class="Other">]</span><span class="Other">(</span><span class="Identifier">L</span><span class="Other">:</span> <span class="Keyword">var</span> <span class="Identifier">Lapper</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">]</span><span class="Other">;</span> <span class="Identifier">start</span><span class="Other">:</span> <span class="Identifier">int</span><span class="Other">;</span> <span class="Identifier">stop</span><span class="Other">:</span> <span class="Identifier">int</span><span class="Other">;</span> <span class="Identifier">ivs</span><span class="Other">:</span> <span class="Keyword">var</span> <span class="Identifier">seq</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">]</span><span class="Other">)</span><span class="Other">:</span> <span class="Identifier">bool</span></pre></dt>
1340 | <dd>
1341 | fill ivs with all intervals in L that overlap start .. stop inclusive. this method will work when queries to this lapper are in sorted (start) order it uses a linear search from the last query instead of a binary search. if ivs is nil, then this will just return true if it finds an interval and false otherwise
1342 | 
1343 | </dd>
1344 | <dt id="each_seek"><a name="each_seek,Lapper[T: Interval],int,int,proc(T)"></a><pre><span class="Keyword">proc</span> <span class="Identifier">each_seek</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">:</span> <span class="Identifier">Interval</span><span class="Other">]</span><span class="Other">(</span><span class="Identifier">L</span><span class="Other">:</span> <span class="Keyword">var</span> <span class="Identifier">Lapper</span><span class="Other">[</span><span class="Identifier">T</span><span class="Other">]</span><span class="Other">;</span> <span class="Identifier">start</span><span class="Other">:</span> <span class="Identifier">int</span><span class="Other">;</span> <span class="Identifier">stop</span><span class="Other">:</span> <span class="Identifier">int</span><span class="Other">;</span> <span class="Identifier">fn</span><span class="Other">:</span> <span class="Keyword">proc</span> <span class="Other">(</span><span class="Identifier">v</span><span class="Other">:</span> <span class="Identifier">T</span><span class="Other">)</span><span class="Other">)</span> <span class="Other pragmabegin">{.</span><div class="pragma">
1345 |     <span class="Identifier">inline</span></div><span class="Other pragmaend">.}</span></pre></dt>
1346 | <dd>
1347 | call fn(x) for each interval x in L that overlaps start..stop this assumes that subsequent calls to this function will be in sorted order
1348 | 
1349 | </dd>
1350 | 
1351 | </dl></div>
1352 | 
1353 |   </div>
1354 | </div>
1355 | 
1356 |     <div class="row">
1357 |       <div class="twelve-columns footer">
1358 |         <span class="nim-sprite"></span>
1359 |         <br/>
1360 |         <small>Made with Nim. Generated: 2017-11-25 08:56:21 UTC</small>
1361 |       </div>
1362 |     </div>
1363 |   </div>
1364 | </div>
1365 | 
1366 | </body>
1367 | </html>
1368 | 


--------------------------------------------------------------------------------
/example.nim:
--------------------------------------------------------------------------------
 1 | import lapper
 2 | import strutils
 3 | 
 4 | # define an appropriate data-type. it must have a `start(m) int` and `stop(m) int` method.
 5 | #type myinterval = tuple[start:int, stop:int, val:int]
 6 | # if we want to modify the result, then we have to use a ref object type
 7 | type myinterval = ref object
 8 |   start: int
 9 |   stop: int
10 |   val: int
11 | 
12 | proc start(m: myinterval): int {.inline.} = return m.start
13 | proc stop(m: myinterval): int {.inline.} = return m.stop
14 | proc `$`(m:myinterval): string = return "(start:$#, stop:$#, val:$#)" % [$m.start, $m.stop, $m.val]
15 | 
16 | # create some fake data
17 | var ivs = new_seq[myinterval]()
18 | for i in countup(0, 100, 10):
19 |   ivs.add(myinterval(start:i, stop:i + 15, val:0))
20 | 
21 | # make the Lapper "data-structure"
22 | var l = lapify(ivs)
23 | var empty:seq[myinterval]
24 | 
25 | assert l.find(10, 20, empty)
26 | var notfound = not l.find(200, 300, empty)
27 | assert notfound
28 | 
29 | var res = new_seq[myinterval]()
30 | 
31 | # find is the more general case, l.seek gives a speed benefit when consecutive queries are in order.
32 | echo l.find(50, 70, res)
33 | echo res
34 | # @[(start: 40, stop: 55, val:0), (start: 50, stop: 65, val: 0), (start: 60, stop: 75, val: 0), (start: 70, stop: 85, val: 0)]
35 | for r in res:
36 |   r.val += 1
37 | 
38 | # or we can do a function on each overlapping interval
39 | l.each_seek(50, 60, proc(a:myinterval) = inc(a.val))
40 | # or
41 | l.each_find(50, 60, proc(a:myinterval) = a.val += 10)
42 | 
43 | discard l.seek(50, 70, res)
44 | echo res
45 | #@[(start:40, stop:55, val:12), (start:50, stop:65, val:12), (start:60, stop:75, val:1)]
46 | 


--------------------------------------------------------------------------------
/lapper.nimble:
--------------------------------------------------------------------------------
 1 | # Package
 2 | 
 3 | version       = "0.1.8"
 4 | author        = "Brent Pedersen"
 5 | description   = "fast, simple interval overlaps with binary search"
 6 | license       = "MIT"
 7 | 
 8 | # Dependencies
 9 | requires "nim >= 0.19.2" #, "nim-lang/c2nim>=0.9.13"
10 | srcDir = "src"
11 | 
12 | skipFiles = @["bench.nim", "example.nim"]
13 | 
14 | skipDirs = @["tests"]
15 | 
16 | task test, "run the tests":
17 |   exec "nim c -d:release --lineDir:on -r src/lapper"
18 | 
19 | task docs, "make docs":
20 |   exec "nim doc2 src/lapper; mkdir -p docs; mv lapper.html docs/index.html"
21 | 


--------------------------------------------------------------------------------
/nim.cfg:
--------------------------------------------------------------------------------
1 | path = "$projectPath/src"
2 | 


--------------------------------------------------------------------------------
/src/lapper.nim:
--------------------------------------------------------------------------------
  1 | ## This module provides a simple data-structure for fast interval searches. It does not use an interval tree,
  2 | ## instead, it operates on the assumption that most intervals are of similar length; or, more exactly, that the
  3 | ## longest interval in the set is not long compared to the average distance between intervals. On any dataset
  4 | ## where that is not the case, this method will not perform well. For cases where this holds true (as it often
  5 | ## does with genomic data), we can sort by start and use binary search on the starts, accounting for the length
  6 | ## of the longest interval. The advantage of this approach is simplicity of implementation and speed. In realistic
  7 | ## tests queries returning the overlapping intervals are 1000 times faster than brute force and queries that merely
  8 | ## check for the overlaps are > 5000 times faster.
  9 | ##
 10 | ## The main methods are `find` and `seek` where the latter uses a cursor and is very fast for cases when the queries
 11 | ## are sorted. This is another innovation in this library that allows an addition ~50% speed improvement when
 12 | ## consecutive queries are known to be in sort order.
 13 | ##
 14 | ## For both find and seek, if the given intervals parameter is nil, the function will return a boolean indicating if
 15 | ## any intervals in the set overlap the query. This is much faster than modifying the
 16 | ## intervals.
 17 | ##
 18 | ## The example below shows off most of the API of `Lapper`.
 19 | ##
 20 | ## .. code-block:: nim
 21 | ##   import lapper
 22 | ##   type myinterval = ref object
 23 | ##      start: int
 24 | ##      stop: int
 25 | ##      val: int
 26 | ##    
 27 | ##    proc start(m: myinterval): int {.inline.} = return m.start
 28 | ##    proc stop(m: myinterval): int {.inline.} = return m.stop
 29 | ##    proc `$`(m:myinterval): string = return "(start:$#, stop:$#, val:$#)" % [$m.start, $m.stop, $m.val]
 30 | ##    
 31 | ##  create some fake data
 32 | ## .. code-block:: nim
 33 | ##  var ivs = new_seq[myinterval]()
 34 | ##  for i in countup(0, 100, 10):
 35 | ##    ivs.add(myinterval(start:i, stop:i + 15, val:0))
 36 | 
 37 | ##  make the Lapper "data-structure"
 38 | 
 39 | ## .. code-block:: nim
 40 | ##  l = lapify(ivs)
 41 | ##  empty:seq[myinterval]
 42 |     
 43 | ## .. code-block:: nim
 44 | ##  l.find(10, 20, empty)
 45 | ##  notfound = not l.find(200, 300, empty)
 46 | ##  assert notfound
 47 |     
 48 | ## .. code-block:: nim
 49 | ##  res = new_seq[myinterval]()
 50 |  
 51 | ##  find is the more general case, l.seek gives a speed benefit when consecutive queries are in order.
 52 | 
 53 | ## .. code-block:: nim
 54 | ##  echo l.find(50, 70, res)
 55 | ##  echo res
 56 | ##  # @[(start: 40, stop: 55, val:0), (start: 50, stop: 65, val: 0), (start: 60, stop: 75, val: 0), (start: 70, stop: 85, val: 0)]
 57 | ##  for r in res:
 58 | ##     r.val += 1
 59 |  
 60 | ## or we can do a function on each overlapping interval
 61 | 
 62 | ## .. code-block:: nim
 63 | ##   l.each_seek(50, 60, proc(a:myinterval) = inc(a.val))
 64 | 
 65 | ## or
 66 | 
 67 | ## .. code-block:: nim
 68 | ##   l.each_find(50, 60, proc(a:myinterval) = a.val += 10)
 69 |  
 70 | ## .. code-block:: nim
 71 | ##   discard l.seek(50, 70, res)
 72 | ##   echo res
 73 | ##   # @[(start:40, stop:55, val:12), (start:50, stop:65, val:12), (start:60, stop:75, val:1)]
 74 | import algorithm
 75 | 
 76 | type
 77 | 
 78 |   Interval* = concept i
 79 |     ## An object/tuple must implement these 2 methods to use this module
 80 |     start(i) is int
 81 |     stop(i) is int
 82 | 
 83 |   Lapper*[T] = object
 84 |     ## Lapper enables fast interval searches
 85 |     intervals: seq[T]
 86 |     max_len*: int
 87 |     cursor: int ## `cursor` is used internally by ordered find
 88 | 
 89 | template overlap*[T:Interval](a: T, start:int, stop:int): bool =
 90 |   ## overlap returns true if half-open intervals overlap
 91 |   #return a.start < stop and a.stop > start
 92 |   a.stop > start and a.start < stop
 93 | 
 94 | 
 95 | proc iv_cmp[T:Interval](a, b: T): int =
 96 |     if a.start < b.start: return -1
 97 |     if b.start < a.start: return 1
 98 |     return cmp(a.stop, b.stop)
 99 | 
100 | 
101 | proc lapify*[T:Interval](ivs:var seq[T]): Lapper[T] =
102 |   ## create a new Lapper object; ivs will be sorted.
103 |   sort(ivs, iv_cmp)
104 |   result = Lapper[T](max_len: 0, intervals:ivs)
105 |   for iv in ivs:
106 |     if iv.stop - iv.start > result.max_len:
107 |       result.max_len = iv.stop - iv.start
108 | 
109 | proc lowerBound[T:Interval](a: var seq[T], start: int): int =
110 |   result = a.low
111 |   var count = a.high - a.low + 1
112 |   var step, pos: int
113 |   while count != 0:
114 |     step = count div 2
115 |     pos = result + step
116 |     if a[pos].start < start:
117 |       result = pos + 1
118 |       count -= step + 1
119 |     else:
120 |       count = step
121 | 
122 | proc len*[T:Interval](L:Lapper[T]): int {.inline.} =
123 |   ## len returns the number of intervals in the Lapper
124 |   L.intervals.len
125 | 
126 | proc empty*[T:Interval](L:Lapper[T]): bool {.inline.} =
127 |   return L.intervals.len == 0
128 | 
129 | iterator find*[T:Interval](L:var Lapper[T], start:int, stop:int): T =
130 |   ## fill ivs with all intervals in L that overlap start .. stop.
131 |   #if ivs.len != 0: ivs.set_len(0)
132 |   let off = lowerBound(L.intervals, start - L.max_len)
133 |   for i in off..L.intervals.high:
134 |     let x = L.intervals[i]
135 |     if likely(x.overlap(start, stop)):
136 |       yield x
137 |     elif x.start >= stop: break
138 | 
139 | proc find*[T:Interval](L:var Lapper[T], start:int, stop:int, ivs:var seq[T]): bool =
140 |   ## fill ivs with all intervals in L that overlap start .. stop.
141 |   #if ivs.len != 0: ivs.set_len(0)
142 |   let off = lowerBound(L.intervals, start - L.max_len)
143 |   var n = 0
144 |   for i in off..L.intervals.high:
145 |     let x = L.intervals[i]
146 |     if x.overlap(start, stop):
147 |       if n < ivs.len:
148 |         ivs[n] = x
149 |       else:
150 |         ivs.add(x)
151 |       n += 1
152 |     elif x.start >= stop: break
153 |   if ivs.len > n:
154 |     ivs.setLen(n)
155 |   return len(ivs) > 0
156 | 
157 | proc count*[T:Interval](L:var Lapper[T], start:int, stop:int): int =
158 |   ## fill ivs with all intervals in L that overlap start .. stop.
159 |   let off = lowerBound(L.intervals, start - L.max_len)
160 |   for i in off..L.intervals.high:
161 |     let x = L.intervals[i]
162 |     if x.overlap(start, stop):
163 |       result.inc
164 |     elif x.start >= stop: break
165 | 
166 | proc each_find*[T:Interval](L:var Lapper[T], start:int, stop:int, fn: proc (v:T)) =
167 |   ## call fn(x) for each interval x in L that overlaps start..stop
168 |   let off = lowerBound(L.intervals, start - L.max_len)
169 |   for i in off..L.intervals.high:
170 |     let x = L.intervals[i]
171 |     if x.overlap(start, stop):
172 |       fn(x)
173 |     elif x.start >= stop: break
174 | 
175 | iterator seek*[T:Interval](L:var Lapper[T], start:int, stop:int): T =
176 |   if L.cursor == 0 or L.intervals[L.cursor].start > start:
177 |     L.cursor = lowerBound(L.intervals, start - L.max_len)
178 |   while (L.cursor + 1) < L.intervals.high and L.intervals[L.cursor + 1].start < (start - L.max_len):
179 |     L.cursor += 1
180 |   let old_cursor = L.cursor
181 |   for i in L.cursor..L.intervals.high:
182 |     let x = L.intervals[i]
183 |     if x.overlap(start, stop):
184 |       yield x
185 |     elif x.start >= stop: break
186 |   L.cursor = old_cursor
187 | 
188 | proc seek*[T:Interval](L:var Lapper[T], start:int, stop:int, ivs:var seq[T]): bool =
189 |   ## fill ivs with all intervals in L that overlap start .. stop inclusive.
190 |   ## this method will work when queries to this lapper are in sorted (start) order
191 |   ## it uses a linear search from the last query instead of a binary search.
192 |   ## if ivs is nil, then this will just return true if it finds an interval and false otherwise
193 |   if ivs.len != 0: ivs.set_len(0)
194 |   if L.cursor == 0 or L.intervals[L.cursor].start > start:
195 |     L.cursor = lowerBound(L.intervals, start - L.max_len)
196 |   let old_cursor = L.cursor
197 |   while (L.cursor + 1) < L.intervals.high and L.intervals[L.cursor + 1].start < (start - L.max_len):
198 |     L.cursor += 1
199 |   for i in L.cursor..L.intervals.high:
200 |     let x = L.intervals[i]
201 |     if x.overlap(start, stop):
202 |       ivs.add(x)
203 |     elif x.start >= stop: break
204 |   L.cursor = old_cursor
205 |   return ivs.len != 0
206 | 
207 | proc each_seek*[T:Interval](L:var Lapper[T], start:int, stop:int, fn:proc (v:T)) {.inline.} =
208 |   ## call fn(x) for each interval x in L that overlaps start..stop
209 |   ## this assumes that subsequent calls to this function will be in sorted order
210 |   if L.cursor == 0 or L.cursor >= L.intervals.high or L.intervals[L.cursor].start > start:
211 |     L.cursor = lowerBound(L.intervals, start - L.max_len)
212 |   while (L.cursor + 1) < L.intervals.high and L.intervals[L.cursor + 1].start < (start - L.max_len):
213 |     L.cursor += 1
214 |   let old_cursor = L.cursor
215 |   for i in L.cursor..L.intervals.high:
216 |     let x = L.intervals[i]
217 |     if x.start >= stop: break
218 |     elif x.stop > start:
219 |       fn(x)
220 |   L.cursor = old_cursor
221 | 
222 | iterator items*[T:Interval](L: Lapper[T]): T =
223 |   for i in L.intervals: yield i
224 | 
225 | when isMainModule:
226 | 
227 |   import random
228 |   import times
229 |   import strutils
230 | 
231 |   proc randomi(imin:int, imax:int): int =
232 |       return imin + rand(imax - imin)
233 | 
234 |   proc brute_force(ivs: seq[Interval], start:int, stop:int, res: var seq[Interval]) =
235 |     if res.len != 0: res.set_len(0)
236 |     for i in ivs:
237 |       if i.overlap(start, stop): res.add(i)
238 | 
239 |   # example implementation
240 |   type myinterval = tuple[start:int, stop:int, val:int]
241 |   proc start(m: myinterval): int {.inline.} = return m.start
242 |   proc stop(m: myinterval): int {.inline.} = return m.stop
243 | 
244 |   proc make_random(n:int, range_max:int, size_min:int, size_max:int): seq[myinterval] =
245 |     result = new_seq[myinterval](n)
246 |     for i in 0..<n:
247 |       var s = randomi(0, range_max)
248 |       var e = s + randomi(size_min, size_max)
249 |       var m:myinterval = (s, e, 0)
250 |       result[i] = m
251 | 
252 |   var
253 |     N = 100000
254 |     ntimes = 40
255 |     brute_step = 10
256 | 
257 |   var intervals = make_random(N, 50000000, 500, 20000)
258 |   echo "running tests and comparisons on $# random intervals" % [$N]
259 |   var icopy = intervals
260 | 
261 |   var t = cpuTime()
262 |   var res = new_seq[myinterval]()
263 | 
264 |   for i in countup(0, intervals.len - brute_step, brute_step):
265 |     var iv = intervals[i]
266 |     brute_force(intervals, iv.start, iv.stop, res)
267 | 
268 |   var brute_time = cpuTime() - t
269 |   echo "time for brute force search on 1/$#th of the data:" % [$brute_step], brute_time
270 | 
271 |   t = cpuTime()
272 | 
273 |   var lap = lapify(intervals)
274 |   echo "time to create Lapper:", cpuTime() - t
275 | 
276 |   t = cpuTime()
277 |   for k in 0..<ntimes:
278 |     for iv in icopy:
279 |       discard lap.find(iv.start, iv.stop, res)
280 |       if len(res) == 0:
281 |         echo "0 bad!!!"
282 |   var lap_time = cpuTime() - t
283 |   echo "time to do $# searches ($# reps) in Lapper:" % [$(N * ntimes), $ntimes], lap_time, " speedup:", (brute_time * float64(brute_step)) / (lap_time / float64(ntimes))
284 | 
285 |   t = cpuTime()
286 |   for k in 0..<ntimes:
287 |     for iv in intervals:
288 |       discard lap.seek(iv.start, iv.stop, res)
289 |       if len(res) == 0:
290 |         echo "1 bad!!!"
291 |   lap_time = cpuTime() - t
292 |   echo "time to do $# seek-searches ($# reps) in Lapper:" % [$(N * ntimes), $ntimes], lap_time, " speedup:", (brute_time * float64(brute_step)) / (lap_time / float64(ntimes))
293 | 
294 |   var iempty: seq[myinterval]
295 |   t = cpuTime()
296 |   for k in 0..<ntimes:
297 |     for iv in icopy:
298 |       if 0 == lap.count(iv.start, iv.stop):
299 |         echo "2 bad!!!"
300 |   lap_time = cpuTime() - t
301 |   echo "time to do $# presence tests ($# reps) in Lapper:" % [$(N * ntimes), $ntimes], lap_time, " speedup:", (brute_time * float64(brute_step)) / (lap_time / float64(ntimes))
302 | 
303 |   t = cpuTime()
304 |   for k in 0..<ntimes:
305 |     for iv in intervals:
306 |       if not lap.seek(iv.start, iv.stop, iempty):
307 |         echo "3 bad!!!"
308 |   lap_time = cpuTime() - t
309 |   echo "time to do $# seek-presence tests ($# reps) in Lapper:" % [$(N * ntimes), $ntimes], lap_time, " speedup:", (brute_time * float64(brute_step)) / (lap_time / float64(ntimes))
310 | 
311 |   t = cpuTime()
312 |   for k in 0..<ntimes:
313 |     for iv in intervals:
314 |       var n = 0
315 |       lap.each_seek(iv.start, iv.stop, (proc(f:myinterval) = (if iv.start == f.start: n.inc)))
316 |       if n == 0:
317 |         echo "4 bad!!!"
318 |   lap_time = cpuTime() - t
319 |   echo "time to do $# each-seek-presence tests ($# reps) in Lapper:" % [$(N * ntimes), $ntimes], lap_time, " speedup:", (brute_time * float64(brute_step)) / (lap_time / float64(ntimes))
320 | 
321 | 
322 |   var brute_res = new_seq[myinterval]()
323 |   var error = 0
324 | 
325 |   t = cpuTime()
326 |   var res2 = new_seq[myinterval](10)
327 |   var res3 = new_seq_of_cap[myinterval](10)
328 |   var res4 = new_seq_of_cap[myinterval](10)
329 |   proc do_each_find(m:myinterval) = res3.add(m)
330 |   proc do_each_seek(m:myinterval) = res4.add(m)
331 |   icopy.sort(iv_cmp)
332 | 
333 |   for iv in icopy:
334 |     brute_force(icopy, iv.start, iv.stop, brute_res)
335 |     discard lap.find(iv.start, iv.stop, res)
336 |     discard lap.seek(iv.start, iv.stop, res2)
337 | 
338 |     res3.set_len(0)
339 |     lap.each_find(iv.start, iv.stop, do_each_find)
340 | 
341 |     res4.set_len(0)
342 |     lap.each_seek(iv.start, iv.stop, do_each_seek)
343 | 
344 |     if not lap.seek(iv.start, iv.stop, iempty):
345 |       echo "4 bad!! should have found it"
346 |     sort(brute_res, iv_cmp)
347 |     sort(res, iv_cmp)
348 |     sort(res2, iv_cmp)
349 |     sort(res3, iv_cmp)
350 |     sort(res4, iv_cmp)
351 | 
352 |     for i, b in brute_res:
353 |         if b.start != res[i].start or b.start != res2[i].start or b.start != res3[i].start or b.start != res4[i].start:
354 |           echo "5 bad!!! ", len(res), " ", len(res2)
355 |           error = 1
356 |         if b.stop != res[i].stop or b.stop != res2[i].stop or res3[i].stop != b.stop or res4[i].stop != b.stop:
357 |           echo "6 bad!!! ", len(res), " ", len(res2)
358 |           error = 1
359 |   echo "time to check each result:", cpuTime() - t
360 |   quit(error)
361 | 


--------------------------------------------------------------------------------