├── .Rbuildignore
├── .gitignore
├── DESCRIPTION
├── NAMESPACE
├── NEWS.md
├── R
    ├── RcppExports.R
    ├── cluster.R
    ├── complement.R
    ├── intersect.R
    ├── join_closest.R
    └── subtract.R
├── README.md
├── _pkgdown.yml
├── cran-comments.md
├── docs
    ├── articles
    │   ├── index.html
    │   ├── intro.html
    │   └── resources
    │   │   ├── genome_cluster_docu.png
    │   │   ├── genome_complement_docu.png
    │   │   ├── genome_intersect_docu.png
    │   │   ├── genome_join_closest_docu.png
    │   │   ├── genome_join_docu.png
    │   │   └── genome_subtract_docu.png
    ├── authors.html
    ├── docsearch.css
    ├── docsearch.js
    ├── index.html
    ├── link.svg
    ├── news
    │   └── index.html
    ├── pkgdown.css
    ├── pkgdown.js
    ├── pkgdown.yml
    └── reference
    │   ├── cluster_interval.html
    │   ├── genome_cluster.html
    │   ├── genome_complement.html
    │   ├── genome_intersect.html
    │   ├── genome_join_closest.html
    │   ├── genome_subtract.html
    │   └── index.html
├── man
    ├── cluster_interval.Rd
    ├── genome_cluster.Rd
    ├── genome_complement.Rd
    ├── genome_intersect.Rd
    ├── genome_join_closest.Rd
    └── genome_subtract.Rd
├── src
    ├── .gitignore
    ├── RcppExports.cpp
    ├── cluster_interval.cpp
    └── tidygenomics_init.c
├── tests
    ├── testthat.R
    └── testthat
    │   ├── test_cluster.R
    │   ├── test_complement.R
    │   ├── test_intersect.R
    │   ├── test_issue.R
    │   ├── test_join_closest.R
    │   └── test_subtract.R
├── tidygenomics.Rproj
└── vignettes
    ├── intro.Rmd
    └── resources
        ├── genome_cluster_docu.png
        ├── genome_complement_docu.png
        ├── genome_intersect_docu.png
        ├── genome_join_closest_docu.png
        ├── genome_join_docu.png
        └── genome_subtract_docu.png


/.Rbuildignore:
--------------------------------------------------------------------------------
1 | ^.*\.Rproj$
2 | ^\.Rproj\.user$
3 | cran-comments.md
4 | ^_pkgdown\.yml$
5 | ^docs$
6 | ^pkgdown$
7 | ^CRAN-RELEASE$
8 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
1 | .Rproj.user
2 | .Rhistory
3 | .RData
4 | .Ruserdata
5 | inst/doc
6 | 


--------------------------------------------------------------------------------
/DESCRIPTION:
--------------------------------------------------------------------------------
 1 | Package: tidygenomics
 2 | Type: Package
 3 | Title: Tidy Verbs for Dealing with Genomic Data Frames
 4 | Version: 0.1.2
 5 | Authors@R: c(person("Constantin", "Ahlmann-Eltze", email = "artjom31415@googlemail.com", role = c("aut", "cre"), 
 6 |                     comment = c(ORCID = "0000-0002-3762-068X")),
 7 |     person("Stan Developers", role="cph", 
 8 |            comment="Code from the Stan Math library is reused in 'cluster_interval.cpp'"),
 9 |     person("David", "Robinson", role="cph", 
10 |            comment="Code from the fuzzyjoin package is reused"))
11 | Description: Handle genomic data within data frames just as you would with 'GRanges'.
12 |     This packages provides method to deal with genomic intervals the "tidy-way" which makes
13 |     it simpler to integrate in the the general data munging process. The API is inspired by the
14 |     popular 'bedtools' and the genome_join() method from the 'fuzzyjoin' package.
15 | URL: https://github.com/const-ae/tidygenomics
16 | License: GPL-3
17 | Encoding: UTF-8
18 | LazyData: true
19 | Imports:
20 |     dplyr,
21 |     rlang,
22 |     purrr,
23 |     tidyr,
24 |     fuzzyjoin (>= 0.1.3),
25 |     IRanges,
26 |     Rcpp
27 | Suggests: testthat,
28 |     knitr,
29 |     rmarkdown
30 | RoxygenNote: 6.1.1
31 | LinkingTo:
32 |     Rcpp
33 | VignetteBuilder: knitr
34 | 


--------------------------------------------------------------------------------
/NAMESPACE:
--------------------------------------------------------------------------------
 1 | # Generated by roxygen2: do not edit by hand
 2 | 
 3 | export(cluster_interval)
 4 | export(genome_anti_join_closest)
 5 | export(genome_cluster)
 6 | export(genome_complement)
 7 | export(genome_full_join_closest)
 8 | export(genome_inner_join_closest)
 9 | export(genome_intersect)
10 | export(genome_join_closest)
11 | export(genome_left_join_closest)
12 | export(genome_right_join_closest)
13 | export(genome_semi_join_closest)
14 | export(genome_subtract)
15 | importFrom(Rcpp,sourceCpp)
16 | importFrom(dplyr,"%>%")
17 | importFrom(dplyr,"n")
18 | importFrom(rlang,":=")
19 | importFrom(rlang,"sym")
20 | useDynLib(tidygenomics, .registration = TRUE)
21 | 


--------------------------------------------------------------------------------
/NEWS.md:
--------------------------------------------------------------------------------
 1 | 
 2 | # v0.1.2
 3 | 
 4 | * Remove remaining calls to deprecated tidyr functions to become compatible with tidyr v1.0.0.
 5 |   Thanks to @jennybc for the pull request (#6)
 6 | 
 7 | # v0.1.1
 8 | 
 9 | * Fix issue #5
10 |   - the genome_cluster method assigned all chunks to cluster zero if their end was smaller 
11 |     than the end of the first entry
12 | 
13 | * Port dplyr calls to new tidyeval API
14 |   - This avoids plenty of deprecation warnings
15 | 
16 | * Add pkgdown webpage: https://const-ae.github.io/tidygenomics/
17 | 
18 | # Initial Release (v0.1.0)
19 | 
20 | First acceptance on CRAN
21 | 


--------------------------------------------------------------------------------
/R/RcppExports.R:
--------------------------------------------------------------------------------
 1 | # Generated by using Rcpp::compileAttributes() -> do not edit by hand
 2 | # Generator token: 10BE3573-1514-4C36-9D1C-5A225CD40393
 3 | 
 4 | sort_indices <- function(x) {
 5 |     .Call(`_tidygenomics_sort_indices`, x)
 6 | }
 7 | 
 8 | #' Cluster ranges which are implemented as 2 equal-length numeric vectors.
 9 | #' @param starts A numeric vector that defines the starts of each interval
10 | #' @param ends A numeric vector that defines the ends of each interval
11 | #' @param max_distance The maximum distance up to which intervals are still considered to be
12 | #'  the same cluster. Default: 0.
13 | #' @examples
14 | #' starts <- c(50, 100, 120)
15 | #' ends <- c(75, 130, 150)
16 | #' j <- cluster_interval(starts, ends)
17 | #' j == c(0,1,1)
18 | #' @export
19 | cluster_interval <- function(starts, ends, max_distance = 0L) {
20 |     .Call(`_tidygenomics_cluster_interval`, starts, ends, max_distance)
21 | }
22 | 
23 | 


--------------------------------------------------------------------------------
/R/cluster.R:
--------------------------------------------------------------------------------
 1 | 
 2 | #' @useDynLib tidygenomics, .registration = TRUE
 3 | #' @importFrom Rcpp sourceCpp
 4 | NULL
 5 | 
 6 | .onUnload <- function (libpath) {
 7 |   library.dynam.unload("tidygenomics", libpath)
 8 | }
 9 | 
10 | #' Intersect data frames based on chromosome, start and end.
11 | #'
12 | #' @param x A dataframe.
13 | #' @param by A character vector with 3 entries which are the chromosome, start and end column.
14 | #'   For example: \code{by=c("chr", "start", "end")}
15 | #' @param max_distance The maximum distance up to which intervals are still considered to be
16 | #'  the same cluster. Default: 0.
17 | #' @param cluster_column_name A string that is used as the new column name
18 | #' @return The dataframe with the additional column of the cluster
19 | #' @examples
20 | #'
21 | #' library(dplyr)
22 | #'
23 | #' x1 <- data.frame(id = 1:4, bla=letters[1:4],
24 | #'                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
25 | #'                  start = c(100, 120, 300, 260),
26 | #'                  end = c(150, 250, 350, 450))
27 | #' genome_cluster(x1, by=c("chromosome", "start", "end"))
28 | #' genome_cluster(x1, by=c("chromosome", "start", "end"), max_distance=10)
29 | #' @export
30 | genome_cluster <- function(x, by=NULL, max_distance=0, cluster_column_name="cluster_id"){
31 | 
32 |   x_groups <- dplyr::groups(x)
33 |   x <- dplyr::ungroup(x)
34 |   regroup <- function(d) {
35 |     if (is.null(x_groups)) {
36 |       return(d)
37 |     }
38 |     g <- purrr::map_chr(x_groups, as.character)
39 |     missing <- !(g %in% colnames(d))
40 |     g[missing] <- paste0(g[missing], ".x")
41 |     dplyr::group_by_(d, .dots = g)
42 |   }
43 | 
44 |   if (is.null(by) | length(by) != 3) {
45 |     stop("genome_cluster must join on exactly three columns")
46 |   }
47 | 
48 |   ret <- x %>%
49 |     dplyr::group_by(!!sym(by[1])) %>%
50 |     dplyr::mutate(!! cluster_column_name := cluster_interval(!!sym(by[2]), !!sym(by[3]), max_distance = max_distance)) %>%
51 |     dplyr::ungroup() %>%
52 |     dplyr::mutate(!! cluster_column_name := as.numeric(as.factor(paste0(!!sym(by[1]), "-", !!sym(cluster_column_name))))-1)
53 | 
54 |   ret <- regroup(ret)
55 |   return(ret)
56 | 
57 | }
58 | 


--------------------------------------------------------------------------------
/R/complement.R:
--------------------------------------------------------------------------------
 1 | 
 2 | 
 3 | 
 4 | 
 5 | #' Calculates the complement to the intervals covered by the intervals in
 6 | #' a data frame. It can optionally take a \code{chromosome_size} data frame
 7 | #' that contains 2 or 3 columns, the first the names of chromosome and in case
 8 | #' there are 2 columns the size or first the start index and lastly the end index
 9 | #' on the chromosome.
10 | #' @param x A data frame for which the complement is calculated
11 | #' @param chromosome_size A dataframe with at least 2 columns that contains
12 | #'  first the chromosome name and then the size of that chromosome. Can be NULL
13 | #'  in which case the largest value per chromosome from \code{x} is used.
14 | #' @param by A character vector with 3 entries which are the chromosome, start and end column.
15 | #'   For example: \code{by=c("chr", "start", "end")}
16 | #' @examples
17 | #'
18 | #' library(dplyr)
19 | #'
20 | #' x1 <- data.frame(id = 1:4, bla=letters[1:4],
21 | #'                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
22 | #'                  start = c(100, 200, 300, 400),
23 | #'                  end = c(150, 250, 350, 450))
24 | #'
25 | #' genome_complement(x1, by=c("chromosome", "start", "end"))
26 | #' @export
27 | genome_complement <- function(x, chromosome_size=NULL, by=NULL){
28 | 
29 |   if (is.null(by) | length(by) != 3) {
30 |     stop("genome_complement must work on exactly three columns")
31 |   }
32 | 
33 | 
34 |   if(is.null(chromosome_size)){
35 |     chromosome_size <- x %>%
36 |       dplyr::group_by(!! sym(by[1])) %>%
37 |       dplyr::summarize(start = 1,
38 |                        end = max(!! sym(by[3])))
39 |   }else if(ncol(chromosome_size) == 2){
40 |     chromosome_size <- cbind(chromosome_size[, 1, drop=FALSE], data.frame(start=1), chromosome_size[, -1, drop=FALSE])
41 |   }
42 | 
43 |   colnames(chromosome_size)[1:3] <- by
44 | 
45 |   chromosome_size %>%
46 |     genome_subtract(x, by=by)
47 | }
48 | 


--------------------------------------------------------------------------------
/R/intersect.R:
--------------------------------------------------------------------------------
  1 | 
  2 | #' @importFrom dplyr "%>%" "n"
  3 | #' @importFrom rlang "sym" ":="
  4 | NULL
  5 | 
  6 | 
  7 | ## quiets concerns of R CMD check re: the .'s that appear in pipelines
  8 | if(getRversion() >= "2.15.1")  utils::globalVariables(c("..start", "..end", "..id", "..distance"))
  9 | 
 10 | 
 11 | 
 12 | #' Intersect data frames based on chromosome, start and end.
 13 | #'
 14 | #' @param x A dataframe.
 15 | #' @param y A dataframe.
 16 | #' @param by A character vector with 3 entries which are used to match the chromosome, start and end column.
 17 | #'   For example: \code{by=c("Chromosome"="chr", "Start"="start", "End"="end")}
 18 | #' @param mode One of "both", "left", "right" or "anti".
 19 | #' @return The intersected dataframe of \code{x} and \code{y} with the new boundaries.
 20 | #' @examples
 21 | #'
 22 | #' library(dplyr)
 23 | #'
 24 | #' x1 <- data.frame(id = 1:4, bla=letters[1:4],
 25 | #'                  chromosome = c("chr1", "chr1", "chr2", "chr2"),
 26 | #'                  start = c(100, 200, 300, 400),
 27 | #'                  end = c(150, 250, 350, 450))
 28 | #'
 29 | #' x2 <- data.frame(id = 1:4, BLA=LETTERS[1:4],
 30 | #'                  chromosome = c("chr1", "chr2", "chr2", "chr1"),
 31 | #'                  start = c(140, 210, 400, 300),
 32 | #'                  end = c(160, 240, 415, 320))
 33 | #' j <- genome_intersect(x1, x2, by=c("chromosome", "start", "end"), mode="both")
 34 | #' print(j)
 35 | #'
 36 | #'
 37 | #'
 38 | #' @export
 39 | genome_intersect <- function(x, y, by=NULL, mode= "both"){
 40 | 
 41 |   # Much of this code is copied from https://github.com/dgrtwo/fuzzyjoin
 42 | 
 43 |   x_groups <- dplyr::groups(x)
 44 |   x <- dplyr::ungroup(x)
 45 |   regroup <- function(d) {
 46 |     if (is.null(x_groups)) {
 47 |       return(d)
 48 |     }
 49 |     g <- purrr::map_chr(x_groups, as.character)
 50 |     missing <- !(g %in% colnames(d))
 51 |     g[missing] <- paste0(g[missing], ".x")
 52 |     dplyr::group_by_(d, .dots = g)
 53 |   }
 54 | 
 55 |   mode <- match.arg(mode, c("both", "left", "right", "anti"))
 56 | 
 57 |   by <- dplyr::common_by(by, x, y)
 58 | 
 59 |   if (length(by$x) != 3) {
 60 |     stop("genome_join must join on exactly three columns")
 61 |   }
 62 | 
 63 | 
 64 |   index_match_fun <- function(x,y){
 65 |     # nest around the chromosome column
 66 |     x$..index <- seq_len(nrow(x))
 67 |     y$..index <- seq_len(nrow(y))
 68 |     nested_x <- dplyr::group_by_at(x, 1) %>% tidyr::nest()
 69 |     nested_y <- dplyr::group_by_at(y, 1) %>% tidyr::nest()
 70 |     by <- c(colnames(nested_y)[1])
 71 |     names(by) <- colnames(nested_x)[1]
 72 | 
 73 |     joined <- dplyr::inner_join(nested_x, nested_y, by = by)
 74 | 
 75 |     # find matching ranges in each
 76 |     find_overlaps <- function(xd, yd) {
 77 |       r1 <- IRanges::IRanges(xd[[1]], xd[[2]])
 78 |       r2 <- IRanges::IRanges(yd[[1]], yd[[2]])
 79 |       o <- as.data.frame(IRanges::findOverlaps(r1, r2))
 80 |       intersection <- IRanges::pintersect(r1[o$queryHits], r2[o$subjectHits])
 81 |       data.frame(x = xd$..index[o$queryHits], y = yd$..index[o$subjectHits],
 82 |                  ..start=IRanges::start(intersection), ..end=IRanges::end(intersection))
 83 |     }
 84 | 
 85 |     ret <- purrr::map2_df(joined$data.x, joined$data.y, find_overlaps)
 86 |     ret
 87 |   }
 88 | 
 89 |   d1 <- x[, by$x, drop = FALSE]
 90 |   d2 <- y[, by$y, drop = FALSE]
 91 |   matches <- index_match_fun(d1, d2)
 92 | 
 93 |   matches$i <- NULL
 94 |   if (mode == "anti") {
 95 |     if (nrow(matches) == 0) {
 96 |       return(regroup(x))
 97 |     }
 98 |     return(regroup(x[-sort(unique(matches$x)), ]))
 99 |   }
100 |   if (mode == "left") {
101 |     ret <- x %>%
102 |       dplyr::select(- dplyr::one_of(by$x[-1])) %>%
103 |       dplyr::mutate(..id=seq_len(n())) %>%
104 |       dplyr::inner_join(matches[, c("x", "..start", "..end")], by=c("..id"="x")) %>%
105 |       dplyr::rename(!! by$x[2] := `..start`, !! by$x[3] := `..end`) %>%
106 |       dplyr::select(- `..id`) %>%
107 |       regroup()
108 |     return(ret)
109 |   }
110 |   else if (mode == "right") {
111 |     ret <- y %>%
112 |       dplyr::select(- dplyr::one_of(by$y[-1])) %>%
113 |       dplyr::mutate(..id=seq_len(n())) %>%
114 |       dplyr::inner_join(matches[,c("y", "..start", "..end")], by=c("..id"="y")) %>%
115 |       dplyr::rename(!! by$y[2] := `..start`, !! by$y[3] := `..end`) %>%
116 |       dplyr::select(- `..id`) %>%
117 |       regroup()
118 |     return(ret)
119 |   }
120 | 
121 |   matches <- dplyr::arrange(matches, x, y)
122 |   for (n in intersect(colnames(x), colnames(y))) {
123 |     if(! n %in% by$x){
124 |       x <- dplyr::rename(x, !! paste0(n, ".x") := !! sym(n))
125 |     }
126 |     if(! n %in% by$y){
127 |       y <- dplyr::rename(y, !! paste0(n, ".y") := !! sym(n))
128 |     }
129 |   }
130 | 
131 |   ret <- dplyr::bind_cols(x[matches$x, , drop = FALSE] %>% dplyr::select(- dplyr::one_of(by$x[-1])),
132 |                           y[matches$y, , drop = FALSE] %>% dplyr::select(- dplyr::one_of(by$y)))
133 |   if (ncol(matches) > 2) {
134 |     extra_cols <- matches[, -(1:2), drop = FALSE]
135 |     ret <- dplyr::bind_cols(ret, extra_cols) %>%
136 |       dplyr::rename(!! by$x[2] := `..start`, !! by$x[3] := `..end`)
137 |   }
138 |   regroup(ret)
139 | 
140 | 
141 | }
142 | 


--------------------------------------------------------------------------------
/R/join_closest.R:
--------------------------------------------------------------------------------
  1 | 
  2 | 
  3 | #' Join intervals on chromosomes in data frames, to the closest partner
  4 | #'
  5 | #' @param x A dataframe.
  6 | #' @param y A dataframe.
  7 | #' @param by A character vector with 3 entries which are used to match the chromosome, start and end column.
  8 | #'   For example: \code{by=c("Chromosome"="chr", "Start"="start", "End"="end")}
  9 | #' @param mode One of "inner", "full", "left", "right", "semi" or "anti".
 10 | #' @param distance_column_name A string that is used as the new column name with the distance.
 11 | #' If \code{NULL} no new column is added.
 12 | #' @param max_distance The maximum distance that is allowed to join 2 entries.
 13 | #' @param select A string that is passed on to \code{IRanges::distanceToNearest}, can either be
 14 | #'  all which means that in case that multiple intervals have the same distance all are reported, or
 15 | #'  arbitrary which means in that case one would be chosen at random.
 16 | #' @param ... Additional arguments parsed on to genome_join_closest.
 17 | #' @return The joined dataframe of \code{x} and \code{y}.
 18 | #' @examples
 19 | #'
 20 | #' library(dplyr)
 21 | #'
 22 | #' x1 <- data.frame(id = 1:4, bla=letters[1:4],
 23 | #'                  chromosome = c("chr1", "chr1", "chr2", "chr2"),
 24 | #'                  start = c(100, 200, 300, 400),
 25 | #'                  end = c(150, 250, 350, 450))
 26 | #'
 27 | #' x2 <- data.frame(id = 1:4, BLA=LETTERS[1:4],
 28 | #'                  chromosome = c("chr1", "chr2", "chr2", "chr1"),
 29 | #'                  start = c(140, 210, 400, 300),
 30 | #'                  end = c(160, 240, 415, 320))
 31 | #' j <- genome_intersect(x1, x2, by=c("chromosome", "start", "end"), mode="both")
 32 | #' print(j)
 33 | #' @export
 34 | genome_join_closest <- function(x, y, by=NULL,  mode = "inner",
 35 |                                 distance_column_name=NULL, max_distance=Inf, select="all"){
 36 | 
 37 |   # Nearly all of this code is copied from https://github.com/dgrtwo/fuzzyjoin
 38 | 
 39 |   if (!requireNamespace("IRanges", quietly = TRUE)) {
 40 |     stop("genome_join_closest requires the IRanges package: ",
 41 |          "https://bioconductor.org/packages/release/bioc/html/IRanges.html")
 42 |   }
 43 | 
 44 |   select <- match.arg(select, c("all", "arbitrary"))
 45 | 
 46 |   by <- dplyr::common_by(by, x, y)
 47 |   if (length(by$x) != 3) {
 48 |     stop("genome_join_closest must join on exactly three columns")
 49 |   }
 50 | 
 51 |   f <- function(x, y) {
 52 |     # nest around the chromosome column
 53 |     x$..index <- seq_len(nrow(x))
 54 |     y$..index <- seq_len(nrow(y))
 55 | 
 56 |     nested_x <- dplyr::group_by_at(x, 1) %>% tidyr::nest()
 57 |     nested_y <- dplyr::group_by_at(y, 1) %>% tidyr::nest()
 58 |     by <- c(colnames(nested_y)[1])
 59 |     names(by) <- colnames(nested_x)[1]
 60 | 
 61 |     joined <- dplyr::inner_join(nested_x, nested_y, by = by)
 62 | 
 63 |     # find matching ranges in each
 64 |     find_closest <- function(xd, yd) {
 65 |       r1 <- IRanges::IRanges(xd[[1]], xd[[2]])
 66 |       r2 <- IRanges::IRanges(yd[[1]], yd[[2]])
 67 |       o <- as.data.frame(IRanges::distanceToNearest(r1, r2, select=select))
 68 | 
 69 |       data.frame(x = xd$..index[o$queryHits], y = yd$..index[o$subjectHits], ..distance=o$distance) %>%
 70 |         dplyr::filter(`..distance` < max_distance)
 71 |     }
 72 | 
 73 |     ret <- purrr::map2_df(joined$data.x, joined$data.y, find_closest)
 74 | 
 75 |     if(! is.null(distance_column_name)){
 76 |       ret[[distance_column_name]] <- ret$..distance
 77 |     }
 78 |     ret$..distance <- NULL
 79 | 
 80 |     ret
 81 |   }
 82 | 
 83 |   fuzzyjoin::fuzzy_join(x, y, mode = mode, index_match_fun = f, multi_by = by)
 84 | 
 85 | }
 86 | 
 87 | 
 88 | #' @rdname genome_join_closest
 89 | #' @export
 90 | genome_inner_join_closest <- function(x, y, by = NULL, ...) {
 91 |   genome_join_closest (x, y,  by, mode = "inner", ...)
 92 | }
 93 | 
 94 | 
 95 | #' @rdname genome_join_closest
 96 | #' @export
 97 | genome_left_join_closest <- function(x, y, by = NULL, ...) {
 98 |   genome_join_closest (x, y,  by, mode = "left", ...)
 99 | }
100 | 
101 | 
102 | #' @rdname genome_join_closest
103 | #' @export
104 | genome_right_join_closest <- function(x, y, by = NULL, ...) {
105 |   genome_join_closest (x, y,  by, mode = "right", ...)
106 | }
107 | 
108 | 
109 | #' @rdname genome_join_closest
110 | #' @export
111 | genome_full_join_closest <- function(x, y, by = NULL, ...) {
112 |   genome_join_closest (x, y,  by, mode = "full", ...)
113 | }
114 | 
115 | 
116 | #' @rdname genome_join_closest
117 | #' @export
118 | genome_semi_join_closest <- function(x, y, by = NULL, ...) {
119 |   genome_join_closest (x, y,  by, mode = "semi", ...)
120 | }
121 | 
122 | 
123 | #' @rdname genome_join_closest
124 | #' @export
125 | genome_anti_join_closest <- function(x, y, by = NULL, ...) {
126 |   genome_join_closest (x, y,  by, mode = "anti", ...)
127 | }
128 | 
129 | 
130 | 


--------------------------------------------------------------------------------
/R/subtract.R:
--------------------------------------------------------------------------------
 1 | 
 2 | 
 3 | 
 4 | #' Subtract one data frame from another based on chromosome, start and end.
 5 | #'
 6 | #' @param x A dataframe.
 7 | #' @param y A dataframe.
 8 | #' @param by A character vector with 3 entries which are used to match the chromosome, start and end column.
 9 | #'   For example: \code{by=c("Chromosome"="chr", "Start"="start", "End"="end")}
10 | #' @return The subtracted dataframe of \code{x} and \code{y} with the new boundaries.
11 | #' @examples
12 | #'
13 | #' library(dplyr)
14 | #'
15 | #' x1 <- data.frame(id = 1:4, bla=letters[1:4],
16 | #'                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
17 | #'                  start = c(100, 200, 300, 400),
18 | #'                  end = c(150, 250, 350, 450))
19 | #'
20 | #' x2 <- data.frame(id = 1:4, BLA=LETTERS[1:4],
21 | #'                  chromosome = c("chr1", "chr2", "chr1", "chr1"),
22 | #'                  start = c(120, 210, 300, 400),
23 | #'                  end = c(125, 240, 320, 415))
24 | #'
25 | #' j <- genome_subtract(x1, x2, by=c("chromosome", "start", "end"))
26 | #' print(j)
27 | #'
28 | #'
29 | #' @export
30 | genome_subtract <- function(x, y, by=NULL){
31 | 
32 |   # Much of this code is copied from https://github.com/dgrtwo/fuzzyjoin
33 | 
34 |   x_groups <- dplyr::groups(x)
35 |   x <- dplyr::ungroup(x)
36 |   regroup <- function(d) {
37 |     if (is.null(x_groups)) {
38 |       return(d)
39 |     }
40 |     g <- purrr::map_chr(x_groups, as.character)
41 |     missing <- !(g %in% colnames(d))
42 |     g[missing] <- paste0(g[missing], ".x")
43 |     dplyr::group_by_(d, .dots = g)
44 |   }
45 | 
46 |   by <- dplyr::common_by(by, x, y)
47 | 
48 |   if (length(by$x) != 3) {
49 |     stop("genome_join must join on exactly three columns")
50 |   }
51 | 
52 | 
53 |   f <- function(x,y){
54 |     # nest around the chromosome column
55 |     x$..index <- seq_len(nrow(x))
56 |     y$..index <- seq_len(nrow(y))
57 |     nested_x <- dplyr::group_by_at(x, 1) %>% tidyr::nest()
58 |     nested_y <- dplyr::group_by_at(y, 1) %>% tidyr::nest()
59 |     by <- c(colnames(nested_y)[1])
60 |     names(by) <- colnames(nested_x)[1]
61 | 
62 |     joined <- dplyr::inner_join(nested_x, nested_y, by = by)
63 | 
64 |     # find matching ranges in each
65 |     find_subtractions <- function(xd, yd) {
66 |       r1 <- IRanges::IRanges(xd[[1]], xd[[2]])
67 |       r2 <- IRanges::IRanges(yd[[1]], yd[[2]])
68 | 
69 |       subtraction <- IRanges::setdiff(r1, r2)
70 | 
71 |       o <- as.data.frame(IRanges::findOverlaps(subtraction, r1))
72 |       data.frame(x = xd$..index[o$subjectHits],
73 |                  ..start=pmax(IRanges::start(subtraction)[o$queryHits], IRanges::start(r1)[o$subjectHits]),
74 |                  ..end=pmin(IRanges::end(subtraction)[o$queryHits], IRanges::end(r1)[o$subjectHits]))
75 |     }
76 | 
77 |     ret <- purrr::map2_df(joined$data.x, joined$data.y, find_subtractions)
78 |     ret
79 |   }
80 | 
81 |   d1 <- x[, by$x, drop = FALSE]
82 |   d2 <- y[, by$y, drop = FALSE]
83 | 
84 |   matches <- f(d1, d2)
85 |   ret <- x %>%
86 |     dplyr::select(- dplyr::one_of(by$x[-1])) %>%
87 |     dplyr::mutate(..id=seq_len(n())) %>%
88 |     dplyr::inner_join(matches[, c("x", "..start", "..end")], by=c("..id"="x")) %>%
89 |     dplyr::rename(!! by$x[2] := `..start`, !! by$x[3] := `..end`) %>%
90 |     dplyr::select(- `..id`) %>%
91 |     regroup()
92 |   return(ret)
93 | 
94 | }
95 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | # tidygenomics
  2 | 
  3 | [![CRAN_Status_Badge](https://www.r-pkg.org/badges/version/tidygenomics)](https://cran.r-project.org/package=tidygenomics)
  4 | 
  5 | Tidy Verbs for Dealing with Genomic Data Frames
  6 | 
  7 | ## Description
  8 | 
  9 | Handle genomic data within data frames just as you would with `GRanges`.
 10 | This packages provides method to deal with genomics intervals the "tidy-way" which makes
 11 | it simpler to integrate in the the general data munging process. The API is inspired by the
 12 | popular bedtools and the genome_join() method from the fuzzyjoin package.
 13 | 
 14 | ## Installation
 15 | 
 16 | ```
 17 | install.packages("tidygenomics")
 18 | ```
 19 | 
 20 | Or to get the latest development version
 21 | ```
 22 | devtools::install_github("const-ae/tidygenomics")
 23 | ```
 24 | 
 25 | ## Documentation
 26 | 
 27 | 
 28 | #### genome_intersect
 29 | 
 30 | Joins 2 data frames based on their genomic overlap. Unlike the `genome_join` function it updates the boundaries to reflect
 31 | the overlap of the regions.
 32 | 
 33 | <img src="vignettes/resources/genome_intersect_docu.png" alt="genome_intersect" style="width: 100%;"/>
 34 | 
 35 | 
 36 | ```{r}
 37 | x1 <- data.frame(id = 1:4, 
 38 |                 chromosome = c("chr1", "chr1", "chr2", "chr2"),
 39 |                 start = c(100, 200, 300, 400),
 40 |                 end = c(150, 250, 350, 450))
 41 | 
 42 | x2 <- data.frame(id = 1:4,
 43 |                  chromosome = c("chr1", "chr2", "chr2", "chr1"),
 44 |                  start = c(140, 210, 400, 300),
 45 |                  end = c(160, 240, 415, 320))
 46 | 
 47 | genome_intersect(x1, x2, by=c("chromosome", "start", "end"), mode="both")
 48 | ```
 49 | 
 50 | | id.x|chromosome | id.y| start| end|
 51 | |----:|:----------|----:|-----:|---:|
 52 | |    1|chr1       |    1|   140| 150|
 53 | |    4|chr2       |    3|   400| 415|
 54 | 
 55 | #### genome_subtract
 56 | 
 57 | Subtracts one data frame from the other. This can be used to split the x data frame into smaller areas.
 58 | 
 59 | <img src="vignettes/resources/genome_subtract_docu.png" alt="genome_subtract" style="width: 100%;"/>
 60 | 
 61 | ```{r}
 62 | x1 <- data.frame(id = 1:4,
 63 |                 chromosome = c("chr1", "chr1", "chr2", "chr1"),
 64 |                 start = c(100, 200, 300, 400),
 65 |                 end = c(150, 250, 350, 450))
 66 | 
 67 | x2 <- data.frame(id = 1:4,
 68 |                 chromosome = c("chr1", "chr2", "chr1", "chr1"),
 69 |                 start = c(120, 210, 300, 400),
 70 |                 end = c(125, 240, 320, 415))
 71 | 
 72 | genome_subtract(x1, x2, by=c("chromosome", "start", "end"))
 73 | ```
 74 | 
 75 | | id|chromosome | start| end|
 76 | |--:|:----------|-----:|---:|
 77 | |  1|chr1       |   100| 119|
 78 | |  1|chr1       |   126| 150|
 79 | |  2|chr1       |   200| 250|
 80 | |  3|chr2       |   300| 350|
 81 | |  4|chr1       |   416| 450|
 82 | 
 83 | 
 84 | #### genome_join_closest
 85 | 
 86 | Joins 2 data frames based on their genomic location. If no exact overlap is found the next closest interval is used.
 87 | 
 88 | <img src="vignettes/resources/genome_join_closest_docu.png" alt="genome_join_closest" style="width: 100%;"/>
 89 | 
 90 | ```{r}
 91 | x1 <- data_frame(id = 1:4, 
 92 |                  chr = c("chr1", "chr1", "chr2", "chr3"),
 93 |                  start = c(100, 200, 300, 400),
 94 |                  end = c(150, 250, 350, 450))
 95 | 
 96 | x2 <- data_frame(id = 1:4,
 97 |                  chr = c("chr1", "chr1", "chr1", "chr2"),
 98 |                  start = c(220, 210, 300, 400),
 99 |                  end = c(225, 240, 320, 415))
100 | genome_join_closest(x1, x2, by=c("chr", "start", "end"), distance_column_name="distance", mode="left")
101 | ```
102 | 
103 | | id.x|chr.x | start.x| end.x| id.y|chr.y | start.y| end.y| distance|
104 | |----:|:-----|-------:|-----:|----:|:-----|-------:|-----:|--------:|
105 | |    1|chr1  |     100|   150|    2|chr1  |     210|   240|       59|
106 | |    2|chr1  |     200|   250|    1|chr1  |     220|   225|        0|
107 | |    2|chr1  |     200|   250|    2|chr1  |     210|   240|        0|
108 | |    3|chr2  |     300|   350|    4|chr2  |     400|   415|       49|
109 | |    4|chr3  |     400|   450|   NA|NA    |      NA|    NA|       NA|
110 | 
111 | #### genome_cluster
112 | 
113 | Add a new column with the cluster if 2 intervals are overlapping or are within the `max_distance`.
114 | 
115 | <img src="vignettes/resources/genome_cluster_docu.png" alt="genome_cluster" style="width: 100%;"/>
116 | 
117 | ```{r}
118 | x1 <- data.frame(id = 1:4, bla=letters[1:4],
119 |                 chromosome = c("chr1", "chr1", "chr2", "chr1"),
120 |                 start = c(100, 120, 300, 260),
121 |                 end = c(150, 250, 350, 450))
122 | genome_cluster(x1, by=c("chromosome", "start", "end"))
123 | ```
124 | 
125 | | id|bla |chromosome | start| end| cluster_id|
126 | |--:|:---|:----------|-----:|---:|----------:|
127 | |  1|a   |chr1       |   100| 150|          0|
128 | |  2|b   |chr1       |   120| 250|          0|
129 | |  3|c   |chr2       |   300| 350|          2|
130 | |  4|d   |chr1       |   260| 450|          1|
131 | 
132 | ```{r}
133 | genome_cluster(x1, by=c("chromosome", "start", "end"), max_distance=10)
134 | ```
135 | 
136 | | id|bla |chromosome | start| end| cluster_id|
137 | |--:|:---|:----------|-----:|---:|----------:|
138 | |  1|a   |chr1       |   100| 150|          0|
139 | |  2|b   |chr1       |   120| 250|          0|
140 | |  3|c   |chr2       |   300| 350|          1|
141 | |  4|d   |chr1       |   260| 450|          0|
142 | 
143 | #### genome_complement
144 | 
145 | Calculates the complement of a genomic region.
146 | 
147 | <img src="vignettes/resources/genome_complement_docu.png" alt="genome_complement" style="width: 100%;"/>
148 | 
149 | ```{r}
150 | x1 <- data.frame(id = 1:4,
151 |                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
152 |                  start = c(100, 200, 300, 400),
153 |                  end = c(150, 250, 350, 450))
154 | 
155 | genome_complement(x1, by=c("chromosome", "start", "end"))
156 | ```
157 | 
158 | |chromosome | start| end|
159 | |:----------|-----:|---:|
160 | |chr1       |     1|  99|
161 | |chr1       |   151| 199|
162 | |chr1       |   251| 399|
163 | |chr2       |     1| 299|
164 | 
165 | 
166 | #### genome_join
167 | 
168 | Classical join function based on the overlap of the interval. Implemented and maintained in the
169 | [fuzzyjoin](https://github.com/dgrtwo/fuzzyjoin) package and documented here only for completeness.
170 | 
171 | <img src="vignettes/resources/genome_join_docu.png" alt="genome_join" style="width: 100%;"/>
172 | 
173 | ```{r}
174 | x1 <- data_frame(id = 1:4, 
175 |                  chr = c("chr1", "chr1", "chr2", "chr3"),
176 |                  start = c(100, 200, 300, 400),
177 |                  end = c(150, 250, 350, 450))
178 | 
179 | x2 <- data_frame(id = 1:4,
180 |                  chr = c("chr1", "chr1", "chr1", "chr2"),
181 |                  start = c(220, 210, 300, 400),
182 |                  end = c(225, 240, 320, 415))
183 | fuzzyjoin::genome_join(x1, x2, by=c("chr", "start", "end"), mode="inner")
184 | ```
185 | 
186 | | id.x|chr.x | start.x| end.x| id.y|chr.y | start.y| end.y|
187 | |----:|:-----|-------:|-----:|----:|:-----|-------:|-----:|
188 | |    2|chr1  |     200|   250|    1|chr1  |     220|   225|
189 | |    2|chr1  |     200|   250|    2|chr1  |     210|   240|
190 | 
191 | ```{r}
192 | fuzzyjoin::genome_join(x1, x2, by=c("chr", "start", "end"), mode="left")
193 | ```
194 | 
195 | | id.x|chr.x | start.x| end.x| id.y|chr.y | start.y| end.y|
196 | |----:|:-----|-------:|-----:|----:|:-----|-------:|-----:|
197 | |    1|chr1  |     100|   150|   NA|NA    |      NA|    NA|
198 | |    2|chr1  |     200|   250|    1|chr1  |     220|   225|
199 | |    2|chr1  |     200|   250|    2|chr1  |     210|   240|
200 | |    3|chr2  |     300|   350|   NA|NA    |      NA|    NA|
201 | |    4|chr3  |     400|   450|   NA|NA    |      NA|    NA|
202 | 
203 | ```{r}
204 | fuzzyjoin::genome_join(x1, x2, by=c("chr", "start", "end"), mode="anti")
205 | ```
206 | 
207 | | id|chr  | start| end|
208 | |--:|:----|-----:|---:|
209 | |  1|chr1 |   100| 150|
210 | |  3|chr2 |   300| 350|
211 | |  4|chr3 |   400| 450|
212 | 
213 | 
214 | 
215 | ## Inspiration
216 | 
217 | - [tidyverse](http://tidyverse.org/)
218 | - [fuzzyjoin](https://github.com/dgrtwo/fuzzyjoin)
219 | - [GenomicRanges](http://bioconductor.org/packages/release/bioc/html/GenomicRanges.html)
220 | - [bedtools](http://bedtools.readthedocs.io)
221 | 
222 | If you have any additional questions or encounter issues please raise them on the [github page](https://github.com/Artjom-Metro/tidygenomics).
223 | 
224 | 
225 | 
226 | 
227 | 
228 | 
229 | 
230 | 
231 | 
232 | 


--------------------------------------------------------------------------------
/_pkgdown.yml:
--------------------------------------------------------------------------------
1 | destination: docs
2 | 


--------------------------------------------------------------------------------
/cran-comments.md:
--------------------------------------------------------------------------------
 1 | # Bug fix
 2 | 
 3 | In this release I have fixed a bug and ported code to new dplyr API
 4 | 
 5 | ## Test environments
 6 | * macOS Mojave: R 3.6.1
 7 | * R-Hub (Fedora R-devel, Ubuntu R-release)
 8 | * winbuilder (R-devel, R-release)
 9 | 
10 | ## R CMD check results
11 | There were no ERRORs, WARNINGs
12 | 
13 | ## Downstream dependencies
14 | 
15 | There is no downstream dependency yet
16 |   
17 | 


--------------------------------------------------------------------------------
/docs/articles/index.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html lang="en">
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Articles • tidygenomics</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous" />
 16 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous" />
 20 | 
 21 | <!-- clipboard.js -->
 22 | <script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script>
 23 | 
 24 | <!-- sticky kit -->
 25 | <script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script>
 26 | 
 27 | <!-- pkgdown -->
 28 | <link href="../pkgdown.css" rel="stylesheet">
 29 | <script src="../pkgdown.js"></script>
 30 | 
 31 | 
 32 | 
 33 | <meta property="og:title" content="Articles" />
 34 | 
 35 | 
 36 | 
 37 | <!-- mathjax -->
 38 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
 39 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
 40 | 
 41 | <!--[if lt IE 9]>
 42 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 43 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 44 | <![endif]-->
 45 | 
 46 | 
 47 |   </head>
 48 | 
 49 |   <body>
 50 |     <div class="container template-article-index">
 51 |       <header>
 52 |       <div class="navbar navbar-default navbar-fixed-top" role="navigation">
 53 |   <div class="container">
 54 |     <div class="navbar-header">
 55 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 56 |         <span class="sr-only">Toggle navigation</span>
 57 |         <span class="icon-bar"></span>
 58 |         <span class="icon-bar"></span>
 59 |         <span class="icon-bar"></span>
 60 |       </button>
 61 |       <span class="navbar-brand">
 62 |         <a class="navbar-link" href="../index.html">tidygenomics</a>
 63 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.1.2</span>
 64 |       </span>
 65 |     </div>
 66 | 
 67 |     <div id="navbar" class="navbar-collapse collapse">
 68 |       <ul class="nav navbar-nav">
 69 |         <li>
 70 |   <a href="../index.html">
 71 |     <span class="fa fa-home fa-lg"></span>
 72 |      
 73 |   </a>
 74 | </li>
 75 | <li>
 76 |   <a href="../reference/index.html">Reference</a>
 77 | </li>
 78 | <li class="dropdown">
 79 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 80 |     Articles
 81 |      
 82 |     <span class="caret"></span>
 83 |   </a>
 84 |   <ul class="dropdown-menu" role="menu">
 85 |     <li>
 86 |       <a href="../articles/intro.html">Tidy Genomics</a>
 87 |     </li>
 88 |   </ul>
 89 | </li>
 90 | <li>
 91 |   <a href="../news/index.html">Changelog</a>
 92 | </li>
 93 |       </ul>
 94 |       
 95 |       <ul class="nav navbar-nav navbar-right">
 96 |         <li>
 97 |   <a href="https://github.com/const-ae/tidygenomics">
 98 |     <span class="fa fa-github fa-lg"></span>
 99 |      
100 |   </a>
101 | </li>
102 |       </ul>
103 |       
104 |     </div><!--/.nav-collapse -->
105 |   </div><!--/.container -->
106 | </div><!--/.navbar -->
107 | 
108 |       
109 |       </header>
110 | 
111 | <div class="row">
112 |   <div class="col-md-9 contents">
113 |     <div class="page-header">
114 |       <h1>Articles</h1>
115 |     </div>
116 | 
117 |     <div class="section ">
118 |       <h3>All vignettes</h3>
119 |       <p class="section-desc"></p>
120 | 
121 |       <ul>
122 |         <li><a href="intro.html">Tidy Genomics</a></li>
123 |       </ul>
124 |     </div>
125 |   </div>
126 | </div>
127 | 
128 |       <footer>
129 |       <div class="copyright">
130 |   <p>Developed by Constantin Ahlmann-Eltze.</p>
131 | </div>
132 | 
133 | <div class="pkgdown">
134 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
135 | </div>
136 |       </footer>
137 |    </div>
138 | 
139 |   
140 | 
141 |   </body>
142 | </html>
143 | 
144 | 


--------------------------------------------------------------------------------
/docs/articles/resources/genome_cluster_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/docs/articles/resources/genome_cluster_docu.png


--------------------------------------------------------------------------------
/docs/articles/resources/genome_complement_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/docs/articles/resources/genome_complement_docu.png


--------------------------------------------------------------------------------
/docs/articles/resources/genome_intersect_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/docs/articles/resources/genome_intersect_docu.png


--------------------------------------------------------------------------------
/docs/articles/resources/genome_join_closest_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/docs/articles/resources/genome_join_closest_docu.png


--------------------------------------------------------------------------------
/docs/articles/resources/genome_join_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/docs/articles/resources/genome_join_docu.png


--------------------------------------------------------------------------------
/docs/articles/resources/genome_subtract_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/docs/articles/resources/genome_subtract_docu.png


--------------------------------------------------------------------------------
/docs/authors.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html lang="en">
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Authors • tidygenomics</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous" />
 16 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous" />
 20 | 
 21 | <!-- clipboard.js -->
 22 | <script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script>
 23 | 
 24 | <!-- sticky kit -->
 25 | <script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script>
 26 | 
 27 | <!-- pkgdown -->
 28 | <link href="pkgdown.css" rel="stylesheet">
 29 | <script src="pkgdown.js"></script>
 30 | 
 31 | 
 32 | 
 33 | <meta property="og:title" content="Authors" />
 34 | 
 35 | 
 36 | 
 37 | <!-- mathjax -->
 38 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
 39 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
 40 | 
 41 | <!--[if lt IE 9]>
 42 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 43 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 44 | <![endif]-->
 45 | 
 46 | 
 47 |   </head>
 48 | 
 49 |   <body>
 50 |     <div class="container template-authors">
 51 |       <header>
 52 |       <div class="navbar navbar-default navbar-fixed-top" role="navigation">
 53 |   <div class="container">
 54 |     <div class="navbar-header">
 55 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 56 |         <span class="sr-only">Toggle navigation</span>
 57 |         <span class="icon-bar"></span>
 58 |         <span class="icon-bar"></span>
 59 |         <span class="icon-bar"></span>
 60 |       </button>
 61 |       <span class="navbar-brand">
 62 |         <a class="navbar-link" href="index.html">tidygenomics</a>
 63 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.1.2</span>
 64 |       </span>
 65 |     </div>
 66 | 
 67 |     <div id="navbar" class="navbar-collapse collapse">
 68 |       <ul class="nav navbar-nav">
 69 |         <li>
 70 |   <a href="index.html">
 71 |     <span class="fa fa-home fa-lg"></span>
 72 |      
 73 |   </a>
 74 | </li>
 75 | <li>
 76 |   <a href="reference/index.html">Reference</a>
 77 | </li>
 78 | <li class="dropdown">
 79 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 80 |     Articles
 81 |      
 82 |     <span class="caret"></span>
 83 |   </a>
 84 |   <ul class="dropdown-menu" role="menu">
 85 |     <li>
 86 |       <a href="articles/intro.html">Tidy Genomics</a>
 87 |     </li>
 88 |   </ul>
 89 | </li>
 90 | <li>
 91 |   <a href="news/index.html">Changelog</a>
 92 | </li>
 93 |       </ul>
 94 |       
 95 |       <ul class="nav navbar-nav navbar-right">
 96 |         <li>
 97 |   <a href="https://github.com/const-ae/tidygenomics">
 98 |     <span class="fa fa-github fa-lg"></span>
 99 |      
100 |   </a>
101 | </li>
102 |       </ul>
103 |       
104 |     </div><!--/.nav-collapse -->
105 |   </div><!--/.container -->
106 | </div><!--/.navbar -->
107 | 
108 |       
109 |       </header>
110 | 
111 | <div class="row">
112 |   <div class="contents col-md-9">
113 |     <div class="page-header">
114 |       <h1>Authors</h1>
115 |     </div>
116 | 
117 |     <ul class="list-unstyled">
118 |       <li>
119 |         <p><strong>Constantin Ahlmann-Eltze</strong>. Author, maintainer. <a href='https://orcid.org/0000-0002-3762-068X' target='orcid.widget'><img src='https://members.orcid.org/sites/default/files/vector_iD_icon.svg' class='orcid' alt='ORCID' height='16'></a>
120 |         </p>
121 |       </li>
122 |       <li>
123 |         <p><strong>Stan Developers</strong>. Copyright holder. 
124 |         <br /><small>Code from the Stan Math library is reused in 'cluster_interval.cpp'</small></p>
125 |       </li>
126 |       <li>
127 |         <p><strong>David Robinson</strong>. Copyright holder. 
128 |         <br /><small>Code from the fuzzyjoin package is reused</small></p>
129 |       </li>
130 |     </ul>
131 | 
132 |   </div>
133 | 
134 | </div>
135 | 
136 | 
137 |       <footer>
138 |       <div class="copyright">
139 |   <p>Developed by Constantin Ahlmann-Eltze.</p>
140 | </div>
141 | 
142 | <div class="pkgdown">
143 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
144 | </div>
145 |       </footer>
146 |    </div>
147 | 
148 |   
149 | 
150 |   </body>
151 | </html>
152 | 
153 | 


--------------------------------------------------------------------------------
/docs/docsearch.css:
--------------------------------------------------------------------------------
  1 | /* Docsearch -------------------------------------------------------------- */
  2 | /*
  3 |   Source: https://github.com/algolia/docsearch/
  4 |   License: MIT
  5 | */
  6 | 
  7 | .algolia-autocomplete {
  8 |   display: block;
  9 |   -webkit-box-flex: 1;
 10 |   -ms-flex: 1;
 11 |   flex: 1
 12 | }
 13 | 
 14 | .algolia-autocomplete .ds-dropdown-menu {
 15 |   width: 100%;
 16 |   min-width: none;
 17 |   max-width: none;
 18 |   padding: .75rem 0;
 19 |   background-color: #fff;
 20 |   background-clip: padding-box;
 21 |   border: 1px solid rgba(0, 0, 0, .1);
 22 |   box-shadow: 0 .5rem 1rem rgba(0, 0, 0, .175);
 23 | }
 24 | 
 25 | @media (min-width:768px) {
 26 |   .algolia-autocomplete .ds-dropdown-menu {
 27 |       width: 175%
 28 |   }
 29 | }
 30 | 
 31 | .algolia-autocomplete .ds-dropdown-menu::before {
 32 |   display: none
 33 | }
 34 | 
 35 | .algolia-autocomplete .ds-dropdown-menu [class^=ds-dataset-] {
 36 |   padding: 0;
 37 |   background-color: rgb(255,255,255);
 38 |   border: 0;
 39 |   max-height: 80vh;
 40 | }
 41 | 
 42 | .algolia-autocomplete .ds-dropdown-menu .ds-suggestions {
 43 |   margin-top: 0
 44 | }
 45 | 
 46 | .algolia-autocomplete .algolia-docsearch-suggestion {
 47 |   padding: 0;
 48 |   overflow: visible
 49 | }
 50 | 
 51 | .algolia-autocomplete .algolia-docsearch-suggestion--category-header {
 52 |   padding: .125rem 1rem;
 53 |   margin-top: 0;
 54 |   font-size: 1.3em;
 55 |   font-weight: 500;
 56 |   color: #00008B;
 57 |   border-bottom: 0
 58 | }
 59 | 
 60 | .algolia-autocomplete .algolia-docsearch-suggestion--wrapper {
 61 |     float: none;
 62 |     padding-top: 0
 63 | }
 64 | 
 65 | .algolia-autocomplete .algolia-docsearch-suggestion--subcategory-column {
 66 |   float: none;
 67 |   width: auto;
 68 |   padding: 0;
 69 |   text-align: left
 70 | }
 71 | 
 72 | .algolia-autocomplete .algolia-docsearch-suggestion--content {
 73 |   float: none;
 74 |   width: auto;
 75 |   padding: 0
 76 | }
 77 | 
 78 | .algolia-autocomplete .algolia-docsearch-suggestion--content::before {
 79 |   display: none
 80 | }
 81 | 
 82 | .algolia-autocomplete .ds-suggestion:not(:first-child) .algolia-docsearch-suggestion--category-header {
 83 |   padding-top: .75rem;
 84 |   margin-top: .75rem;
 85 |   border-top: 1px solid rgba(0, 0, 0, .1)
 86 | }
 87 | 
 88 | .algolia-autocomplete .ds-suggestion .algolia-docsearch-suggestion--subcategory-column {
 89 |   display: block;
 90 |   padding: .1rem 1rem;
 91 |   margin-bottom: 0.1;
 92 |   font-size: 1.0em;
 93 |   font-weight: 400
 94 |   /* display: none */
 95 | }
 96 | 
 97 | .algolia-autocomplete .algolia-docsearch-suggestion--title {
 98 |   display: block;
 99 |   padding: .25rem 1rem;
100 |   margin-bottom: 0;
101 |   font-size: 0.9em;
102 |   font-weight: 400
103 | }
104 | 
105 | .algolia-autocomplete .algolia-docsearch-suggestion--text {
106 |   padding: 0 1rem .5rem;
107 |   margin-top: -.25rem;
108 |   font-size: 0.8em;
109 |   font-weight: 400;
110 |   line-height: 1.25
111 | }
112 | 
113 | .algolia-autocomplete .algolia-docsearch-footer {
114 |   width: 110px;
115 |   height: 20px;
116 |   z-index: 3;
117 |   margin-top: 10.66667px;
118 |   float: right;
119 |   font-size: 0;
120 |   line-height: 0;
121 | }
122 | 
123 | .algolia-autocomplete .algolia-docsearch-footer--logo {
124 |   background-image: url("data:image/svg+xml;utf8,<svg viewBox='0 0 130 18' xmlns='http://www.w3.org/2000/svg'><defs><linearGradient x1='-36.868%' y1='134.936%' x2='129.432%' y2='-27.7%' id='a'><stop stop-color='%2300AEFF' offset='0%'/><stop stop-color='%233369E7' offset='100%'/></linearGradient></defs><g fill='none' fill-rule='evenodd'><path d='M59.399.022h13.299a2.372 2.372 0 0 1 2.377 2.364V15.62a2.372 2.372 0 0 1-2.377 2.364H59.399a2.372 2.372 0 0 1-2.377-2.364V2.381A2.368 2.368 0 0 1 59.399.022z' fill='url(%23a)'/><path d='M66.257 4.56c-2.815 0-5.1 2.272-5.1 5.078 0 2.806 2.284 5.072 5.1 5.072 2.815 0 5.1-2.272 5.1-5.078 0-2.806-2.279-5.072-5.1-5.072zm0 8.652c-1.983 0-3.593-1.602-3.593-3.574 0-1.972 1.61-3.574 3.593-3.574 1.983 0 3.593 1.602 3.593 3.574a3.582 3.582 0 0 1-3.593 3.574zm0-6.418v2.664c0 .076.082.131.153.093l2.377-1.226c.055-.027.071-.093.044-.147a2.96 2.96 0 0 0-2.465-1.487c-.055 0-.11.044-.11.104l.001-.001zm-3.33-1.956l-.312-.311a.783.783 0 0 0-1.106 0l-.372.37a.773.773 0 0 0 0 1.101l.307.305c.049.049.121.038.164-.011.181-.245.378-.479.597-.697.225-.223.455-.42.707-.599.055-.033.06-.109.016-.158h-.001zm5.001-.806v-.616a.781.781 0 0 0-.783-.779h-1.824a.78.78 0 0 0-.783.779v.632c0 .071.066.12.137.104a5.736 5.736 0 0 1 1.588-.223c.52 0 1.035.071 1.534.207a.106.106 0 0 0 .131-.104z' fill='%23FFF'/><path d='M102.162 13.762c0 1.455-.372 2.517-1.123 3.193-.75.676-1.895 1.013-3.44 1.013-.564 0-1.736-.109-2.673-.316l.345-1.689c.783.163 1.819.207 2.361.207.86 0 1.473-.174 1.84-.523.367-.349.548-.866.548-1.553v-.349a6.374 6.374 0 0 1-.838.316 4.151 4.151 0 0 1-1.194.158 4.515 4.515 0 0 1-1.616-.278 3.385 3.385 0 0 1-1.254-.817 3.744 3.744 0 0 1-.811-1.351c-.192-.539-.29-1.504-.29-2.212 0-.665.104-1.498.307-2.054a3.925 3.925 0 0 1 .904-1.433 4.124 4.124 0 0 1 1.441-.926 5.31 5.31 0 0 1 1.945-.365c.696 0 1.337.087 1.961.191a15.86 15.86 0 0 1 1.588.332v8.456h-.001zm-5.954-4.206c0 .893.197 1.885.592 2.299.394.414.904.621 1.528.621.34 0 .663-.049.964-.142a2.75 2.75 0 0 0 .734-.332v-5.29a8.531 8.531 0 0 0-1.413-.18c-.778-.022-1.369.294-1.786.801-.411.507-.619 1.395-.619 2.223zm16.12 0c0 .719-.104 1.264-.318 1.858a4.389 4.389 0 0 1-.904 1.52c-.389.42-.854.746-1.402.975-.548.229-1.391.36-1.813.36-.422-.005-1.26-.125-1.802-.36a4.088 4.088 0 0 1-1.397-.975 4.486 4.486 0 0 1-.909-1.52 5.037 5.037 0 0 1-.329-1.858c0-.719.099-1.411.318-1.999.219-.588.526-1.09.92-1.509.394-.42.865-.741 1.402-.97a4.547 4.547 0 0 1 1.786-.338 4.69 4.69 0 0 1 1.791.338c.548.229 1.019.55 1.402.97.389.42.69.921.909 1.509.23.588.345 1.28.345 1.999h.001zm-2.191.005c0-.921-.203-1.689-.597-2.223-.394-.539-.948-.806-1.654-.806-.707 0-1.26.267-1.654.806-.394.539-.586 1.302-.586 2.223 0 .932.197 1.558.592 2.098.394.545.948.812 1.654.812.707 0 1.26-.272 1.654-.812.394-.545.592-1.166.592-2.098h-.001zm6.962 4.707c-3.511.016-3.511-2.822-3.511-3.274L113.583.926l2.142-.338v10.003c0 .256 0 1.88 1.375 1.885v1.792h-.001zm3.774 0h-2.153V5.072l2.153-.338v9.534zm-1.079-10.542c.718 0 1.304-.578 1.304-1.291 0-.714-.581-1.291-1.304-1.291-.723 0-1.304.578-1.304 1.291 0 .714.586 1.291 1.304 1.291zm6.431 1.013c.707 0 1.304.087 1.786.262.482.174.871.42 1.156.73.285.311.488.735.608 1.182.126.447.186.937.186 1.476v5.481a25.24 25.24 0 0 1-1.495.251c-.668.098-1.419.147-2.251.147a6.829 6.829 0 0 1-1.517-.158 3.213 3.213 0 0 1-1.178-.507 2.455 2.455 0 0 1-.761-.904c-.181-.37-.274-.893-.274-1.438 0-.523.104-.855.307-1.215.208-.36.487-.654.838-.883a3.609 3.609 0 0 1 1.227-.49 7.073 7.073 0 0 1 2.202-.103c.263.027.537.076.833.147v-.349c0-.245-.027-.479-.088-.697a1.486 1.486 0 0 0-.307-.583c-.148-.169-.34-.3-.581-.392a2.536 2.536 0 0 0-.915-.163c-.493 0-.942.06-1.353.131-.411.071-.75.153-1.008.245l-.257-1.749c.268-.093.668-.185 1.183-.278a9.335 9.335 0 0 1 1.66-.142l-.001-.001zm.181 7.731c.657 0 1.145-.038 1.484-.104v-2.168a5.097 5.097 0 0 0-1.978-.104c-.241.033-.46.098-.652.191a1.167 1.167 0 0 0-.466.392c-.121.169-.175.267-.175.523 0 .501.175.79.493.981.323.196.75.289 1.293.289h.001zM84.109 4.794c.707 0 1.304.087 1.786.262.482.174.871.42 1.156.73.29.316.487.735.608 1.182.126.447.186.937.186 1.476v5.481a25.24 25.24 0 0 1-1.495.251c-.668.098-1.419.147-2.251.147a6.829 6.829 0 0 1-1.517-.158 3.213 3.213 0 0 1-1.178-.507 2.455 2.455 0 0 1-.761-.904c-.181-.37-.274-.893-.274-1.438 0-.523.104-.855.307-1.215.208-.36.487-.654.838-.883a3.609 3.609 0 0 1 1.227-.49 7.073 7.073 0 0 1 2.202-.103c.257.027.537.076.833.147v-.349c0-.245-.027-.479-.088-.697a1.486 1.486 0 0 0-.307-.583c-.148-.169-.34-.3-.581-.392a2.536 2.536 0 0 0-.915-.163c-.493 0-.942.06-1.353.131-.411.071-.75.153-1.008.245l-.257-1.749c.268-.093.668-.185 1.183-.278a8.89 8.89 0 0 1 1.66-.142l-.001-.001zm.186 7.736c.657 0 1.145-.038 1.484-.104v-2.168a5.097 5.097 0 0 0-1.978-.104c-.241.033-.46.098-.652.191a1.167 1.167 0 0 0-.466.392c-.121.169-.175.267-.175.523 0 .501.175.79.493.981.318.191.75.289 1.293.289h.001zm8.682 1.738c-3.511.016-3.511-2.822-3.511-3.274L89.461.926l2.142-.338v10.003c0 .256 0 1.88 1.375 1.885v1.792h-.001z' fill='%23182359'/><path d='M5.027 11.025c0 .698-.252 1.246-.757 1.644-.505.397-1.201.596-2.089.596-.888 0-1.615-.138-2.181-.414v-1.214c.358.168.739.301 1.141.397.403.097.778.145 1.125.145.508 0 .884-.097 1.125-.29a.945.945 0 0 0 .363-.779.978.978 0 0 0-.333-.747c-.222-.204-.68-.446-1.375-.725-.716-.29-1.221-.621-1.515-.994-.294-.372-.44-.82-.44-1.343 0-.655.233-1.171.698-1.547.466-.376 1.09-.564 1.875-.564.752 0 1.5.165 2.245.494l-.408 1.047c-.698-.294-1.321-.44-1.869-.44-.415 0-.73.09-.945.271a.89.89 0 0 0-.322.717c0 .204.043.379.129.524.086.145.227.282.424.411.197.129.551.299 1.063.51.577.24.999.464 1.268.671.269.208.466.442.591.704.125.261.188.569.188.924l-.001.002zm3.98 2.24c-.924 0-1.646-.269-2.167-.808-.521-.539-.782-1.281-.782-2.226 0-.97.242-1.733.725-2.288.483-.555 1.148-.833 1.993-.833.784 0 1.404.238 1.858.714.455.476.682 1.132.682 1.966v.682H7.357c.018.577.174 1.02.467 1.329.294.31.707.465 1.241.465.351 0 .678-.033.98-.099a5.1 5.1 0 0 0 .975-.33v1.026a3.865 3.865 0 0 1-.935.312 5.723 5.723 0 0 1-1.08.091l.002-.001zm-.231-5.199c-.401 0-.722.127-.964.381s-.386.625-.432 1.112h2.696c-.007-.491-.125-.862-.354-1.115-.229-.252-.544-.379-.945-.379l-.001.001zm7.692 5.092l-.252-.827h-.043c-.286.362-.575.608-.865.739-.29.131-.662.196-1.117.196-.584 0-1.039-.158-1.367-.473-.328-.315-.491-.761-.491-1.337 0-.612.227-1.074.682-1.386.455-.312 1.148-.482 2.079-.51l1.026-.032v-.317c0-.38-.089-.663-.266-.851-.177-.188-.452-.282-.824-.282-.304 0-.596.045-.876.134a6.68 6.68 0 0 0-.806.317l-.408-.902a4.414 4.414 0 0 1 1.058-.384 4.856 4.856 0 0 1 1.085-.132c.756 0 1.326.165 1.711.494.385.329.577.847.577 1.552v4.002h-.902l-.001-.001zm-1.88-.859c.458 0 .826-.128 1.104-.384.278-.256.416-.615.416-1.077v-.516l-.763.032c-.594.021-1.027.121-1.297.298s-.406.448-.406.814c0 .265.079.47.236.615.158.145.394.218.709.218h.001zm7.557-5.189c.254 0 .464.018.628.054l-.124 1.176a2.383 2.383 0 0 0-.559-.064c-.505 0-.914.165-1.227.494-.313.329-.47.757-.47 1.284v3.105h-1.262V7.218h.988l.167 1.047h.064c.197-.354.454-.636.771-.843a1.83 1.83 0 0 1 1.023-.312h.001zm4.125 6.155c-.899 0-1.582-.262-2.049-.787-.467-.525-.701-1.277-.701-2.259 0-.999.244-1.767.733-2.304.489-.537 1.195-.806 2.119-.806.627 0 1.191.116 1.692.349l-.381 1.015c-.534-.208-.974-.312-1.321-.312-1.028 0-1.542.682-1.542 2.046 0 .666.128 1.166.384 1.501.256.335.631.502 1.125.502a3.23 3.23 0 0 0 1.595-.419v1.101a2.53 2.53 0 0 1-.722.285 4.356 4.356 0 0 1-.932.086v.002zm8.277-.107h-1.268V9.506c0-.458-.092-.8-.277-1.026-.184-.226-.477-.338-.878-.338-.53 0-.919.158-1.168.475-.249.317-.373.848-.373 1.593v2.949h-1.262V4.801h1.262v2.122c0 .34-.021.704-.064 1.09h.081a1.76 1.76 0 0 1 .717-.666c.306-.158.663-.236 1.072-.236 1.439 0 2.159.725 2.159 2.175v3.873l-.001-.001zm7.649-6.048c.741 0 1.319.269 1.732.806.414.537.62 1.291.62 2.261 0 .974-.209 1.732-.628 2.275-.419.542-1.001.814-1.746.814-.752 0-1.336-.27-1.751-.811h-.086l-.231.704h-.945V4.801h1.262v1.987l-.021.655-.032.553h.054c.401-.591.992-.886 1.772-.886zm-.328 1.031c-.508 0-.875.149-1.098.448-.224.299-.339.799-.346 1.501v.086c0 .723.115 1.247.344 1.571.229.324.603.486 1.123.486.448 0 .787-.177 1.018-.532.231-.354.346-.867.346-1.536 0-1.35-.462-2.025-1.386-2.025l-.001.001zm3.244-.924h1.375l1.209 3.368c.183.48.304.931.365 1.354h.043c.032-.197.091-.436.177-.717.086-.281.541-1.616 1.364-4.004h1.364l-2.541 6.73c-.462 1.235-1.232 1.853-2.31 1.853-.279 0-.551-.03-.816-.091v-.999c.19.043.406.064.65.064.609 0 1.037-.353 1.284-1.058l.22-.559-2.385-5.941h.001z' fill='%231D3657'/></g></svg>");
125 |   background-repeat: no-repeat;
126 |   background-position: 50%;
127 |   background-size: 100%;
128 |   overflow: hidden;
129 |   text-indent: -9000px;
130 |   width: 100%;
131 |   height: 100%;
132 |   display: block;
133 |   transform: translate(-8px);
134 | }
135 | 
136 | .algolia-autocomplete .algolia-docsearch-suggestion--highlight {
137 |   color: #FF8C00;
138 |   background: rgba(232, 189, 54, 0.1)
139 | }
140 | 
141 | 
142 | .algolia-autocomplete .algolia-docsearch-suggestion--text .algolia-docsearch-suggestion--highlight {
143 |   box-shadow: inset 0 -2px 0 0 rgba(105, 105, 105, .5)
144 | }
145 | 
146 | .algolia-autocomplete .ds-suggestion.ds-cursor .algolia-docsearch-suggestion--content {
147 |   background-color: rgba(192, 192, 192, .15)
148 | }
149 | 


--------------------------------------------------------------------------------
/docs/docsearch.js:
--------------------------------------------------------------------------------
 1 | $(function() {
 2 | 
 3 |   // register a handler to move the focus to the search bar
 4 |   // upon pressing shift + "/" (i.e. "?")
 5 |   $(document).on('keydown', function(e) {
 6 |     if (e.shiftKey && e.keyCode == 191) {
 7 |       e.preventDefault();
 8 |       $("#search-input").focus();
 9 |     }
10 |   });
11 | 
12 |   $(document).ready(function() {
13 |     // do keyword highlighting
14 |     /* modified from https://jsfiddle.net/julmot/bL6bb5oo/ */
15 |     var mark = function() {
16 | 
17 |       var referrer = document.URL ;
18 |       var paramKey = "q" ;
19 | 
20 |       if (referrer.indexOf("?") !== -1) {
21 |         var qs = referrer.substr(referrer.indexOf('?') + 1);
22 |         var qs_noanchor = qs.split('#')[0];
23 |         var qsa = qs_noanchor.split('&');
24 |         var keyword = "";
25 | 
26 |         for (var i = 0; i < qsa.length; i++) {
27 |           var currentParam = qsa[i].split('=');
28 | 
29 |           if (currentParam.length !== 2) {
30 |             continue;
31 |           }
32 | 
33 |           if (currentParam[0] == paramKey) {
34 |             keyword = decodeURIComponent(currentParam[1].replace(/\+/g, "%20"));
35 |           }
36 |         }
37 | 
38 |         if (keyword !== "") {
39 |           $(".contents").unmark({
40 |             done: function() {
41 |               $(".contents").mark(keyword);
42 |             }
43 |           });
44 |         }
45 |       }
46 |     };
47 | 
48 |     mark();
49 |   });
50 | });
51 | 
52 | /* Search term highlighting ------------------------------*/
53 | 
54 | function matchedWords(hit) {
55 |   var words = [];
56 | 
57 |   var hierarchy = hit._highlightResult.hierarchy;
58 |   // loop to fetch from lvl0, lvl1, etc.
59 |   for (var idx in hierarchy) {
60 |     words = words.concat(hierarchy[idx].matchedWords);
61 |   }
62 | 
63 |   var content = hit._highlightResult.content;
64 |   if (content) {
65 |     words = words.concat(content.matchedWords);
66 |   }
67 | 
68 |   // return unique words
69 |   var words_uniq = [...new Set(words)];
70 |   return words_uniq;
71 | }
72 | 
73 | function updateHitURL(hit) {
74 | 
75 |   var words = matchedWords(hit);
76 |   var url = "";
77 | 
78 |   if (hit.anchor) {
79 |     url = hit.url_without_anchor + '?q=' + escape(words.join(" ")) + '#' + hit.anchor;
80 |   } else {
81 |     url = hit.url + '?q=' + escape(words.join(" "));
82 |   }
83 | 
84 |   return url;
85 | }
86 | 


--------------------------------------------------------------------------------
/docs/index.html:
--------------------------------------------------------------------------------
  1 | <!DOCTYPE html>
  2 | <!-- Generated by pkgdown: do not edit by hand --><html lang="en">
  3 | <head>
  4 | <meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
  5 | <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | <title>Tidy Verbs for Dealing with Genomic Data Frames • tidygenomics</title>
  9 | <!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous">
 10 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous">
 11 | <!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script><!-- sticky kit --><script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script><!-- pkgdown --><link href="pkgdown.css" rel="stylesheet">
 12 | <script src="pkgdown.js"></script><meta property="og:title" content="Tidy Verbs for Dealing with Genomic Data Frames">
 13 | <meta property="og:description" content="Handle genomic data within data frames just as you would with 'GRanges'.
 14 |     This packages provides method to deal with genomic intervals the &quot;tidy-way&quot; which makes
 15 |     it simpler to integrate in the the general data munging process. The API is inspired by the
 16 |     popular 'bedtools' and the genome_join() method from the 'fuzzyjoin' package.">
 17 | <meta name="twitter:card" content="summary">
 18 | <!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 19 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 20 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 21 | <![endif]-->
 22 | </head>
 23 | <body>
 24 |     <div class="container template-home">
 25 |       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
 26 |   <div class="container">
 27 |     <div class="navbar-header">
 28 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 29 |         <span class="sr-only">Toggle navigation</span>
 30 |         <span class="icon-bar"></span>
 31 |         <span class="icon-bar"></span>
 32 |         <span class="icon-bar"></span>
 33 |       </button>
 34 |       <span class="navbar-brand">
 35 |         <a class="navbar-link" href="index.html">tidygenomics</a>
 36 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.1.2</span>
 37 |       </span>
 38 |     </div>
 39 | 
 40 |     <div id="navbar" class="navbar-collapse collapse">
 41 |       <ul class="nav navbar-nav">
 42 | <li>
 43 |   <a href="index.html">
 44 |     <span class="fa fa-home fa-lg"></span>
 45 |      
 46 |   </a>
 47 | </li>
 48 | <li>
 49 |   <a href="reference/index.html">Reference</a>
 50 | </li>
 51 | <li class="dropdown">
 52 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 53 |     Articles
 54 |      
 55 |     <span class="caret"></span>
 56 |   </a>
 57 |   <ul class="dropdown-menu" role="menu">
 58 | <li>
 59 |       <a href="articles/intro.html">Tidy Genomics</a>
 60 |     </li>
 61 |   </ul>
 62 | </li>
 63 | <li>
 64 |   <a href="news/index.html">Changelog</a>
 65 | </li>
 66 |       </ul>
 67 | <ul class="nav navbar-nav navbar-right">
 68 | <li>
 69 |   <a href="https://github.com/const-ae/tidygenomics">
 70 |     <span class="fa fa-github fa-lg"></span>
 71 |      
 72 |   </a>
 73 | </li>
 74 |       </ul>
 75 | </div>
 76 | <!--/.nav-collapse -->
 77 |   </div>
 78 | <!--/.container -->
 79 | </div>
 80 | <!--/.navbar -->
 81 | 
 82 |       
 83 |       </header><div class="row">
 84 |   <div class="contents col-md-9">
 85 | <div id="tidygenomics" class="section level1">
 86 | <div class="page-header"><h1 class="hasAnchor">
 87 | <a href="#tidygenomics" class="anchor"></a>tidygenomics</h1></div>
 88 | 
 89 | <p>Tidy Verbs for Dealing with Genomic Data Frames</p>
 90 | <div id="description" class="section level2">
 91 | <h2 class="hasAnchor">
 92 | <a href="#description" class="anchor"></a>Description</h2>
 93 | <p>Handle genomic data within data frames just as you would with <code>GRanges</code>. This packages provides method to deal with genomics intervals the “tidy-way” which makes it simpler to integrate in the the general data munging process. The API is inspired by the popular bedtools and the genome_join() method from the fuzzyjoin package.</p>
 94 | </div>
 95 | <div id="installation" class="section level2">
 96 | <h2 class="hasAnchor">
 97 | <a href="#installation" class="anchor"></a>Installation</h2>
 98 | <pre><code><a href="https://www.rdocumentation.org/packages/utils/topics/install.packages">install.packages("tidygenomics")
 99 | 
100 | # Or to get the latest development version
101 | devtools::install_github("const-ae/tidygenomics")</a></code></pre>
102 | </div>
103 | <div id="documentation" class="section level2">
104 | <h2 class="hasAnchor">
105 | <a href="#documentation" class="anchor"></a>Documentation</h2>
106 | <div id="genome_intersect" class="section level4">
107 | <h4 class="hasAnchor">
108 | <a href="#genome_intersect" class="anchor"></a>genome_intersect</h4>
109 | <p>Joins 2 data frames based on their genomic overlap. Unlike the <code>genome_join</code> function it updates the boundaries to reflect the overlap of the regions.</p>
110 | <p><img src="articles/resources/genome_intersect_docu.png" alt="genome_intersect" style="width: 100%;"></p>
111 | <pre class="{r}"><code>x1 &lt;- data.frame(id = 1:4, 
112 |                 chromosome = c("chr1", "chr1", "chr2", "chr2"),
113 |                 start = c(100, 200, 300, 400),
114 |                 end = c(150, 250, 350, 450))
115 | 
116 | x2 &lt;- data.frame(id = 1:4,
117 |                  chromosome = c("chr1", "chr2", "chr2", "chr1"),
118 |                  start = c(140, 210, 400, 300),
119 |                  end = c(160, 240, 415, 320))
120 | 
121 | genome_intersect(x1, x2, by=c("chromosome", "start", "end"), mode="both")</code></pre>
122 | <table class="table">
123 | <thead><tr class="header">
124 | <th align="right">id.x</th>
125 | <th align="left">chromosome</th>
126 | <th align="right">id.y</th>
127 | <th align="right">start</th>
128 | <th align="right">end</th>
129 | </tr></thead>
130 | <tbody>
131 | <tr class="odd">
132 | <td align="right">1</td>
133 | <td align="left">chr1</td>
134 | <td align="right">1</td>
135 | <td align="right">140</td>
136 | <td align="right">150</td>
137 | </tr>
138 | <tr class="even">
139 | <td align="right">4</td>
140 | <td align="left">chr2</td>
141 | <td align="right">3</td>
142 | <td align="right">400</td>
143 | <td align="right">415</td>
144 | </tr>
145 | </tbody>
146 | </table>
147 | </div>
148 | <div id="genome_subtract" class="section level4">
149 | <h4 class="hasAnchor">
150 | <a href="#genome_subtract" class="anchor"></a>genome_subtract</h4>
151 | <p>Subtracts one data frame from the other. This can be used to split the x data frame into smaller areas.</p>
152 | <p><img src="articles/resources/genome_subtract_docu.png" alt="genome_subtract" style="width: 100%;"></p>
153 | <pre class="{r}"><code>x1 &lt;- data.frame(id = 1:4,
154 |                 chromosome = c("chr1", "chr1", "chr2", "chr1"),
155 |                 start = c(100, 200, 300, 400),
156 |                 end = c(150, 250, 350, 450))
157 | 
158 | x2 &lt;- data.frame(id = 1:4,
159 |                 chromosome = c("chr1", "chr2", "chr1", "chr1"),
160 |                 start = c(120, 210, 300, 400),
161 |                 end = c(125, 240, 320, 415))
162 | 
163 | genome_subtract(x1, x2, by=c("chromosome", "start", "end"))</code></pre>
164 | <table class="table">
165 | <thead><tr class="header">
166 | <th align="right">id</th>
167 | <th align="left">chromosome</th>
168 | <th align="right">start</th>
169 | <th align="right">end</th>
170 | </tr></thead>
171 | <tbody>
172 | <tr class="odd">
173 | <td align="right">1</td>
174 | <td align="left">chr1</td>
175 | <td align="right">100</td>
176 | <td align="right">119</td>
177 | </tr>
178 | <tr class="even">
179 | <td align="right">1</td>
180 | <td align="left">chr1</td>
181 | <td align="right">126</td>
182 | <td align="right">150</td>
183 | </tr>
184 | <tr class="odd">
185 | <td align="right">2</td>
186 | <td align="left">chr1</td>
187 | <td align="right">200</td>
188 | <td align="right">250</td>
189 | </tr>
190 | <tr class="even">
191 | <td align="right">3</td>
192 | <td align="left">chr2</td>
193 | <td align="right">300</td>
194 | <td align="right">350</td>
195 | </tr>
196 | <tr class="odd">
197 | <td align="right">4</td>
198 | <td align="left">chr1</td>
199 | <td align="right">416</td>
200 | <td align="right">450</td>
201 | </tr>
202 | </tbody>
203 | </table>
204 | </div>
205 | <div id="genome_join_closest" class="section level4">
206 | <h4 class="hasAnchor">
207 | <a href="#genome_join_closest" class="anchor"></a>genome_join_closest</h4>
208 | <p>Joins 2 data frames based on their genomic location. If no exact overlap is found the next closest interval is used.</p>
209 | <p><img src="articles/resources/genome_join_closest_docu.png" alt="genome_join_closest" style="width: 100%;"></p>
210 | <pre class="{r}"><code>x1 &lt;- data_frame(id = 1:4, 
211 |                  chr = c("chr1", "chr1", "chr2", "chr3"),
212 |                  start = c(100, 200, 300, 400),
213 |                  end = c(150, 250, 350, 450))
214 | 
215 | x2 &lt;- data_frame(id = 1:4,
216 |                  chr = c("chr1", "chr1", "chr1", "chr2"),
217 |                  start = c(220, 210, 300, 400),
218 |                  end = c(225, 240, 320, 415))
219 | genome_join_closest(x1, x2, by=c("chr", "start", "end"), distance_column_name="distance", mode="left")</code></pre>
220 | <table class="table">
221 | <thead><tr class="header">
222 | <th align="right">id.x</th>
223 | <th align="left">chr.x</th>
224 | <th align="right">start.x</th>
225 | <th align="right">end.x</th>
226 | <th align="right">id.y</th>
227 | <th align="left">chr.y</th>
228 | <th align="right">start.y</th>
229 | <th align="right">end.y</th>
230 | <th align="right">distance</th>
231 | </tr></thead>
232 | <tbody>
233 | <tr class="odd">
234 | <td align="right">1</td>
235 | <td align="left">chr1</td>
236 | <td align="right">100</td>
237 | <td align="right">150</td>
238 | <td align="right">2</td>
239 | <td align="left">chr1</td>
240 | <td align="right">210</td>
241 | <td align="right">240</td>
242 | <td align="right">59</td>
243 | </tr>
244 | <tr class="even">
245 | <td align="right">2</td>
246 | <td align="left">chr1</td>
247 | <td align="right">200</td>
248 | <td align="right">250</td>
249 | <td align="right">1</td>
250 | <td align="left">chr1</td>
251 | <td align="right">220</td>
252 | <td align="right">225</td>
253 | <td align="right">0</td>
254 | </tr>
255 | <tr class="odd">
256 | <td align="right">2</td>
257 | <td align="left">chr1</td>
258 | <td align="right">200</td>
259 | <td align="right">250</td>
260 | <td align="right">2</td>
261 | <td align="left">chr1</td>
262 | <td align="right">210</td>
263 | <td align="right">240</td>
264 | <td align="right">0</td>
265 | </tr>
266 | <tr class="even">
267 | <td align="right">3</td>
268 | <td align="left">chr2</td>
269 | <td align="right">300</td>
270 | <td align="right">350</td>
271 | <td align="right">4</td>
272 | <td align="left">chr2</td>
273 | <td align="right">400</td>
274 | <td align="right">415</td>
275 | <td align="right">49</td>
276 | </tr>
277 | <tr class="odd">
278 | <td align="right">4</td>
279 | <td align="left">chr3</td>
280 | <td align="right">400</td>
281 | <td align="right">450</td>
282 | <td align="right">NA</td>
283 | <td align="left">NA</td>
284 | <td align="right">NA</td>
285 | <td align="right">NA</td>
286 | <td align="right">NA</td>
287 | </tr>
288 | </tbody>
289 | </table>
290 | </div>
291 | <div id="genome_cluster" class="section level4">
292 | <h4 class="hasAnchor">
293 | <a href="#genome_cluster" class="anchor"></a>genome_cluster</h4>
294 | <p>Add a new column with the cluster if 2 intervals are overlapping or are within the <code>max_distance</code>.</p>
295 | <p><img src="articles/resources/genome_cluster_docu.png" alt="genome_cluster" style="width: 100%;"></p>
296 | <pre class="{r}"><code>x1 &lt;- data.frame(id = 1:4, bla=letters[1:4],
297 |                 chromosome = c("chr1", "chr1", "chr2", "chr1"),
298 |                 start = c(100, 120, 300, 260),
299 |                 end = c(150, 250, 350, 450))
300 | genome_cluster(x1, by=c("chromosome", "start", "end"))</code></pre>
301 | <table class="table">
302 | <thead><tr class="header">
303 | <th align="right">id</th>
304 | <th align="left">bla</th>
305 | <th align="left">chromosome</th>
306 | <th align="right">start</th>
307 | <th align="right">end</th>
308 | <th align="right">cluster_id</th>
309 | </tr></thead>
310 | <tbody>
311 | <tr class="odd">
312 | <td align="right">1</td>
313 | <td align="left">a</td>
314 | <td align="left">chr1</td>
315 | <td align="right">100</td>
316 | <td align="right">150</td>
317 | <td align="right">0</td>
318 | </tr>
319 | <tr class="even">
320 | <td align="right">2</td>
321 | <td align="left">b</td>
322 | <td align="left">chr1</td>
323 | <td align="right">120</td>
324 | <td align="right">250</td>
325 | <td align="right">0</td>
326 | </tr>
327 | <tr class="odd">
328 | <td align="right">3</td>
329 | <td align="left">c</td>
330 | <td align="left">chr2</td>
331 | <td align="right">300</td>
332 | <td align="right">350</td>
333 | <td align="right">2</td>
334 | </tr>
335 | <tr class="even">
336 | <td align="right">4</td>
337 | <td align="left">d</td>
338 | <td align="left">chr1</td>
339 | <td align="right">260</td>
340 | <td align="right">450</td>
341 | <td align="right">1</td>
342 | </tr>
343 | </tbody>
344 | </table>
345 | <pre class="{r}"><code><a href="reference/genome_cluster.html">genome_cluster(x1, by=c("chromosome", "start", "end"), max_distance=10)</a></code></pre>
346 | <table class="table">
347 | <thead><tr class="header">
348 | <th align="right">id</th>
349 | <th align="left">bla</th>
350 | <th align="left">chromosome</th>
351 | <th align="right">start</th>
352 | <th align="right">end</th>
353 | <th align="right">cluster_id</th>
354 | </tr></thead>
355 | <tbody>
356 | <tr class="odd">
357 | <td align="right">1</td>
358 | <td align="left">a</td>
359 | <td align="left">chr1</td>
360 | <td align="right">100</td>
361 | <td align="right">150</td>
362 | <td align="right">0</td>
363 | </tr>
364 | <tr class="even">
365 | <td align="right">2</td>
366 | <td align="left">b</td>
367 | <td align="left">chr1</td>
368 | <td align="right">120</td>
369 | <td align="right">250</td>
370 | <td align="right">0</td>
371 | </tr>
372 | <tr class="odd">
373 | <td align="right">3</td>
374 | <td align="left">c</td>
375 | <td align="left">chr2</td>
376 | <td align="right">300</td>
377 | <td align="right">350</td>
378 | <td align="right">1</td>
379 | </tr>
380 | <tr class="even">
381 | <td align="right">4</td>
382 | <td align="left">d</td>
383 | <td align="left">chr1</td>
384 | <td align="right">260</td>
385 | <td align="right">450</td>
386 | <td align="right">0</td>
387 | </tr>
388 | </tbody>
389 | </table>
390 | </div>
391 | <div id="genome_complement" class="section level4">
392 | <h4 class="hasAnchor">
393 | <a href="#genome_complement" class="anchor"></a>genome_complement</h4>
394 | <p>Calculates the complement of a genomic region.</p>
395 | <p><img src="articles/resources/genome_complement_docu.png" alt="genome_complement" style="width: 100%;"></p>
396 | <pre class="{r}"><code>x1 &lt;- data.frame(id = 1:4,
397 |                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
398 |                  start = c(100, 200, 300, 400),
399 |                  end = c(150, 250, 350, 450))
400 | 
401 | genome_complement(x1, by=c("chromosome", "start", "end"))</code></pre>
402 | <table class="table">
403 | <thead><tr class="header">
404 | <th align="left">chromosome</th>
405 | <th align="right">start</th>
406 | <th align="right">end</th>
407 | </tr></thead>
408 | <tbody>
409 | <tr class="odd">
410 | <td align="left">chr1</td>
411 | <td align="right">1</td>
412 | <td align="right">99</td>
413 | </tr>
414 | <tr class="even">
415 | <td align="left">chr1</td>
416 | <td align="right">151</td>
417 | <td align="right">199</td>
418 | </tr>
419 | <tr class="odd">
420 | <td align="left">chr1</td>
421 | <td align="right">251</td>
422 | <td align="right">399</td>
423 | </tr>
424 | <tr class="even">
425 | <td align="left">chr2</td>
426 | <td align="right">1</td>
427 | <td align="right">299</td>
428 | </tr>
429 | </tbody>
430 | </table>
431 | </div>
432 | <div id="genome_join" class="section level4">
433 | <h4 class="hasAnchor">
434 | <a href="#genome_join" class="anchor"></a>genome_join</h4>
435 | <p>Classical join function based on the overlap of the interval. Implemented and maintained in the <a href="https://github.com/dgrtwo/fuzzyjoin">fuzzyjoin</a> package and documented here only for completeness.</p>
436 | <p><img src="articles/resources/genome_join_docu.png" alt="genome_join" style="width: 100%;"></p>
437 | <pre class="{r}"><code>x1 &lt;- data_frame(id = 1:4, 
438 |                  chr = c("chr1", "chr1", "chr2", "chr3"),
439 |                  start = c(100, 200, 300, 400),
440 |                  end = c(150, 250, 350, 450))
441 | 
442 | x2 &lt;- data_frame(id = 1:4,
443 |                  chr = c("chr1", "chr1", "chr1", "chr2"),
444 |                  start = c(220, 210, 300, 400),
445 |                  end = c(225, 240, 320, 415))
446 | fuzzyjoin::genome_join(x1, x2, by=c("chr", "start", "end"), mode="inner")</code></pre>
447 | <table class="table">
448 | <thead><tr class="header">
449 | <th align="right">id.x</th>
450 | <th align="left">chr.x</th>
451 | <th align="right">start.x</th>
452 | <th align="right">end.x</th>
453 | <th align="right">id.y</th>
454 | <th align="left">chr.y</th>
455 | <th align="right">start.y</th>
456 | <th align="right">end.y</th>
457 | </tr></thead>
458 | <tbody>
459 | <tr class="odd">
460 | <td align="right">2</td>
461 | <td align="left">chr1</td>
462 | <td align="right">200</td>
463 | <td align="right">250</td>
464 | <td align="right">1</td>
465 | <td align="left">chr1</td>
466 | <td align="right">220</td>
467 | <td align="right">225</td>
468 | </tr>
469 | <tr class="even">
470 | <td align="right">2</td>
471 | <td align="left">chr1</td>
472 | <td align="right">200</td>
473 | <td align="right">250</td>
474 | <td align="right">2</td>
475 | <td align="left">chr1</td>
476 | <td align="right">210</td>
477 | <td align="right">240</td>
478 | </tr>
479 | </tbody>
480 | </table>
481 | <pre class="{r}"><code><a href="https://www.rdocumentation.org/packages/fuzzyjoin/topics/genome_join">fuzzyjoin::genome_join(x1, x2, by=c("chr", "start", "end"), mode="left")</a></code></pre>
482 | <table class="table">
483 | <thead><tr class="header">
484 | <th align="right">id.x</th>
485 | <th align="left">chr.x</th>
486 | <th align="right">start.x</th>
487 | <th align="right">end.x</th>
488 | <th align="right">id.y</th>
489 | <th align="left">chr.y</th>
490 | <th align="right">start.y</th>
491 | <th align="right">end.y</th>
492 | </tr></thead>
493 | <tbody>
494 | <tr class="odd">
495 | <td align="right">1</td>
496 | <td align="left">chr1</td>
497 | <td align="right">100</td>
498 | <td align="right">150</td>
499 | <td align="right">NA</td>
500 | <td align="left">NA</td>
501 | <td align="right">NA</td>
502 | <td align="right">NA</td>
503 | </tr>
504 | <tr class="even">
505 | <td align="right">2</td>
506 | <td align="left">chr1</td>
507 | <td align="right">200</td>
508 | <td align="right">250</td>
509 | <td align="right">1</td>
510 | <td align="left">chr1</td>
511 | <td align="right">220</td>
512 | <td align="right">225</td>
513 | </tr>
514 | <tr class="odd">
515 | <td align="right">2</td>
516 | <td align="left">chr1</td>
517 | <td align="right">200</td>
518 | <td align="right">250</td>
519 | <td align="right">2</td>
520 | <td align="left">chr1</td>
521 | <td align="right">210</td>
522 | <td align="right">240</td>
523 | </tr>
524 | <tr class="even">
525 | <td align="right">3</td>
526 | <td align="left">chr2</td>
527 | <td align="right">300</td>
528 | <td align="right">350</td>
529 | <td align="right">NA</td>
530 | <td align="left">NA</td>
531 | <td align="right">NA</td>
532 | <td align="right">NA</td>
533 | </tr>
534 | <tr class="odd">
535 | <td align="right">4</td>
536 | <td align="left">chr3</td>
537 | <td align="right">400</td>
538 | <td align="right">450</td>
539 | <td align="right">NA</td>
540 | <td align="left">NA</td>
541 | <td align="right">NA</td>
542 | <td align="right">NA</td>
543 | </tr>
544 | </tbody>
545 | </table>
546 | <pre class="{r}"><code><a href="https://www.rdocumentation.org/packages/fuzzyjoin/topics/genome_join">fuzzyjoin::genome_join(x1, x2, by=c("chr", "start", "end"), mode="anti")</a></code></pre>
547 | <table class="table">
548 | <thead><tr class="header">
549 | <th align="right">id</th>
550 | <th align="left">chr</th>
551 | <th align="right">start</th>
552 | <th align="right">end</th>
553 | </tr></thead>
554 | <tbody>
555 | <tr class="odd">
556 | <td align="right">1</td>
557 | <td align="left">chr1</td>
558 | <td align="right">100</td>
559 | <td align="right">150</td>
560 | </tr>
561 | <tr class="even">
562 | <td align="right">3</td>
563 | <td align="left">chr2</td>
564 | <td align="right">300</td>
565 | <td align="right">350</td>
566 | </tr>
567 | <tr class="odd">
568 | <td align="right">4</td>
569 | <td align="left">chr3</td>
570 | <td align="right">400</td>
571 | <td align="right">450</td>
572 | </tr>
573 | </tbody>
574 | </table>
575 | </div>
576 | </div>
577 | <div id="inspiration" class="section level2">
578 | <h2 class="hasAnchor">
579 | <a href="#inspiration" class="anchor"></a>Inspiration</h2>
580 | <ul>
581 | <li><a href="http://tidyverse.org/">tidyverse</a></li>
582 | <li><a href="https://github.com/dgrtwo/fuzzyjoin">fuzzyjoin</a></li>
583 | <li><a href="http://bioconductor.org/packages/release/bioc/html/GenomicRanges.html">GenomicRanges</a></li>
584 | <li><a href="http://bedtools.readthedocs.io">bedtools</a></li>
585 | </ul>
586 | <p>If you have any additional questions or encounter issues please raise them on the <a href="https://github.com/Artjom-Metro/tidygenomics">github page</a>.</p>
587 | </div>
588 | </div>
589 |   </div>
590 | 
591 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
592 |     <div class="links">
593 | <h2>Links</h2>
594 | <ul class="list-unstyled">
595 | <li>Download from CRAN at <br><a href="https://cloud.r-project.org/package=tidygenomics">https://​cloud.r-project.org/​package=tidygenomics</a>
596 | </li>
597 | <li>Browse source code at <br><a href="https://github.com/const-ae/tidygenomics">https://​github.com/​const-ae/​tidygenomics</a>
598 | </li>
599 | </ul>
600 | </div>
601 | <div class="license">
602 | <h2>License</h2>
603 | <ul class="list-unstyled">
604 | <li><a href="https://www.r-project.org/Licenses/GPL-3">GPL-3</a></li>
605 | </ul>
606 | </div>
607 | <div class="developers">
608 | <h2>Developers</h2>
609 | <ul class="list-unstyled">
610 | <li>Constantin Ahlmann-Eltze <br><small class="roles"> Author, maintainer </small> <a href="https://orcid.org/0000-0002-3762-068X" target="orcid.widget"><img src="https://members.orcid.org/sites/default/files/vector_iD_icon.svg" class="orcid" alt="ORCID" height="16"></a> </li>
611 | <li><a href="authors.html">All authors...</a></li>
612 | </ul>
613 | </div>
614 | 
615 |   <div class="dev-status">
616 | <h2>Dev status</h2>
617 | <ul class="list-unstyled">
618 | <li><a href="https://cran.r-project.org/package=tidygenomics"><img src="https://www.r-pkg.org/badges/version/tidygenomics" alt="CRAN_Status_Badge"></a></li>
619 | </ul>
620 | </div>
621 | </div>
622 | </div>
623 | 
624 |       <footer><div class="copyright">
625 |   <p>Developed by Constantin Ahlmann-Eltze.</p>
626 | </div>
627 | 
628 | <div class="pkgdown">
629 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
630 | </div>
631 |       </footer>
632 | </div>
633 | 
634 |   
635 | 
636 |   </body>
637 | </html>
638 | 


--------------------------------------------------------------------------------
/docs/link.svg:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <!-- Generator: Adobe Illustrator 19.2.1, SVG Export Plug-In . SVG Version: 6.00 Build 0)  -->
 3 | <svg version="1.1" id="Layer_1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" x="0px" y="0px"
 4 | 	 viewBox="0 0 20 20" style="enable-background:new 0 0 20 20;" xml:space="preserve">
 5 | <style type="text/css">
 6 | 	.st0{fill:#75AADB;}
 7 | </style>
 8 | <path class="st0" d="M4,11.3h1.3v1.3H4c-2,0-4-2.3-4-4.7s2.1-4.7,4-4.7h5.3c1.9,0,4,2.3,4,4.7c0,1.9-1.2,3.6-2.7,4.3v-1.5
 9 | 	C11.4,10.2,12,9.1,12,8c0-1.7-1.4-3.3-2.7-3.3H4C2.7,4.7,1.3,6.3,1.3,8S2.7,11.3,4,11.3z M16,7.3h-1.3v1.3H16c1.3,0,2.7,1.6,2.7,3.3
10 | 	s-1.4,3.3-2.7,3.3h-5.3C9.4,15.3,8,13.7,8,12c0-1.1,0.6-2.2,1.3-2.8V7.7C7.9,8.4,6.7,10.1,6.7,12c0,2.4,2.1,4.7,4,4.7H16
11 | 	c1.9,0,4-2.3,4-4.7S18,7.3,16,7.3z"/>
12 | </svg>
13 | 


--------------------------------------------------------------------------------
/docs/news/index.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html lang="en">
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Changelog • tidygenomics</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous" />
 16 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous" />
 20 | 
 21 | <!-- clipboard.js -->
 22 | <script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script>
 23 | 
 24 | <!-- sticky kit -->
 25 | <script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script>
 26 | 
 27 | <!-- pkgdown -->
 28 | <link href="../pkgdown.css" rel="stylesheet">
 29 | <script src="../pkgdown.js"></script>
 30 | 
 31 | 
 32 | 
 33 | <meta property="og:title" content="Changelog" />
 34 | 
 35 | 
 36 | 
 37 | <!-- mathjax -->
 38 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
 39 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
 40 | 
 41 | <!--[if lt IE 9]>
 42 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 43 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 44 | <![endif]-->
 45 | 
 46 | 
 47 |   </head>
 48 | 
 49 |   <body>
 50 |     <div class="container template-news">
 51 |       <header>
 52 |       <div class="navbar navbar-default navbar-fixed-top" role="navigation">
 53 |   <div class="container">
 54 |     <div class="navbar-header">
 55 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 56 |         <span class="sr-only">Toggle navigation</span>
 57 |         <span class="icon-bar"></span>
 58 |         <span class="icon-bar"></span>
 59 |         <span class="icon-bar"></span>
 60 |       </button>
 61 |       <span class="navbar-brand">
 62 |         <a class="navbar-link" href="../index.html">tidygenomics</a>
 63 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.1.2</span>
 64 |       </span>
 65 |     </div>
 66 | 
 67 |     <div id="navbar" class="navbar-collapse collapse">
 68 |       <ul class="nav navbar-nav">
 69 |         <li>
 70 |   <a href="../index.html">
 71 |     <span class="fa fa-home fa-lg"></span>
 72 |      
 73 |   </a>
 74 | </li>
 75 | <li>
 76 |   <a href="../reference/index.html">Reference</a>
 77 | </li>
 78 | <li class="dropdown">
 79 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 80 |     Articles
 81 |      
 82 |     <span class="caret"></span>
 83 |   </a>
 84 |   <ul class="dropdown-menu" role="menu">
 85 |     <li>
 86 |       <a href="../articles/intro.html">Tidy Genomics</a>
 87 |     </li>
 88 |   </ul>
 89 | </li>
 90 | <li>
 91 |   <a href="../news/index.html">Changelog</a>
 92 | </li>
 93 |       </ul>
 94 |       
 95 |       <ul class="nav navbar-nav navbar-right">
 96 |         <li>
 97 |   <a href="https://github.com/const-ae/tidygenomics">
 98 |     <span class="fa fa-github fa-lg"></span>
 99 |      
100 |   </a>
101 | </li>
102 |       </ul>
103 |       
104 |     </div><!--/.nav-collapse -->
105 |   </div><!--/.container -->
106 | </div><!--/.navbar -->
107 | 
108 |       
109 |       </header>
110 | 
111 | <div class="row">
112 |   <div class="col-md-9 contents">
113 |     <div class="page-header">
114 |       <h1>Changelog <small></small></h1>
115 |       <small>Source: <a href='https://github.com/const-ae/tidygenomics/blob/master/NEWS.md'><code>NEWS.md</code></a></small>
116 |     </div>
117 | 
118 |   </div>
119 | 
120 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
121 |     <div id="tocnav">
122 |       <h2>Contents</h2>
123 |       <ul class="nav nav-pills nav-stacked">
124 |       </ul>
125 |     </div>
126 |   </div>
127 | 
128 | </div>
129 | 
130 |       <footer>
131 |       <div class="copyright">
132 |   <p>Developed by Constantin Ahlmann-Eltze.</p>
133 | </div>
134 | 
135 | <div class="pkgdown">
136 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
137 | </div>
138 |       </footer>
139 |    </div>
140 | 
141 |   
142 | 
143 |   </body>
144 | </html>
145 | 
146 | 


--------------------------------------------------------------------------------
/docs/pkgdown.css:
--------------------------------------------------------------------------------
  1 | /* Sticky footer */
  2 | 
  3 | /**
  4 |  * Basic idea: https://philipwalton.github.io/solved-by-flexbox/demos/sticky-footer/
  5 |  * Details: https://github.com/philipwalton/solved-by-flexbox/blob/master/assets/css/components/site.css
  6 |  *
  7 |  * .Site -> body > .container
  8 |  * .Site-content -> body > .container .row
  9 |  * .footer -> footer
 10 |  *
 11 |  * Key idea seems to be to ensure that .container and __all its parents__
 12 |  * have height set to 100%
 13 |  *
 14 |  */
 15 | 
 16 | html, body {
 17 |   height: 100%;
 18 | }
 19 | 
 20 | body > .container {
 21 |   display: flex;
 22 |   height: 100%;
 23 |   flex-direction: column;
 24 | 
 25 |   padding-top: 60px;
 26 | }
 27 | 
 28 | body > .container .row {
 29 |   flex: 1 0 auto;
 30 | }
 31 | 
 32 | footer {
 33 |   margin-top: 45px;
 34 |   padding: 35px 0 36px;
 35 |   border-top: 1px solid #e5e5e5;
 36 |   color: #666;
 37 |   display: flex;
 38 |   flex-shrink: 0;
 39 | }
 40 | footer p {
 41 |   margin-bottom: 0;
 42 | }
 43 | footer div {
 44 |   flex: 1;
 45 | }
 46 | footer .pkgdown {
 47 |   text-align: right;
 48 | }
 49 | footer p {
 50 |   margin-bottom: 0;
 51 | }
 52 | 
 53 | img.icon {
 54 |   float: right;
 55 | }
 56 | 
 57 | img {
 58 |   max-width: 100%;
 59 | }
 60 | 
 61 | /* Fix bug in bootstrap (only seen in firefox) */
 62 | summary {
 63 |   display: list-item;
 64 | }
 65 | 
 66 | /* Typographic tweaking ---------------------------------*/
 67 | 
 68 | .contents .page-header {
 69 |   margin-top: calc(-60px + 1em);
 70 | }
 71 | 
 72 | /* Section anchors ---------------------------------*/
 73 | 
 74 | a.anchor {
 75 |   margin-left: -30px;
 76 |   display:inline-block;
 77 |   width: 30px;
 78 |   height: 30px;
 79 |   visibility: hidden;
 80 | 
 81 |   background-image: url(./link.svg);
 82 |   background-repeat: no-repeat;
 83 |   background-size: 20px 20px;
 84 |   background-position: center center;
 85 | }
 86 | 
 87 | .hasAnchor:hover a.anchor {
 88 |   visibility: visible;
 89 | }
 90 | 
 91 | @media (max-width: 767px) {
 92 |   .hasAnchor:hover a.anchor {
 93 |     visibility: hidden;
 94 |   }
 95 | }
 96 | 
 97 | 
 98 | /* Fixes for fixed navbar --------------------------*/
 99 | 
100 | .contents h1, .contents h2, .contents h3, .contents h4 {
101 |   padding-top: 60px;
102 |   margin-top: -40px;
103 | }
104 | 
105 | /* Static header placement on mobile devices */
106 | @media (max-width: 767px) {
107 |   .navbar-fixed-top {
108 |     position: absolute;
109 |   }
110 |   .navbar {
111 |     padding: 0;
112 |   }
113 | }
114 | 
115 | 
116 | /* Sidebar --------------------------*/
117 | 
118 | #sidebar {
119 |   margin-top: 30px;
120 | }
121 | #sidebar h2 {
122 |   font-size: 1.5em;
123 |   margin-top: 1em;
124 | }
125 | 
126 | #sidebar h2:first-child {
127 |   margin-top: 0;
128 | }
129 | 
130 | #sidebar .list-unstyled li {
131 |   margin-bottom: 0.5em;
132 | }
133 | 
134 | .orcid {
135 |   height: 16px;
136 |   vertical-align: middle;
137 | }
138 | 
139 | /* Reference index & topics ----------------------------------------------- */
140 | 
141 | .ref-index th {font-weight: normal;}
142 | 
143 | .ref-index td {vertical-align: top;}
144 | .ref-index .icon {width: 40px;}
145 | .ref-index .alias {width: 40%;}
146 | .ref-index-icons .alias {width: calc(40% - 40px);}
147 | .ref-index .title {width: 60%;}
148 | 
149 | .ref-arguments th {text-align: right; padding-right: 10px;}
150 | .ref-arguments th, .ref-arguments td {vertical-align: top;}
151 | .ref-arguments .name {width: 20%;}
152 | .ref-arguments .desc {width: 80%;}
153 | 
154 | /* Nice scrolling for wide elements --------------------------------------- */
155 | 
156 | table {
157 |   display: block;
158 |   overflow: auto;
159 | }
160 | 
161 | /* Syntax highlighting ---------------------------------------------------- */
162 | 
163 | pre {
164 |   word-wrap: normal;
165 |   word-break: normal;
166 |   border: 1px solid #eee;
167 | }
168 | 
169 | pre, code {
170 |   background-color: #f8f8f8;
171 |   color: #333;
172 | }
173 | 
174 | pre code {
175 |   overflow: auto;
176 |   word-wrap: normal;
177 |   white-space: pre;
178 | }
179 | 
180 | pre .img {
181 |   margin: 5px 0;
182 | }
183 | 
184 | pre .img img {
185 |   background-color: #fff;
186 |   display: block;
187 |   height: auto;
188 | }
189 | 
190 | code a, pre a {
191 |   color: #375f84;
192 | }
193 | 
194 | a.sourceLine:hover {
195 |   text-decoration: none;
196 | }
197 | 
198 | .fl      {color: #1514b5;}
199 | .fu      {color: #000000;} /* function */
200 | .ch,.st  {color: #036a07;} /* string */
201 | .kw      {color: #264D66;} /* keyword */
202 | .co      {color: #888888;} /* comment */
203 | 
204 | .message { color: black;   font-weight: bolder;}
205 | .error   { color: orange;  font-weight: bolder;}
206 | .warning { color: #6A0366; font-weight: bolder;}
207 | 
208 | /* Clipboard --------------------------*/
209 | 
210 | .hasCopyButton {
211 |   position: relative;
212 | }
213 | 
214 | .btn-copy-ex {
215 |   position: absolute;
216 |   right: 0;
217 |   top: 0;
218 |   visibility: hidden;
219 | }
220 | 
221 | .hasCopyButton:hover button.btn-copy-ex {
222 |   visibility: visible;
223 | }
224 | 
225 | /* mark.js ----------------------------*/
226 | 
227 | mark {
228 |   background-color: rgba(255, 255, 51, 0.5);
229 |   border-bottom: 2px solid rgba(255, 153, 51, 0.3);
230 |   padding: 1px;
231 | }
232 | 
233 | /* vertical spacing after htmlwidgets */
234 | .html-widget {
235 |   margin-bottom: 10px;
236 | }
237 | 


--------------------------------------------------------------------------------
/docs/pkgdown.js:
--------------------------------------------------------------------------------
  1 | /* http://gregfranko.com/blog/jquery-best-practices/ */
  2 | (function($) {
  3 |   $(function() {
  4 | 
  5 |     $("#sidebar")
  6 |       .stick_in_parent({offset_top: 40})
  7 |       .on('sticky_kit:bottom', function(e) {
  8 |         $(this).parent().css('position', 'static');
  9 |       })
 10 |       .on('sticky_kit:unbottom', function(e) {
 11 |         $(this).parent().css('position', 'relative');
 12 |       });
 13 | 
 14 |     $('body').scrollspy({
 15 |       target: '#sidebar',
 16 |       offset: 60
 17 |     });
 18 | 
 19 |     $('[data-toggle="tooltip"]').tooltip();
 20 | 
 21 |     var cur_path = paths(location.pathname);
 22 |     var links = $("#navbar ul li a");
 23 |     var max_length = -1;
 24 |     var pos = -1;
 25 |     for (var i = 0; i < links.length; i++) {
 26 |       if (links[i].getAttribute("href") === "#")
 27 |         continue;
 28 |       // Ignore external links
 29 |       if (links[i].host !== location.host)
 30 |         continue;
 31 | 
 32 |       var nav_path = paths(links[i].pathname);
 33 | 
 34 |       var length = prefix_length(nav_path, cur_path);
 35 |       if (length > max_length) {
 36 |         max_length = length;
 37 |         pos = i;
 38 |       }
 39 |     }
 40 | 
 41 |     // Add class to parent <li>, and enclosing <li> if in dropdown
 42 |     if (pos >= 0) {
 43 |       var menu_anchor = $(links[pos]);
 44 |       menu_anchor.parent().addClass("active");
 45 |       menu_anchor.closest("li.dropdown").addClass("active");
 46 |     }
 47 |   });
 48 | 
 49 |   function paths(pathname) {
 50 |     var pieces = pathname.split("/");
 51 |     pieces.shift(); // always starts with /
 52 | 
 53 |     var end = pieces[pieces.length - 1];
 54 |     if (end === "index.html" || end === "")
 55 |       pieces.pop();
 56 |     return(pieces);
 57 |   }
 58 | 
 59 |   // Returns -1 if not found
 60 |   function prefix_length(needle, haystack) {
 61 |     if (needle.length > haystack.length)
 62 |       return(-1);
 63 | 
 64 |     // Special case for length-0 haystack, since for loop won't run
 65 |     if (haystack.length === 0) {
 66 |       return(needle.length === 0 ? 0 : -1);
 67 |     }
 68 | 
 69 |     for (var i = 0; i < haystack.length; i++) {
 70 |       if (needle[i] != haystack[i])
 71 |         return(i);
 72 |     }
 73 | 
 74 |     return(haystack.length);
 75 |   }
 76 | 
 77 |   /* Clipboard --------------------------*/
 78 | 
 79 |   function changeTooltipMessage(element, msg) {
 80 |     var tooltipOriginalTitle=element.getAttribute('data-original-title');
 81 |     element.setAttribute('data-original-title', msg);
 82 |     $(element).tooltip('show');
 83 |     element.setAttribute('data-original-title', tooltipOriginalTitle);
 84 |   }
 85 | 
 86 |   if(ClipboardJS.isSupported()) {
 87 |     $(document).ready(function() {
 88 |       var copyButton = "<button type='button' class='btn btn-primary btn-copy-ex' type = 'submit' title='Copy to clipboard' aria-label='Copy to clipboard' data-toggle='tooltip' data-placement='left auto' data-trigger='hover' data-clipboard-copy><i class='fa fa-copy'></i></button>";
 89 | 
 90 |       $(".examples, div.sourceCode").addClass("hasCopyButton");
 91 | 
 92 |       // Insert copy buttons:
 93 |       $(copyButton).prependTo(".hasCopyButton");
 94 | 
 95 |       // Initialize tooltips:
 96 |       $('.btn-copy-ex').tooltip({container: 'body'});
 97 | 
 98 |       // Initialize clipboard:
 99 |       var clipboardBtnCopies = new ClipboardJS('[data-clipboard-copy]', {
100 |         text: function(trigger) {
101 |           return trigger.parentNode.textContent;
102 |         }
103 |       });
104 | 
105 |       clipboardBtnCopies.on('success', function(e) {
106 |         changeTooltipMessage(e.trigger, 'Copied!');
107 |         e.clearSelection();
108 |       });
109 | 
110 |       clipboardBtnCopies.on('error', function() {
111 |         changeTooltipMessage(e.trigger,'Press Ctrl+C or Command+C to copy');
112 |       });
113 |     });
114 |   }
115 | })(window.jQuery || window.$)
116 | 


--------------------------------------------------------------------------------
/docs/pkgdown.yml:
--------------------------------------------------------------------------------
1 | pandoc: 2.3.1
2 | pkgdown: 1.3.0
3 | pkgdown_sha: ~
4 | articles:
5 |   intro: intro.html
6 | 
7 | 


--------------------------------------------------------------------------------
/docs/reference/cluster_interval.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html lang="en">
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Cluster ranges which are implemented as 2 equal-length numeric vectors. — cluster_interval • tidygenomics</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous" />
 16 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous" />
 20 | 
 21 | <!-- clipboard.js -->
 22 | <script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script>
 23 | 
 24 | <!-- sticky kit -->
 25 | <script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script>
 26 | 
 27 | <!-- pkgdown -->
 28 | <link href="../pkgdown.css" rel="stylesheet">
 29 | <script src="../pkgdown.js"></script>
 30 | 
 31 | 
 32 | 
 33 | <meta property="og:title" content="Cluster ranges which are implemented as 2 equal-length numeric vectors. — cluster_interval" />
 34 | 
 35 | <meta property="og:description" content="Cluster ranges which are implemented as 2 equal-length numeric vectors." />
 36 | <meta name="twitter:card" content="summary" />
 37 | 
 38 | 
 39 | 
 40 | <!-- mathjax -->
 41 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
 42 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
 43 | 
 44 | <!--[if lt IE 9]>
 45 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 46 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 47 | <![endif]-->
 48 | 
 49 | 
 50 |   </head>
 51 | 
 52 |   <body>
 53 |     <div class="container template-reference-topic">
 54 |       <header>
 55 |       <div class="navbar navbar-default navbar-fixed-top" role="navigation">
 56 |   <div class="container">
 57 |     <div class="navbar-header">
 58 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 59 |         <span class="sr-only">Toggle navigation</span>
 60 |         <span class="icon-bar"></span>
 61 |         <span class="icon-bar"></span>
 62 |         <span class="icon-bar"></span>
 63 |       </button>
 64 |       <span class="navbar-brand">
 65 |         <a class="navbar-link" href="../index.html">tidygenomics</a>
 66 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.1.2</span>
 67 |       </span>
 68 |     </div>
 69 | 
 70 |     <div id="navbar" class="navbar-collapse collapse">
 71 |       <ul class="nav navbar-nav">
 72 |         <li>
 73 |   <a href="../index.html">
 74 |     <span class="fa fa-home fa-lg"></span>
 75 |      
 76 |   </a>
 77 | </li>
 78 | <li>
 79 |   <a href="../reference/index.html">Reference</a>
 80 | </li>
 81 | <li class="dropdown">
 82 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 83 |     Articles
 84 |      
 85 |     <span class="caret"></span>
 86 |   </a>
 87 |   <ul class="dropdown-menu" role="menu">
 88 |     <li>
 89 |       <a href="../articles/intro.html">Tidy Genomics</a>
 90 |     </li>
 91 |   </ul>
 92 | </li>
 93 | <li>
 94 |   <a href="../news/index.html">Changelog</a>
 95 | </li>
 96 |       </ul>
 97 |       
 98 |       <ul class="nav navbar-nav navbar-right">
 99 |         <li>
100 |   <a href="https://github.com/const-ae/tidygenomics">
101 |     <span class="fa fa-github fa-lg"></span>
102 |      
103 |   </a>
104 | </li>
105 |       </ul>
106 |       
107 |     </div><!--/.nav-collapse -->
108 |   </div><!--/.container -->
109 | </div><!--/.navbar -->
110 | 
111 |       
112 |       </header>
113 | 
114 | <div class="row">
115 |   <div class="col-md-9 contents">
116 |     <div class="page-header">
117 |     <h1>Cluster ranges which are implemented as 2 equal-length numeric vectors.</h1>
118 |     <small class="dont-index">Source: <a href='https://github.com/const-ae/tidygenomics/blob/master/R/RcppExports.R'><code>R/RcppExports.R</code></a></small>
119 |     <div class="hidden name"><code>cluster_interval.Rd</code></div>
120 |     </div>
121 | 
122 |     <div class="ref-description">
123 |     
124 |     <p>Cluster ranges which are implemented as 2 equal-length numeric vectors.</p>
125 |     
126 |     </div>
127 | 
128 |     <pre class="usage"><span class='fu'>cluster_interval</span>(<span class='no'>starts</span>, <span class='no'>ends</span>, <span class='kw'>max_distance</span> <span class='kw'>=</span> <span class='fl'>0L</span>)</pre>
129 |     
130 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
131 |     <table class="ref-arguments">
132 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
133 |     <tr>
134 |       <th>starts</th>
135 |       <td><p>A numeric vector that defines the starts of each interval</p></td>
136 |     </tr>
137 |     <tr>
138 |       <th>ends</th>
139 |       <td><p>A numeric vector that defines the ends of each interval</p></td>
140 |     </tr>
141 |     <tr>
142 |       <th>max_distance</th>
143 |       <td><p>The maximum distance up to which intervals are still considered to be
144 | the same cluster. Default: 0.</p></td>
145 |     </tr>
146 |     </table>
147 |     
148 | 
149 |     <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
150 |     <pre class="examples"><div class='input'><span class='no'>starts</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>50</span>, <span class='fl'>100</span>, <span class='fl'>120</span>)
151 | <span class='no'>ends</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>75</span>, <span class='fl'>130</span>, <span class='fl'>150</span>)
152 | <span class='no'>j</span> <span class='kw'>&lt;-</span> <span class='fu'>cluster_interval</span>(<span class='no'>starts</span>, <span class='no'>ends</span>)
153 | <span class='no'>j</span> <span class='kw'>==</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>0</span>,<span class='fl'>1</span>,<span class='fl'>1</span>)</div><div class='output co'>#&gt; [1] TRUE TRUE TRUE</div></pre>
154 |   </div>
155 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
156 |     <h2>Contents</h2>
157 |     <ul class="nav nav-pills nav-stacked">
158 |       <li><a href="#arguments">Arguments</a></li>
159 |             
160 |       <li><a href="#examples">Examples</a></li>
161 |     </ul>
162 | 
163 |   </div>
164 | </div>
165 | 
166 |       <footer>
167 |       <div class="copyright">
168 |   <p>Developed by Constantin Ahlmann-Eltze.</p>
169 | </div>
170 | 
171 | <div class="pkgdown">
172 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
173 | </div>
174 |       </footer>
175 |    </div>
176 | 
177 |   
178 | 
179 |   </body>
180 | </html>
181 | 
182 | 


--------------------------------------------------------------------------------
/docs/reference/genome_cluster.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html lang="en">
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Intersect data frames based on chromosome, start and end. — genome_cluster • tidygenomics</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous" />
 16 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous" />
 20 | 
 21 | <!-- clipboard.js -->
 22 | <script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script>
 23 | 
 24 | <!-- sticky kit -->
 25 | <script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script>
 26 | 
 27 | <!-- pkgdown -->
 28 | <link href="../pkgdown.css" rel="stylesheet">
 29 | <script src="../pkgdown.js"></script>
 30 | 
 31 | 
 32 | 
 33 | <meta property="og:title" content="Intersect data frames based on chromosome, start and end. — genome_cluster" />
 34 | 
 35 | <meta property="og:description" content="Intersect data frames based on chromosome, start and end." />
 36 | <meta name="twitter:card" content="summary" />
 37 | 
 38 | 
 39 | 
 40 | <!-- mathjax -->
 41 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
 42 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
 43 | 
 44 | <!--[if lt IE 9]>
 45 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 46 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 47 | <![endif]-->
 48 | 
 49 | 
 50 |   </head>
 51 | 
 52 |   <body>
 53 |     <div class="container template-reference-topic">
 54 |       <header>
 55 |       <div class="navbar navbar-default navbar-fixed-top" role="navigation">
 56 |   <div class="container">
 57 |     <div class="navbar-header">
 58 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 59 |         <span class="sr-only">Toggle navigation</span>
 60 |         <span class="icon-bar"></span>
 61 |         <span class="icon-bar"></span>
 62 |         <span class="icon-bar"></span>
 63 |       </button>
 64 |       <span class="navbar-brand">
 65 |         <a class="navbar-link" href="../index.html">tidygenomics</a>
 66 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.1.2</span>
 67 |       </span>
 68 |     </div>
 69 | 
 70 |     <div id="navbar" class="navbar-collapse collapse">
 71 |       <ul class="nav navbar-nav">
 72 |         <li>
 73 |   <a href="../index.html">
 74 |     <span class="fa fa-home fa-lg"></span>
 75 |      
 76 |   </a>
 77 | </li>
 78 | <li>
 79 |   <a href="../reference/index.html">Reference</a>
 80 | </li>
 81 | <li class="dropdown">
 82 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 83 |     Articles
 84 |      
 85 |     <span class="caret"></span>
 86 |   </a>
 87 |   <ul class="dropdown-menu" role="menu">
 88 |     <li>
 89 |       <a href="../articles/intro.html">Tidy Genomics</a>
 90 |     </li>
 91 |   </ul>
 92 | </li>
 93 | <li>
 94 |   <a href="../news/index.html">Changelog</a>
 95 | </li>
 96 |       </ul>
 97 |       
 98 |       <ul class="nav navbar-nav navbar-right">
 99 |         <li>
100 |   <a href="https://github.com/const-ae/tidygenomics">
101 |     <span class="fa fa-github fa-lg"></span>
102 |      
103 |   </a>
104 | </li>
105 |       </ul>
106 |       
107 |     </div><!--/.nav-collapse -->
108 |   </div><!--/.container -->
109 | </div><!--/.navbar -->
110 | 
111 |       
112 |       </header>
113 | 
114 | <div class="row">
115 |   <div class="col-md-9 contents">
116 |     <div class="page-header">
117 |     <h1>Intersect data frames based on chromosome, start and end.</h1>
118 |     <small class="dont-index">Source: <a href='https://github.com/const-ae/tidygenomics/blob/master/R/cluster.R'><code>R/cluster.R</code></a></small>
119 |     <div class="hidden name"><code>genome_cluster.Rd</code></div>
120 |     </div>
121 | 
122 |     <div class="ref-description">
123 |     
124 |     <p>Intersect data frames based on chromosome, start and end.</p>
125 |     
126 |     </div>
127 | 
128 |     <pre class="usage"><span class='fu'>genome_cluster</span>(<span class='no'>x</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='kw'>max_distance</span> <span class='kw'>=</span> <span class='fl'>0</span>,
129 |   <span class='kw'>cluster_column_name</span> <span class='kw'>=</span> <span class='st'>"cluster_id"</span>)</pre>
130 |     
131 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
132 |     <table class="ref-arguments">
133 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
134 |     <tr>
135 |       <th>x</th>
136 |       <td><p>A dataframe.</p></td>
137 |     </tr>
138 |     <tr>
139 |       <th>by</th>
140 |       <td><p>A character vector with 3 entries which are the chromosome, start and end column.
141 | For example: <code>by=c("chr", "start", "end")</code></p></td>
142 |     </tr>
143 |     <tr>
144 |       <th>max_distance</th>
145 |       <td><p>The maximum distance up to which intervals are still considered to be
146 | the same cluster. Default: 0.</p></td>
147 |     </tr>
148 |     <tr>
149 |       <th>cluster_column_name</th>
150 |       <td><p>A string that is used as the new column name</p></td>
151 |     </tr>
152 |     </table>
153 |     
154 |     <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
155 | 
156 |     <p>The dataframe with the additional column of the cluster</p>
157 |     
158 | 
159 |     <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
160 |     <pre class="examples"><div class='input'>
161 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='no'>dplyr</span>)</div><div class='output co'>#&gt; <span class='message'></span>
162 | #&gt; <span class='message'>Attaching package: ‘dplyr’</span></div><div class='output co'>#&gt; <span class='message'>The following object is masked from ‘package:testthat’:</span>
163 | #&gt; <span class='message'></span>
164 | #&gt; <span class='message'>    matches</span></div><div class='output co'>#&gt; <span class='message'>The following objects are masked from ‘package:stats’:</span>
165 | #&gt; <span class='message'></span>
166 | #&gt; <span class='message'>    filter, lag</span></div><div class='output co'>#&gt; <span class='message'>The following objects are masked from ‘package:base’:</span>
167 | #&gt; <span class='message'></span>
168 | #&gt; <span class='message'>    intersect, setdiff, setequal, union</span></div><div class='input'>
169 | <span class='no'>x1</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/data.frame'>data.frame</a></span>(<span class='kw'>id</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>4</span>, <span class='kw'>bla</span><span class='kw'>=</span><span class='no'>letters</span>[<span class='fl'>1</span>:<span class='fl'>4</span>],
170 |                  <span class='kw'>chromosome</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chr1"</span>, <span class='st'>"chr1"</span>, <span class='st'>"chr2"</span>, <span class='st'>"chr1"</span>),
171 |                  <span class='kw'>start</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>100</span>, <span class='fl'>120</span>, <span class='fl'>300</span>, <span class='fl'>260</span>),
172 |                  <span class='kw'>end</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>150</span>, <span class='fl'>250</span>, <span class='fl'>350</span>, <span class='fl'>450</span>))
173 | <span class='fu'>genome_cluster</span>(<span class='no'>x1</span>, <span class='kw'>by</span><span class='kw'>=</span><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chromosome"</span>, <span class='st'>"start"</span>, <span class='st'>"end"</span>))</div><div class='output co'>#&gt; <span style='color: #555555;'># A tibble: 4 x 6</span><span>
174 | #&gt;      id bla   chromosome start   end cluster_id
175 | #&gt;   </span><span style='color: #555555;font-style: italic;'>&lt;int&gt;</span><span> </span><span style='color: #555555;font-style: italic;'>&lt;fct&gt;</span><span> </span><span style='color: #555555;font-style: italic;'>&lt;fct&gt;</span><span>      </span><span style='color: #555555;font-style: italic;'>&lt;dbl&gt;</span><span> </span><span style='color: #555555;font-style: italic;'>&lt;dbl&gt;</span><span>      </span><span style='color: #555555;font-style: italic;'>&lt;dbl&gt;</span><span>
176 | #&gt; </span><span style='color: #555555;'>1</span><span>     1 a     chr1         100   150          0
177 | #&gt; </span><span style='color: #555555;'>2</span><span>     2 b     chr1         120   250          0
178 | #&gt; </span><span style='color: #555555;'>3</span><span>     3 c     chr2         300   350          2
179 | #&gt; </span><span style='color: #555555;'>4</span><span>     4 d     chr1         260   450          1</div><div class='input'><span class='fu'>genome_cluster</span>(<span class='no'>x1</span>, <span class='kw'>by</span><span class='kw'>=</span><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chromosome"</span>, <span class='st'>"start"</span>, <span class='st'>"end"</span>), <span class='kw'>max_distance</span><span class='kw'>=</span><span class='fl'>10</span>)</div><div class='output co'>#&gt; </span><span style='color: #555555;'># A tibble: 4 x 6</span><span>
180 | #&gt;      id bla   chromosome start   end cluster_id
181 | #&gt;   </span><span style='color: #555555;font-style: italic;'>&lt;int&gt;</span><span> </span><span style='color: #555555;font-style: italic;'>&lt;fct&gt;</span><span> </span><span style='color: #555555;font-style: italic;'>&lt;fct&gt;</span><span>      </span><span style='color: #555555;font-style: italic;'>&lt;dbl&gt;</span><span> </span><span style='color: #555555;font-style: italic;'>&lt;dbl&gt;</span><span>      </span><span style='color: #555555;font-style: italic;'>&lt;dbl&gt;</span><span>
182 | #&gt; </span><span style='color: #555555;'>1</span><span>     1 a     chr1         100   150          0
183 | #&gt; </span><span style='color: #555555;'>2</span><span>     2 b     chr1         120   250          0
184 | #&gt; </span><span style='color: #555555;'>3</span><span>     3 c     chr2         300   350          1
185 | #&gt; </span><span style='color: #555555;'>4</span><span>     4 d     chr1         260   450          0</div></span></pre>
186 |   </div>
187 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
188 |     <h2>Contents</h2>
189 |     <ul class="nav nav-pills nav-stacked">
190 |       <li><a href="#arguments">Arguments</a></li>
191 |       
192 |       <li><a href="#value">Value</a></li>
193 |       
194 |       <li><a href="#examples">Examples</a></li>
195 |     </ul>
196 | 
197 |   </div>
198 | </div>
199 | 
200 |       <footer>
201 |       <div class="copyright">
202 |   <p>Developed by Constantin Ahlmann-Eltze.</p>
203 | </div>
204 | 
205 | <div class="pkgdown">
206 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
207 | </div>
208 |       </footer>
209 |    </div>
210 | 
211 |   
212 | 
213 |   </body>
214 | </html>
215 | 
216 | 


--------------------------------------------------------------------------------
/docs/reference/genome_complement.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html lang="en">
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Calculates the complement to the intervals covered by the intervals in
 10 | a data frame. It can optionally take a <code>chromosome_size</code> data frame
 11 | that contains 2 or 3 columns, the first the names of chromosome and in case
 12 | there are 2 columns the size or first the start index and lastly the end index
 13 | on the chromosome. — genome_complement • tidygenomics</title>
 14 | 
 15 | <!-- jquery -->
 16 | <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script>
 17 | <!-- Bootstrap -->
 18 | 
 19 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous" />
 20 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script>
 21 | 
 22 | <!-- Font Awesome icons -->
 23 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous" />
 24 | 
 25 | <!-- clipboard.js -->
 26 | <script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script>
 27 | 
 28 | <!-- sticky kit -->
 29 | <script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script>
 30 | 
 31 | <!-- pkgdown -->
 32 | <link href="../pkgdown.css" rel="stylesheet">
 33 | <script src="../pkgdown.js"></script>
 34 | 
 35 | 
 36 | 
 37 | <meta property="og:title" content="Calculates the complement to the intervals covered by the intervals in
 38 | a data frame. It can optionally take a <code>chromosome_size</code> data frame
 39 | that contains 2 or 3 columns, the first the names of chromosome and in case
 40 | there are 2 columns the size or first the start index and lastly the end index
 41 | on the chromosome. — genome_complement" />
 42 | 
 43 | <meta property="og:description" content="Calculates the complement to the intervals covered by the intervals in
 44 | a data frame. It can optionally take a chromosome_size data frame
 45 | that contains 2 or 3 columns, the first the names of chromosome and in case
 46 | there are 2 columns the size or first the start index and lastly the end index
 47 | on the chromosome." />
 48 | <meta name="twitter:card" content="summary" />
 49 | 
 50 | 
 51 | 
 52 | <!-- mathjax -->
 53 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
 54 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
 55 | 
 56 | <!--[if lt IE 9]>
 57 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 58 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 59 | <![endif]-->
 60 | 
 61 | 
 62 |   </head>
 63 | 
 64 |   <body>
 65 |     <div class="container template-reference-topic">
 66 |       <header>
 67 |       <div class="navbar navbar-default navbar-fixed-top" role="navigation">
 68 |   <div class="container">
 69 |     <div class="navbar-header">
 70 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 71 |         <span class="sr-only">Toggle navigation</span>
 72 |         <span class="icon-bar"></span>
 73 |         <span class="icon-bar"></span>
 74 |         <span class="icon-bar"></span>
 75 |       </button>
 76 |       <span class="navbar-brand">
 77 |         <a class="navbar-link" href="../index.html">tidygenomics</a>
 78 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.1.2</span>
 79 |       </span>
 80 |     </div>
 81 | 
 82 |     <div id="navbar" class="navbar-collapse collapse">
 83 |       <ul class="nav navbar-nav">
 84 |         <li>
 85 |   <a href="../index.html">
 86 |     <span class="fa fa-home fa-lg"></span>
 87 |      
 88 |   </a>
 89 | </li>
 90 | <li>
 91 |   <a href="../reference/index.html">Reference</a>
 92 | </li>
 93 | <li class="dropdown">
 94 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 95 |     Articles
 96 |      
 97 |     <span class="caret"></span>
 98 |   </a>
 99 |   <ul class="dropdown-menu" role="menu">
100 |     <li>
101 |       <a href="../articles/intro.html">Tidy Genomics</a>
102 |     </li>
103 |   </ul>
104 | </li>
105 | <li>
106 |   <a href="../news/index.html">Changelog</a>
107 | </li>
108 |       </ul>
109 |       
110 |       <ul class="nav navbar-nav navbar-right">
111 |         <li>
112 |   <a href="https://github.com/const-ae/tidygenomics">
113 |     <span class="fa fa-github fa-lg"></span>
114 |      
115 |   </a>
116 | </li>
117 |       </ul>
118 |       
119 |     </div><!--/.nav-collapse -->
120 |   </div><!--/.container -->
121 | </div><!--/.navbar -->
122 | 
123 |       
124 |       </header>
125 | 
126 | <div class="row">
127 |   <div class="col-md-9 contents">
128 |     <div class="page-header">
129 |     <h1>Calculates the complement to the intervals covered by the intervals in
130 | a data frame. It can optionally take a <code>chromosome_size</code> data frame
131 | that contains 2 or 3 columns, the first the names of chromosome and in case
132 | there are 2 columns the size or first the start index and lastly the end index
133 | on the chromosome.</h1>
134 |     <small class="dont-index">Source: <a href='https://github.com/const-ae/tidygenomics/blob/master/R/complement.R'><code>R/complement.R</code></a></small>
135 |     <div class="hidden name"><code>genome_complement.Rd</code></div>
136 |     </div>
137 | 
138 |     <div class="ref-description">
139 |     
140 |     <p>Calculates the complement to the intervals covered by the intervals in
141 | a data frame. It can optionally take a <code>chromosome_size</code> data frame
142 | that contains 2 or 3 columns, the first the names of chromosome and in case
143 | there are 2 columns the size or first the start index and lastly the end index
144 | on the chromosome.</p>
145 |     
146 |     </div>
147 | 
148 |     <pre class="usage"><span class='fu'>genome_complement</span>(<span class='no'>x</span>, <span class='kw'>chromosome_size</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>)</pre>
149 |     
150 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
151 |     <table class="ref-arguments">
152 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
153 |     <tr>
154 |       <th>x</th>
155 |       <td><p>A data frame for which the complement is calculated</p></td>
156 |     </tr>
157 |     <tr>
158 |       <th>chromosome_size</th>
159 |       <td><p>A dataframe with at least 2 columns that contains
160 | first the chromosome name and then the size of that chromosome. Can be NULL
161 | in which case the largest value per chromosome from <code>x</code> is used.</p></td>
162 |     </tr>
163 |     <tr>
164 |       <th>by</th>
165 |       <td><p>A character vector with 3 entries which are the chromosome, start and end column.
166 | For example: <code>by=c("chr", "start", "end")</code></p></td>
167 |     </tr>
168 |     </table>
169 |     
170 | 
171 |     <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
172 |     <pre class="examples"><div class='input'>
173 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='no'>dplyr</span>)
174 | 
175 | <span class='no'>x1</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/data.frame'>data.frame</a></span>(<span class='kw'>id</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>4</span>, <span class='kw'>bla</span><span class='kw'>=</span><span class='no'>letters</span>[<span class='fl'>1</span>:<span class='fl'>4</span>],
176 |                  <span class='kw'>chromosome</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chr1"</span>, <span class='st'>"chr1"</span>, <span class='st'>"chr2"</span>, <span class='st'>"chr1"</span>),
177 |                  <span class='kw'>start</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>100</span>, <span class='fl'>200</span>, <span class='fl'>300</span>, <span class='fl'>400</span>),
178 |                  <span class='kw'>end</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>150</span>, <span class='fl'>250</span>, <span class='fl'>350</span>, <span class='fl'>450</span>))
179 | 
180 | <span class='fu'>genome_complement</span>(<span class='no'>x1</span>, <span class='kw'>by</span><span class='kw'>=</span><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chromosome"</span>, <span class='st'>"start"</span>, <span class='st'>"end"</span>))</div><div class='output co'>#&gt; <span style='color: #555555;'># A tibble: 4 x 3</span><span>
181 | #&gt;   chromosome start   end
182 | #&gt;   </span><span style='color: #555555;font-style: italic;'>&lt;fct&gt;</span><span>      </span><span style='color: #555555;font-style: italic;'>&lt;int&gt;</span><span> </span><span style='color: #555555;font-style: italic;'>&lt;int&gt;</span><span>
183 | #&gt; </span><span style='color: #555555;'>1</span><span> chr1           1    99
184 | #&gt; </span><span style='color: #555555;'>2</span><span> chr1         151   199
185 | #&gt; </span><span style='color: #555555;'>3</span><span> chr1         251   399
186 | #&gt; </span><span style='color: #555555;'>4</span><span> chr2           1   299</div></span></pre>
187 |   </div>
188 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
189 |     <h2>Contents</h2>
190 |     <ul class="nav nav-pills nav-stacked">
191 |       <li><a href="#arguments">Arguments</a></li>
192 |             
193 |       <li><a href="#examples">Examples</a></li>
194 |     </ul>
195 | 
196 |   </div>
197 | </div>
198 | 
199 |       <footer>
200 |       <div class="copyright">
201 |   <p>Developed by Constantin Ahlmann-Eltze.</p>
202 | </div>
203 | 
204 | <div class="pkgdown">
205 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
206 | </div>
207 |       </footer>
208 |    </div>
209 | 
210 |   
211 | 
212 |   </body>
213 | </html>
214 | 
215 | 


--------------------------------------------------------------------------------
/docs/reference/genome_intersect.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html lang="en">
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Intersect data frames based on chromosome, start and end. — genome_intersect • tidygenomics</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous" />
 16 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous" />
 20 | 
 21 | <!-- clipboard.js -->
 22 | <script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script>
 23 | 
 24 | <!-- sticky kit -->
 25 | <script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script>
 26 | 
 27 | <!-- pkgdown -->
 28 | <link href="../pkgdown.css" rel="stylesheet">
 29 | <script src="../pkgdown.js"></script>
 30 | 
 31 | 
 32 | 
 33 | <meta property="og:title" content="Intersect data frames based on chromosome, start and end. — genome_intersect" />
 34 | 
 35 | <meta property="og:description" content="Intersect data frames based on chromosome, start and end." />
 36 | <meta name="twitter:card" content="summary" />
 37 | 
 38 | 
 39 | 
 40 | <!-- mathjax -->
 41 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
 42 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
 43 | 
 44 | <!--[if lt IE 9]>
 45 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 46 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 47 | <![endif]-->
 48 | 
 49 | 
 50 |   </head>
 51 | 
 52 |   <body>
 53 |     <div class="container template-reference-topic">
 54 |       <header>
 55 |       <div class="navbar navbar-default navbar-fixed-top" role="navigation">
 56 |   <div class="container">
 57 |     <div class="navbar-header">
 58 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 59 |         <span class="sr-only">Toggle navigation</span>
 60 |         <span class="icon-bar"></span>
 61 |         <span class="icon-bar"></span>
 62 |         <span class="icon-bar"></span>
 63 |       </button>
 64 |       <span class="navbar-brand">
 65 |         <a class="navbar-link" href="../index.html">tidygenomics</a>
 66 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.1.2</span>
 67 |       </span>
 68 |     </div>
 69 | 
 70 |     <div id="navbar" class="navbar-collapse collapse">
 71 |       <ul class="nav navbar-nav">
 72 |         <li>
 73 |   <a href="../index.html">
 74 |     <span class="fa fa-home fa-lg"></span>
 75 |      
 76 |   </a>
 77 | </li>
 78 | <li>
 79 |   <a href="../reference/index.html">Reference</a>
 80 | </li>
 81 | <li class="dropdown">
 82 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 83 |     Articles
 84 |      
 85 |     <span class="caret"></span>
 86 |   </a>
 87 |   <ul class="dropdown-menu" role="menu">
 88 |     <li>
 89 |       <a href="../articles/intro.html">Tidy Genomics</a>
 90 |     </li>
 91 |   </ul>
 92 | </li>
 93 | <li>
 94 |   <a href="../news/index.html">Changelog</a>
 95 | </li>
 96 |       </ul>
 97 |       
 98 |       <ul class="nav navbar-nav navbar-right">
 99 |         <li>
100 |   <a href="https://github.com/const-ae/tidygenomics">
101 |     <span class="fa fa-github fa-lg"></span>
102 |      
103 |   </a>
104 | </li>
105 |       </ul>
106 |       
107 |     </div><!--/.nav-collapse -->
108 |   </div><!--/.container -->
109 | </div><!--/.navbar -->
110 | 
111 |       
112 |       </header>
113 | 
114 | <div class="row">
115 |   <div class="col-md-9 contents">
116 |     <div class="page-header">
117 |     <h1>Intersect data frames based on chromosome, start and end.</h1>
118 |     <small class="dont-index">Source: <a href='https://github.com/const-ae/tidygenomics/blob/master/R/intersect.R'><code>R/intersect.R</code></a></small>
119 |     <div class="hidden name"><code>genome_intersect.Rd</code></div>
120 |     </div>
121 | 
122 |     <div class="ref-description">
123 |     
124 |     <p>Intersect data frames based on chromosome, start and end.</p>
125 |     
126 |     </div>
127 | 
128 |     <pre class="usage"><span class='fu'>genome_intersect</span>(<span class='no'>x</span>, <span class='no'>y</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='kw'>mode</span> <span class='kw'>=</span> <span class='st'>"both"</span>)</pre>
129 |     
130 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
131 |     <table class="ref-arguments">
132 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
133 |     <tr>
134 |       <th>x</th>
135 |       <td><p>A dataframe.</p></td>
136 |     </tr>
137 |     <tr>
138 |       <th>y</th>
139 |       <td><p>A dataframe.</p></td>
140 |     </tr>
141 |     <tr>
142 |       <th>by</th>
143 |       <td><p>A character vector with 3 entries which are used to match the chromosome, start and end column.
144 | For example: <code>by=c("Chromosome"="chr", "Start"="start", "End"="end")</code></p></td>
145 |     </tr>
146 |     <tr>
147 |       <th>mode</th>
148 |       <td><p>One of "both", "left", "right" or "anti".</p></td>
149 |     </tr>
150 |     </table>
151 |     
152 |     <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
153 | 
154 |     <p>The intersected dataframe of <code>x</code> and <code>y</code> with the new boundaries.</p>
155 |     
156 | 
157 |     <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
158 |     <pre class="examples"><div class='input'>
159 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='no'>dplyr</span>)
160 | 
161 | <span class='no'>x1</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/data.frame'>data.frame</a></span>(<span class='kw'>id</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>4</span>, <span class='kw'>bla</span><span class='kw'>=</span><span class='no'>letters</span>[<span class='fl'>1</span>:<span class='fl'>4</span>],
162 |                  <span class='kw'>chromosome</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chr1"</span>, <span class='st'>"chr1"</span>, <span class='st'>"chr2"</span>, <span class='st'>"chr2"</span>),
163 |                  <span class='kw'>start</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>100</span>, <span class='fl'>200</span>, <span class='fl'>300</span>, <span class='fl'>400</span>),
164 |                  <span class='kw'>end</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>150</span>, <span class='fl'>250</span>, <span class='fl'>350</span>, <span class='fl'>450</span>))
165 | 
166 | <span class='no'>x2</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/data.frame'>data.frame</a></span>(<span class='kw'>id</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>4</span>, <span class='kw'>BLA</span><span class='kw'>=</span><span class='no'>LETTERS</span>[<span class='fl'>1</span>:<span class='fl'>4</span>],
167 |                  <span class='kw'>chromosome</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chr1"</span>, <span class='st'>"chr2"</span>, <span class='st'>"chr2"</span>, <span class='st'>"chr1"</span>),
168 |                  <span class='kw'>start</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>140</span>, <span class='fl'>210</span>, <span class='fl'>400</span>, <span class='fl'>300</span>),
169 |                  <span class='kw'>end</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>160</span>, <span class='fl'>240</span>, <span class='fl'>415</span>, <span class='fl'>320</span>))
170 | <span class='no'>j</span> <span class='kw'>&lt;-</span> <span class='fu'>genome_intersect</span>(<span class='no'>x1</span>, <span class='no'>x2</span>, <span class='kw'>by</span><span class='kw'>=</span><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chromosome"</span>, <span class='st'>"start"</span>, <span class='st'>"end"</span>), <span class='kw'>mode</span><span class='kw'>=</span><span class='st'>"both"</span>)
171 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/print'>print</a></span>(<span class='no'>j</span>)</div><div class='output co'>#&gt;   id.x bla chromosome id.y BLA start end
172 | #&gt; 1    1   a       chr1    1   A   140 150
173 | #&gt; 2    4   d       chr2    3   C   400 415</div><div class='input'>
174 | 
175 | 
176 | </div></pre>
177 |   </div>
178 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
179 |     <h2>Contents</h2>
180 |     <ul class="nav nav-pills nav-stacked">
181 |       <li><a href="#arguments">Arguments</a></li>
182 |       
183 |       <li><a href="#value">Value</a></li>
184 |       
185 |       <li><a href="#examples">Examples</a></li>
186 |     </ul>
187 | 
188 |   </div>
189 | </div>
190 | 
191 |       <footer>
192 |       <div class="copyright">
193 |   <p>Developed by Constantin Ahlmann-Eltze.</p>
194 | </div>
195 | 
196 | <div class="pkgdown">
197 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
198 | </div>
199 |       </footer>
200 |    </div>
201 | 
202 |   
203 | 
204 |   </body>
205 | </html>
206 | 
207 | 


--------------------------------------------------------------------------------
/docs/reference/genome_join_closest.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html lang="en">
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Join intervals on chromosomes in data frames, to the closest partner — genome_join_closest • tidygenomics</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous" />
 16 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous" />
 20 | 
 21 | <!-- clipboard.js -->
 22 | <script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script>
 23 | 
 24 | <!-- sticky kit -->
 25 | <script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script>
 26 | 
 27 | <!-- pkgdown -->
 28 | <link href="../pkgdown.css" rel="stylesheet">
 29 | <script src="../pkgdown.js"></script>
 30 | 
 31 | 
 32 | 
 33 | <meta property="og:title" content="Join intervals on chromosomes in data frames, to the closest partner — genome_join_closest" />
 34 | 
 35 | <meta property="og:description" content="Join intervals on chromosomes in data frames, to the closest partner" />
 36 | <meta name="twitter:card" content="summary" />
 37 | 
 38 | 
 39 | 
 40 | <!-- mathjax -->
 41 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
 42 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
 43 | 
 44 | <!--[if lt IE 9]>
 45 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 46 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 47 | <![endif]-->
 48 | 
 49 | 
 50 |   </head>
 51 | 
 52 |   <body>
 53 |     <div class="container template-reference-topic">
 54 |       <header>
 55 |       <div class="navbar navbar-default navbar-fixed-top" role="navigation">
 56 |   <div class="container">
 57 |     <div class="navbar-header">
 58 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 59 |         <span class="sr-only">Toggle navigation</span>
 60 |         <span class="icon-bar"></span>
 61 |         <span class="icon-bar"></span>
 62 |         <span class="icon-bar"></span>
 63 |       </button>
 64 |       <span class="navbar-brand">
 65 |         <a class="navbar-link" href="../index.html">tidygenomics</a>
 66 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.1.2</span>
 67 |       </span>
 68 |     </div>
 69 | 
 70 |     <div id="navbar" class="navbar-collapse collapse">
 71 |       <ul class="nav navbar-nav">
 72 |         <li>
 73 |   <a href="../index.html">
 74 |     <span class="fa fa-home fa-lg"></span>
 75 |      
 76 |   </a>
 77 | </li>
 78 | <li>
 79 |   <a href="../reference/index.html">Reference</a>
 80 | </li>
 81 | <li class="dropdown">
 82 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 83 |     Articles
 84 |      
 85 |     <span class="caret"></span>
 86 |   </a>
 87 |   <ul class="dropdown-menu" role="menu">
 88 |     <li>
 89 |       <a href="../articles/intro.html">Tidy Genomics</a>
 90 |     </li>
 91 |   </ul>
 92 | </li>
 93 | <li>
 94 |   <a href="../news/index.html">Changelog</a>
 95 | </li>
 96 |       </ul>
 97 |       
 98 |       <ul class="nav navbar-nav navbar-right">
 99 |         <li>
100 |   <a href="https://github.com/const-ae/tidygenomics">
101 |     <span class="fa fa-github fa-lg"></span>
102 |      
103 |   </a>
104 | </li>
105 |       </ul>
106 |       
107 |     </div><!--/.nav-collapse -->
108 |   </div><!--/.container -->
109 | </div><!--/.navbar -->
110 | 
111 |       
112 |       </header>
113 | 
114 | <div class="row">
115 |   <div class="col-md-9 contents">
116 |     <div class="page-header">
117 |     <h1>Join intervals on chromosomes in data frames, to the closest partner</h1>
118 |     <small class="dont-index">Source: <a href='https://github.com/const-ae/tidygenomics/blob/master/R/join_closest.R'><code>R/join_closest.R</code></a></small>
119 |     <div class="hidden name"><code>genome_join_closest.Rd</code></div>
120 |     </div>
121 | 
122 |     <div class="ref-description">
123 |     
124 |     <p>Join intervals on chromosomes in data frames, to the closest partner</p>
125 |     
126 |     </div>
127 | 
128 |     <pre class="usage"><span class='fu'>genome_join_closest</span>(<span class='no'>x</span>, <span class='no'>y</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='kw'>mode</span> <span class='kw'>=</span> <span class='st'>"inner"</span>,
129 |   <span class='kw'>distance_column_name</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='kw'>max_distance</span> <span class='kw'>=</span> <span class='fl'>Inf</span>, <span class='kw'>select</span> <span class='kw'>=</span> <span class='st'>"all"</span>)
130 | 
131 | <span class='fu'>genome_inner_join_closest</span>(<span class='no'>x</span>, <span class='no'>y</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='no'>...</span>)
132 | 
133 | <span class='fu'>genome_left_join_closest</span>(<span class='no'>x</span>, <span class='no'>y</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='no'>...</span>)
134 | 
135 | <span class='fu'>genome_right_join_closest</span>(<span class='no'>x</span>, <span class='no'>y</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='no'>...</span>)
136 | 
137 | <span class='fu'>genome_full_join_closest</span>(<span class='no'>x</span>, <span class='no'>y</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='no'>...</span>)
138 | 
139 | <span class='fu'>genome_semi_join_closest</span>(<span class='no'>x</span>, <span class='no'>y</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='no'>...</span>)
140 | 
141 | <span class='fu'>genome_anti_join_closest</span>(<span class='no'>x</span>, <span class='no'>y</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='no'>...</span>)</pre>
142 |     
143 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
144 |     <table class="ref-arguments">
145 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
146 |     <tr>
147 |       <th>x</th>
148 |       <td><p>A dataframe.</p></td>
149 |     </tr>
150 |     <tr>
151 |       <th>y</th>
152 |       <td><p>A dataframe.</p></td>
153 |     </tr>
154 |     <tr>
155 |       <th>by</th>
156 |       <td><p>A character vector with 3 entries which are used to match the chromosome, start and end column.
157 | For example: <code>by=c("Chromosome"="chr", "Start"="start", "End"="end")</code></p></td>
158 |     </tr>
159 |     <tr>
160 |       <th>mode</th>
161 |       <td><p>One of "inner", "full", "left", "right", "semi" or "anti".</p></td>
162 |     </tr>
163 |     <tr>
164 |       <th>distance_column_name</th>
165 |       <td><p>A string that is used as the new column name with the distance.
166 | If <code>NULL</code> no new column is added.</p></td>
167 |     </tr>
168 |     <tr>
169 |       <th>max_distance</th>
170 |       <td><p>The maximum distance that is allowed to join 2 entries.</p></td>
171 |     </tr>
172 |     <tr>
173 |       <th>select</th>
174 |       <td><p>A string that is passed on to <code><a href='https://www.rdocumentation.org/packages/IRanges/topics/nearest-methods'>IRanges::distanceToNearest</a></code>, can either be
175 | all which means that in case that multiple intervals have the same distance all are reported, or
176 | arbitrary which means in that case one would be chosen at random.</p></td>
177 |     </tr>
178 |     <tr>
179 |       <th>...</th>
180 |       <td><p>Additional arguments parsed on to genome_join_closest.</p></td>
181 |     </tr>
182 |     </table>
183 |     
184 |     <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
185 | 
186 |     <p>The joined dataframe of <code>x</code> and <code>y</code>.</p>
187 |     
188 | 
189 |     <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
190 |     <pre class="examples"><div class='input'>
191 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='no'>dplyr</span>)
192 | 
193 | <span class='no'>x1</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/data.frame'>data.frame</a></span>(<span class='kw'>id</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>4</span>, <span class='kw'>bla</span><span class='kw'>=</span><span class='no'>letters</span>[<span class='fl'>1</span>:<span class='fl'>4</span>],
194 |                  <span class='kw'>chromosome</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chr1"</span>, <span class='st'>"chr1"</span>, <span class='st'>"chr2"</span>, <span class='st'>"chr2"</span>),
195 |                  <span class='kw'>start</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>100</span>, <span class='fl'>200</span>, <span class='fl'>300</span>, <span class='fl'>400</span>),
196 |                  <span class='kw'>end</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>150</span>, <span class='fl'>250</span>, <span class='fl'>350</span>, <span class='fl'>450</span>))
197 | 
198 | <span class='no'>x2</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/data.frame'>data.frame</a></span>(<span class='kw'>id</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>4</span>, <span class='kw'>BLA</span><span class='kw'>=</span><span class='no'>LETTERS</span>[<span class='fl'>1</span>:<span class='fl'>4</span>],
199 |                  <span class='kw'>chromosome</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chr1"</span>, <span class='st'>"chr2"</span>, <span class='st'>"chr2"</span>, <span class='st'>"chr1"</span>),
200 |                  <span class='kw'>start</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>140</span>, <span class='fl'>210</span>, <span class='fl'>400</span>, <span class='fl'>300</span>),
201 |                  <span class='kw'>end</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>160</span>, <span class='fl'>240</span>, <span class='fl'>415</span>, <span class='fl'>320</span>))
202 | <span class='no'>j</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='genome_intersect.html'>genome_intersect</a></span>(<span class='no'>x1</span>, <span class='no'>x2</span>, <span class='kw'>by</span><span class='kw'>=</span><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chromosome"</span>, <span class='st'>"start"</span>, <span class='st'>"end"</span>), <span class='kw'>mode</span><span class='kw'>=</span><span class='st'>"both"</span>)
203 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/print'>print</a></span>(<span class='no'>j</span>)</div><div class='output co'>#&gt;   id.x bla chromosome id.y BLA start end
204 | #&gt; 1    1   a       chr1    1   A   140 150
205 | #&gt; 2    4   d       chr2    3   C   400 415</div></pre>
206 |   </div>
207 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
208 |     <h2>Contents</h2>
209 |     <ul class="nav nav-pills nav-stacked">
210 |       <li><a href="#arguments">Arguments</a></li>
211 |       
212 |       <li><a href="#value">Value</a></li>
213 |       
214 |       <li><a href="#examples">Examples</a></li>
215 |     </ul>
216 | 
217 |   </div>
218 | </div>
219 | 
220 |       <footer>
221 |       <div class="copyright">
222 |   <p>Developed by Constantin Ahlmann-Eltze.</p>
223 | </div>
224 | 
225 | <div class="pkgdown">
226 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
227 | </div>
228 |       </footer>
229 |    </div>
230 | 
231 |   
232 | 
233 |   </body>
234 | </html>
235 | 
236 | 


--------------------------------------------------------------------------------
/docs/reference/genome_subtract.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html lang="en">
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Subtract one data frame from another based on chromosome, start and end. — genome_subtract • tidygenomics</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous" />
 16 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous" />
 20 | 
 21 | <!-- clipboard.js -->
 22 | <script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script>
 23 | 
 24 | <!-- sticky kit -->
 25 | <script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script>
 26 | 
 27 | <!-- pkgdown -->
 28 | <link href="../pkgdown.css" rel="stylesheet">
 29 | <script src="../pkgdown.js"></script>
 30 | 
 31 | 
 32 | 
 33 | <meta property="og:title" content="Subtract one data frame from another based on chromosome, start and end. — genome_subtract" />
 34 | 
 35 | <meta property="og:description" content="Subtract one data frame from another based on chromosome, start and end." />
 36 | <meta name="twitter:card" content="summary" />
 37 | 
 38 | 
 39 | 
 40 | <!-- mathjax -->
 41 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
 42 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
 43 | 
 44 | <!--[if lt IE 9]>
 45 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 46 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 47 | <![endif]-->
 48 | 
 49 | 
 50 |   </head>
 51 | 
 52 |   <body>
 53 |     <div class="container template-reference-topic">
 54 |       <header>
 55 |       <div class="navbar navbar-default navbar-fixed-top" role="navigation">
 56 |   <div class="container">
 57 |     <div class="navbar-header">
 58 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 59 |         <span class="sr-only">Toggle navigation</span>
 60 |         <span class="icon-bar"></span>
 61 |         <span class="icon-bar"></span>
 62 |         <span class="icon-bar"></span>
 63 |       </button>
 64 |       <span class="navbar-brand">
 65 |         <a class="navbar-link" href="../index.html">tidygenomics</a>
 66 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.1.2</span>
 67 |       </span>
 68 |     </div>
 69 | 
 70 |     <div id="navbar" class="navbar-collapse collapse">
 71 |       <ul class="nav navbar-nav">
 72 |         <li>
 73 |   <a href="../index.html">
 74 |     <span class="fa fa-home fa-lg"></span>
 75 |      
 76 |   </a>
 77 | </li>
 78 | <li>
 79 |   <a href="../reference/index.html">Reference</a>
 80 | </li>
 81 | <li class="dropdown">
 82 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 83 |     Articles
 84 |      
 85 |     <span class="caret"></span>
 86 |   </a>
 87 |   <ul class="dropdown-menu" role="menu">
 88 |     <li>
 89 |       <a href="../articles/intro.html">Tidy Genomics</a>
 90 |     </li>
 91 |   </ul>
 92 | </li>
 93 | <li>
 94 |   <a href="../news/index.html">Changelog</a>
 95 | </li>
 96 |       </ul>
 97 |       
 98 |       <ul class="nav navbar-nav navbar-right">
 99 |         <li>
100 |   <a href="https://github.com/const-ae/tidygenomics">
101 |     <span class="fa fa-github fa-lg"></span>
102 |      
103 |   </a>
104 | </li>
105 |       </ul>
106 |       
107 |     </div><!--/.nav-collapse -->
108 |   </div><!--/.container -->
109 | </div><!--/.navbar -->
110 | 
111 |       
112 |       </header>
113 | 
114 | <div class="row">
115 |   <div class="col-md-9 contents">
116 |     <div class="page-header">
117 |     <h1>Subtract one data frame from another based on chromosome, start and end.</h1>
118 |     <small class="dont-index">Source: <a href='https://github.com/const-ae/tidygenomics/blob/master/R/subtract.R'><code>R/subtract.R</code></a></small>
119 |     <div class="hidden name"><code>genome_subtract.Rd</code></div>
120 |     </div>
121 | 
122 |     <div class="ref-description">
123 |     
124 |     <p>Subtract one data frame from another based on chromosome, start and end.</p>
125 |     
126 |     </div>
127 | 
128 |     <pre class="usage"><span class='fu'>genome_subtract</span>(<span class='no'>x</span>, <span class='no'>y</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>)</pre>
129 |     
130 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
131 |     <table class="ref-arguments">
132 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
133 |     <tr>
134 |       <th>x</th>
135 |       <td><p>A dataframe.</p></td>
136 |     </tr>
137 |     <tr>
138 |       <th>y</th>
139 |       <td><p>A dataframe.</p></td>
140 |     </tr>
141 |     <tr>
142 |       <th>by</th>
143 |       <td><p>A character vector with 3 entries which are used to match the chromosome, start and end column.
144 | For example: <code>by=c("Chromosome"="chr", "Start"="start", "End"="end")</code></p></td>
145 |     </tr>
146 |     </table>
147 |     
148 |     <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
149 | 
150 |     <p>The subtracted dataframe of <code>x</code> and <code>y</code> with the new boundaries.</p>
151 |     
152 | 
153 |     <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
154 |     <pre class="examples"><div class='input'>
155 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='no'>dplyr</span>)
156 | 
157 | <span class='no'>x1</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/data.frame'>data.frame</a></span>(<span class='kw'>id</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>4</span>, <span class='kw'>bla</span><span class='kw'>=</span><span class='no'>letters</span>[<span class='fl'>1</span>:<span class='fl'>4</span>],
158 |                  <span class='kw'>chromosome</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chr1"</span>, <span class='st'>"chr1"</span>, <span class='st'>"chr2"</span>, <span class='st'>"chr1"</span>),
159 |                  <span class='kw'>start</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>100</span>, <span class='fl'>200</span>, <span class='fl'>300</span>, <span class='fl'>400</span>),
160 |                  <span class='kw'>end</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>150</span>, <span class='fl'>250</span>, <span class='fl'>350</span>, <span class='fl'>450</span>))
161 | 
162 | <span class='no'>x2</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/data.frame'>data.frame</a></span>(<span class='kw'>id</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>4</span>, <span class='kw'>BLA</span><span class='kw'>=</span><span class='no'>LETTERS</span>[<span class='fl'>1</span>:<span class='fl'>4</span>],
163 |                  <span class='kw'>chromosome</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chr1"</span>, <span class='st'>"chr2"</span>, <span class='st'>"chr1"</span>, <span class='st'>"chr1"</span>),
164 |                  <span class='kw'>start</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>120</span>, <span class='fl'>210</span>, <span class='fl'>300</span>, <span class='fl'>400</span>),
165 |                  <span class='kw'>end</span> <span class='kw'>=</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='fl'>125</span>, <span class='fl'>240</span>, <span class='fl'>320</span>, <span class='fl'>415</span>))
166 | 
167 | <span class='no'>j</span> <span class='kw'>&lt;-</span> <span class='fu'>genome_subtract</span>(<span class='no'>x1</span>, <span class='no'>x2</span>, <span class='kw'>by</span><span class='kw'>=</span><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/c'>c</a></span>(<span class='st'>"chromosome"</span>, <span class='st'>"start"</span>, <span class='st'>"end"</span>))
168 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/print'>print</a></span>(<span class='no'>j</span>)</div><div class='output co'>#&gt;   id bla chromosome start end
169 | #&gt; 1  1   a       chr1   100 119
170 | #&gt; 2  1   a       chr1   126 150
171 | #&gt; 3  2   b       chr1   200 250
172 | #&gt; 4  3   c       chr2   300 350
173 | #&gt; 5  4   d       chr1   416 450</div><div class='input'>
174 | 
175 | </div></pre>
176 |   </div>
177 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
178 |     <h2>Contents</h2>
179 |     <ul class="nav nav-pills nav-stacked">
180 |       <li><a href="#arguments">Arguments</a></li>
181 |       
182 |       <li><a href="#value">Value</a></li>
183 |       
184 |       <li><a href="#examples">Examples</a></li>
185 |     </ul>
186 | 
187 |   </div>
188 | </div>
189 | 
190 |       <footer>
191 |       <div class="copyright">
192 |   <p>Developed by Constantin Ahlmann-Eltze.</p>
193 | </div>
194 | 
195 | <div class="pkgdown">
196 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
197 | </div>
198 |       </footer>
199 |    </div>
200 | 
201 |   
202 | 
203 |   </body>
204 | </html>
205 | 
206 | 


--------------------------------------------------------------------------------
/docs/reference/index.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html lang="en">
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Function reference • tidygenomics</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous" />
 16 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous" />
 20 | 
 21 | <!-- clipboard.js -->
 22 | <script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script>
 23 | 
 24 | <!-- sticky kit -->
 25 | <script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script>
 26 | 
 27 | <!-- pkgdown -->
 28 | <link href="../pkgdown.css" rel="stylesheet">
 29 | <script src="../pkgdown.js"></script>
 30 | 
 31 | 
 32 | 
 33 | <meta property="og:title" content="Function reference" />
 34 | 
 35 | 
 36 | 
 37 | <!-- mathjax -->
 38 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
 39 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
 40 | 
 41 | <!--[if lt IE 9]>
 42 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 43 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 44 | <![endif]-->
 45 | 
 46 | 
 47 |   </head>
 48 | 
 49 |   <body>
 50 |     <div class="container template-reference-index">
 51 |       <header>
 52 |       <div class="navbar navbar-default navbar-fixed-top" role="navigation">
 53 |   <div class="container">
 54 |     <div class="navbar-header">
 55 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 56 |         <span class="sr-only">Toggle navigation</span>
 57 |         <span class="icon-bar"></span>
 58 |         <span class="icon-bar"></span>
 59 |         <span class="icon-bar"></span>
 60 |       </button>
 61 |       <span class="navbar-brand">
 62 |         <a class="navbar-link" href="../index.html">tidygenomics</a>
 63 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.1.2</span>
 64 |       </span>
 65 |     </div>
 66 | 
 67 |     <div id="navbar" class="navbar-collapse collapse">
 68 |       <ul class="nav navbar-nav">
 69 |         <li>
 70 |   <a href="../index.html">
 71 |     <span class="fa fa-home fa-lg"></span>
 72 |      
 73 |   </a>
 74 | </li>
 75 | <li>
 76 |   <a href="../reference/index.html">Reference</a>
 77 | </li>
 78 | <li class="dropdown">
 79 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 80 |     Articles
 81 |      
 82 |     <span class="caret"></span>
 83 |   </a>
 84 |   <ul class="dropdown-menu" role="menu">
 85 |     <li>
 86 |       <a href="../articles/intro.html">Tidy Genomics</a>
 87 |     </li>
 88 |   </ul>
 89 | </li>
 90 | <li>
 91 |   <a href="../news/index.html">Changelog</a>
 92 | </li>
 93 |       </ul>
 94 |       
 95 |       <ul class="nav navbar-nav navbar-right">
 96 |         <li>
 97 |   <a href="https://github.com/const-ae/tidygenomics">
 98 |     <span class="fa fa-github fa-lg"></span>
 99 |      
100 |   </a>
101 | </li>
102 |       </ul>
103 |       
104 |     </div><!--/.nav-collapse -->
105 |   </div><!--/.container -->
106 | </div><!--/.navbar -->
107 | 
108 |       
109 |       </header>
110 | 
111 | <div class="row">
112 |   <div class="contents col-md-9">
113 |     <div class="page-header">
114 |       <h1>Reference</h1>
115 |     </div>
116 | 
117 |     <table class="ref-index">
118 | 
119 |     <colgroup>
120 |       
121 |       <col class="alias" />
122 |       <col class="title" />
123 |     </colgroup>
124 | 
125 |     <tbody>
126 |       <tr>
127 |         <th colspan="2">
128 |           <h2 id="section-all-functions" class="hasAnchor"><a href="#section-all-functions" class="anchor"></a>All functions</h2>
129 |           <p class="section-desc"></p>
130 |         </th>
131 |       </tr>
132 |       <tr>
133 |         
134 |         <td>
135 |           <p><code><a href="cluster_interval.html">cluster_interval()</a></code> </p>
136 |         </td>
137 |         <td><p>Cluster ranges which are implemented as 2 equal-length numeric vectors.</p></td>
138 |       </tr><tr>
139 |         
140 |         <td>
141 |           <p><code><a href="genome_cluster.html">genome_cluster()</a></code> </p>
142 |         </td>
143 |         <td><p>Intersect data frames based on chromosome, start and end.</p></td>
144 |       </tr><tr>
145 |         
146 |         <td>
147 |           <p><code><a href="genome_complement.html">genome_complement()</a></code> </p>
148 |         </td>
149 |         <td><p>Calculates the complement to the intervals covered by the intervals in
150 | a data frame. It can optionally take a <code>chromosome_size</code> data frame
151 | that contains 2 or 3 columns, the first the names of chromosome and in case
152 | there are 2 columns the size or first the start index and lastly the end index
153 | on the chromosome.</p></td>
154 |       </tr><tr>
155 |         
156 |         <td>
157 |           <p><code><a href="genome_intersect.html">genome_intersect()</a></code> </p>
158 |         </td>
159 |         <td><p>Intersect data frames based on chromosome, start and end.</p></td>
160 |       </tr><tr>
161 |         
162 |         <td>
163 |           <p><code><a href="genome_join_closest.html">genome_join_closest()</a></code> <code><a href="genome_join_closest.html">genome_inner_join_closest()</a></code> <code><a href="genome_join_closest.html">genome_left_join_closest()</a></code> <code><a href="genome_join_closest.html">genome_right_join_closest()</a></code> <code><a href="genome_join_closest.html">genome_full_join_closest()</a></code> <code><a href="genome_join_closest.html">genome_semi_join_closest()</a></code> <code><a href="genome_join_closest.html">genome_anti_join_closest()</a></code> </p>
164 |         </td>
165 |         <td><p>Join intervals on chromosomes in data frames, to the closest partner</p></td>
166 |       </tr><tr>
167 |         
168 |         <td>
169 |           <p><code><a href="genome_subtract.html">genome_subtract()</a></code> </p>
170 |         </td>
171 |         <td><p>Subtract one data frame from another based on chromosome, start and end.</p></td>
172 |       </tr>
173 |     </tbody>
174 |     </table>
175 |   </div>
176 | 
177 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
178 |     <h2>Contents</h2>
179 |     <ul class="nav nav-pills nav-stacked">
180 |       <li><a href="#section-all-functions">All functions</a></li>
181 |     </ul>
182 |   </div>
183 | </div>
184 | 
185 |       <footer>
186 |       <div class="copyright">
187 |   <p>Developed by Constantin Ahlmann-Eltze.</p>
188 | </div>
189 | 
190 | <div class="pkgdown">
191 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
192 | </div>
193 |       </footer>
194 |    </div>
195 | 
196 |   
197 | 
198 |   </body>
199 | </html>
200 | 
201 | 


--------------------------------------------------------------------------------
/man/cluster_interval.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/RcppExports.R
 3 | \name{cluster_interval}
 4 | \alias{cluster_interval}
 5 | \title{Cluster ranges which are implemented as 2 equal-length numeric vectors.}
 6 | \usage{
 7 | cluster_interval(starts, ends, max_distance = 0L)
 8 | }
 9 | \arguments{
10 | \item{starts}{A numeric vector that defines the starts of each interval}
11 | 
12 | \item{ends}{A numeric vector that defines the ends of each interval}
13 | 
14 | \item{max_distance}{The maximum distance up to which intervals are still considered to be
15 | the same cluster. Default: 0.}
16 | }
17 | \description{
18 | Cluster ranges which are implemented as 2 equal-length numeric vectors.
19 | }
20 | \examples{
21 | starts <- c(50, 100, 120)
22 | ends <- c(75, 130, 150)
23 | j <- cluster_interval(starts, ends)
24 | j == c(0,1,1)
25 | }
26 | 


--------------------------------------------------------------------------------
/man/genome_cluster.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/cluster.R
 3 | \name{genome_cluster}
 4 | \alias{genome_cluster}
 5 | \title{Intersect data frames based on chromosome, start and end.}
 6 | \usage{
 7 | genome_cluster(x, by = NULL, max_distance = 0,
 8 |   cluster_column_name = "cluster_id")
 9 | }
10 | \arguments{
11 | \item{x}{A dataframe.}
12 | 
13 | \item{by}{A character vector with 3 entries which are the chromosome, start and end column.
14 | For example: \code{by=c("chr", "start", "end")}}
15 | 
16 | \item{max_distance}{The maximum distance up to which intervals are still considered to be
17 | the same cluster. Default: 0.}
18 | 
19 | \item{cluster_column_name}{A string that is used as the new column name}
20 | }
21 | \value{
22 | The dataframe with the additional column of the cluster
23 | }
24 | \description{
25 | Intersect data frames based on chromosome, start and end.
26 | }
27 | \examples{
28 | 
29 | library(dplyr)
30 | 
31 | x1 <- data.frame(id = 1:4, bla=letters[1:4],
32 |                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
33 |                  start = c(100, 120, 300, 260),
34 |                  end = c(150, 250, 350, 450))
35 | genome_cluster(x1, by=c("chromosome", "start", "end"))
36 | genome_cluster(x1, by=c("chromosome", "start", "end"), max_distance=10)
37 | }
38 | 


--------------------------------------------------------------------------------
/man/genome_complement.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/complement.R
 3 | \name{genome_complement}
 4 | \alias{genome_complement}
 5 | \title{Calculates the complement to the intervals covered by the intervals in
 6 | a data frame. It can optionally take a \code{chromosome_size} data frame
 7 | that contains 2 or 3 columns, the first the names of chromosome and in case
 8 | there are 2 columns the size or first the start index and lastly the end index
 9 | on the chromosome.}
10 | \usage{
11 | genome_complement(x, chromosome_size = NULL, by = NULL)
12 | }
13 | \arguments{
14 | \item{x}{A data frame for which the complement is calculated}
15 | 
16 | \item{chromosome_size}{A dataframe with at least 2 columns that contains
17 | first the chromosome name and then the size of that chromosome. Can be NULL
18 | in which case the largest value per chromosome from \code{x} is used.}
19 | 
20 | \item{by}{A character vector with 3 entries which are the chromosome, start and end column.
21 | For example: \code{by=c("chr", "start", "end")}}
22 | }
23 | \description{
24 | Calculates the complement to the intervals covered by the intervals in
25 | a data frame. It can optionally take a \code{chromosome_size} data frame
26 | that contains 2 or 3 columns, the first the names of chromosome and in case
27 | there are 2 columns the size or first the start index and lastly the end index
28 | on the chromosome.
29 | }
30 | \examples{
31 | 
32 | library(dplyr)
33 | 
34 | x1 <- data.frame(id = 1:4, bla=letters[1:4],
35 |                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
36 |                  start = c(100, 200, 300, 400),
37 |                  end = c(150, 250, 350, 450))
38 | 
39 | genome_complement(x1, by=c("chromosome", "start", "end"))
40 | }
41 | 


--------------------------------------------------------------------------------
/man/genome_intersect.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/intersect.R
 3 | \name{genome_intersect}
 4 | \alias{genome_intersect}
 5 | \title{Intersect data frames based on chromosome, start and end.}
 6 | \usage{
 7 | genome_intersect(x, y, by = NULL, mode = "both")
 8 | }
 9 | \arguments{
10 | \item{x}{A dataframe.}
11 | 
12 | \item{y}{A dataframe.}
13 | 
14 | \item{by}{A character vector with 3 entries which are used to match the chromosome, start and end column.
15 | For example: \code{by=c("Chromosome"="chr", "Start"="start", "End"="end")}}
16 | 
17 | \item{mode}{One of "both", "left", "right" or "anti".}
18 | }
19 | \value{
20 | The intersected dataframe of \code{x} and \code{y} with the new boundaries.
21 | }
22 | \description{
23 | Intersect data frames based on chromosome, start and end.
24 | }
25 | \examples{
26 | 
27 | library(dplyr)
28 | 
29 | x1 <- data.frame(id = 1:4, bla=letters[1:4],
30 |                  chromosome = c("chr1", "chr1", "chr2", "chr2"),
31 |                  start = c(100, 200, 300, 400),
32 |                  end = c(150, 250, 350, 450))
33 | 
34 | x2 <- data.frame(id = 1:4, BLA=LETTERS[1:4],
35 |                  chromosome = c("chr1", "chr2", "chr2", "chr1"),
36 |                  start = c(140, 210, 400, 300),
37 |                  end = c(160, 240, 415, 320))
38 | j <- genome_intersect(x1, x2, by=c("chromosome", "start", "end"), mode="both")
39 | print(j)
40 | 
41 | 
42 | 
43 | }
44 | 


--------------------------------------------------------------------------------
/man/genome_join_closest.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/join_closest.R
 3 | \name{genome_join_closest}
 4 | \alias{genome_join_closest}
 5 | \alias{genome_inner_join_closest}
 6 | \alias{genome_left_join_closest}
 7 | \alias{genome_right_join_closest}
 8 | \alias{genome_full_join_closest}
 9 | \alias{genome_semi_join_closest}
10 | \alias{genome_anti_join_closest}
11 | \title{Join intervals on chromosomes in data frames, to the closest partner}
12 | \usage{
13 | genome_join_closest(x, y, by = NULL, mode = "inner",
14 |   distance_column_name = NULL, max_distance = Inf, select = "all")
15 | 
16 | genome_inner_join_closest(x, y, by = NULL, ...)
17 | 
18 | genome_left_join_closest(x, y, by = NULL, ...)
19 | 
20 | genome_right_join_closest(x, y, by = NULL, ...)
21 | 
22 | genome_full_join_closest(x, y, by = NULL, ...)
23 | 
24 | genome_semi_join_closest(x, y, by = NULL, ...)
25 | 
26 | genome_anti_join_closest(x, y, by = NULL, ...)
27 | }
28 | \arguments{
29 | \item{x}{A dataframe.}
30 | 
31 | \item{y}{A dataframe.}
32 | 
33 | \item{by}{A character vector with 3 entries which are used to match the chromosome, start and end column.
34 | For example: \code{by=c("Chromosome"="chr", "Start"="start", "End"="end")}}
35 | 
36 | \item{mode}{One of "inner", "full", "left", "right", "semi" or "anti".}
37 | 
38 | \item{distance_column_name}{A string that is used as the new column name with the distance.
39 | If \code{NULL} no new column is added.}
40 | 
41 | \item{max_distance}{The maximum distance that is allowed to join 2 entries.}
42 | 
43 | \item{select}{A string that is passed on to \code{IRanges::distanceToNearest}, can either be
44 | all which means that in case that multiple intervals have the same distance all are reported, or
45 | arbitrary which means in that case one would be chosen at random.}
46 | 
47 | \item{...}{Additional arguments parsed on to genome_join_closest.}
48 | }
49 | \value{
50 | The joined dataframe of \code{x} and \code{y}.
51 | }
52 | \description{
53 | Join intervals on chromosomes in data frames, to the closest partner
54 | }
55 | \examples{
56 | 
57 | library(dplyr)
58 | 
59 | x1 <- data.frame(id = 1:4, bla=letters[1:4],
60 |                  chromosome = c("chr1", "chr1", "chr2", "chr2"),
61 |                  start = c(100, 200, 300, 400),
62 |                  end = c(150, 250, 350, 450))
63 | 
64 | x2 <- data.frame(id = 1:4, BLA=LETTERS[1:4],
65 |                  chromosome = c("chr1", "chr2", "chr2", "chr1"),
66 |                  start = c(140, 210, 400, 300),
67 |                  end = c(160, 240, 415, 320))
68 | j <- genome_intersect(x1, x2, by=c("chromosome", "start", "end"), mode="both")
69 | print(j)
70 | }
71 | 


--------------------------------------------------------------------------------
/man/genome_subtract.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/subtract.R
 3 | \name{genome_subtract}
 4 | \alias{genome_subtract}
 5 | \title{Subtract one data frame from another based on chromosome, start and end.}
 6 | \usage{
 7 | genome_subtract(x, y, by = NULL)
 8 | }
 9 | \arguments{
10 | \item{x}{A dataframe.}
11 | 
12 | \item{y}{A dataframe.}
13 | 
14 | \item{by}{A character vector with 3 entries which are used to match the chromosome, start and end column.
15 | For example: \code{by=c("Chromosome"="chr", "Start"="start", "End"="end")}}
16 | }
17 | \value{
18 | The subtracted dataframe of \code{x} and \code{y} with the new boundaries.
19 | }
20 | \description{
21 | Subtract one data frame from another based on chromosome, start and end.
22 | }
23 | \examples{
24 | 
25 | library(dplyr)
26 | 
27 | x1 <- data.frame(id = 1:4, bla=letters[1:4],
28 |                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
29 |                  start = c(100, 200, 300, 400),
30 |                  end = c(150, 250, 350, 450))
31 | 
32 | x2 <- data.frame(id = 1:4, BLA=LETTERS[1:4],
33 |                  chromosome = c("chr1", "chr2", "chr1", "chr1"),
34 |                  start = c(120, 210, 300, 400),
35 |                  end = c(125, 240, 320, 415))
36 | 
37 | j <- genome_subtract(x1, x2, by=c("chromosome", "start", "end"))
38 | print(j)
39 | 
40 | 
41 | }
42 | 


--------------------------------------------------------------------------------
/src/.gitignore:
--------------------------------------------------------------------------------
1 | *.o
2 | *.so
3 | *.dll
4 | 


--------------------------------------------------------------------------------
/src/RcppExports.cpp:
--------------------------------------------------------------------------------
 1 | // Generated by using Rcpp::compileAttributes() -> do not edit by hand
 2 | // Generator token: 10BE3573-1514-4C36-9D1C-5A225CD40393
 3 | 
 4 | #include <Rcpp.h>
 5 | 
 6 | using namespace Rcpp;
 7 | 
 8 | // sort_indices
 9 | IntegerVector sort_indices(NumericVector x);
10 | RcppExport SEXP _tidygenomics_sort_indices(SEXP xSEXP) {
11 | BEGIN_RCPP
12 |     Rcpp::RObject rcpp_result_gen;
13 |     Rcpp::RNGScope rcpp_rngScope_gen;
14 |     Rcpp::traits::input_parameter< NumericVector >::type x(xSEXP);
15 |     rcpp_result_gen = Rcpp::wrap(sort_indices(x));
16 |     return rcpp_result_gen;
17 | END_RCPP
18 | }
19 | // cluster_interval
20 | IntegerVector cluster_interval(NumericVector starts, NumericVector ends, int max_distance);
21 | RcppExport SEXP _tidygenomics_cluster_interval(SEXP startsSEXP, SEXP endsSEXP, SEXP max_distanceSEXP) {
22 | BEGIN_RCPP
23 |     Rcpp::RObject rcpp_result_gen;
24 |     Rcpp::RNGScope rcpp_rngScope_gen;
25 |     Rcpp::traits::input_parameter< NumericVector >::type starts(startsSEXP);
26 |     Rcpp::traits::input_parameter< NumericVector >::type ends(endsSEXP);
27 |     Rcpp::traits::input_parameter< int >::type max_distance(max_distanceSEXP);
28 |     rcpp_result_gen = Rcpp::wrap(cluster_interval(starts, ends, max_distance));
29 |     return rcpp_result_gen;
30 | END_RCPP
31 | }
32 | 


--------------------------------------------------------------------------------
/src/cluster_interval.cpp:
--------------------------------------------------------------------------------
  1 | #include <Rcpp.h>
  2 | 
  3 | 
  4 | using namespace Rcpp;
  5 | using namespace std;
  6 | 
  7 | 
  8 | // The following code was copied from the stan math library
  9 | // https://github.com/stan-dev/stan/blob/e118db2b78ed33c40f7b5c774f3ce5b85aa5dfdf/src/stan/math/matrix/sort_indices.hpp
 10 | 
 11 | /*
 12 |  * Copyright (c) 2011--2015, Stan Developers and their Assignees
 13 |  All rights reserved.
 14 | 
 15 |  Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:
 16 | 
 17 |  * Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
 18 |  * Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution.
 19 |  * Neither the name of Columbia University nor the names of its contributors may be used to endorse or promote products derived from this software without specific prior written permission.
 20 | 
 21 |  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 22 |  */
 23 | 
 24 | template <bool ascending, typename C>
 25 | class index_comparator {
 26 |   const C& xs_;
 27 | public:
 28 |   /**
 29 |   * Construct an index comparator holding a reference
 30 |   * to the specified container.
 31 |   *
 32 |   * @patam xs Container
 33 |   */
 34 |   index_comparator(const C& xs) : xs_(xs) { }
 35 | 
 36 |   /**
 37 |   * Return true if the value at the first index is sorted in
 38 |   * front of the value at the second index;  this will depend
 39 |   * on the template parameter <code>ascending</code>.
 40 |   *
 41 |   * @param i Index of first value for comparison
 42 |   * @param j Index of second value for comparison
 43 |   */
 44 |   bool operator()(int i, int j) const {
 45 |     if (ascending)
 46 |       return xs_[i] < xs_[j];
 47 |     else
 48 |       return xs_[i] > xs_[j];
 49 |   }
 50 | };
 51 | 
 52 | 
 53 | /**
 54 |  * Return an integer array of indices of the specified container
 55 |  * sorting the values in ascending or descending order based on
 56 |  * the value of the first template prameter.
 57 |  *
 58 |  * @tparam ascending true if sort is in ascending order
 59 |  * @tparam C type of container
 60 |  * @param xs Container to sort
 61 |  * @return sorted version of container
 62 |  */
 63 | template <bool ascending, typename C>
 64 | std::vector<int> sort_indices(const C& xs) {
 65 |   typename C::size_type size = xs.size();
 66 |   std::vector<int> idxs;
 67 |   idxs.resize(size);
 68 |   for (typename C::size_type i = 0; i < size; ++i)
 69 |     idxs[i] = i;
 70 |   index_comparator<ascending,C> comparator(xs);
 71 |   std::sort(idxs.begin(), idxs.end(), comparator);
 72 |   return idxs;
 73 | }
 74 | 
 75 | 
 76 | // [[Rcpp::export]]
 77 | IntegerVector sort_indices(NumericVector x){
 78 |   return wrap(sort_indices<true>(as<std::vector<double> >(x)));
 79 | }
 80 | 
 81 | 
 82 | //' Cluster ranges which are implemented as 2 equal-length numeric vectors.
 83 | //' @param starts A numeric vector that defines the starts of each interval
 84 | //' @param ends A numeric vector that defines the ends of each interval
 85 | //' @param max_distance The maximum distance up to which intervals are still considered to be
 86 | //'  the same cluster. Default: 0.
 87 | //' @examples
 88 | //' starts <- c(50, 100, 120)
 89 | //' ends <- c(75, 130, 150)
 90 | //' j <- cluster_interval(starts, ends)
 91 | //' j == c(0,1,1)
 92 | //' @export
 93 | // [[Rcpp::export]]
 94 | IntegerVector cluster_interval(NumericVector starts, NumericVector ends, int max_distance=0) {
 95 | 
 96 |   // Require that starts and ends are the same length
 97 | 
 98 |   // The implementation is inspired by the bedtools implementation:
 99 |   // https://github.com/arq5x/bedtools2/blob/14fbbb8aed5c6a04685da2cee3f11b98d70304a7/src/clusterBed/clusterBed.cpp
100 |   IntegerVector result(starts.size());
101 |   int cluster_id = -1;
102 |   int prev_end = std::numeric_limits<int>::min();
103 |   vector<int> indices = sort_indices<true>(as<std::vector<double> >(starts));
104 |   for (int j = 0; j < indices.size(); j++) {
105 |     int i = indices[j];
106 |     Rcpp::checkUserInterrupt();
107 |     if(starts[i] - prev_end > max_distance){
108 |       cluster_id++;
109 |       prev_end = ends[i];
110 |     }else{
111 |       if(ends[i] > prev_end){
112 |         prev_end = ends[i];
113 |       }
114 |     }
115 |     result[i] = cluster_id;
116 |   }
117 | 
118 |   return result;
119 | }
120 | 
121 | 
122 | 
123 | 


--------------------------------------------------------------------------------
/src/tidygenomics_init.c:
--------------------------------------------------------------------------------
 1 | #include <R.h>
 2 | #include <Rinternals.h>
 3 | #include <stdlib.h> // for NULL
 4 | #include <R_ext/Rdynload.h>
 5 | 
 6 | /* FIXME:
 7 |    Check these declarations against the C/Fortran source code.
 8 | */
 9 | 
10 | /* .Call calls */
11 | extern SEXP _tidygenomics_cluster_interval(SEXP, SEXP, SEXP);
12 | extern SEXP _tidygenomics_sort_indices(SEXP);
13 | 
14 | static const R_CallMethodDef CallEntries[] = {
15 |     {"_tidygenomics_cluster_interval", (DL_FUNC) &_tidygenomics_cluster_interval, 3},
16 |     {"_tidygenomics_sort_indices",     (DL_FUNC) &_tidygenomics_sort_indices,     1},
17 |     {NULL, NULL, 0}
18 | };
19 | 
20 | void R_init_tidygenomics(DllInfo *dll)
21 | {
22 |     R_registerRoutines(dll, NULL, CallEntries, NULL, NULL);
23 |     R_useDynamicSymbols(dll, FALSE);
24 | }
25 | 


--------------------------------------------------------------------------------
/tests/testthat.R:
--------------------------------------------------------------------------------
1 | library(testthat)
2 | library(tidygenomics)
3 | 
4 | test_check("tidygenomics")
5 | 


--------------------------------------------------------------------------------
/tests/testthat/test_cluster.R:
--------------------------------------------------------------------------------
 1 | 
 2 | context("genome_cluster")
 3 | 
 4 | library(dplyr)
 5 | 
 6 | x1 <- tibble(id = 1:4, bla=letters[1:4],
 7 |                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
 8 |                  start = c(100, 120, 300, 260),
 9 |                  end = c(150, 250, 350, 450))
10 | 
11 | 
12 | test_that("genome_clustering assings that correct clusters", {
13 |   j <- genome_cluster(x1, by=c("chromosome", "start", "end"), max_distance=5)
14 | 
15 |   print(j)
16 | 
17 |   expect_equal(j$cluster_id, c(0,0,2,1))
18 | })
19 | 
20 | 
21 | test_that("cluster_interval works", {
22 |   starts <- c(50, 100, 120)
23 |   ends <- c(75, 130, 150)
24 |   j <- cluster_interval(starts, ends)
25 |   expect_equal(j, c(0,1,1))
26 |   expect_equal(cluster_interval(starts, ends, max_distance = 24), c(0,1,1))
27 |   expect_equal(cluster_interval(starts, ends, max_distance = 25), c(0,0,0))
28 | 
29 |   starts <- c(50, 100, 120, 180, 350)
30 |   ends <- c(75, 200, 150, 210, 400)
31 |   expect_equal(cluster_interval(starts, ends), c(0,1,1,1,2))
32 | 
33 |   starts <- c(500, 300, 150)
34 |   ends <- c(510, 310, 160)
35 |   expect_equal(cluster_interval(starts, ends), c(2,1,0))
36 | 
37 |   expect_equal(cluster_interval(numeric(0), numeric(0)), numeric(0))
38 | })
39 | 


--------------------------------------------------------------------------------
/tests/testthat/test_complement.R:
--------------------------------------------------------------------------------
 1 | 
 2 | context("genome_complement")
 3 | 
 4 | library(dplyr)
 5 | 
 6 | x1 <- tibble(id = 1:4, bla=letters[1:4],
 7 |                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
 8 |                  start = c(100, 200, 300, 400),
 9 |                  end = c(150, 250, 350, 450))
10 | 
11 | test_that("Calculating the complement of a sequence works", {
12 |   j <- genome_complement(x1, by=c("chromosome", "start", "end"))
13 |   print(j)
14 |   expect_equal(j$chromosome, c("chr1", "chr1", "chr1", "chr2"))
15 |   expect_equal(j$start, c(1,151, 251,1))
16 |   expect_equal(j$end, c(99,199, 399, 299))
17 | })
18 | 


--------------------------------------------------------------------------------
/tests/testthat/test_intersect.R:
--------------------------------------------------------------------------------
 1 | 
 2 | context("genome_intersect")
 3 | 
 4 | suppressPackageStartupMessages(library(dplyr))
 5 | 
 6 | x1 <- tibble(id = 1:4, bla=letters[1:4],
 7 |                  chromosome = c("chr1", "chr1", "chr2", "chr2"),
 8 |                  start = c(100, 200, 300, 400),
 9 |                  end = c(150, 250, 350, 450))
10 | 
11 | x2 <- tibble(id = 1:4, BLA=LETTERS[1:4],
12 |                  chromosome = c("chr1", "chr2", "chr2", "chr1"),
13 |                  start = c(140, 210, 400, 300),
14 |                  end = c(160, 240, 415, 320))
15 | 
16 | test_that("Intersection (both) of 2 data frames works as expected", {
17 |   j <- genome_intersect(x1, x2, by=c("chromosome", "start", "end"), mode="both")
18 |   # print(j)
19 |   expect_equal(colnames(j), c("id.x", "bla", "chromosome", "id.y", "BLA", "start", "end"))
20 |   expect_equal(j$start, c(140, 400))
21 |   expect_equal(j$end, c(150, 415))
22 | })
23 | 
24 | test_that("Intersection of 2 data frames works for multi-overlap ranges", {
25 |   x2 <- tibble(id = 1, BLA=LETTERS[1],
26 |                    chromosome = c("chr1"),
27 |                    start = c(140),
28 |                    end = c(220))
29 |   j <- genome_intersect(x1, x2, by=c("chromosome", "start", "end"), mode="both")
30 |   # print(j)
31 |   expect_equal(colnames(j), c("id.x", "bla", "chromosome", "id.y", "BLA", "start", "end"))
32 |   expect_equal(j$start, c(140, 200))
33 |   expect_equal(j$end, c(150, 220))
34 |   expect_equal(j$id.x, c(1,2))
35 |   expect_equal(j$id.y, c(1,1))
36 | 
37 | })
38 | 
39 | 
40 | 
41 | test_that("Intersection of 2 data frames works for multi-overlap ranges the other way around", {
42 |   x1 <- tibble(id = 1, bla=letters[1],
43 |                    chromosome = c("chr1"),
44 |                    start = c(100),
45 |                    end = c(420))
46 |   j <- genome_intersect(x1, x2, by=c("chromosome", "start", "end"), mode="both")
47 |   # print(j)
48 |   expect_equal(colnames(j), c("id.x", "bla", "chromosome", "id.y", "BLA", "start", "end"))
49 |   expect_equal(j$start, c(140, 300))
50 |   expect_equal(j$end, c(160, 320))
51 |   expect_equal(j$id.x, c(1,1))
52 |   expect_equal(j$id.y, c(1,4))
53 | 
54 | })
55 | 
56 | 
57 | test_that("Intersect and findOverlap always match", {
58 |   r1 <- IRanges::IRanges(start=c(1,3,24), end=c(1,130,24))
59 |   r2 <- IRanges::IRanges(start=c(1,20,100), end=c(10,30,110))
60 |   o <- as.data.frame(IRanges::findOverlaps(r1, r2))
61 |   intersection <- IRanges::pintersect(r1[o$queryHits], r2[o$subjectHits])
62 |   expect_equal(length(o$queryHits), length(intersection))
63 |   expect_true(all(IRanges::poverlaps(intersection, r1[o$queryHits])))
64 | })
65 | 
66 | 
67 | 


--------------------------------------------------------------------------------
/tests/testthat/test_issue.R:
--------------------------------------------------------------------------------
 1 | 
 2 | context("genome_issue")
 3 | 
 4 | 
 5 | suppressPackageStartupMessages(library(dplyr))
 6 | 
 7 | 
 8 | test_that("Latest issue", {
 9 | 
10 | })
11 | 


--------------------------------------------------------------------------------
/tests/testthat/test_join_closest.R:
--------------------------------------------------------------------------------
 1 | 
 2 | context("genome_join_closest")
 3 | 
 4 | library(dplyr)
 5 | 
 6 | x1 <- tibble(id = 1:4, bla=letters[1:4],
 7 |                  chromosome = c("chr1", "chr1", "chr2", "chr3"),
 8 |                  start = c(100, 200, 300, 400),
 9 |                  end = c(150, 250, 350, 450))
10 | 
11 | x2 <- tibble(id = 1:4, BLA=LETTERS[1:4],
12 |                  chromosome = c("chr1", "chr1", "chr1", "chr2"),
13 |                  start = c(220, 210, 300, 400),
14 |                  end = c(225, 240, 320, 415))
15 | 
16 | test_that("Joining with closest works as expected", {
17 |   j <- genome_join_closest(x1, x2, by=c("chromosome", "start", "end"), distance_column_name="distance", mode="left")
18 |   print(j)
19 |   expect_equal(colnames(j), c("id.x", "bla", "chromosome.x", "start.x", "end.x",
20 |                               "id.y", "BLA", "chromosome.y", "start.y", "end.y", "distance"))
21 |   expect_equal(j$start.y, c(210, 220, 210, 400, NA))
22 |   expect_equal(j$distance, c(59, 0, 0, 49, NA))
23 | })
24 | 
25 | 
26 | 


--------------------------------------------------------------------------------
/tests/testthat/test_subtract.R:
--------------------------------------------------------------------------------
 1 | 
 2 | context("genome_subtract")
 3 | 
 4 | 
 5 | suppressPackageStartupMessages(library(dplyr))
 6 | 
 7 | x1 <- tibble(id = 1:4, bla=letters[1:4],
 8 |                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
 9 |                  start = c(100, 200, 300, 400),
10 |                  end = c(150, 250, 350, 450))
11 | 
12 | x2 <- tibble(id = 1:4, BLA=LETTERS[1:4],
13 |                  chromosome = c("chr1", "chr2", "chr1", "chr1"),
14 |                  start = c(120, 210, 300, 400),
15 |                  end = c(125, 240, 320, 415))
16 | 
17 | test_that("Subtraction of 2 data frames works as expected", {
18 |   j <- genome_subtract(x1, x2, by=c("chromosome", "start", "end"))
19 |   # print(j)
20 |   expect_equal(colnames(j), c("id", "bla", "chromosome", "start", "end"))
21 |   expect_equal(j$start, c(100, 126, 200, 300, 416))
22 |   expect_equal(j$end,   c(119, 150, 250, 350, 450))
23 | })
24 | 
25 | 
26 | 
27 | test_that("Edge cases of subtraction of 2 data frames works as expected", {
28 |   x1 <- tibble(id = 1:2, bla=letters[1:2],
29 |                    chromosome = c("chr1", "chr1"),
30 |                    start = c(100, 200),
31 |                    end = c(150, 250))
32 | 
33 |   x2 <- tibble(id = 1:4, BLA=LETTERS[1:4],
34 |                    chromosome = c("chr1", "chr1", "chr1", "chr1"),
35 |                    start = c(120, 110, 190, 400),
36 |                    end = c(125, 122, 320, 415))
37 | 
38 |   j <- genome_subtract(x1, x2, by=c("chromosome", "start", "end"))
39 |   print(j)
40 |   expect_equal(colnames(j), c("id", "bla", "chromosome", "start", "end"))
41 |   expect_equal(j$start, c(100, 126))
42 |   expect_equal(j$end,   c(109, 150))
43 | })
44 | 
45 | 
46 | test_that("during subtraction the intervals are not unified", {
47 |   x1 <- tibble(id = 1:3, bla=letters[1:3],
48 |                    chromosome = c("chr1", "chr1", "chr1"),
49 |                    start = c(100, 115, 200),
50 |                    end = c(150, 160, 250))
51 | 
52 |   x2 <- tibble(id = 1, BLA=LETTERS[1],
53 |                    chromosome = c("chr1"),
54 |                    start = c(110),
55 |                    end = c(130))
56 | 
57 |   j <- genome_subtract(x1, x2, by=c("chromosome", "start", "end"))
58 |   print(j)
59 |   expect_equal(colnames(j), c("id", "bla", "chromosome", "start", "end"))
60 |   expect_equal(j$start, c(100, 131, 131, 200))
61 |   expect_equal(j$end,   c(109, 150, 160, 250))
62 | })
63 | 


--------------------------------------------------------------------------------
/tidygenomics.Rproj:
--------------------------------------------------------------------------------
 1 | Version: 1.0
 2 | 
 3 | RestoreWorkspace: Default
 4 | SaveWorkspace: Default
 5 | AlwaysSaveHistory: Default
 6 | 
 7 | EnableCodeIndexing: Yes
 8 | UseSpacesForTab: Yes
 9 | NumSpacesForTab: 2
10 | Encoding: UTF-8
11 | 
12 | RnwWeave: Sweave
13 | LaTeX: pdfLaTeX
14 | 
15 | AutoAppendNewline: Yes
16 | StripTrailingWhitespace: Yes
17 | 
18 | BuildType: Package
19 | PackageUseDevtools: Yes
20 | PackageInstallArgs: --no-multiarch --with-keep.source
21 | 


--------------------------------------------------------------------------------
/vignettes/intro.Rmd:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "Tidy Genomics"
  3 | author: "Constantin Ahlmann-Eltze"
  4 | date: "`r Sys.Date()`"
  5 | output: 
  6 |   rmarkdown::html_vignette:
  7 |         fig_caption: yes
  8 | vignette: >
  9 |   %\VignetteIndexEntry{Tidy Genomics}
 10 |   %\VignetteEngine{knitr::rmarkdown}
 11 |   %\VignetteEncoding{UTF-8}
 12 | ---
 13 | 
 14 | The most dramatic impact on programming in R the last years was the development of the [tidyverse](http://tidyverse.org/) by Hadley Wickham et al.
 15 | which, combined with the ingenious `%>%` from magrittr, provides a uniform philosophy for handling data.
 16 | 
 17 | The genomics community has an alternative set of approaches, for which [bioconductor](http://bioconductor.org/) and the 
 18 | [GenomicRanges](http://bioconductor.org/packages/release/bioc/html/GenomicRanges.html) package provide the basis. The `GenomicRanges` and
 19 | the underlying `IRanges` package provide a great set of methods for dealing with intervals as they typically encountered in genomics.
 20 | 
 21 | Unfortunately it is not always easy to combine those two worlds, many common operations in `GenomicRanges` focus solely on the
 22 | ranges and loose the additional metadata columns. On the other hand the `tidyverse` does not provide a unified set of methods
 23 | to do common set operations with intervals.
 24 | 
 25 | At least until recently, when the [fuzzyjoin](https://github.com/dgrtwo/fuzzyjoin) package was extended with the `genome_join`
 26 | method for combining genomic data stored in a `data.frame`. It demonstrated that genomic data could appropriately be handled
 27 | with the _tidy_-philosophy.
 28 | 
 29 | The `tidygenomics` package extends the limited set of methods provided by the `fuzzyjoin` package for dealing with genomic
 30 | data. Its API is inspired by the very popular [bedtools](http://bedtools.readthedocs.io/en/latest/index.html):
 31 | 
 32 | 
 33 | - `genome_intersect`
 34 | - `genome_subtract`
 35 | - `genome_join_closest`
 36 | - `genome_cluster`
 37 | - `genome_complement`
 38 | - `genome_join` _Provided by the fuzzyjoin package_
 39 | 
 40 | ```{r, message=FALSE, warning=FALSE, echo=FALSE}
 41 | library(dplyr)
 42 | library(tidygenomics)
 43 | ```
 44 | 
 45 | 
 46 | ## genome_intersect
 47 | 
 48 | Joins 2 data frames based on their genomic overlap. Unlike the `genome_join` function it updates the boundaries to reflect
 49 | the overlap of the regions.
 50 | 
 51 | <img src="resources/genome_intersect_docu.png" alt="genome_intersect" style="width: 100%;"/>
 52 | 
 53 | 
 54 | ```{r}
 55 | x1 <- data.frame(id = 1:4, 
 56 |                 chromosome = c("chr1", "chr1", "chr2", "chr2"),
 57 |                 start = c(100, 200, 300, 400),
 58 |                 end = c(150, 250, 350, 450))
 59 | 
 60 | x2 <- data.frame(id = 1:4,
 61 |                  chromosome = c("chr1", "chr2", "chr2", "chr1"),
 62 |                  start = c(140, 210, 400, 300),
 63 |                  end = c(160, 240, 415, 320))
 64 | 
 65 | genome_intersect(x1, x2, by=c("chromosome", "start", "end"), mode="both")
 66 | ```
 67 | 
 68 | 
 69 | ## genome_subtract
 70 | 
 71 | Subtracts one data frame from the other. This can be used to split the x data frame into smaller areas.
 72 | 
 73 | <img src="resources/genome_subtract_docu.png" alt="genome_subtract" style="width: 100%;"/>
 74 | 
 75 | ```{r}
 76 | x1 <- data.frame(id = 1:4,
 77 |                 chromosome = c("chr1", "chr1", "chr2", "chr1"),
 78 |                 start = c(100, 200, 300, 400),
 79 |                 end = c(150, 250, 350, 450))
 80 | 
 81 | x2 <- data.frame(id = 1:4,
 82 |                 chromosome = c("chr1", "chr2", "chr1", "chr1"),
 83 |                 start = c(120, 210, 300, 400),
 84 |                 end = c(125, 240, 320, 415))
 85 | 
 86 | genome_subtract(x1, x2, by=c("chromosome", "start", "end"))
 87 | ```
 88 | 
 89 | 
 90 | 
 91 | 
 92 | ## genome_join_closest
 93 | 
 94 | Joins 2 data frames based on their genomic location. If no exact overlap is found the next closest interval is used.
 95 | 
 96 | <img src="resources/genome_join_closest_docu.png" alt="genome_join_closest" style="width: 100%;"/>
 97 | 
 98 | ```{r}
 99 | x1 <- tibble(id = 1:4, 
100 |              chr = c("chr1", "chr1", "chr2", "chr3"),
101 |              start = c(100, 200, 300, 400),
102 |              end = c(150, 250, 350, 450))
103 | 
104 | x2 <- tibble(id = 1:4,
105 |              chr = c("chr1", "chr1", "chr1", "chr2"),
106 |              start = c(220, 210, 300, 400),
107 |              end = c(225, 240, 320, 415))
108 | genome_join_closest(x1, x2, by=c("chr", "start", "end"), distance_column_name="distance", mode="left")
109 | ```
110 | 
111 | 
112 | ## genome_cluster
113 | 
114 | Add a new column with the cluster if 2 intervals are overlapping or are within the `max_distance`.
115 | 
116 | <img src="resources/genome_cluster_docu.png" alt="genome_cluster" style="width: 100%;"/>
117 | 
118 | ```{r}
119 | x1 <- data.frame(id = 1:4, bla=letters[1:4],
120 |                 chromosome = c("chr1", "chr1", "chr2", "chr1"),
121 |                 start = c(100, 120, 300, 260),
122 |                 end = c(150, 250, 350, 450))
123 | genome_cluster(x1, by=c("chromosome", "start", "end"))
124 | genome_cluster(x1, by=c("chromosome", "start", "end"), max_distance=10)
125 | ```
126 | 
127 | ## genome_complement
128 | 
129 | Calculates the complement of a genomic region.
130 | 
131 | <img src="resources/genome_complement_docu.png" alt="genome_complement" style="width: 100%;"/>
132 | 
133 | ```{r}
134 | x1 <- data.frame(id = 1:4,
135 |                  chromosome = c("chr1", "chr1", "chr2", "chr1"),
136 |                  start = c(100, 200, 300, 400),
137 |                  end = c(150, 250, 350, 450))
138 | 
139 | genome_complement(x1, by=c("chromosome", "start", "end"))
140 | ```
141 | 
142 | 
143 | 
144 | ## genome_join
145 | 
146 | Classical join function based on the overlap of the interval. Implemented and mainted in the
147 | [fuzzyjoin](https://github.com/dgrtwo/fuzzyjoin) package and documented here only for completeness.
148 | 
149 | <img src="resources/genome_join_docu.png" alt="genome_join" style="width: 100%;"/>
150 | 
151 | ```{r}
152 | x1 <- tibble(id = 1:4, 
153 |              chr = c("chr1", "chr1", "chr2", "chr3"),
154 |              start = c(100, 200, 300, 400),
155 |              end = c(150, 250, 350, 450))
156 | 
157 | x2 <- tibble(id = 1:4,
158 |              chr = c("chr1", "chr1", "chr1", "chr2"),
159 |              start = c(220, 210, 300, 400),
160 |              end = c(225, 240, 320, 415))
161 | fuzzyjoin::genome_join(x1, x2, by=c("chr", "start", "end"), mode="inner")
162 | 
163 | fuzzyjoin::genome_join(x1, x2, by=c("chr", "start", "end"), mode="left")
164 | 
165 | fuzzyjoin::genome_join(x1, x2, by=c("chr", "start", "end"), mode="anti")
166 | ```
167 | 
168 | 
169 | 
170 | 


--------------------------------------------------------------------------------
/vignettes/resources/genome_cluster_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/vignettes/resources/genome_cluster_docu.png


--------------------------------------------------------------------------------
/vignettes/resources/genome_complement_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/vignettes/resources/genome_complement_docu.png


--------------------------------------------------------------------------------
/vignettes/resources/genome_intersect_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/vignettes/resources/genome_intersect_docu.png


--------------------------------------------------------------------------------
/vignettes/resources/genome_join_closest_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/vignettes/resources/genome_join_closest_docu.png


--------------------------------------------------------------------------------
/vignettes/resources/genome_join_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/vignettes/resources/genome_join_docu.png


--------------------------------------------------------------------------------
/vignettes/resources/genome_subtract_docu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/const-ae/tidygenomics/23737e99f7ff9893f485e2b6b48c1d15c13a5623/vignettes/resources/genome_subtract_docu.png


--------------------------------------------------------------------------------