Introduction

The chromatin interactions is involved in precise quantitative and spatiotemporal control of gene expression. The development of high-throughput experimental techniques, such as HiC-seq, HiCAR-seq, and InTAC-seq, for analyzing both the higher-order structure of chromatin and the interactions between protein and their nearby and remote regulatory elements has been developed to reveal how gene expression is controlled in genome-wide.

The interaction data will be saved in the format of paired genome coordinates with the interaction score. The popular format are .validPairs, .hic, and .cool. The trackViewer package can be used to handle those data to plot the heatmap or the interaction links.

Plot chromatin interactions data in linear layout

Plot chromatin interactions tracks as heatmap.

library(trackViewer)
library(InteractionSet)
gi <- readRDS(system.file("extdata", "nij.chr6.51120000.53200000.gi.rds", package="trackViewer"))
head(gi)
## GInteractions object with 6 interactions and 1 metadata column:
##       seqnames1           ranges1     seqnames2           ranges2 |     score
##           <Rle>         <IRanges>         <Rle>         <IRanges> | <numeric>
##   [1]      chr6 51120000-51160000 ---      chr6 51120000-51160000 |   45.1227
##   [2]      chr6 51120000-51160000 ---      chr6 51160000-51200000 |   35.0006
##   [3]      chr6 51120000-51160000 ---      chr6 51200000-51240000 |   44.7322
##   [4]      chr6 51120000-51160000 ---      chr6 51240000-51280000 |   29.3507
##   [5]      chr6 51120000-51160000 ---      chr6 51280000-51320000 |   38.8417
##   [6]      chr6 51120000-51160000 ---      chr6 51320000-51360000 |   31.7063
##   -------
##   regions: 53 ranges and 0 metadata columns
##   seqinfo: 1 sequence from an unspecified genome; no seqlengths
## hicexplorer:hicConvertFormat tool can be used to convert other formats into GInteractions
## eg: hicConvertFormat -m mESC_rep.hic --inputFormat hic --outputFormat cool -o mESC_rep.mcool
##     hicConvertFormat -m mESC_rep.mcool::resolutions/10000 --inputFormat cool --outputFormat ginteractions -o mESC_rep.ginteractions --resolutions 10000
## please note that metadata:score is used for plot.
gi$border_color <- NA ## highlight some regions
gi$border_color[sample(seq_along(gi), 20)] <- sample(1:7, 20, replace=TRUE)
## The TADs will be drawn as lines at points start(first), center point, end(second).
tads <- GInteractions(
  GRanges("chr6", 
          IRanges(c(51130001, 51130001, 51450001, 52210001), width = 20000)),
  GRanges("chr6", 
          IRanges(c(51530001, 52170001, 52210001, 53210001), width = 20000)))
range <- GRanges("chr6", IRanges(51120000, 53200000))
heatmap <- gi2track(gi)
ctcf <- readRDS(system.file("extdata", "ctcf.sample.rds", package="trackViewer"))
viewTracks(trackList(ctcf, heatmap, heightDist = c(1, 3)), 
           gr=range, autoOptimizeStyle = TRUE)
## add TAD information
addInteractionAnnotation(tads, "heatmap", grid.lines, gp=gpar(col="#E69F00", lwd=3, lty=3))
## add highlight interested regions
gi_sub <- gi[order(gi$score, decreasing = TRUE)]
gi_sub <- head(gi_sub[distance(first(gi_sub), second(gi_sub))>200000], n=5)
start(regions(gi_sub)) <- start(regions(gi_sub))-40000
end(regions(gi_sub)) <- end(regions(gi_sub))+40000
addInteractionAnnotation(gi_sub, "heatmap", grid.polygon, gp=gpar(col="red", lwd=2, lty=2, fill=NA))
## add interesting anchor at giving coordinate.
addInteractionAnnotation(52900000, "heatmap", gp=gpar(col="blue", lwd=3))
addInteractionAnnotation(-52900000, "heatmap", gp=gpar(col="cyan", lwd=3, lty=4))

## view the interaction data back to back.
## Please make sure the data are normalized.
gi2 <- gi
set.seed(123)
gi2$score <- gi$score + rnorm(length(gi), sd = sd(gi$score))
back2back <- gi2track(gi, gi2)
## change the color
setTrackStyleParam(back2back, "breaks", 
                   c(seq(from=0, to=50, by=10), 200))
setTrackStyleParam(back2back, "color",
                   c("lightblue", "yellow", "red"))
## chang the lim of y-axis (by default, [0, 1])
setTrackStyleParam(back2back, "ylim", c(0, .5))
viewTracks(trackList(ctcf, back2back, heightDist=c(1, 5)),
           gr=range, autoOptimizeStyle = TRUE)
addInteractionAnnotation(tads, "back2back", grid.lines,
                         gp=gpar(col="cyan", lwd=3, lty=2))
addInteractionAnnotation(-52208000, "back2back", gp=gpar(col="blue", lwd=3),
                         panel="top")
addInteractionAnnotation(51508000, "back2back", gp=gpar(col="gray", lwd=3, lty=2),
                         panel="bottom")

Plot chromatin interactions track as links.

setTrackStyleParam(heatmap, "tracktype", "link")
setTrackStyleParam(heatmap, "breaks", 
                   c(seq(from=0, to=50, by=10), 200))
setTrackStyleParam(heatmap, "color",
                   c("lightblue", "yellow", "red"))
## filter the links to simulate the real data
keep <- distance(heatmap$dat, heatmap$dat2) > 5e5 & heatmap$dat$score>20
heatmap$dat <- heatmap$dat[keep]
heatmap$dat2 <- heatmap$dat2[keep]
viewTracks(trackList(heatmap), gr=range, autoOptimizeStyle = TRUE)

To import interactions data from “.hic” (reference to the script of hic-straw and the documentation). The function importGInteractions (trackViewer version>=1.27.6) can be used to import data from .hic format file.

hic <- system.file("extdata", "test_chr22.hic", package = "trackViewer",
                    mustWork=TRUE)
if(.Platform$OS.type!="windows"){
importGInteractions(file=hic, format="hic",
                    ranges=GRanges("22", IRanges(50000000, 100000000)),
                    out = "GInteractions")
}
## GInteractions object with 70 interactions and 1 metadata column:
##        seqnames1           ranges1     seqnames2           ranges2 |     score
##            <Rle>         <IRanges>         <Rle>         <IRanges> | <numeric>
##    [1]        22 50000001-50100000 ---        22 50000001-50100000 |        26
##    [2]        22 50000001-50100000 ---        22 50100001-50200000 |         2
##    [3]        22 50100001-50200000 ---        22 50100001-50200000 |        22
##    [4]        22 50100001-50200000 ---        22 50200001-50300000 |         7
##    [5]        22 50200001-50300000 ---        22 50200001-50300000 |        31
##    ...       ...               ... ...       ...               ... .       ...
##   [66]        22 50400001-50500000 ---        22 51200001-51300000 |         1
##   [67]        22 50500001-50600000 ---        22 51200001-51300000 |         2
##   [68]        22 50800001-50900000 ---        22 51200001-51300000 |         2
##   [69]        22 51100001-51200000 ---        22 51200001-51300000 |         3
##   [70]        22 51200001-51300000 ---        22 51200001-51300000 |         5
##   -------
##   regions: 13 ranges and 0 metadata columns
##   seqinfo: 1 sequence from an unspecified genome; no seqlengths

Another widely used genomic interaction data format is .cool files and the cooler index contains analyzed HiC data for hg19 and mm9 from many different sources. Those files can be used as data resources for visualizations and annotations (see ChIPpeakAnno::findEnhancers). The importGInteractions function can also be used to import data from .cool format (trackViewer version>=1.27.6).

cool <- system.file("extdata", "test.mcool", package = "trackViewer",
                     mustWork=TRUE)
importGInteractions(file=cool, format="cool",
                    resolution = 2,
                    ranges=GRanges("chr1", IRanges(10, 28)),
                    out = "GInteractions")

Session Info

sessionInfo()

R version 4.4.1 (2024-06-14) Platform: x86_64-pc-linux-gnu Running under: Ubuntu 24.04.1 LTS

Matrix products: default BLAS: /home/biocbuild/bbs-3.20-bioc/R/lib/libRblas.so LAPACK: /usr/lib/x86_64-linux-gnu/lapack/liblapack.so.3.12.0

locale: [1] LC_CTYPE=en_US.UTF-8 LC_NUMERIC=C
[3] LC_TIME=en_GB LC_COLLATE=C
[5] LC_MONETARY=en_US.UTF-8 LC_MESSAGES=en_US.UTF-8
[7] LC_PAPER=en_US.UTF-8 LC_NAME=C
[9] LC_ADDRESS=C LC_TELEPHONE=C
[11] LC_MEASUREMENT=en_US.UTF-8 LC_IDENTIFICATION=C

time zone: America/New_York tzcode source: system (glibc)

attached base packages: [1] grid stats4 stats graphics grDevices utils datasets [8] methods base

other attached packages: [1] InteractionSet_1.34.0
[2] motifStack_1.50.0
[3] httr_1.4.7
[4] VariantAnnotation_1.52.0
[5] Rsamtools_2.22.0
[6] Biostrings_2.74.0
[7] XVector_0.46.0
[8] SummarizedExperiment_1.36.0
[9] MatrixGenerics_1.18.0
[10] matrixStats_1.4.1
[11] org.Hs.eg.db_3.20.0
[12] TxDb.Hsapiens.UCSC.hg19.knownGene_3.2.2 [13] GenomicFeatures_1.58.0
[14] AnnotationDbi_1.68.0
[15] Biobase_2.66.0
[16] Gviz_1.50.0
[17] rtracklayer_1.66.0
[18] trackViewer_1.42.0
[19] GenomicRanges_1.58.0
[20] GenomeInfoDb_1.42.0
[21] IRanges_2.40.0
[22] S4Vectors_0.44.0
[23] BiocGenerics_0.52.0

loaded via a namespace (and not attached): [1] BiocIO_1.16.0 bitops_1.0-9
[3] filelock_1.0.3 R.oo_1.26.0
[5] tibble_3.2.1 XML_3.99-0.17
[7] rpart_4.1.23 DirichletMultinomial_1.48.0 [9] lifecycle_1.0.4 httr2_1.0.5
[11] pwalign_1.2.0 lattice_0.22-6
[13] ensembldb_2.30.0 MASS_7.3-61
[15] backports_1.5.0 magrittr_2.0.3
[17] Hmisc_5.2-0 sass_0.4.9
[19] rmarkdown_2.28 jquerylib_0.1.4
[21] yaml_2.3.10 grImport2_0.3-3
[23] DBI_1.2.3 CNEr_1.42.0
[25] RColorBrewer_1.1-3 ade4_1.7-22
[27] abind_1.4-8 zlibbioc_1.52.0
[29] R.utils_2.12.3 AnnotationFilter_1.30.0
[31] biovizBase_1.54.0 RCurl_1.98-1.16
[33] nnet_7.3-19 pracma_2.4.4
[35] rappdirs_0.3.3 GenomeInfoDbData_1.2.13
[37] grImport_0.9-7 seqLogo_1.72.0
[39] BiocStyle_2.34.0 annotate_1.84.0
[41] codetools_0.2-20 DelayedArray_0.32.0
[43] xml2_1.3.6 tidyselect_1.2.1
[45] UCSC.utils_1.2.0 BiocFileCache_2.14.0
[47] base64enc_0.1-3 GenomicAlignments_1.42.0
[49] jsonlite_1.8.9 Formula_1.2-5
[51] tools_4.4.1 progress_1.2.3
[53] strawr_0.0.92 TFMPvalue_0.0.9
[55] Rcpp_1.0.13 glue_1.8.0
[57] gridExtra_2.3 SparseArray_1.6.0
[59] xfun_0.48 dplyr_1.1.4
[61] BiocManager_1.30.25 fastmap_1.2.0
[63] latticeExtra_0.6-30 rhdf5filters_1.18.0
[65] fansi_1.0.6 caTools_1.18.3
[67] digest_0.6.37 R6_2.5.1
[69] colorspace_2.1-1 Cairo_1.6-2
[71] GO.db_3.20.0 gtools_3.9.5
[73] poweRlaw_0.80.0 jpeg_0.1-10
[75] dichromat_2.0-0.1 biomaRt_2.62.0
[77] RSQLite_2.3.7 R.methodsS3_1.8.2
[79] utf8_1.2.4 generics_0.1.3
[81] data.table_1.16.2 prettyunits_1.2.0
[83] htmlwidgets_1.6.4 S4Arrays_1.6.0
[85] TFBSTools_1.44.0 pkgconfig_2.0.3
[87] gtable_0.3.6 blob_1.2.4
[89] htmltools_0.5.8.1 ProtGenerics_1.38.0
[91] scales_1.3.0 png_0.1-8
[93] knitr_1.48 rstudioapi_0.17.1
[95] tzdb_0.4.0 reshape2_1.4.4
[97] rjson_0.2.23 checkmate_2.3.2
[99] curl_5.2.3 cachem_1.1.0
[101] rhdf5_2.50.0 stringr_1.5.1
[103] parallel_4.4.1 foreign_0.8-87
[105] restfulr_0.0.15 pillar_1.9.0
[107] vctrs_0.6.5 dbplyr_2.5.0
[109] xtable_1.8-4 cluster_2.1.6
[111] htmlTable_2.4.3 evaluate_1.0.1
[113] readr_2.1.5 cli_3.6.3
[115] compiler_4.4.1 rlang_1.1.4
[117] crayon_1.5.3 interp_1.1-6
[119] plyr_1.8.9 stringi_1.8.4
[121] deldir_2.0-4 BiocParallel_1.40.0
[123] txdbmaker_1.2.0 munsell_0.5.1
[125] lazyeval_0.2.2 Matrix_1.7-1
[127] BSgenome_1.74.0 hms_1.1.3
[129] bit64_4.5.2 ggplot2_3.5.1
[131] Rhdf5lib_1.28.0 KEGGREST_1.46.0
[133] highr_0.11 memoise_2.0.1
[135] bslib_0.8.0 bit_4.5.0

  翻译: