RNAmodR.Data contains example data for the RNAmodR and related packages. The data is provided as gff3, fasta and bam files.

Four sets of data with multiple files are included

eh <- ExperimentHub()
ExperimentHub::listResources(eh, "RNAmodR.Data")
##  [1] "RNAmodR.Data.example.fasta"     "RNAmodR.Data.example.gff3"     
##  [3] "RNAmodR.Data.example.bam.1"     "RNAmodR.Data.example.bam.2"    
##  [5] "RNAmodR.Data.example.bam.3"     "RNAmodR.Data.example.RMS.fasta"
##  [7] "RNAmodR.Data.example.RMS.gff3"  "RNAmodR.Data.example.RMS.1"    
##  [9] "RNAmodR.Data.example.RMS.2"     "RNAmodR.Data.example.AAS.fasta"
## [11] "RNAmodR.Data.example.AAS.gff3"  "RNAmodR.Data.example.bud23.1"  
## [13] "RNAmodR.Data.example.bud23.2"   "RNAmodR.Data.example.trm8.1"   
## [15] "RNAmodR.Data.example.trm8.2"    "RNAmodR.Data.example.wt.1"     
## [17] "RNAmodR.Data.example.wt.2"      "RNAmodR.Data.example.wt.3"     
## [19] "" "" 
## [21] "RNAmodR.Data.snoRNAdb"

These resources are grouped based on topic. Please have a look at the following man pages:

2 snoRNAdb

RNAmodR.Data.snoRNAdb consists of a table containing the published data from the snoRNAdb [@Lestrade.2006]. The can be loaded as a GRanges object.

table <- read.csv2(RNAmodR.Data.snoRNAdb(), stringsAsFactors = FALSE)
head(table, n = 2)
##   hgnc_id start end hgnc_symbol modification position   guide old.transcript
## 1   53533     1 157   RNA5-8SN5           Um       14 SNORD71         U13369
## 2   53533     1 157   RNA5-8SN5            Y       55 SNORA72         U13369
##   old.start old.end old.position
## 1      6623    6779           14
## 2      6623    6779           55
# keep only the current coordinates
table <- table[,1:7]
snoRNAdb <- GRanges(seqnames = table$hgnc_symbol,
              ranges = IRanges(start = table$position, width = 1),strand = "+",
              type = "RNAMOD",
              mod = table$modification,
              Parent = table$hgnc_symbol,
              Activity = CharacterList(strsplit(table$guide,",")))
# convert to current gene name
snoRNAdb <- snoRNAdb[vapply(snoRNAdb$Activity != "unknown",all,logical(1)),]
snoRNAdb <- split(snoRNAdb,snoRNAdb$Parent)
## GRangesList object of length 6:
## $RNA18SN5
## GRanges object with 69 ranges and 4 metadata columns:
##        seqnames    ranges strand |        type         mod      Parent
##           <Rle> <IRanges>  <Rle> | <character> <character> <character>
##    [1] RNA18SN5        27      + |      RNAMOD          Am    RNA18SN5
##    [2] RNA18SN5        34      + |      RNAMOD           Y    RNA18SN5
##    [3] RNA18SN5        36      + |      RNAMOD           Y    RNA18SN5
##    [4] RNA18SN5        93      + |      RNAMOD           Y    RNA18SN5
##    [5] RNA18SN5        99      + |      RNAMOD          Am    RNA18SN5
##    ...      ...       ...    ... .         ...         ...         ...
##   [65] RNA18SN5      1643      + |      RNAMOD           Y    RNA18SN5
##   [66] RNA18SN5      1678      + |      RNAMOD          Am    RNA18SN5
##   [67] RNA18SN5      1692      + |      RNAMOD           Y    RNA18SN5
##   [68] RNA18SN5      1703      + |      RNAMOD          Cm    RNA18SN5
##   [69] RNA18SN5      1804      + |      RNAMOD          Um    RNA18SN5
##                              Activity
##                       <CharacterList>
##    [1]                        SNORD27
##    [2]               SNORA50A,SNORA76
##    [3]                SNORA69,SNORA55
##    [4]                        SNORA75
##    [5]                        SNORD57
##    ...                            ...
##   [65]                        SNORA41
##   [66]                        SNORD82
##   [67] SNORD70A,SNORD70B,SNORD70C,...
##   [68]                        SNORD43
##   [69]                        SNORD20
##   -------
##   seqinfo: 9 sequences from an unspecified genome; no seqlengths
## ...
## <5 more elements>

