MsDataHub 1.0.0
The MsDataHub
package provides example mass spectrometry data,
peptide spectrum matches or quantitative data from proteomics and
metabolomics experiments. The data are served through the
ExperimentHub
infrastructure, which allows download them only ones
and cache them for further use. Currently available data are summarised
in the table below and details in the next section.
library("MsDataHub")
## Warning: replacing previous import 'utils::findMatches' by
## 'S4Vectors::findMatches' when loading 'AnnotationDbi'
DT::datatable(MsDataHub())
To install the package:
if (!require("BiocManager"))
install.packages("BiocManager")
BiocManager::install("MsDataHub")
PestMix1_DDA.mzML
and PestMix1_SWATH.mzML
?TripleTOF
Load with
f <- PestMix1_DDA.mzML()
## see ?MsDataHub and browseVignettes('MsDataHub') for documentation
## loading from cache
library(Spectra)
Spectra(f)
## MSn data (Spectra) with 7602 spectra in a MsBackendMzR backend:
## msLevel rtime scanIndex
## <integer> <numeric> <integer>
## 1 1 0.231 1
## 2 1 0.351 2
## 3 1 0.471 3
## 4 1 0.591 4
## 5 1 0.711 5
## ... ... ... ...
## 7598 1 899.491 7598
## 7599 1 899.613 7599
## 7600 1 899.747 7600
## 7601 1 899.872 7601
## 7602 1 899.993 7602
## ... 33 more variables/columns.
##
## file(s):
## 33d2621e24639d_7861
f <- PestMix1_SWATH.mzML()
## see ?MsDataHub and browseVignettes('MsDataHub') for documentation
## loading from cache
Spectra(f)
## MSn data (Spectra) with 8999 spectra in a MsBackendMzR backend:
## msLevel rtime scanIndex
## <integer> <numeric> <integer>
## 1 2 0.203 1
## 2 2 0.300 2
## 3 2 0.397 3
## 4 2 0.494 4
## 5 2 0.591 5
## ... ... ... ...
## 8995 2 899.527 8995
## 8996 2 899.624 8996
## 8997 2 899.721 8997
## 8998 2 899.818 8998
## 8999 2 899.915 8999
## ... 33 more variables/columns.
##
## file(s):
## 33d26214a335e3_7862
20171016_POOL_POS_1_105-134.mzML
and 20171016_POOL_POS_3_105-134.mzML
?sciex
Load with
f <- X20171016_POOL_POS_1_105.134.mzML()
## see ?MsDataHub and browseVignettes('MsDataHub') for documentation
## loading from cache
Spectra(f)
## MSn data (Spectra) with 931 spectra in a MsBackendMzR backend:
## msLevel rtime scanIndex
## <integer> <numeric> <integer>
## 1 1 0.280 1
## 2 1 0.559 2
## 3 1 0.838 3
## 4 1 1.117 4
## 5 1 1.396 5
## ... ... ... ...
## 927 1 258.641 927
## 928 1 258.920 928
## 929 1 259.199 929
## 930 1 259.478 930
## 931 1 259.757 931
## ... 33 more variables/columns.
##
## file(s):
## 33d262208ac2f9_7859
f <- X20171016_POOL_POS_3_105.134.mzML()
## see ?MsDataHub and browseVignettes('MsDataHub') for documentation
## loading from cache
Spectra(f)
## MSn data (Spectra) with 931 spectra in a MsBackendMzR backend:
## msLevel rtime scanIndex
## <integer> <numeric> <integer>
## 1 1 0.275 1
## 2 1 0.554 2
## 3 1 0.833 3
## 4 1 1.112 4
## 5 1 1.391 5
## ... ... ... ...
## 927 1 258.636 927
## 928 1 258.915 928
## 929 1 259.194 929
## 930 1 259.473 930
## 931 1 259.752 931
## ... 33 more variables/columns.
##
## file(s):
## 33d2624c28adfa_7860
TMT_Erwinia_1uLSike_Top10HCD_isol2_45stepped_60min_01-20141210.mzML.gz
and
TMT_Erwinia_1uLSike_Top10HCD_isol2_45stepped_60min_01-20141210.mzid
?PDX000001
Load with
f <- TMT_Erwinia_1uLSike_Top10HCD_isol2_45stepped_60min_01.20141210.mzML.gz()
## see ?MsDataHub and browseVignettes('MsDataHub') for documentation
## loading from cache
Spectra(f)
## MSn data (Spectra) with 7534 spectra in a MsBackendMzR backend:
## msLevel rtime scanIndex
## <integer> <numeric> <integer>
## 1 1 0.4584 1
## 2 1 0.9725 2
## 3 1 1.8524 3
## 4 1 2.7424 4
## 5 1 3.6124 5
## ... ... ... ...
## 7530 2 3600.47 7530
## 7531 2 3600.83 7531
## 7532 2 3601.18 7532
## 7533 2 3601.57 7533
## 7534 2 3601.98 7534
## ... 33 more variables/columns.
##
## file(s):
## 33d262170f6aa7_7858
f <- TMT_Erwinia_1uLSike_Top10HCD_isol2_45stepped_60min_01.20141210.mzid()
## see ?MsDataHub and browseVignettes('MsDataHub') for documentation
## loading from cache
library(PSMatch)
PSM(f)
## PSM with 5802 rows and 35 columns.
## names(35): sequence spectrumID ... subReplacementResidue subLocation
cptac_a_b_c_peptides.txt
, cptac_a_b_peptides.txt
and
cptac_peptides.txt
?cptac
Load with
library(QFeatures)
f <- cptac_peptides.txt()
## see ?MsDataHub and browseVignettes('MsDataHub') for documentation
## loading from cache
ecols <- grep("Intensity\\.", names(read.delim(f)))
readSummarizedExperiment(f, ecols, sep = "\t")
## class: SummarizedExperiment
## dim: 11466 45
## metadata(0):
## assays(1): ''
## rownames(11466): 1 2 ... 11465 11466
## rowData names(143): Sequence N.term.cleavage.window ...
## Oxidation..M..site.IDs MS.MS.Count
## colnames(45): Intensity.6A_1 Intensity.6A_2 ... Intensity.6E_8
## Intensity.6E_9
## colData names(0):
cptac_a_b_c_peptides.txt()
## see ?MsDataHub and browseVignettes('MsDataHub') for documentation
## loading from cache
## EH7804
## "/home/biocbuild/.cache/R/ExperimentHub/33d2626c4b9398_7854"
cptac_a_b_peptides.txt()
## see ?MsDataHub and browseVignettes('MsDataHub') for documentation
## loading from cache
## EH7805
## "/home/biocbuild/.cache/R/ExperimentHub/33d2625d5bd72b_7855"
ko15.CDF
?cdf
Load with
f <- ko15.CDF()
## see ?MsDataHub and browseVignettes('MsDataHub') for documentation
## loading from cache
Spectra(f)
## MSn data (Spectra) with 1278 spectra in a MsBackendMzR backend:
## msLevel rtime scanIndex
## <integer> <numeric> <integer>
## 1 1 2501.38 1
## 2 1 2502.94 2
## 3 1 2504.51 3
## 4 1 2506.07 4
## 5 1 2507.64 5
## ... ... ... ...
## 1274 1 4493.56 1274
## 1275 1 4495.13 1275
## 1276 1 4496.69 1276
## 1277 1 4498.26 1277
## 1278 1 4499.82 1278
## ... 33 more variables/columns.
##
## file(s):
## 33d262241e102b_7853
MsDataHub
MsDataHub
, start by
opening an
issue
in the package’s GitHub repository and describe the new data. In
particular, provide information about it’s provenance, its use, its
format(s) and acknowledge that the data may be shared freely with
the community without any restrictions. You may provide an open
licence specifying the terms it can be re-used, typically a
CC-BY-SA license.ExperimentHub
packages and GitHub pull requests, you may
directly send one that adds your data to the package. Make sure (1)
add appropriate references in the manual page and (2) to add
yourself as a contributor of the package in the DESCRIPTION file.## R version 4.3.0 RC (2023-04-13 r84269)
## Platform: x86_64-pc-linux-gnu (64-bit)
## Running under: Ubuntu 22.04.2 LTS
##
## Matrix products: default
## BLAS: /home/biocbuild/bbs-3.17-bioc/R/lib/libRblas.so
## LAPACK: /usr/lib/x86_64-linux-gnu/lapack/liblapack.so.3.10.0
##
## locale:
## [1] LC_CTYPE=en_US.UTF-8 LC_NUMERIC=C
## [3] LC_TIME=en_GB LC_COLLATE=C
## [5] LC_MONETARY=en_US.UTF-8 LC_MESSAGES=en_US.UTF-8
## [7] LC_PAPER=en_US.UTF-8 LC_NAME=C
## [9] LC_ADDRESS=C LC_TELEPHONE=C
## [11] LC_MEASUREMENT=en_US.UTF-8 LC_IDENTIFICATION=C
##
## time zone: America/New_York
## tzcode source: system (glibc)
##
## attached base packages:
## [1] stats4 stats graphics grDevices utils datasets methods
## [8] base
##
## other attached packages:
## [1] MsDataHub_1.0.0 QFeatures_1.10.0
## [3] MultiAssayExperiment_1.26.0 SummarizedExperiment_1.30.0
## [5] Biobase_2.60.0 GenomicRanges_1.52.0
## [7] GenomeInfoDb_1.36.0 IRanges_2.34.0
## [9] MatrixGenerics_1.12.0 matrixStats_0.63.0
## [11] PSMatch_1.4.0 Spectra_1.10.0
## [13] ProtGenerics_1.32.0 BiocParallel_1.34.0
## [15] S4Vectors_0.38.0 BiocGenerics_0.46.0
## [17] BiocStyle_2.28.0
##
## loaded via a namespace (and not attached):
## [1] tidyselect_1.2.0 dplyr_1.1.2
## [3] blob_1.2.4 Biostrings_2.68.0
## [5] filelock_1.0.2 bitops_1.0-7
## [7] fastmap_1.1.1 lazyeval_0.2.2
## [9] RCurl_1.98-1.12 BiocFileCache_2.8.0
## [11] promises_1.2.0.1 digest_0.6.31
## [13] mime_0.12 lifecycle_1.0.3
## [15] cluster_2.1.4 ellipsis_0.3.2
## [17] KEGGREST_1.40.0 interactiveDisplayBase_1.38.0
## [19] RSQLite_2.3.1 magrittr_2.0.3
## [21] compiler_4.3.0 rlang_1.1.0
## [23] sass_0.4.5 tools_4.3.0
## [25] igraph_1.4.2 utf8_1.2.3
## [27] yaml_2.3.7 knitr_1.42
## [29] htmlwidgets_1.6.2 bit_4.0.5
## [31] curl_5.0.0 DelayedArray_0.26.0
## [33] withr_2.5.0 purrr_1.0.1
## [35] grid_4.3.0 fansi_1.0.4
## [37] ExperimentHub_2.8.0 xtable_1.8-4
## [39] MASS_7.3-59 cli_3.6.1
## [41] mzR_2.34.0 crayon_1.5.2
## [43] rmarkdown_2.21 generics_0.1.3
## [45] httr_1.4.5 ncdf4_1.21
## [47] DBI_1.1.3 cachem_1.0.7
## [49] zlibbioc_1.46.0 parallel_4.3.0
## [51] AnnotationDbi_1.62.0 AnnotationFilter_1.24.0
## [53] BiocManager_1.30.20 XVector_0.40.0
## [55] vctrs_0.6.2 Matrix_1.5-4
## [57] jsonlite_1.8.4 bookdown_0.33
## [59] bit64_4.0.5 clue_0.3-64
## [61] crosstalk_1.2.0 jquerylib_0.1.4
## [63] glue_1.6.2 codetools_0.2-19
## [65] DT_0.27 later_1.3.0
## [67] BiocVersion_3.17.1 tibble_3.2.1
## [69] pillar_1.9.0 rappdirs_0.3.3
## [71] htmltools_0.5.5 GenomeInfoDbData_1.2.10
## [73] R6_2.5.1 dbplyr_2.3.2
## [75] evaluate_0.20 shiny_1.7.4
## [77] lattice_0.21-8 AnnotationHub_3.8.0
## [79] png_0.1-8 memoise_2.0.1
## [81] httpuv_1.6.9 bslib_0.4.2
## [83] Rcpp_1.0.10 xfun_0.39
## [85] MsCoreUtils_1.12.0 fs_1.6.2
## [87] pkgconfig_2.0.3