--- title: "Basic R-Usage Guide for rMZQC" author: "Chris Bielow " date: '`r Sys.Date()`' output: html_document: default pdf_document: null vignette: > %\VignetteIndexEntry{Basic R-Usage Guide for rMZQC} %\VignetteEngine{knitr::rmarkdown} \usepackage[utf8]{inputenc} --- # Basic R-Usage Guide for rMZQC This vignette serves as a quickstart guide for R users to create and save an mzQC document. **Target Audience:** R users ## Read an mzQC file and extract some data ```{r, eval=TRUE} library(rmzqc) data = readMZQC(system.file("./testdata/test.mzQC", package = "rmzqc", mustWork = TRUE)) cat("This file has ", length(data$runQualities), " runqualities\n") cat(" - file: ", data$runQualities[[1]]$metadata$inputFiles[[1]]$name, "\n") cat(" - # of metrics: ", length(data$runQualities[[1]]$qualityMetrics), "\n") cat(" - metric #1 name: ", data$runQualities[[1]]$qualityMetrics[[1]]$name, "\n") cat(" - metric #1 value: ", data$runQualities[[1]]$qualityMetrics[[1]]$value, "\n") ``` Hint: if you receive an error such as ``` Error in parse_con(txt, bigint_as_char) : lexical error: invalid char in json text. cursor_int": [ NaN,NaN,NaN,NaN,825282.0,308263 (right here) ------^ ``` when calling`readMZQC` this indicates that the mzQC is not valid JSON, since `NaN` values should be quoted (`"NaN"`) or replaced by `null` (unquoted), depending on context. In short: `null` may become an `NA` in R if part of an array, see https://github.com/jeroen/jsonlite/issues/70#issuecomment-431433773. ## Create a minial mzQC document ```{r, eval=TRUE} library(rmzqc) ## we need a proper URI (i.e. no backslashes and a scheme, e.g. 'file:') ## otherwise writing will fail raw_file = localFileToURI("c:\\data\\special.raw", FALSE) file_format = getCVTemplate(accession = filenameToCV(raw_file)) ptxqc_software = toAnalysisSoftware(id = "MS:1003162", version = "1.0.13") ## you could use 'version = packageVersion("PTXQC")' to automate further run1_qc = MzQCrunQuality$new(metadata = MzQCmetadata$new(label = raw_file, inputFiles = list(MzQCinputFile$new(basename(raw_file), raw_file, file_format)), analysisSoftware = list(ptxqc_software)), qualityMetrics = list(toQCMetric(id = "MS:4000059", value = 13405) ## number of MS1 scans ) ) mzQC_document = MzQCmzQC$new(version = "1.0.0", creationDate = MzQCDateTime$new(), contactName = Sys.info()["user"], contactAddress = "test@user.info", description = "A minimal mzQC test document with bogus data", runQualities = list(run1_qc), setQualities = list(), controlledVocabularies = list(getCVInfo())) ## write it out mzqc_filename = paste0(getwd(), "/test.mzQC") writeMZQC(mzqc_filename, mzQC_document) cat(mzqc_filename, "written to disk!\n") ## read it again mq = readMZQC(mzqc_filename) ## print some basic stats gettextf("This mzQC was created on %s and has %d quality metric(s) in total.", dQuote(mq$creationDate$datetime), length(mq$runQualities) + length(mq$setQualities)) ```