Blejec} %\address{}% %\email{}% % %\thanks{}% %\subjclass{}% %\keywords{}% %\date{}% %\dedicatory{}% %\commby{}% \thispagestyle{empty} \maketitle \vfill\hspace{5cm}\parbox{5cm}{ Parameters:\\[20pt] \Sexpr{paste(names(addArgs),addArgs,collapse="\\\\",sep=" = ")} } % ---------------------------------------------------------------- %\begin{abstract} % %\end{abstract} % ---------------------------------------------------------------- \clearpage \tableofcontents \clearpage \listoftables \clearpage \listoffigures <>= ############################################### ## ## ## (c) Andrej Blejec (andrej.blejec@nib.si) ## ## ## ############################################### @ <>= options(width=60) library(Hmisc) library(amisc) library(Biobase) #library(xlsReadWrite) library(xtable) #library(MASS) library(lattice) library(reshape2) library(mixOmics) @ \clearpage \section{Task} Analysis of transcriptomics and metabolomics data with canonical correlation. Main ideas are from package \pkg{mixOmics}. Final document in folder \file{/reports}: <<>>= fileName(outputFile) @ \clearpage \section{Information from pISA} Data directory <<>>= .inroot @ Results directory <<>>= .oroot @ <>= catln("project:\t", .pName) catln("Investigation: ",.iName) catln("Study: ",.sName) catln("Assay: ",.aName) @ \clearpage <>= .testing <- TRUE tst <- function(x, force=FALSE, ...) { if(.testing|force) { cat("-->", deparse(substitute(x)),..., "\n") print(x) } invisible(x) } coef <- 1:5 tst(coef) .testing <- FALSE tst(coef,TRUE,"Za poskus force=TRUE") @ \clearpage \section{Data} Priporočljivo je najprej prebrati phenodata in feature-data, potem pa podatke. To omogoča izbor spremenljivk in vzorcev takoj za tem, ko podatke preberemo. %% <>= %% out <- "From: 10a-ReadData.Rnw\n" %% out <- paste(out,knit_child(file.path(".","10a-ReadData.Rnw"),quiet=TRUE)) %% @ % %\Sexpr{out} <>= cat(knit_child(file.path("../doc","10a_Read-Data.Rnw"),quiet=TRUE)) @ List of data objects: <<>>= my.objects @ List of interesting genes, based on typification on 50* reports (key: \file{Transcript stats}. Typification is extracted from the file in the relevant \code{output} directory. To allow manual curation, the info is extracted from the \code{Type} column. <<>>= tsfn <- getMeta(.adesc,"Transcript stats") stat4 <- read.table(file.path(.aroot, tsfn), sep="\t", header=TRUE) colnames(stat4) rownames(stat4) <- stat4[,1] head(stat4) @ Select interesting genes <<>>= filter <- unlist(intgenes) #stat4$Type!="" length(filter) statig <- stat4[filter,] dim(statig) @ <<>>= (my.objects <- addObject(stat4,"Statistics from transcript analysis (50*)")) (my.objects <- addObject(statig,"Statistics for interesting genes")) @ How many interesting genes are in the interesting bins? <<>>= filter <- rownames(statig) %in% unlist(intgenes) sum(filter) rownames(statig)[filter] @ <<>>= head(statig[filter, c("Type","BINCODE","DESCRIPTION")]) @ \clearpage \subsection{Data overview} <<>>= x <- my.objects x$name[1] for(i in 1:nrow(x)){ cat("\n\n--------- ", x[i,1],": ",x[i,2], " -------------------------------\n\n",sep="") print(x[i,]) cat("\n") print(head(eval(as.name(x[i,1])))) } @ Factor for days within the year <<>>= pdata1819$day <- factor(as.character(pdata1819$day)) @ \clearpage \section{Preparation of data for mixOmics} Data for \pkg{mixOmics} analysis should follow the traditional mathematical orientation: samples in rows, variables in columns. The matrices must have appropriate dimensions. Due to different ranges and variability in years 2018 and 2019, we will analyze them separately. \subsubsection{Selection of samples, transcripts and metaboloms} Common samples in the given year (\Sexpr{.years}). 