view Build_tissue-specific_expression_dataset.R @ 1:cfcc7a780991 draft default tip

planemo upload commit c599cfc156c77626df2b674bdfbd437b9f664ab9
author proteore
date Thu, 13 Dec 2018 03:59:41 -0500
parents
children
line wrap: on
line source



select_HPAimmunohisto<-function(hpa_ref, tissue, level, reliability) {
  HPA.normal = read.table(hpa_ref,header=TRUE,sep="\t",stringsAsFactors = FALSE)
  if (tissue == "tissue") {
    tissue <- unique(HPA.normal$Tissue) 
  }
  if (level == "level") {
    level <- unique(HPA.normal$Level)
  }
  if (reliability == "reliability") {
    reliability <- unique(HPA.normal$Reliability)
  }
  res.imm <- subset(HPA.normal, Tissue%in%tissue & Level%in%level & Reliability%in%reliability)
  return(res.imm)
}

    
    
select_HPARNAseq<-function(hpa_ref, sample) {
  HPA.rnaTissue = read.table(hpa_ref,header=TRUE,sep="\t",stringsAsFactors = FALSE)
  res.rna <- subset(HPA.rnaTissue, Sample%in%sample, select = -c(Unit))
  colnames(res.rna)[which(colnames(res.rna) == 'Value')] <- 'Value (TPM unit)'
  return(res.rna)
}

main <- function() {
  args <- commandArgs(TRUE)
  if(length(args)<1) {
    args <- c("--help")
  }
  
  # Help section
  if("--help" %in% args) {
    cat("Selection and Annotation HPA
    Arguments:
        --data_source: immuno/rnaseq
        --hpe_ref: path to reference file normal_tissue.tsv/rna_tissue.tsv)
          if immuno:
            --tissue: list of tissues
            --level: Not detected, Low, Medium, High
            --reliability: Supported, Approved, Enhanced, Uncertain
          if rnaseq:
            --sample: Sample tissues 
        --output: output filename \n")
    q(save="no")
  }
  
  # Parse arguments
  parseArgs <- function(x) strsplit(sub("^--", "", x), "=")
  argsDF <- as.data.frame(do.call("rbind", parseArgs(args)))
  args <- as.list(as.character(argsDF$V2))
  names(args) <- argsDF$V1

  # Extract options
  data_source = args$data_source
  hpa_ref = args$hpa_ref
  if (data_source == "immuno") {
    tissue = strsplit(args$tissue, ",")[[1]]
    level = strsplit(args$level, ",")[[1]]
    reliability = strsplit(args$reliability, ",")[[1]]
    # Calculation
    res = select_HPAimmunohisto(hpa_ref, tissue, level, reliability)
  }
  else if (data_source == "rnaseq") {
    sample = strsplit(args$sample, ",")[[1]]
    # Calculation
    res = select_HPARNAseq(hpa_ref, sample)
  }

  # Write output
  output = args$output
  write.table(res, output, sep = "\t", quote = FALSE, row.names = FALSE)
}

main()