From 85178ec6baba442caef061c19a052e6c265cc2d0 Mon Sep 17 00:00:00 2001 From: Dominik Brilhaus <dominik.brilhaus@hhu.de> Date: Tue, 9 Aug 2022 10:39:36 +0200 Subject: [PATCH] there must be a better way for that arcRoot --- runs/merged_isa_metadata/README.md | 24 ++++++++++++++++++- .../merge_isa_metadata.yml | 2 -- .../merge_isa_metadata_rooted.yml | 8 +++++++ workflows/merge_isa_metadata.R | 17 ++++++------- 4 files changed, 38 insertions(+), 13 deletions(-) create mode 100644 runs/merged_isa_metadata/merge_isa_metadata_rooted.yml diff --git a/runs/merged_isa_metadata/README.md b/runs/merged_isa_metadata/README.md index ceeaf9b..9319c2e 100644 --- a/runs/merged_isa_metadata/README.md +++ b/runs/merged_isa_metadata/README.md @@ -1,4 +1,26 @@ +# cwltool README +## First cd into the (runs) folder, with the .yml file -cwltool ../../workflows/merge_isa_metadata.cwl merge_isa_metadata.yml \ No newline at end of file +cd /Users/dominikbrilhaus/03_DataPLANT_gitlab/samplearc_rnaseq/runs/merged_isa_metadata + +## Let it flow + +```bash + +### store arc root (two levels up from here) as variable +arc_root=$(echo ${PWD%/*/*}) + +# arc_root=/Users/dominikbrilhaus/03_DataPLANT_gitlab/samplearc_rnaseq/ + +### write a temporary yml +cat merge_isa_metadata.yml > merge_isa_metadata_rooted.yml + +### add the arc root to that yml +printf "\narc_root: $arc_root\n" >> merge_isa_metadata_rooted.yml + +### run with cwltool +cwltool ../../workflows/merge_isa_metadata.cwl merge_isa_metadata_rooted.yml + +``` diff --git a/runs/merged_isa_metadata/merge_isa_metadata.yml b/runs/merged_isa_metadata/merge_isa_metadata.yml index 0a2a9fd..450d89f 100644 --- a/runs/merged_isa_metadata/merge_isa_metadata.yml +++ b/runs/merged_isa_metadata/merge_isa_metadata.yml @@ -2,8 +2,6 @@ cores: 1 r_script: class: File path: ../../workflows/merge_isa_metadata.R -# arc_root: ../ -arc_root: /Users/dominikbrilhaus/03_DataPLANT_gitlab/samplearc_rnaseq/ in_isa_study: studies/TalinumFacultativeCAM/isa.study.xlsx:plant_growth in_isa_assay: assays/Talinum_RNASeq_minimal/isa.assay.xlsx:2EXT01_RNA:3ASY01_RNASeq out_folder: runs/merged_isa_metadata \ No newline at end of file diff --git a/runs/merged_isa_metadata/merge_isa_metadata_rooted.yml b/runs/merged_isa_metadata/merge_isa_metadata_rooted.yml new file mode 100644 index 0000000..2f282e0 --- /dev/null +++ b/runs/merged_isa_metadata/merge_isa_metadata_rooted.yml @@ -0,0 +1,8 @@ +cores: 1 +r_script: + class: File + path: ../../workflows/merge_isa_metadata.R +in_isa_study: studies/TalinumFacultativeCAM/isa.study.xlsx:plant_growth +in_isa_assay: assays/Talinum_RNASeq_minimal/isa.assay.xlsx:2EXT01_RNA:3ASY01_RNASeq +out_folder: runs/merged_isa_metadata +arc_root: /Users/dominikbrilhaus/03_DataPLANT_gitlab/samplearc_rnaseq diff --git a/workflows/merge_isa_metadata.R b/workflows/merge_isa_metadata.R index c629683..50746cd 100644 --- a/workflows/merge_isa_metadata.R +++ b/workflows/merge_isa_metadata.R @@ -26,8 +26,6 @@ in_isa_study <- args[2] in_isa_assay <- args[3] out_folder <- args[4] -# setwd(arc_root) - ################################################ #### Read metadata from isa excel workbooks ################################################ @@ -36,12 +34,12 @@ isa_study <- unlist(strsplit(paste(arc_root, in_isa_study, sep = "/"), split = " isa_assay <- unlist(strsplit(paste(arc_root, in_isa_assay, sep = "/"), split = ":")) isa_sheets <- list() -for(i in 2:length(isa_study)) +for (i in 2:length(isa_study)) { isa_sheets[[length(isa_sheets) + 1]] <- readWorkbook(isa_study[1], isa_study[i], startRow = 1) } -for(i in 2:length(isa_assay)) +for (i in 2:length(isa_assay)) { isa_sheets[[length(isa_sheets) + 1]] <- readWorkbook(isa_assay[1], isa_assay[i], startRow = 1) } @@ -52,20 +50,19 @@ for(i in 2:length(isa_assay)) isa_merged <- isa_sheets[[1]] -for(j in 2:length(isa_sheets)) +for (j in 2:length(isa_sheets)) # for(j in 2) { isa_merged <- merge(isa_merged, - isa_sheets[[j]], - by.x = "Sample.Name", - by.y = "Source.Name", + isa_sheets[[j]], + by.x = "Sample.Name", + by.y = "Source.Name", ) # Rename duplicated Sample.Name column colnames(isa_merged)[which(colnames(isa_merged) == "Sample.Name")] <- paste("Sample.Name", j, sep = ".") colnames(isa_merged)[which(colnames(isa_merged) == "Sample.Name.y")] <- "Sample.Name" - } @@ -87,4 +84,4 @@ dir.create(paste(arc_root, out_folder, sep = "/"), recursive = T, showWarnings = #### Write table to file ################################################ -write.table(isa_merged, file = paste(arc_root, out_folder, "merged_isa.tsv", sep = "/"), sep = "\t") \ No newline at end of file +write.table(isa_merged, file = paste(arc_root, out_folder, "merged_isa.tsv", sep = "/"), sep = "\t") -- GitLab