From 643960967a3468165c68998bf13eebbdfcd3456a Mon Sep 17 00:00:00 2001 From: coolneng Date: Mon, 29 Mar 2021 20:30:16 +0200 Subject: [PATCH] Remove redundant sequencing runs argument --- generation.sh | 2 +- src/repertoire.r | 32 +++++++++----------------------- 2 files changed, 10 insertions(+), 24 deletions(-) diff --git a/generation.sh b/generation.sh index 9853ac2..b1aa319 100755 --- a/generation.sh +++ b/generation.sh @@ -20,5 +20,5 @@ filename="sequence" prefix="curesim_" Rscript src/repertoire.r "$sequences" "$sequencing_runs" -java -jar tools/CuReSim.jar -m "$read_mean_size" -sd "$read_variance_size" -f "$data_directory$filename$fasta" -o "$data_directory$prefix$filename$fastq" +java -jar tools/CuReSim.jar -n "$sequencing_runs" -m "$read_mean_size" -sd "$read_variance_size" -f "$data_directory$filename$fasta" -o "$data_directory$prefix$filename$fastq" rm "$data_directory/log.txt" diff --git a/src/repertoire.r b/src/repertoire.r index dcf2909..7a1273e 100644 --- a/src/repertoire.r +++ b/src/repertoire.r @@ -10,15 +10,6 @@ generate_repertoire <- function(number_of_sequences) { )) } -amplify_rows <- function(data, column, factor) { - if (column == "sequence") { - dna_string <- Biostrings::DNAStringSet(data) - reverse_complement <- Biostrings::reverseComplement(dna_string) - return(rep(reverse_complement, factor)) - } - return(rep(data, factor)) -} - save_data <- function(data) { Biostrings::writeXStringSet(data$sequence, "data/sequence.fasta") vdj_sequences <- data[-1] @@ -31,23 +22,18 @@ process_data <- function(repertoire, sequencing_runs) { "d_sequence_alignment", "j_sequence_alignment" ) data <- repertoire[, columns] - amplified_data <- mapply(data, names(data), - sequencing_runs, - FUN = amplify_rows - ) - save_data(amplified_data) + data$sequence <- Biostrings::reverseComplement(data$sequence) + save_data(data) } -parse_cli_arguments <- function(args) { - if (length(args) != 2) { - stop("usage: repertoire.r ") +parse_cli_arguments <- function() { + args <- commandArgs(trailingOnly = TRUE) + if (length(args) != 1) { + stop("usage: repertoire.r ") } - return(c(args[1], args[2])) + return(args[1]) } -args <- commandArgs(trailingOnly = TRUE) -arguments <- parse_cli_arguments(args) -number_of_sequences <- as.integer(arguments[1]) -sequencing_runs <- as.integer(arguments[2]) -repertoire <- generate_repertoire(number_of_sequences) +arguments <- parse_cli_arguments(commandArgs(trailing)) +repertoire <- generate_repertoire(number_of_sequences = arguments[1]) process_data(repertoire, sequencing_runs) \ No newline at end of file