Compare commits

...

2 Commits

Author SHA1 Message Date
d2e45bc00f
Change output format to FASTA 2021-03-02 20:08:14 +01:00
deb1066982
Set CuReSim read size to 350 bases 2021-03-02 20:07:05 +01:00
3 changed files with 12 additions and 11 deletions

2
.gitignore vendored
View File

@ -1,2 +1,2 @@
*.txt *.txt
*.fastq *.fasta

View File

@ -11,9 +11,11 @@ fi
sequences=$1 sequences=$1
sequencing_runs=$2 sequencing_runs=$2
read_mean_size=350
read_variance_size=0.0
data_directory="data/" data_directory="data/"
file="sequence.fastq" file="sequence.fasta"
prefix="curesim_" prefix="curesim_"
Rscript src/repertoire.r "$sequences" "$sequencing_runs" Rscript src/repertoire.r "$sequences" "$sequencing_runs"
java -jar tools/CuReSim.jar -f "$data_directory$file" -o "$data_directory$prefix$file" java -jar tools/CuReSim.jar -m "$read_mean_size" -sd "$read_variance_size" -f "$data_directory$file" -o "$data_directory$prefix$file"

View File

@ -1,7 +1,7 @@
library(immuneSIM) library(immuneSIM)
library(Biostrings) library(Biostrings)
generate_repertoires <- function(number_of_sequences) { generate_repertoire <- function(number_of_sequences) {
b_chain <- immuneSIM( b_chain <- immuneSIM(
number_of_seqs = number_of_sequences, number_of_seqs = number_of_sequences,
species = "hs", species = "hs",
@ -22,9 +22,8 @@ preprocess_data <- function(repertoire, sequencing_runs) {
} }
save_data <- function(repertoire) { save_data <- function(repertoire) {
file_name <- "data/sequence.fastq" file_name <- "data/sequence.fasta"
# TODO Change format to fasta Biostrings::writeXStringSet(repertoire, file_name, format = "fasta")
Biostrings::writeXStringSet(repertoire, file_name, format = "fastq")
} }
parse_cli_arguments <- function(args) { parse_cli_arguments <- function(args) {
@ -35,9 +34,9 @@ parse_cli_arguments <- function(args) {
} }
args <- commandArgs(trailingOnly = TRUE) args <- commandArgs(trailingOnly = TRUE)
parameters <- parse_cli_arguments(args) arguments <- parse_cli_arguments(args)
number_of_sequences <- as.integer(parameters[1]) number_of_sequences <- as.integer(arguments[1])
sequencing_runs <- as.integer(parameters[2]) sequencing_runs <- as.integer(arguments[2])
repertoire <- generate_repertoires(number_of_sequences) repertoire <- generate_repertoire(number_of_sequences)
processed_data <- preprocess_data(repertoire, sequencing_runs) processed_data <- preprocess_data(repertoire, sequencing_runs)
save_data(processed_data) save_data(processed_data)