Implement HVR sequence alignment
This commit is contained in:
parent
3a10380d8c
commit
c5f28ea3bf
|
@ -5,7 +5,8 @@ construct_dataframe <- function(data) {
|
|||
vdj_string_set <- lapply(data, FUN = Biostrings::DNAStringSet)
|
||||
vdj_dataframe <- as.data.frame(vdj_string_set)
|
||||
vdj_dataframe$hvr_region <- paste(vdj_dataframe$v_sequence,
|
||||
vdj_dataframe$d_sequence, vdj_dataframe$j_sequence,
|
||||
vdj_dataframe$d_sequence,
|
||||
vdj_dataframe$j_sequence,
|
||||
sep = ""
|
||||
)
|
||||
return(vdj_dataframe)
|
||||
|
@ -18,11 +19,27 @@ parse_data <- function(files) {
|
|||
vdj_dataframe <- construct_dataframe(vdj_alignment)
|
||||
return(list(sequences, vdj_dataframe))
|
||||
}
|
||||
|
||||
align_sequence <- function(sequence, vdj_segment) {
|
||||
return(Biostrings::pairwiseAlignment(
|
||||
pattern = sequence,
|
||||
subject = vdj_segment,
|
||||
type = "global-local",
|
||||
gapOpening = 1
|
||||
))
|
||||
}
|
||||
|
||||
align_sequences <- function(sequences, vdj_segments) {
|
||||
|
||||
perform_alignment <- function(sequences, vdj_segments) {
|
||||
sequence_alignment <- mcmapply(sequences,
|
||||
vdj_segments$hvr_region,
|
||||
FUN = align_sequence,
|
||||
mc.cores = 4
|
||||
)
|
||||
return(sequence_alignment)
|
||||
}
|
||||
|
||||
input_files <- c("data/curesim_sequence.fastq", "data/vdj_alignment.csv")
|
||||
data <- parse_data(input_files)
|
||||
data <- parse_data(input_files)
|
||||
alignment <- perform_alignment(sequences = data[[1]], vdj_segments = data[[2]])
|
||||
print(alignment)
|
Loading…
Reference in New Issue