diff --git a/pvacseq/lib/pipeline.py b/pvacseq/lib/pipeline.py index 4c562fe..6a2b4ee 100644 --- a/pvacseq/lib/pipeline.py +++ b/pvacseq/lib/pipeline.py @@ -154,8 +154,10 @@ def split_tsv_file(self, total_row_count): def generate_fasta(self): pass - def split_fasta_basename(self): - return os.path.join(self.tmp_dir, self.sample_name + "_" + str(self.peptide_sequence_length) + ".fa.split") + def split_fasta_file_path(self, split_start, split_end): + basename = os.path.join(self.tmp_dir, self.sample_name + "_" + str(self.peptide_sequence_length) + ".fa.split") + fasta_chunk = "%d-%d" % (split_start*2-1, split_end*2) + return "%s_%s" % (basename, fasta_chunk) @abstractmethod def call_iedb_and_parse_outputs(self, chunks): @@ -312,7 +314,7 @@ def generate_fasta(self, chunks): for (split_start, split_end) in chunks: fasta_chunk = "%d-%d" % (split_start*2-1, split_end*2) split_tsv_file_path = self.split_tsv_file_path(split_start, split_end) - split_fasta_file_path = "%s_%s" % (self.split_fasta_basename(), fasta_chunk) + split_fasta_file_path = self.split_fasta_file_path(split_start, split_end) if os.path.exists(split_fasta_file_path): status_message("Split FASTA file for Entries %s already exists. Skipping." % (fasta_chunk)) continue @@ -336,7 +338,7 @@ def call_iedb_and_parse_outputs(self, chunks): fasta_chunk = "%d-%d" % (split_start*2-1, split_end*2) for a in self.alleles: for epl in self.epitope_lengths: - split_fasta_file_path = "%s_%s"%(self.split_fasta_basename(), fasta_chunk) + split_fasta_file_path = self.split_fasta_file_path(split_start, split_end) split_iedb_output_files = [] status_message("Processing entries for Allele %s and Epitope Length %s - Entries %s" % (a, epl, fasta_chunk)) for method in self.prediction_algorithms: @@ -404,7 +406,7 @@ def generate_fasta(self, chunks): for (split_start, split_end) in chunks: fasta_chunk = "%d-%d" % (split_start*2-1, split_end*2) split_tsv_file_path = self.split_tsv_file_path(split_start, split_end) - split_fasta_file_path = "%s_%s" % (self.split_fasta_basename(), fasta_chunk) + split_fasta_file_path = self.split_fasta_file_path(split_start, split_end) if os.path.exists(split_fasta_file_path): status_message("Split FASTA file for Entries %s already exists. Skipping." % (fasta_chunk)) continue @@ -427,7 +429,7 @@ def call_iedb_and_parse_outputs(self, chunks): for (split_start, split_end) in chunks: fasta_chunk = "%d-%d" % (split_start*2-1, split_end*2) for a in self.alleles: - split_fasta_file_path = "%s_%s"%(self.split_fasta_basename(), fasta_chunk) + split_fasta_file_path = self.split_fasta_file_path(split_start, split_end) split_iedb_output_files = [] status_message("Processing entries for Allele %s - Entries %s" % (a, fasta_chunk)) for method in self.prediction_algorithms: