@@ -157,28 +157,6 @@ def _prepare_seq(
157157 seq = cut_transcript_seq (seq , tag )
158158 return seq
159159
160- # def extract(self, intervals: List[Interval], **kwargs) -> str:
161- # """
162- # Extract and concatenate the sequence for a list of intervals
163- # :param intervals: list of intervals
164- # :param kwargs: will be passed on to `_prepare_seq()`
165- # :return: concatenated dna sequence of the intervals
166- # """
167- # seqs = [self.extractor.extract(i) for i in intervals]
168- #
169- # reverse_strand = False
170- # if self.use_strand:
171- # reverse_strand = intervals[0].neg_strand
172- # if self.extractor.use_strand:
173- # # If the fasta extractor already does the reversion, we do not have to do it manually.
174- # # Instead, we need to reverse the list of sequences.
175- # seqs.reverse()
176- # reverse_strand = False
177- #
178- # tag = intervals[0].attrs["tag"]
179- #
180- # return self._prepare_seq(seqs, reverse_strand, tag=tag, **kwargs)
181-
182160 def get_protein_seq (self , transcript_id : str ):
183161 """
184162 Extract amino acid sequence for given transcript_id
@@ -268,24 +246,6 @@ def _prepare_seq(cls, *args, **kwargs):
268246 """
269247 return translate (super ()._prepare_seq (* args , ** kwargs ), hg38 = True )
270248
271- # def extract(
272- # self,
273- # intervals: List[Interval],
274- # sample_id: List[str] = None,
275- # **kwargs
276- # ):
277- # reverse_complement = intervals[0].neg_strand
278- # tag = intervals[0].attrs["tag"]
279- # # remove strand information
280- # intervals = [i.unstrand() for i in intervals]
281- #
282- # variant_interval_queryable = self.multi_sample_VCF.query_variants(intervals, sample_id=sample_id)
283- #
284- # iter_seqs = self.extract_query(variant_interval_queryable, sample_id=sample_id)
285- # for seqs, variant_info in iter_seqs:
286- # # 1st seq, 2nd variant info
287- # yield ProteinSeqExtractor._prepare_seq(seqs, reverse_complement, tag=tag), variant_info
288-
289249 def _filter_snv (self , variants ):
290250 for variant in variants :
291251 if len (variant .ref ) == len (variant .alt ) == 1 : # only SOVs supported
@@ -300,45 +260,6 @@ def _filter_snv(self, variants):
300260
301261class SingleSeqProteinVCFSeqExtractor (SingleSeqExtractorMixin , ProteinVCFSeqExtractor ):
302262 pass
303- # def extract_query(
304- # self,
305- # variant_interval_queryable,
306- # ref_seqs,
307- # reverse_complement,
308- # sample_id=None
309- # ):
310- # """
311- # Iterate through all intervals and extract dna sequence with all variants inserted into it
312- # :return: dna sequence with all variants. If no variants match, will return the reference sequence.
313- # """
314- # """
315- # Iterate through all intervals and extract dna sequence with all
316- # variants inserted into it
317- # :param variant_interval_queryable: Object which contains information
318- # about the variants for current sequence
319- # :param sample_id:
320- # :return: dna sequence with all variants. If no variants match, will return the reference sequence.
321- # """
322- # seqs = []
323- # variants_info = []
324- # for variants, interval in variant_interval_queryable.variant_intervals:
325- # variants = list(self._filter_snv(variants))
326- # if len(variants) > 0:
327- # flag = False
328- # variants_info.extend(variants)
329- # seqs.append(
330- # self.variant_seq_extractor.extract(interval, variants, anchor=0)
331- # )
332- #
333- # alt_seq = "".join(seqs)
334- # variants_info = self._prepare_variants(variants_info)
335- # return (
336- # alt_seq, # the final sequence
337- # variants_info, # dictionary of variants
338- # )
339- #
340- # # cds_seqs = list(self._extract_query(variant_interval_queryable, sample_id=sample_id))
341- # # return cds_seqs
342263
343264
344265class SingleVariantProteinVCFSeqExtractor (SingleVariantExtractorMixin , ProteinVCFSeqExtractor ):
0 commit comments