moved get_permutations and changed threshold to required

jonas-fuchs · jonas-fuchs · commit e52f5581aae3 · 2026-01-29T12:12:37.000+01:00
diff --git a/varvamp/command.py b/varvamp/command.py
@@ -46,7 +46,7 @@ def get_args(sysargs):
     QPCR_parser = mode_parser.add_parser(
         "qpcr",
         help="design qPCR primers",
-        usage="varvamp qpcr [optional arguments] <alignment> <output dir>"
+        usage="varvamp qpcr -t [optional arguments] <alignment> <output dir>"
     )
     parser.add_argument(
         "input",
@@ -145,9 +145,8 @@ def get_args(sysargs):
     QPCR_parser.add_argument(
         "-t",
         "--threshold",
-        metavar="0.9",
+        required=True,
         type=float,
-        default=0.9,
         help="consensus threshold (0-1) - higher values result in higher specificity at the expense of found primers"
     )
     QPCR_parser.add_argument(
diff --git a/varvamp/scripts/primers.py b/varvamp/scripts/primers.py
@@ -3,7 +3,7 @@
 """
 
 # BUILTIN
-from itertools import chain
+import itertools
 import re
 import multiprocessing
 
@@ -13,7 +13,7 @@
 import primer3 as p3
 
 # varVAMP
-from varvamp.scripts import config, reporting
+from varvamp.scripts import config
 
 
 def calc_gc(seq):
@@ -476,6 +476,21 @@ def find_best_primers(left_primer_candidates, right_primer_candidates, high_cons
     return all_primers
 
 
+def get_permutations(seq):
+    """
+    get all permutations of an ambiguous sequence.
+    """
+    groups = itertools.groupby(seq, lambda char: char not in config.AMBIG_NUCS)
+    splits = []
+    for b, group in groups:
+        if b:
+            splits.extend([[g] for g in group])
+        else:
+            for nuc in group:
+                splits.append(config.AMBIG_NUCS[nuc])
+    return[''.join(p) for p in itertools.product(*splits)]
+
+
 def parse_primer_fasta(fasta_path):
     """
     Parse a primer FASTA file and return a list of sequences using BioPython.
@@ -487,9 +502,9 @@ def parse_primer_fasta(fasta_path):
         seq = str(record.seq).lower()
         # Only include primers up to 40 nucleotides
         if len(seq) <= 40:
-            sequences.append(reporting.get_permutations(seq))
+            sequences.append(get_permutations(seq))
 
-    return list(chain.from_iterable(sequences))
+    return list(itertools.chain.from_iterable(sequences))
 
 
 def check_primer_against_externals(args):
@@ -538,4 +553,4 @@ def filter_non_dimer_candidates(primer_candidates, external_sequences, n_threads
         filtered_results = [result for result in results if result is not None]
         return {name: data for name, data in filtered_results}
     else:
-        return [primer for primer in results if primer is not None]
+        return [primer for primer in results if primer is not None]
diff --git a/varvamp/scripts/qpcr.py b/varvamp/scripts/qpcr.py
@@ -61,8 +61,7 @@ def _process_kmer_batch_probes(args):
     probe_idx = 0
 
     for kmer in kmers:
-        if not primers.filter_kmer_direction_independent(kmer[0], config.QPROBE_TMP, config.QPROBE_GC_RANGE,
-                                                         config.QPROBE_SIZES):
+        if not primers.filter_kmer_direction_independent(kmer[0], config.QPROBE_TMP, config.QPROBE_GC_RANGE, config.QPROBE_SIZES):
             continue
         if ambiguous_ends(ambiguous_consensus[kmer[1]:kmer[2]]):
             continue
@@ -112,6 +111,8 @@ def get_qpcr_probes(kmers, ambiguous_consensus, alignment_cleaned, num_processes
     probe_candidates = {}
     probe_idx = 0
     for batch_probes in results:
+        if batch_probes is None:
+            continue
         for probe_name, probe_data in batch_probes.items():
             # Extract direction from original probe name
             direction = "LEFT" if "LEFT" in probe_name else "RIGHT"
@@ -175,9 +176,9 @@ def dimer_in_combinations(right_primer, left_primer, probe, ambiguous_consensus)
     # for the probe check all permutations and possible overhangs to ensure
     # that none of the primers could cause unspecific probe binding.
     # first get all permutations
-    probe_per = reporting.get_permutations(ambiguous_consensus[probe[1]:probe[2]])
-    left_per = reporting.get_permutations(ambiguous_consensus[left_primer[1]:left_primer[2]])
-    right_per = reporting.get_permutations(ambiguous_consensus[right_primer[1]:right_primer[2]])
+    probe_per = primers.get_permutations(ambiguous_consensus[probe[1]:probe[2]])
+    left_per = primers.get_permutations(ambiguous_consensus[left_primer[1]:left_primer[2]])
+    right_per = primers.get_permutations(ambiguous_consensus[right_primer[1]:right_primer[2]])
     # then check all permutations
     for combination in [(probe_per, left_per), (probe_per, right_per)]:
         for oligo1 in combination[0]:
diff --git a/varvamp/scripts/reporting.py b/varvamp/scripts/reporting.py
@@ -4,7 +4,6 @@
 # BUILT-INS
 import os
 import math
-import itertools
 
 # LIBS
 import pandas as pd
@@ -94,20 +93,6 @@ def write_all_primers(path, scheme_name, all_primers):
             write_primers_to_bed(outfile, scheme_name, primer, all_primers[direction][primer], round(all_primers[direction][primer][3], 2), direction)
 
 
-def get_permutations(seq):
-    """
-    get all permutations of an ambiguous sequence. needed to
-    correctly report the gc and the temperature.
-    """
-    groups = itertools.groupby(seq, lambda char: char not in config.AMBIG_NUCS)
-    splits = []
-    for b, group in groups:
-        if b:
-            splits.extend([[g] for g in group])
-        else:
-            for nuc in group:
-                splits.append(config.AMBIG_NUCS[nuc])
-    return[''.join(p) for p in itertools.product(*splits)]
 
 
 def calc_mean_stats(permutations):
@@ -190,7 +175,7 @@ def write_qpcr_to_files(path, final_schemes, ambiguous_consensus, scheme_name, l
                 else:
                     direction = "+"
 
-                permutations = get_permutations(seq)
+                permutations = primers.get_permutations(seq)
                 gc, temp = calc_mean_stats(permutations)
                 primer_name = f"{amp_name}_{oligo_type}"
 
@@ -295,7 +280,7 @@ def write_scheme_to_files(path, amplicon_scheme, ambiguous_consensus, scheme_nam
                         # write primers to fasta pool file
                         print(f">{primer_name}\n{seq.upper()}", file=primer_fasta)
                         # calc primer parameters for all permutations
-                        permutations = get_permutations(seq)
+                        permutations = primers.get_permutations(seq)
                         gc, temp = calc_mean_stats(permutations)
                         # write tsv file
                         print(