Skip to content

Commit 6d61210

Browse files
defunktcaenrigen
authored andcommitted
Fix max_seqlets_subsample bug
Mirror the fix in: jmschrei/tfmodisco-lite#60
1 parent 2cb3294 commit 6d61210

File tree

3 files changed

+5
-6
lines changed

3 files changed

+5
-6
lines changed

examples/MergeMotifsAcrossRuns.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -628,7 +628,7 @@
628628
"min_num = 30 # also called min_num_to_trim_to\n",
629629
"flank_to_add = 5 # also called initial_flank_to_add\n",
630630
"window_size = 20 # also called trim_to_window_size\n",
631-
"max_seqlets_subsample = 300 # also called merging_max_seqlets_subsample\n",
631+
"max_seqlets_subsample = 1000 # also called merging_max_seqlets_subsample\n",
632632
"\n",
633633
"pattern_group = 'pos_patterns' #pos_patterns or neg_patterns\n",
634634
"\n",

modiscolite/aggregator.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -186,7 +186,7 @@ def _detect_spurious_merging(patterns, track_set, perplexity,
186186
prob_and_pertrack_sim_merge_thresholds=prob_and_pertrack_sim_merge_thresholds,
187187
prob_and_pertrack_sim_dealbreaker_thresholds=prob_and_pertrack_sim_dealbreaker_thresholds,
188188
min_frac=min_frac, min_num=min_num, flank_to_add=flank_to_add, window_size=window_size,
189-
bg_freq=bg_freq, max_seqlets_subsample=1000)
189+
bg_freq=bg_freq, max_seqlets_subsample=max_seqlets_subsample)
190190

191191
to_return.extend(refined_subpatterns[0])
192192
else:
@@ -197,7 +197,7 @@ def _detect_spurious_merging(patterns, track_set, perplexity,
197197
prob_and_pertrack_sim_merge_thresholds=prob_and_pertrack_sim_merge_thresholds,
198198
prob_and_pertrack_sim_dealbreaker_thresholds=prob_and_pertrack_sim_dealbreaker_thresholds,
199199
min_frac=min_frac, min_num=min_num, flank_to_add=flank_to_add, window_size=window_size,
200-
bg_freq=bg_freq, max_seqlets_subsample=1000)
200+
bg_freq=bg_freq, max_seqlets_subsample=max_seqlets_subsample)
201201

202202
def SimilarPatternsCollapser(patterns, track_set,
203203
min_overlap, prob_and_pertrack_sim_merge_thresholds,

modiscolite/tfmodisco.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,6 @@
77
import scipy
88
import scipy.sparse
99

10-
from collections import OrderedDict
1110
from collections import defaultdict
1211

1312
from . import affinitymat
@@ -161,7 +160,7 @@ def seqlets_to_patterns(seqlets, track_set, track_signs=None,
161160
final_flank_to_add=0,
162161
prob_and_pertrack_sim_merge_thresholds=[(0.8,0.8), (0.5, 0.85), (0.2, 0.9)],
163162
prob_and_pertrack_sim_dealbreaker_thresholds=[(0.4, 0.75), (0.2,0.8), (0.1, 0.85), (0.0,0.9)],
164-
subcluster_perplexity=50, merging_max_seqlets_subsample=300,
163+
subcluster_perplexity=50, merging_max_seqlets_subsample=1000,
165164
final_min_cluster_size=20,min_ic_in_window=0.6, min_ic_windowsize=6,
166165
ppm_pseudocount=0.001):
167166

@@ -275,7 +274,7 @@ def TFMoDISco(one_hot, hypothetical_contribs, sliding_window_size=21,
275274
initial_flank_to_add=10, final_flank_to_add=0,
276275
prob_and_pertrack_sim_merge_thresholds=[(0.8,0.8), (0.5, 0.85), (0.2, 0.9)],
277276
prob_and_pertrack_sim_dealbreaker_thresholds=[(0.4, 0.75), (0.2,0.8), (0.1, 0.85), (0.0,0.9)],
278-
subcluster_perplexity=50, merging_max_seqlets_subsample=300,
277+
subcluster_perplexity=50, merging_max_seqlets_subsample=1000,
279278
final_min_cluster_size=20, min_ic_in_window=0.6, min_ic_windowsize=6,
280279
ppm_pseudocount=0.001, verbose=False):
281280

0 commit comments

Comments
 (0)