Skip to content

Commit 47c4442

Browse files
committed
Add linclust2 and cluster2 regression
1 parent 3e2ca8c commit 47c4442

File tree

4 files changed

+42
-0
lines changed

4 files changed

+42
-0
lines changed

regression/run_cluster2.sh

Lines changed: 14 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,14 @@
1+
#!/bin/sh -e
2+
3+
CLUDB="${RESULTS}/clu"
4+
"${MMSEQS}" createdb "${DATADIR}/clu.fasta" "${CLUDB}" --shuffle 0
5+
6+
"${MMSEQS}" cluster "${CLUDB}" "$RESULTS/results_clu" "$RESULTS/tmp" --min-seq-id 0.3 -s 2 --cluster-steps 3 --linclust-version 2 --cluster-version 2
7+
"${MMSEQS}" createtsv "${CLUDB}" "${CLUDB}" "$RESULTS/results_clu" "$RESULTS/results_cluster.tsv"
8+
9+
awk 'BEGIN { l = "" } l != $1 { l = $1; cnt++; } { t++; } END { print cnt"\t"t"\t"(t/cnt) }' "$RESULTS/results_cluster.tsv" > "$RESULTS/results_summary.tsv"
10+
ACTUAL="$(cut -f1 "$RESULTS/results_summary.tsv")"
11+
TARGET="13620"
12+
awk -v actual="$ACTUAL" -v target="$TARGET" \
13+
'BEGIN { print (actual == target) ? "GOOD" : "BAD"; print "Expected: ", target; print "Actual: ", actual; }' \
14+
> "${RESULTS}.report"

regression/run_linclust2.sh

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
#!/bin/sh -e
2+
CLUDB=
3+
"${MMSEQS}" createdb "${DATADIR}/clu.fasta" "${RESULTS}/clu"
4+
5+
"${MMSEQS}" linclust "${RESULTS}/clu" "$RESULTS/results_clu" "$RESULTS/tmp" --cov-mode 1 --cluster-mode 0 -c 0.90 --min-seq-id 0.50 --linclust-version 2
6+
"${MMSEQS}" createtsv "${RESULTS}/clu" "${RESULTS}/clu" "$RESULTS/results_clu" "$RESULTS/results_cluster.tsv"
7+
8+
awk 'BEGIN { l = "" } l != $1 { l = $1; cnt++; } { t++; } END { print cnt"\t"t"\t"(t/cnt) }' "$RESULTS/results_cluster.tsv" > "$RESULTS/results_summary.tsv"
9+
ACTUAL="$(cut -f1 "$RESULTS/results_summary.tsv")"
10+
TARGET="27153"
11+
awk -v actual="$ACTUAL" -v target="$TARGET" \
12+
'BEGIN { print (actual == target) ? "GOOD" : "BAD"; print "Expected: ", target; print "Actual: ", actual; }' \
13+
> "${RESULTS}.report"

regression/run_linclust2_split.sh

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,12 @@
1+
#!/bin/sh -e
2+
"${MMSEQS}" createdb "${DATADIR}/clu.fasta" "${RESULTS}/clu"
3+
4+
"${MMSEQS}" linclust "${RESULTS}/clu" "$RESULTS/results_clu" "$RESULTS/tmp" --cov-mode 1 --cluster-mode 0 -c 0.90 --min-seq-id 0.50 --split-memory-limit 10M --linclust-version 2
5+
"${MMSEQS}" createtsv "${RESULTS}/clu" "${RESULTS}/clu" "$RESULTS/results_clu" "$RESULTS/results_cluster.tsv"
6+
7+
awk 'BEGIN { l = "" } l != $1 { l = $1; cnt++; } { t++; } END { print cnt"\t"t"\t"(t/cnt) }' "$RESULTS/results_cluster.tsv" > "$RESULTS/results_summary.tsv"
8+
ACTUAL="$(cut -f1 "$RESULTS/results_summary.tsv")"
9+
TARGET="27153"
10+
awk -v actual="$ACTUAL" -v target="$TARGET" \
11+
'BEGIN { print (actual == target) ? "GOOD" : "BAD"; print "Expected: ", target; print "Actual: ", actual; }' \
12+
> "${RESULTS}.report"

run_regression.sh

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -74,11 +74,14 @@ run_test NUCLPROT_SEARCH "run_nuclprot.sh"
7474
run_test NUCLNUCL_SEARCH "run_nuclnucl.sh"
7575
run_test NUCLNUCL_TRANS_SEARCH "run_nuclnucl_translated.sh"
7676
run_test CLUSTER "run_cluster.sh"
77+
run_test CLUSTER2 "run_cluster2.sh"
7778
run_test EASY_CLUSTER "run_easy_cluster.sh"
7879
run_test EASY_NUCL_CLUSTER "run_easy_nuclcluster.sh"
7980
run_test CLUSTER_REASSIGN "run_easy_cluster_reassign.sh"
8081
run_test LINCLUST "run_linclust.sh"
82+
run_test LINCLUST2 "run_linclust2.sh"
8183
run_test LINCLUST_SPLIT "run_linclust_split.sh"
84+
run_test LINCLUST2_SPLIT "run_linclust2_split.sh"
8285
run_test EASY_LINCLUST "run_easy_linclust.sh"
8386
run_test CLUSTHASH "run_clusthash.sh"
8487
run_test PROTNUCL_SEARCH "run_protnucl.sh"

0 commit comments

Comments
 (0)