Skip to content

Commit 1b9a49e

Browse files
committed
Merge branch 'mosaic'
2 parents ee21ae4 + 8c21a78 commit 1b9a49e

32 files changed

+5515
-1500
lines changed

.gitignore

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# log file
2-
*.log
2+
*log
33
TODO.md
44
# Prerequisites
55
*.d
@@ -60,6 +60,7 @@ Mkfile.old
6060
dkms.conf
6161

6262
# vscode
63+
.lintr
6364
.vscode
6465

6566
# gprof

.lintr

Lines changed: 0 additions & 2 deletions
This file was deleted.

Makefile

Lines changed: 22 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -4,13 +4,15 @@ UNAME_S := $(shell uname -s)
44

55
# add -fno-tree-vectorize to avoid certain vectorization errors in O3 optimization
66
# right now, we are using -O3 for the best performance, and no vectorization errors were found
7-
EXTRA_FLAGS = -Wall -Wno-unused-function -Wno-misleading-indentation -Wno-unused-variable
8-
9-
# Get the Git commit hash
10-
GIT_COMMIT := $(shell git rev-parse --short HEAD)
7+
EXTRA_FLAGS = -Wall -Wno-unused-function -Wno-misleading-indentation -Wno-unused-variable -Wno-alloc-size-larger-than
118

129
# Define the version number
13-
VERSION = 0.0.4-$(GIT_COMMIT)
10+
LONGCALLD_VERSION =0.0.5
11+
# Get the Git commit hash
12+
GIT_COMMIT := $(shell git rev-parse --short HEAD 2> /dev/null)
13+
ifneq ($(GIT_COMMIT),)
14+
LONGCALLD_VERSION = 0.0.5-$(GIT_COMMIT)
15+
endif
1416

1517
HTSLIB_DIR = ./htslib
1618
HTSLIB = $(HTSLIB_DIR)/libhts.a
@@ -51,22 +53,28 @@ ifneq ($(debug),)
5153
endif
5254

5355
ABPOA_GDB_LIB = ./abPOA/lib/libabpoa_sse41.a
54-
ABPOA_NOR_LIB = ./abPOA/lib/libabpoa.a
56+
ABPOA_NOR_LIB = ./abPOA/lib/libabpoa.a
57+
WFA_GDB_LIB = ./WFA2-lib/lib/libwfa_gdb.a
58+
WFA_NOR_LIB = ./WFA2-lib/lib/libwfa.a
59+
5560
# for gdb
5661
ifneq ($(gdb),)
57-
OPT_FLAGS = -g
62+
OPT_FLAGS = -O0 -g
5863
ABPOA_LIB = $(ABPOA_GDB_LIB)
64+
WFA2_LIB = $(WFA_GDB_LIB)
5965
else
6066
OPT_FLAGS = -O3
6167
ABPOA_LIB = $(ABPOA_NOR_LIB)
68+
WFA2_LIB = $(WFA_NOR_LIB)
6269
endif
6370

64-
CFLAGS = $(OPT_FLAGS) $(EXTRA_FLAGS) -DVERSION=\"$(VERSION)\"
71+
CFLAGS = $(OPT_FLAGS) $(EXTRA_FLAGS) -DLONGCALLD_VERSION=\"$(LONGCALLD_VERSION)\"
6572

6673
# for gprof
6774
ifneq ($(pg),)
68-
PG_FLAG = -pg
69-
CFLAGS += -pg
75+
OPT_FLAGS = -O0
76+
PG_FLAG = -pg
77+
CFLAGS += -pg
7078
endif
7179

7280
ifneq ($(PREFIX),)
@@ -100,18 +108,18 @@ $(HTSLIB): $(HTSLIB_DIR)/configure.ac
100108
cd $(HTSLIB_DIR); autoreconf -i; ./configure; make CC=${CC}
101109

102110
$(ABPOA_GDB_LIB):
103-
cd $(ABPOA_DIR); make clean libabpoa gdb=1 sse41=1
111+
cd $(ABPOA_DIR); make libabpoa gdb=1 sse41=1
104112
$(ABPOA_NOR_LIB):
105-
cd $(ABPOA_DIR); make clean libabpoa
113+
cd $(ABPOA_DIR); make libabpoa
106114

107115
$(ABPOA_ALL): $(ABPOA_LIB)
108116

109117
$(WFA2_LIB):
110-
cd $(WFA2_DIR); make setup lib_wfa
118+
cd $(WFA2_DIR); make setup lib_wfa CC_FLAGS="$(CC_FLAGS) -O3"
111119
$(WFA2_ALL): $(WFA2_LIB)
112120

113121

114-
$(BIN): $(OBJS)
122+
$(BIN): $(OBJS) $(ABPOA_LIB) $(HTSLIB) $(WFA2_LIB)
115123
if [ ! -d $(BIN_DIR) ]; then mkdir $(BIN_DIR); fi
116124
$(CC) $(OBJS) -o $@ $(LIB) $(PG_FLAG)
117125

README.md

Lines changed: 28 additions & 19 deletions
Original file line numberDiff line numberDiff line change
@@ -8,22 +8,31 @@
88
[![License](https://img.shields.io/badge/License-MIT-black.svg)](https://github.com/yangao07/longcallD/blob/main/LICENSE)
99
<!-- [![Published in Bioinformatics](https://img.shields.io/badge/Published%20in-Bioinformatics-blue.svg)](https://dx.doi.org/10.1093/bioinformatics/btaa963) -->
1010
<!-- [![GitHub Issues](https://img.shields.io/github/issues/yangao07/longcallD.svg?label=Issues)](https://github.com/yangao07/longcallD/issues) -->
11-
## Updates (pre-release v0.0.4)
1211

13-
* Use static regions for multi-thread computing
14-
* Extended phase set
15-
* Fixed HP/PS tags in output phased bam
16-
* Fixed a few edge cases
12+
## Updates (pre-release v0.0.5)
13+
14+
* Fix a SegFault in ONT mode regarding BAM/SA tag
15+
* Significant speed improvement (compiling mistake in last release)
16+
* Add --refine-aln: refine read alignment based on MSA in output BAM/CRAM
17+
* Add -Oz for compressed VCF output
18+
* Add -s/--somatic to output somatic/mosaic variant
19+
* Add --exclude-ctg & --all-ctg; --autosome-XY is default now
20+
* Add -T/--trans-elem; output TE (transposable/mobile element, Alu/L1/SVA) information for INS/DEL
21+
* Add INFO:TSD;REPNAME in VCF for TE INS/DEL
22+
<!-- * Add INFO:TANDAM in VCF for tandem duplications -->
23+
* Fix lower case ref base
24+
* Fix compiling in macOS-x64
25+
1726

1827
## Getting Started
1928
```sh
2029
# Download pre-built executables and test data (recommended)
2130
# Linux-x64
22-
wget https://github.com/yangao07/longcallD/releases/download/v0.0.4/longcallD-v0.0.4_x64-linux.tar.gz
23-
tar -zxvf longcallD-v0.0.4_x64-linux.tar.gz && cd longcallD-v0.0.4_x64-linux
31+
wget https://github.com/yangao07/longcallD/releases/download/v0.0.5/longcallD-v0.0.5_x64-linux.tar.gz
32+
tar -zxvf longcallD-v0.0.5_x64-linux.tar.gz && cd longcallD-v0.0.5_x64-linux
2433
# MacOS-arm64
25-
wget https://github.com/yangao07/longcallD/releases/download/v0.0.4/longcallD-v0.0.4_arm64-macos.tar.gz
26-
tar -zxvf longcallD-v0.0.4_arm64-macos.tar.gz && cd longcallD-v0.0.4_arm64-macos
34+
wget https://github.com/yangao07/longcallD/releases/download/v0.0.5/longcallD-v0.0.5_arm64-macos.tar.gz
35+
tar -zxvf longcallD-v0.0.5_arm64-macos.tar.gz && cd longcallD-v0.0.5_arm64-macos
2736

2837
# PacBio HiFi reads
2938
./longcallD call ./test_data/chr11_2M.fa ./test_data/HG002_chr11_hifi_test.bam --hifi > HG002_hifi_test.vcf
@@ -35,7 +44,7 @@ man ./longcallD.1
3544
``` -->
3645

3746
## Table of Contents
38-
- [Updates (pre-release v0.0.4)](#updates-pre-release-v004)
47+
- [Updates (pre-release v0.0.5)](#updates-pre-release-v005)
3948
- [Getting Started](#getting-started)
4049
- [Table of Contents](#table-of-contents)
4150
- [Introduction](#introduction)
@@ -44,7 +53,7 @@ man ./longcallD.1
4453
- [Bioconda](#bioconda)
4554
- [Build from source](#build-from-source)
4655
- [Usage](#usage)
47-
- [Variant calling with HiFi/Nanopore long reads](#variant-calling-with-hifinanopore-long-reads)
56+
- [Variant calling with PacBio HiFi/Nanopore long reads](#variant-calling-with-pacbio-hifinanopore-long-reads)
4857
- [Region-specific variant calling](#region-specific-variant-calling)
4958
- [Variant calling and output phased long reads](#variant-calling-and-output-phased-long-reads)
5059
- [Variant calling from remote files](#variant-calling-from-remote-files)
@@ -62,13 +71,13 @@ LongcallD phases long reads into haplotypes using SNPs and small indels before c
6271
### Pre-built executables (recommended)
6372
**Linux-x64**
6473
```
65-
wget https://github.com/yangao07/longcallD/releases/download/v0.0.4/longcallD-v0.0.4_x64-linux.tar.gz
66-
tar -zxvf longcallD-v0.0.4_x64-linux.tar.gz
74+
wget https://github.com/yangao07/longcallD/releases/download/v0.0.5/longcallD-v0.0.5_x64-linux.tar.gz
75+
tar -zxvf longcallD-v0.0.5_x64-linux.tar.gz
6776
```
6877
**MacOS-arm64**
6978
```
70-
wget https://github.com/yangao07/longcallD/releases/download/v0.0.4/longcallD-v0.0.4_arm64-macos.tar.gz
71-
tar -zxvf longcallD-v0.0.4_arm64-macos.tar.gz
79+
wget https://github.com/yangao07/longcallD/releases/download/v0.0.5/longcallD-v0.0.5_arm64-macos.tar.gz
80+
tar -zxvf longcallD-v0.0.5_arm64-macos.tar.gz
7281
```
7382

7483
**Linux-arm64/macOS-x64**
@@ -85,14 +94,14 @@ conda install -c bioconda longcalld
8594
To compile longcallD from source, ensure you have **GCC/clang(9.0+)** and **zlib/libbz2/liblzma/libcurl** (for htslib) installed.
8695
It is recommended to use the [latest release](https://github.com/yangao07/longcallD/releases).
8796
```
88-
wget https://github.com/yangao07/longcallD/releases/download/v0.0.4/longcallD-v0.0.4.tar.gz
89-
tar -zxvf longcallD-v0.0.4.tar.gz
90-
cd longcallD-v0.0.4; make
97+
wget https://github.com/yangao07/longcallD/releases/download/v0.0.5/longcallD-v0.0.5.tar.gz
98+
tar -zxvf longcallD-v0.0.5.tar.gz
99+
cd longcallD-v0.0.5; make
91100
```
92101

93102
## Usage
94103
LongcallD requires a **reference genome (FASTA)** and a **long-read BAM/CRAM** file as inputs. It outputs **phased variant calls in VCF format**.
95-
### Variant calling with HiFi/Nanopore long reads
104+
### Variant calling with PacBio HiFi/Nanopore long reads
96105
```
97106
longcallD call -t16 ref.fa hifi.bam > hifi.vcf # default for PacBio HiFi reads (--hifi)
98107
longcallD call -t16 ref.fa ont.bam --ont > ont.vcf # for ONT reads

anno/AluY_L1_SVA_cons_noPA.fa

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
>AluY DF000000002.4 AluY subfamily
2+
GGCCGGGCGCGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCGAGGCGGGCGGATCACGAGGTCAGGAGATCGAGACCATCCTGGCTAACACGGTGAAACCCCGTCTCTACTAAAAATACAAAAAATTAGCCGGGCGTGGTGGCGGGCGCCTGTAGTCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATGGCGTGAACCCGGGAGGCGGAGCTTGCAGTGAGCCGAGATCGCGCCACTGCACTCCAGCCTGGGCGACAGAGCGAGACTCCGTCTC
3+
>L1HS consensus 43 GRCh38 full-length L1HS
4+
AGAAACAATTAAGAAGGGGAGGAGCCAAGATGGCCGAATAGGAACAGCTCCGGTCTACAGCTCCCAGCGTGAGCGACGCAGAAGACGGTGATTTCTGCATTTCCATCTGAGGTACCGGGTTCATCTCACTAGGGAGTGCCAGACAGTGGGCGCAGGCCAGTGTGTGTGCGCACCGTGCGCGAGCCGAAGCAGGGCGAGGCATTGCCTCACCTGGGAAGCGCAAGGGGTCAGGGAGTTCCCTTTCCGAGTCAAAGAAAGGGGTGACGGACGCACCTGGAAAATCGGGTCACTCCCACCCGAATATTGCGCTTTTCAGACCGGCTTAAGAAACGGCGCACCACGAGACTATATCCCACACCTGGCTCGGAGGGTCCTACGCCCACGGAATCTCGCTGATTGCTAGCACAGCAGTCTGAGATCAAACTGCAAGGCGGCAACGAGGCTGGGGGAGGGGCGCCCGCCATTGCCCAGGCTTGCTTAGGTAAACAAAGCAGCCGGGAAGCTCGAACTGGGTGGAGCCCACCACAGCTCAAGGAGGCCTGCCTGCCTCTGTAGGCTCCACCTCTGGGGGCAGGGCACAGACAAACAAAAAGACAGCAGTAACCTCTGCAGACTTAAGTGTCCCTGTCTGACAGCTTTGAAGAGAGCAGTGGTTCTCCCAGCACGCAGCTGGAGATCTGAGAACGGGCAGACTGCCTCCTCAAGTGGGTCCCTGACCCCTGACCCCCGAGCAGCCTAACTGGGAGGCACCCCCCAGCAGGGGCACACTGACACCTCACACGGCAGGGTATTCCAACAGACCTGCAGCTGAGGGTCCTGTCTGTTAGAAGGAAAACTAACAACCAGAAAGGACATCTACACCGAAAACCCATCTGTACATCACCATCATCAAAGACCAAAAGTAGATAAAACCACAAAGATGGGGAAAAAACAGAACAGAAAAACTGGAAACTCTAAAACGCAGAGCGCCTCTCCTCCTCCAAAGGAACGCAGTTCCTCACCAGCAACAGAACAAAGCTGGATGGAGAATGATTTTGACGAGCTGAGAGAAGAAGGCTTCAGACGATCAAATTACTCTGAGCTACGGGAGGACATTCAAACCAAAGGCAAAGAAGTTGAAAACTTTGAAAAAAATTTAGAAGAATGTATAACTAGAATAACCAATACAGAGAAGTGCTTAAAGGAGCTGATGGAGCTGAAAACCAAGGCTCGAGAACTACGTGAAGAATGCAGAAGCCTCAGGAGCCGATGCGATCAACTGGAAGAAAGGGTATCAGCAATGGAAGATGAAATGAATGAAATGAAGCGAGAAGGGAAGTTTAGAGAAAAAAGAATAAAAAGAAATGAGCAAAGCCTCCAAGAAATATGGGACTATGTGAAAAGACCAAATCTACGTCTGATTGGTGTACCTGAAAGTGATGTGGAGAATGGAACCAAGTTGGAAAACACTCTGCAGGATATTATCCAGGAGAACTTCCCCAATCTAGCAAGGCAGGCCAACGTTCAGATTCAGGAAATACAGAGAACGCCACAAAGATACTCCTCGAGAAGAGCAACTCCAAGACACATAATTGTCAGATTCACCAAAGTTGAAATGAAGGAAAAAATGTTAAGGGCAGCCAGAGAGAAAGGTCGGGTTACCCTCAAAGGAAAGCCCATCAGACTAACAGCGGATCTCTCGGCAGAAACCCTACAAGCCAGAAGAGAGTGGGGGCCAATATTCAACATTCTTAAAGAAAAGAATTTTCAACCCAGAATTTCATATCCAGCCAAACTAAGCTTCATAAGTGAAGGAGAAATAAAATACTTTATAGACAAGCAAATGTTGAGAGATTTTGTCACCACCAGGCCTGCCCTAAAAGAGCTCCTGAAGGAAGCGCTAAACATGGAAAGGAACAACCGGTACCAGCCGCTGCAAAATCATGCCAAAATGTAAAGACCATCGAGACTAGGAAGAAACTGCATCAACTAATGAGCAAAATCACCAGCTAACATCATAATGACAGGATCAAATTCACACATAACAATATTAACTTTAAATATAAATGGACTAAATTCTGCAATTAAAAGACACAGACTGGCAAGTTGGATAAAGAGTCAAGACCCATCAGTGTGCTGTATTCAGGAAACCCATCTCACGTGCAGAGACACACATAGGCTCAAAATAAAAGGATGGAGGAAGATCTACCAAGCCAATGGAAAACAAAAAAAGGCAGGGGTTGCAATCCTAGTCTCTGATAAAACAGACTTTAAACCAACAAAGATCAAAAGAGACAAAGAAGGCCATTACATAATGGTAAAGGGATCAATTCAACAAGAGGAGCTAACTATCCTAAATATTTATGCACCCAATACAGGAGCACCCAGATTCATAAAGCAAGTCCTCAGTGACCTACAAAGAGACTTAGACTCCCACACATTAATAATGGGAGACTTTAACACCCCACTGTCAACATTAGACAGATCAACGAGACAGAAAGTCAACAAGGATACCCAGGAATTGAACTCAGCTCTGCACCAAGCAGACCTAATAGACATCTACAGAACTCTCCACCCCAAATCAACAGAATATACATTTTTTTCAGCACCACACCACACCTATTCCAAAATTGACCACATAGTTGGAAGTAAAGCTCTCCTCAGCAAATGTAAAAGAACAGAAATTATAACAAACTATCTCTCAGACCACAGTGCAATCAAACTAGAACTCAGGATTAAGAATCTCACTCAAAGCCGCTCAACTACATGGAAACTGAACAACCTGCTCCTGAATGACTACTGGGTACATAACGAAATGAAGGCAGAAATAAAGATGTTCTTTGAAACCAACGAGAACAAAGACACCACATACCAGAATCTCTGGGACGCATTCAAAGCAGTGTGTAGAGGGAAATTTATAGCACTAAATGCCTACAAGAGAAAGCAGGAAAGATCCAAAATTGACACCCTAACATCACAATTAAAAGAACTAGAAAAGCAAGAGCAAACACATTCAAAAGCTAGCAGAAGGCAAGAAATAACTAAAATCAGAGCAGAACTGAAGGAAATAGAGACACAAAAAACCCTTCAAAAAATCAATGAATCCAGGAGCTGGTTTTTTGAAAGGATCAACAAAATTGATAGACCGCTAGCAAGACTAATAAAGAAAAAAAGAGAGAAGAATCAAATAGACACAATAAAAAATGATAAAGGGGATATCACCACCGATCCCACAGAAATACAAACTACCATCAGAGAATACTACAAACACCTCTACGCAAATAAACTAGAAAATCTAGAAGAAATGGATACATTCCTCGACACATACACTCTCCCAAGACTAAACCAGGAAGAAGTTGAATCTCTGAATAGACCAATAACAGGCTCTGAAATTGTGGCAATAATCAATAGTTTACCAACCAAAAAGAGTCCAGGACCAGATGGATTCACAGCCGAATTCTACCAGAGGTACAAGGAGGAACTGGTACCATTCCTTCTGAAACTATTCCAATCAATAGAAAAAGAGGGAATCCTCCCTAACTCATTTTATGAGGCCAGCATCATTCTGATACCAAAGCCGGGCAGAGACACAACCAAAAAAGAGAATTTTAGACCAATATCCTTGATGAACATTGATGCAAAAATCCTCAATAAAATACTGGCAAACCGAATCCAGCAGCACATCAAAAAGCTTATCCACCATGATCAAGTGGGCTTCATCCCTGGGATGCAAGGCTGGTTCAATATACGCAAATCAATAAATGTAATCCAGCATATAAACAGAGCCAAAGACAAAAACCACATGATTATCTCAATAGATGCAGAAAAAGCCTTTGACAAAATTCAACAACCCTTCATGCTAAAAACTCTCAATAAATTAGGTATTGATGGGACGTATTTCAAAATAATAAGAGCTATCTATGACAAACCCACAGCCAATATCATACTGAATGGGCAAAAACTGGAAGCATTCCCTTTGAAAACTGGCACAAGACAGGGATGCCCTCTCTCACCGCTCCTATTCAACATAGTGTTGGAAGTTCTGGCCAGGGCAATCAGGCAGGAGAAGGAAATAAAGGGTATTCAATTAGGAAAAGAGGAAGTCAAATTGTCCCTGTTTGCAGACGACATGATTGTTTATCTAGAAAACCCCATCGTCTCAGCCCAAAATCTCCTTAAGCTGATAAGCAACTTCAGCAAAGTCTCAGGATACAAAATCAATGTACAAAAATCACAAGCATTCTTATACACCAACAACAGACAAACAGAGAGCCAAATCATGGGTGAACTCCCATTCACAATTGCTTCAAAGAGAATAAAATACCTAGGAATCCAACTTACAAGGGATGTGAAGGACCTCTTCAAGGAGAACTACAAACCACTGCTCAAGGAAATAAAAGAGGACACAAACAAATGGAAGAACATTCCATGCTCATGGGTAGGAAGAATCAATATCGTGAAAATGGCCATACTGCCCAAGGTAATTTACAGATTCAATGCCATCCCCATCAAGCTACCAATGACTTTCTTCACAGAATTGGAAAAAACTACTTTAAAGTTCATATGGAACCAAAAAAGAGCCCGCATTGCCAAGTCAATCCTAAGCCAAAAGAACAAAGCTGGAGGCATCACACTACCTGACTTCAAACTATACTACAAGGCTACAGTAACCAAAACAGCATGGTACTGGTACCAAAACAGAGATATAGATCAATGGAACAGAACAGAGCCCTCAGAAATAATGCCGCATATCTACAACTATCTGATCTTTGACAAACCTGAGAAAAACAAGCAATGGGGAAAGGATTCCCTATTTAATAAATGGTGCTGGGAAAACTGGCTAGCCATATGTAGAAAGCTGAAACTGGATCCCTTCCTTACACCTTATACAAAAATCAATTCAAGATGGATTAAAGATTTAAACGTTAAACCTAAAACCATAAAAACCCTAGAAGAAAACCTAGGCATTACCATTCAGGACATAGGCGTGGGCAAGGACTTCATGTCCAAAACACCAAAAGCAATGGCAACAAAAGACAAAATTGACAAATGGGATCTAATTAAACTAAAGAGCTTCTGCACAGCAAAAGAAACTACCATCAGAGTGAACAGGCAACCTACAACATGGGAGAAAATTTTTGCAACCTACTCATCTGACAAAGGGCTAATATCCAGAATCTACAATGAACTCAAACAAATTTACAAGAAAAAAACAAACAACCCCATCAAAAAGTGGGCGAAGGACATGAACAGACACTTCTCAAAAGAAGACATTTATGCAGCCAAAAAACACATGAAGAAATGCTCATCATCACTGGCCATCAGAGAAATGCAAATCAAAACCACTATGAGATATCATCTCACACCAGTTAGAATGGCAATCATTAAAAAGTCAGGAAACAACAGGTGCTGGAGAGGATGCGGAGAAATAGGAACACTTTTACACTGTTGGTGGGACTGTAAACTAGTTCAACCATTGTGGAAGTCAGTGTGGCGATTCCTCAGGGATCTAGAACTAGAAATACCATTTGACCCAGCCATCCCATTACTGGGTATATACCCAAATGAGTATAAATCATGCTGCTATAAAGACACATGCACACGTATGTTTATTGCGGCACTATTCACAATAGCAAAGACTTGGAACCAACCCAAATGTCCAACAATGATAGACTGGATTAAGAAAATGTGGCACATATACACCATGGAATACTATGCAGCCATAAAAAATGATGAGTTCATATCCTTTGTAGGGACATGGATGAAATTGGAAACCATCATTCTCAGTAAACTATCGCAAGAACAAAAAACCAAACACCGCATATTCTCACTCATAGGTGGGAATTGAACAATGAGATCACATGGACACAGGAAGGGGAATATCACACTCTGGGGACTGTGGTGGGGTCGGGGGAGGGGGGAGGGATAGCATTGGGAGATATACCTAATGCTAGATGACACATTAGTGGGTGCAGCGCACCAGCATGGCACATGTATACATATGTAACTAACCTGCACAATGTGCACATGTACCCTAAAACTTAGAGTATAAT
5+
>SVA consensus of SVA_A/B/C/D/E/F subfamily
6+
CTCTCCCTCTCCCTCTCCCTCTCCCTCTCCCTCTCCCTCTCCCTCTCCCCTCTTTCCACGGTCTCCCTCTGATGCCGAGCCGAAGCTGGACTGTACTGCTGCCATCTCGGCTCACTGCAACCTCCCTGCCTGATTCTCCTGCCTCAGCCTGCCGAGTGCCTGCGATTGCAGGCGCGCGCCGCCACGCCTGACTGGTTTTCGTATTTTTTTGGTGGAGACGGGGTTTCGCTGTGTTGGCCGGGCTGGTCTCCAGCTCCTAACCGCGAGTGATCCGCCAGCCTCGGCCTCCCGAGGTGCCGGGATTGCAGACGGAGTCTCGTTCACTCAGTGCTCAATGGTGCCCAGGCTGGAGTGCAGTGGCGTGATCTCGGCTCGCTACAACCTCCACCTCCCAGCCGCCTGCCTTGGCCTCCCAAAGTGCCGAGATTGCAGCCTCTGCCCGGCCGCCACCCCGTCTGGGAAGTGAGGAGCGTCTCTGCCCGGCCGCCCATCGTCTGGGANGTGAGGAGCCCCTCTGCCCGGCCGCCCCGTCTGGGAAGTGAGGAGCGCCTCTGCCCGGCCGCCGCCCCGTCTGGGAAGTGAGGAGCGTCTCTGCCCGGCCGCCCATCGTCTGGGANGTGGGGAGCGCCTCCGCCCCGCCGCCCCGTCTGGGANGTGAGGAGCGCCTCCGCCCGGCCAGCCGCCCCGTCCGGGAGGTGGGGGGGTCAGCCCCCCGCCCGGCCAGCCGCCCCGTCCGGGAGGAGGTGGGGGGGTCAGCCCCCCGCCCGGCCAGCCGCCCCGTCCGGGAGGTGAGGGGCGCCTCTGCCCGGCCGCCCCTACTGGGAAGTGAGGAGCCCCTCTGCCCGGCCACCGCCCCGTCCGGGAGGTGTACCCAACAGCTCATTGAGAACGGGCCATGATGACAATGGCGGTTTTGTGGAATAGAAAGGGGGGAAATGTGGGGAAAAGATTGAGAAATCGGATGGTTGCCGTGTCTGTGTAGAAAGAAGTAGACATGGGAGACTTTTCATTTTGTTCTGTACTAAGAAAAATTCTTCTGCCTTGGGATCCTGTTGATCTGTGACCTTACCCCCAACCCTGTGCTCTCTGAAACATGTGCTGTGTCCACTCAGGGTTAAATGGATTAAGGGCGGTGCAAGATGTGCTTTGTTAAACAGATGCTTGAAGGCAGCATGCTCGTTAAGAGTCATCACCACTCCCTAATCTCAAGTACCCAGGGACACAAACACTGCGGAAGGCCGCAGGGTCCTCTGCCTAGGAAAACCAGAGACCTTTGTTCACTTGTTTATCTGCTGACCTTCCCTCCACTATTGTCCTATGACCCTGCCAAATCCCCCTCTGCGAGAAACACCCAAGAATGATCAAT

0 commit comments

Comments
 (0)