Skip to content

Commit 0e051f6

Browse files
authored
Merge pull request #632 from Ecogenomics/staging
New release for R226
2 parents 0f1ae4e + 97b9051 commit 0e051f6

File tree

6 files changed

+51
-10
lines changed

6 files changed

+51
-10
lines changed

docs/src/announcements.rst

Lines changed: 19 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,25 @@
11
Announcements
22
=============
33

4+
GTDB-Tk 2.4.1 available
5+
-----------------------
6+
7+
*April 16, 2024*
8+
9+
* GTDB-Tk version ``2.4.1`` is now available.
10+
* This version of GTDB-Tk compatible with the new version of the GTDB-Tk reference package (Release 226).
11+
`gtdbtk_r226_data.tar.gz <https://data.gtdb.ecogenomic.org/releases/release220/220.0/auxillary_files/gtdbtk_package/>`_.
12+
13+
14+
GTDB R226 available
15+
-----------------------
16+
17+
*April 16, 2025*
18+
19+
* GTDB Release 226 is now available and will be used from version ``2.4.1`` and up.
20+
* This version of GTDB-Tk is compatible with both release220 and release226 of the GTDB-Tk reference package.
21+
`gtdbtk_r226_data.tar.gz <https://data.gtdb.ecogenomic.org/releases/release226/226.0/auxillary_files/>`_.
22+
423
GTDB-Tk 2.4.0 available
524
-----------------------
625

docs/src/changelog.rst

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,12 @@
22
Change log
33
==========
44

5+
2.4.1
6+
-----
7+
8+
Bug Fixes:
9+
* (`#630 <https://github.com/Ecogenomics/GTDBTk/issues/630>`_) Fixed SyntaxWarning in Python 3.12 by using raw strings for regex in HMMResultsIO.py
10+
511

612
2.4.0
713
-----

docs/src/installing/index.rst

Lines changed: 9 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -34,11 +34,11 @@ Hardware requirements
3434
- Time
3535
* - Archaea
3636
- ~60 GB
37-
- ~106 GB
37+
- ~140 GB
3838
- ~90 minutes / 1,000 genomes @ 64 CPUs
3939
* - Bacteria
40-
- ~90GB (545 GB when using --full_tree)
41-
- ~106 GB
40+
- ~110GB (690 GB when using --full_tree)
41+
- ~140 GB
4242
- ~90 minutes / 1,000 genomes @ 64 CPUs
4343

4444
.. note::
@@ -117,7 +117,7 @@ Please cite these tools if you use GTDB-Tk in your work.
117117
GTDB-Tk reference data
118118
----------------------
119119

120-
GTDB-Tk requires ~110G of external data that needs to be downloaded and unarchived:
120+
GTDB-Tk requires ~140G of external data that needs to be downloaded and unarchived:
121121

122122
**For full package:**
123123

@@ -154,7 +154,11 @@ https://data.ace.uq.edu.au/public/gtdb/data/releases/release220/220.0/auxillary_
154154
- Minimum version
155155
- Maximum version
156156
- MD5
157-
* - `R220 <https://data.ace.uq.edu.au/public/gtdb/data/releases/latest/auxillary_files/gtdbtk_package/full_package/gtdbtk_data.tar.gz>`_
157+
* - `R226 <https://data.gtdb.ecogenomic.org/releases/release220/226.0/auxillary_files/gtdbtk_package/full_package/gtdbtk_r226_data.tar.gz>`_
158+
- 2.4.0
159+
- Current
160+
- 24b476ea5a4ef30519d461e56cc4a27f
161+
* - `R220 <https://data.gtdb.ecogenomic.org/releases/release220/220.0/auxillary_files/gtdbtk_package/full_package/gtdbtk_r220_data.tar.gz>`_
158162
- 2.4.0
159163
- Current
160164
- 5aafa1b9c27ceda003d75adf238ed9e0

gtdbtk/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -29,4 +29,4 @@
2929
__status__ = 'Production'
3030
__title__ = 'GTDB-Tk'
3131
__url__ = 'https://github.com/Ecogenomics/GTDBTk'
32-
__version__ = '2.4.0'
32+
__version__ = '2.4.1'

gtdbtk/config/common.py

Lines changed: 14 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ class __GTDBTkCommonConfig:
1212
"""
1313

1414
MIN_REF_DATA_VERSION = 'r220'
15-
COMPATIBLE_REF_DATA_VERSIONS = ['r220']
15+
COMPATIBLE_REF_DATA_VERSIONS = ['r220','r226']
1616

1717
BACKBONE_PPLACER_REF_PKG = 'gtdbtk_package_backbone.refpkg'
1818
CLASS_LEVEL_PPLACER_REF_PKG = 'gtdbtk.package.{iter}.refpkg'
@@ -332,8 +332,20 @@ def get_REF_HASHES(self,version=None):
332332
compatible_versions = [int(x.replace('r','')) for x in CONFIG.COMPATIBLE_REF_DATA_VERSIONS]
333333
if version is not None and version not in compatible_versions:
334334
raise ValueError(f"Version {version} is not compatible with this version of GTDB-Tk. Compatible versions are {compatible_versions}")
335+
if version is None or version==226:
336+
return {
337+
self.PPLACER_DIR: '40d242bd5b84d4b2218586390220e6f741191804',
338+
self.MASK_DIR: 'beb296ca29ffadf2d5b86f4160f2a525c5954185',
339+
self.MARKER_DIR: '163f542c3f0a40f59df45d453aa235b39aa96e27',
340+
self.RADII_DIR: '577663ffcd7892551a0f8cb2864fb80544c3bfcd',
341+
self.MSA_FOLDER: '1d47808337897c2965cfc8a101df5e4813ce1581',
342+
self.METADATA_DIR: '56b3a753b0cec1f0ac983fea4c7db32a160d00cb',
343+
self.TAX_FOLDER: 'ea99878828e0baffe8977c7371ce7b7d5109c1e1',
344+
self.SKANI_DIR: '8100f226743d74572fa726ac3ea358c34d5b8222',
345+
self.RED_DIR: 'bd8cfe5c4f5b8fc180cebf974713194395efbc00'
346+
}
335347

336-
if version is None or version==220:
348+
elif version==220:
337349
return {
338350
self.PPLACER_DIR: '75fdd0e093c9af6a73cb510c3d0cd2041265e093',
339351
self.MASK_DIR: 'f4b8ebfa59526a7a86f09752b47e8de1efc384c7',

gtdbtk/external/pypfam/HMM/HMMResultsIO.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -331,15 +331,15 @@ def _readUnitData(self, seqId, fh, hmmRes):
331331
if hmmName and hmmRes.program == 'hmmsearch':
332332

333333
pattern1 = re.compile(r'^\s+%s\s+\d+\s+(\S+)\s+\d+' % hmmName)
334-
seqId = re.sub('(\W)', r'\\\1', seqId)
334+
seqId = re.sub(r'(\W)', r'\\\1', seqId)
335335
# $id =~ s/\|/\\|/g; #Escape '|', '[' and ']' characters
336336
# $id =~ s/\[/\\[/g;
337337
# $id =~ s/\]/\\]/g;
338338
pattern2 = re.compile(r'^\s+%s\s+\d+\s+(\S+)\s+\d+' % seqId)
339339

340340
elif seqName and hmmRes.program == 'hmmscan':
341341
tmpSeqName = seqName
342-
tmpSeqName = re.sub('(\W)', r'\\\1', tmpSeqName)
342+
tmpSeqName = re.sub(r'(\W)', r'\\\1', tmpSeqName)
343343

344344
pattern1 = re.compile(r'^\s+%s\s+\d+\s+(\S+)\s+\d+' % seqId)
345345
pattern2 = re.compile(r'^\s+%s\s+\d+\s+(\S+)\s+\d+' % tmpSeqName)

0 commit comments

Comments
 (0)