Skip to content

Commit 6b5a235

Browse files
authored
Merge pull request #315 from OpenTreeOfLife/3-0-release-notes
initial checkin of 3.0 release notes
2 parents c0cf724 + 9ae063e commit 6b5a235

File tree

4 files changed

+283
-7
lines changed

4 files changed

+283
-7
lines changed

doc/method/to_cite.bib

Lines changed: 92 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,6 @@ @article{10.1371/journal.pone.0119248
5555
volume = {10},
5656
url = {http://dx.doi.org/10.1371%2Fjournal.pone.0119248},
5757
pages = {1-60},
58-
abstract = {<p>We present a consensus classification of life to embrace the more than 1.6 million species already provided by more than 3,000 taxonomists’ expert opinions in a unified and coherent, hierarchically ranked system known as the Catalogue of Life (CoL). The intent of this collaborative effort is to provide a hierarchical classification serving not only the needs of the CoL’s database providers but also the diverse public-domain user community, most of whom are familiar with the Linnaean conceptual system of ordering taxon relationships. This classification is neither phylogenetic nor evolutionary but instead represents a consensus view that accommodates taxonomic choices and practical compromises among diverse expert opinions, public usages, and conflicting evidence about the boundaries between taxa and the ranks of major taxa, including kingdoms. Certain key issues, some not fully resolved, are addressed in particular. Beyond its immediate use as a management tool for the CoL and ITIS (Integrated Taxonomic Information System), it is immediately valuable as a reference for taxonomic and biodiversity research, as a tool for societal communication, and as a classificatory “backbone” for biodiversity databases, museum collections, libraries, and textbooks. Such a modern comprehensive hierarchy has not previously existed at this level of specificity.</p>},
5958
number = {4},
6059
doi = {10.1371/journal.pone.0119248}
6160
}
@@ -67,6 +66,80 @@ @article{10.11646/bionomina.4.1.3
6766
doi = {10.11646/bionomina.4.1.3}
6867
}
6968

69+
@article{10.3897/BDJ.2.e1079,
70+
author = {Cynthia S. Parr and Nathan Wilson and Patrick Leary and Katja Schulz and Kristen Lans and Lisa Walley and Jennifer Hammock and Anthony Goddard and Jeremy Rice and Marie Studer and Jeffrey Holmes and Robert Corrigan, Jr.},
71+
title = {The Encyclopedia of Life v2: Providing Global Access to Knowledge About Life on Earth},
72+
volume = {2},
73+
year = {2014},
74+
doi = {10.3897/BDJ.2.e1079},
75+
publisher = {Pensoft Publishers},
76+
issn = {1314-2836},
77+
pages = {e1079},
78+
URL = {https://doi.org/10.3897/BDJ.2.e1079},
79+
eprint = {https://doi.org/10.3897/BDJ.2.e1079},
80+
journal = {Biodiversity Data Journal}
81+
}
82+
83+
@article{redelings2017,
84+
author = {Redelings, BD AND Holder MT},
85+
year = {2017},
86+
title = {A supertree pipeline for summarizing
87+
phylogenetic and taxonomic information for millions of species},
88+
journal = {PeerJ},
89+
pages = {5:e3058},
90+
url = {https://doi.org/10.7717/peerj.3058}
91+
}
92+
93+
@article{col2016,
94+
author = {Roskov, Y. AND Abucay L. AND Orrell T. AND Nicolson D. AND Flann C. AND Bailly
95+
N. AND Kirk P. AND Bourgoin T. AND DeWalt R.E. AND Decock W. AND De Wever A., editors}
96+
year = {2016},
97+
title = {Species 2000 & ITIS Catalogue of Life, 2016 Annual Checklist},
98+
url = {http://www.catalogueoflife.org/annual-checklist/2016},
99+
publisher = {Species 2000: Naturalis, Leiden, the Netherlands},
100+
issn = {2405-884X},
101+
note = {Accessed: 1 March 2017}
102+
}
103+
104+
@unpublished{newick,
105+
year = {1990},
106+
author = {Gary Olsen},
107+
title = {Interpretation of the "Newick's 8:45" Tree Format Standard},
108+
url = {http://evolution.genetics.washington.edu/phylip/newick_doc.html},
109+
note = {Accessed: 1 March 2017}
110+
}
111+
112+
@unpublished{redlist,
113+
author = {International Union for Conservation of Nature and Natural Resources},
114+
title = {The IUCN Red List of Threatened Species, version 2016-3},
115+
url = {http://www.iucnredlist.org/},
116+
year = {2016},
117+
note = {Accessed: 1 March 2017}
118+
}
119+
120+
@article{10.1371/journal.pone.0029715,
121+
author = {J Wieczorek AND D Bloom AND R Guralnick AND S Blum AND M Döring AND R Giovanni AND et al.},
122+
year = {2012},
123+
title = {Darwin Core: An evolving community-developed biodiversity data standard},
124+
journal = {PLoS ONE},
125+
volume = {7},
126+
issue = {1},
127+
pages = {e29715}
128+
}
129+
130+
@article{10.3897/rio.2.e10610,
131+
author = {Nico Franz and Edward Gilbert and Bertram Ludäscher and Alan Weakley},
132+
title = {Controlling the taxonomic variable: Taxonomic concept resolution for a southeastern United States herbarium portal},
133+
volume = {2},
134+
year = {2016},
135+
doi = {10.3897/rio.2.e10610},
136+
publisher = {Pensoft Publishers},
137+
pages = {e10610},
138+
URL = {https://doi.org/10.3897/rio.2.e10610},
139+
eprint = {https://doi.org/10.3897/rio.2.e10610},
140+
journal = {Research Ideas and Outcomes}
141+
}
142+
70143
@article{10.1016/j.mycres.2007.03.004,
71144
author = {DS Hibbett AND M Binder AND JF Bischoff AND M Blackwell AND et al.},
72145
title = {A higher-level phylogenetic classification of the Fungi},
@@ -102,10 +175,11 @@ @misc{silva115
102175
author = {The SILVA rRNA database project},
103176
title = {SSURef_NR99_115_tax_silva.fasta.tgz},
104177
url = {ftp://ftp.arb-silva.de/release_115/Exports/SSURef_NR99_115_tax_silva.fasta.tgz},
105-
note = {Accessed: 2013-09-07}
178+
note = {Accessed: 2013-09-07},
179+
year = {2013}
106180
}
107181

108-
misc{fungorum2014site,
182+
@misc{fungorum2014site,
109183
title = {Index Fungorum},
110184
author = {Index Fungorum Partnership},
111185
url = {http://www.indexfungorum.org},
@@ -160,6 +234,18 @@ @misc{ncbi2016
160234
note = {Accessed: 2016-11-09}
161235
}
162236

237+
@article{gbif2004,
238+
author = {Edwards, James L.},
239+
title = {Research and societal benefits of the global biodiversity information facility},
240+
journal = {BioScience},
241+
volume = {54},
242+
issue = {6},
243+
year = {2004},
244+
pages = {485},
245+
url = {http://go.galegroup.com/ps/i.do?p=EAIM&sw=w&u=duke_perkins&v=2.1&it=r&id=GALE%7CA118544173&asid=e4d38732723588b8a2dfd99b42f87626},
246+
note = {Accessed: 1 March 2017}
247+
}
248+
163249
@article{markus2016april,
164250
title = {Updating the GBIF Backbone},
165251
author = {M Döring},
@@ -180,7 +266,8 @@ @misc{gbifbackbone2016
180266
title = {GBIF Backbone Taxonomy},
181267
author = {GBIF Secretariat},
182268
url = {http://www.gbif.org/dataset/d7dddbf4-2cf0-4f39-9b2a-bb099caae36c},
183-
note = {Accessed: 2016-07-29}
269+
year = {2016},
270+
note = {Accessed: 2016-11-11}
184271
}
185272

186273
@inproceedings{irmng,
@@ -196,7 +283,7 @@ @inproceedings{irmng
196283
}
197284
@unpublished{irmng2014,
198285
author = {Rees, Tony (compile)},
199-
title = {The Interim Registry of Marine and Nonmarine Genera},
286+
title = {The Interim Register of Marine and Nonmarine Genera},
200287
year = 2014,
201288
url = {http://www.cmar.csiro.au/datacentre/downloads/IRMNG_DWC.zip},
202289
note = {Accessed: 2017-02-21. File dated 2014-01-31. Current searchable version

doc/ott2.10.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -121,7 +121,7 @@ retrieved.
121121
<br />
122122
Download location: [http://purl.org/opentree/ott/ott2.8/inputs/lamiales-20140118.tsv](http://purl.org/opentree/ott/ott2.8/inputs/lamiales-20140118.tsv)
123123

124-
1. [World Registry of Marine Species (WoRMS)](http://www.marinespecies.org/aphia.php) - harvested from web site using web API over several days ending around 1 October 2015.
124+
1. [World Register of Marine Species (WoRMS)](http://www.marinespecies.org/aphia.php) - harvested from web site using web API over several days ending around 1 October 2015.
125125
Download location: [http://files.opentreeoflife.org/worms/worms-1/worms-1-ot.tgz](http://files.opentreeoflife.org/worms/worms-1/worms-1-ot.tgz)
126126

127127
1. NCBI Taxonomy, from the

doc/ott2.9.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -86,7 +86,7 @@ retrieved.
8686
<br />
8787
Download location: [http://purl.org/opentree/ott/ott2.8/inputs/lamiales-20140118.tsv](http://purl.oeg/opentree/ott/ott2.8/inputs/lamiales-20140118.tsv)
8888

89-
1. World Registry of Marine Species (WoRMS) - harvested from web site using web API over several days ending around 1 October 2015.
89+
1. World Register of Marine Species (WoRMS) - harvested from web site using web API over several days ending around 1 October 2015.
9090
[http://www.marinespecies.org/aphia.php](http://www.marinespecies.org/aphia.php)
9191

9292
1. NCBI Taxonomy, from the

doc/ott3.0.md

Lines changed: 189 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,3 +2,192 @@
22
* Small improvements to treatment of containers (X incertae sedis, samples)
33

44
Note that SILVA precedes Hibbett in the load order
5+
6+
7+
# Open Tree of Life reference taxonomy version 3.0
8+
9+
Version 3.0 draft 6 was generated on 26 February 2017.
10+
11+
## Download
12+
13+
[Download](http://files.opentreeoflife.org/ott/ott3.0/ott3.0.tgz)
14+
15+
## Major changes since OTT 2.10
16+
17+
* Updated to NCBI Taxonomy dated 9 November 2016.
18+
* Updated to GBIF backbone dated 29 July 2016. Unfortunately, as a
19+
consequence, about 200 species, mostly birds, have been renamed with
20+
no known link to the previous name. (Example: Collocalia ocista,
21+
formerly known as Aerodramus ocistus) This means occurrences of
22+
these species in previously curated studies will not be recognized
23+
in synthesis runs. It is hoped that this is a temporary problem.
24+
* Cnidaria now gets its taxonomy from WoRMS instead of NCBI.
25+
* Removed Viruses
26+
* A number of taxa whose OTT id unnecessarily changed in the past have
27+
had their OTT ids restored, with the newer id as an id alias.
28+
This change should not have any ill effects for clients that are
29+
aware of id aliases (forwards.tsv).
30+
31+
## Statistics
32+
33+
* OTT identifiers ('taxa'): 3594550
34+
* Visible: [TBD]
35+
* Synonyms: 1842403 (big increase)
36+
* Deprecated/hidden ids occurring in phylesystem: total 3686,
37+
but only 586 if lumped ids are excluded
38+
* Deprecated/hidden ids occurring in studies in synthesis: total 1097,
39+
but only 118 if lumped ids are excluded
40+
* Source taxa dissolved due to conflict (conflicts.tsv): 1171
41+
42+
## Contents of download
43+
44+
All files use UTF-8 character encoding. For documentation about file formats, see [the documentation in the reference taxonomy
45+
wiki](https://github.com/OpenTreeOfLife/reference-taxonomy/wiki/Interim-taxonomy-file-format),
46+
on github.
47+
48+
**taxonomy.tsv**: The file that contains the taxonomy.
49+
50+
**synonyms.tsv**: The list of synonyms.
51+
52+
**forwards.tsv**: Aliases ('forwarding pointers') - a list of OTT ids that are
53+
retired and should be replaced by new ones (usually due to
54+
'lumping')
55+
56+
**conflicts.tsv**: Report on taxa from input taxonomies that are
57+
hidden because they are paraphyletic with respect to a higher
58+
taxon from a higher priority input taxonomy.
59+
Since this file is mainly for debugging purposes I change
60+
it from time to time without notice. The format used in 3.0
61+
is very different from that used in 2.10.
62+
63+
**deprecated.tsv**: List of all taxon ids occurring in phylesystem
64+
studies that have been deprecated or suppressed since previous version. This
65+
includes ids that no longer identify any taxon, those that have been
66+
'lumped' with other ids, and those for taxa that are suppressed in
67+
synthesis but weren't suppressed in the previous version.
68+
69+
**version.tsv**: The version of OTT.
70+
71+
**transcript.out**: Console debugging output generated during the taxonomy build process.
72+
73+
**log.tsv**: Debugging information related to homonym resolution.
74+
75+
**otu_differences.tsv**: list of differences with OTT 2.10, restricted
76+
to ids used in phylesystem
77+
78+
There are some new .json files in the dump containing metrics, created for
79+
the purpose of the taxonomy method writeup. Not documented as of
80+
this writing.
81+
82+
## Build script
83+
84+
The reference taxonomy is an algorithmic combination of several
85+
source taxonomies. For code,
86+
see <a href="https://github.com/OpenTreeOfLife/reference-taxonomy">the
87+
source code repository</a>.
88+
Version 3.0 draft 6 was generated using
89+
<a href="https://github.com/OpenTreeOfLife/reference-taxonomy/commit/fc5cb5c2749e9e986749281a3284d2c1df42b58d">commit fc5cb5c</a>.</p>
90+
91+
## Sources
92+
93+
Any errors in OTT
94+
should be assumed to have been introduced by the Open Tree of Life
95+
project until confirmed as originating in the source taxonomy.
96+
97+
Download locations are for the particular versions used to construct
98+
OTT 3.0. For new work, current versions of these sources should be
99+
retrieved.
100+
101+
1. Curated additions from the Open Tree amendments-1 repository, commit [bcafdea](https://github.com/OpenTreeOfLife/amendments-1/commit/bcafdea7f2e9231274cae2df2beed7d732ca46c5). These taxa are added during OTU mapping using the curator application.
102+
103+
1. Taxonomy from:
104+
DS Hibbett, M Binder, JF Bischoff, M Blackwell, et al.
105+
A higher-level phylogenetic classification of the <i>Fungi</i>.
106+
[Mycological Research</i> <b>111</b>(5):509-547, 2007](http://dx.doi.org/10.1016/j.mycres.2007.03.004).
107+
Newick string with revisions
108+
archived at [http://figshare.com/articles/Fungal\_Classification\_2015/1465038](http://figshare.com/articles/Fungal_Classification_2015/1465038).
109+
<br />
110+
Download location: [https://github.com/OpenTreeOfLife/reference-taxonomy/tree/ott2.10draft11/feed/h2007](https://github.com/OpenTreeOfLife/reference-taxonomy/tree/ott2.10draft11/feed/h2007)
111+
112+
1. Taxonomy from: SILVA 16S ribosomal RNA database, version 115.
113+
See: Quast C, Pruesse E, Yilmaz P, Gerken J, Schweer T, Yarza P, Peplies J,
114+
Gl&ouml;ckner FO (2013) The SILVA ribosomal RNA gene database project:
115+
improved data processing and web-based tools.
116+
[Nucleic Acids Research</i> 41 (D1): D590-D596](http://dx.doi.org/10.1093/nar/gks1219).
117+
Web site: [http://www.arb-silva.de/](http://www.arb-silva.de/).
118+
<br />
119+
Download location: [ftp://ftp.arb-silva.de/release\_115/Exports/tax\_ranks\_ssu\_115.csv](ftp://ftp.arb-silva.de/release_115/Exports/tax_ranks_ssu_115.csv).
120+
121+
1. Index Fungorum.
122+
Download location: derived from database query result files provided by Paul
123+
Kirk, 7 April 2014 (personal communication).
124+
Web site: [http://www.indexfungorum.org/](http://www.indexfungorum.org/).
125+
<br />
126+
Download location (converted to OTT format): [http://files.opentreeoflife.org/fung/fung-9/fung-9-ot.tgz](http://files.opentreeoflife.org/fung/fung-9/fung-9-ot.tgz).
127+
128+
1. Taxonomy from:
129+
Sch&auml;ferhoff, B., Fleischmann, A., Fischer, E., Albach, D. C., Borsch,
130+
T., Heubl, G., and M&uuml;ller, K. F. (2010). Towards resolving Lamiales
131+
relationships: insights from rapidly evolving chloroplast
132+
sequences.
133+
[<i>BMC evolutionary biology</i> 10(1), 352.](http://dx.doi.org/10.1186/1471-2148-10-352).
134+
Manually transcribed from the paper and converted to OTT format.
135+
<br />
136+
Download location: [http://purl.org/opentree/ott/ott2.8/inputs/lamiales-20140118.tsv](http://purl.org/opentree/ott/ott2.8/inputs/lamiales-20140118.tsv)
137+
138+
1. [World Register of Marine Species (WoRMS)](http://www.marinespecies.org/aphia.php) - harvested from web site using web API over several days ending around 1 October 2015.
139+
Download location: [http://files.opentreeoflife.org/worms/worms-1/worms-1-ot.tgz](http://files.opentreeoflife.org/worms/worms-1/worms-1-ot.tgz)
140+
141+
1. NCBI Taxonomy, from the
142+
[US National Center on Biotechnology Information](http://www.ncbi.nlm.nih.gov/).
143+
Web site: [http://www.ncbi.nlm.nih.gov/Taxonomy/](http://www.ncbi.nlm.nih.gov/Taxonomy/).
144+
<br />
145+
We used a version dated 9 November 2016.
146+
Archived location: [http://files.opentreeoflife.org/ncbi/ncbi-20151006/ncbi-20151006.tgz](http://files.opentreeoflife.org/ncbi/ncbi-20161109/ncbi-20161109.tgz).
147+
<br />
148+
Current version download location:
149+
[ftp://ftp.ncbi.nlm.nih.gov/pub/taxonomy/taxdump.tar.gz](ftp://ftp.ncbi.nlm.nih.gov/pub/taxonomy/taxdump.tar.gz)
150+
151+
1. GBIF Backbone Taxonomy, from the
152+
[Global Biodiversity Information facility](http://www.gbif.org/).
153+
<br />
154+
We used a version dated 2016-07-29.
155+
Download location: [http://files.opentreeoflife.org/gbif/gbif-20160729/gbif-201609729.zip](http://files.opentreeoflife.org/gbif/gbif-20160729/gbif-201609729.zip).
156+
<br />
157+
Current version download location (unverified):
158+
[http://www.gbif.org/dataset/d7dddbf4-2cf0-4f39-9b2a-bb099caae36c](http://www.gbif.org/dataset/d7dddbf4-2cf0-4f39-9b2a-bb099caae36c).
159+
160+
1. [Interim Register of Marine and Nonmarine Genera (IRMNG)](http://irmng.org/).
161+
<br />
162+
We used a version dated 2014-01-31. Download location:
163+
[http://purl.org/opentree/ott/ott2.8/inputs/IRMNG\_DWC-2014-01-30.zip](http://purl.org/opentree/ott/ott2.8/inputs/IRMNG_DWC-2014-01-30.zip).
164+
165+
1. Taxon identifiers are carried over from [OTT 2.10](http://files.opentreeoflife.org/ott/ott2.10/) when possible
166+
167+
It has been requested that we relay the following statement:
168+
169+
> REUSE OF IRMNG CONTENT:
170+
> IRMNG (the Interim Register of Marine and Nonmarine Genera) is assembled, with permission, from a range of third party data sources, certain of which permit data reuse only under specific conditions. In particular, for data originating from the Catalogue of Life (CoL), please refer to the relevant terms and conditions for reuse of CoL data as available at [http://www.catalogueoflife.org/content/terms-use](http://www.catalogueoflife.org/content/terms-use), and for data originating from the World Register of Marine Species (WoRMS) refer the paragraph "Terms of Use and Citation" at [http://www.marinespecies.org/about.php](http://www.marinespecies.org/about.php). The compilers of IRMNG accept no liability for any reuse of IRMNG content by downstream users which may be construed by the original data providers to violate their publicly available conditions of use.
171+
172+
The Open Tree Taxonomy does not reproduce its sources in their
173+
entirety or in their original form of expression, but only uses
174+
limited information expressed in them. See "[Scientific names of
175+
organisms: attribution, rights, and licensing](http://dx.doi.org/10.1186/1756-0500-7-79)" ([http://dx.doi.org/10.1186/1756-0500-7-79](http://dx.doi.org/10.1186/1756-0500-7-79))
176+
regarding use of taxonomic information and attribution.
177+
178+
## Priority
179+
180+
Where taxonomies conflict regarding taxon relationships, they are
181+
resolved in favor of the higher priority taxonomy. The priority
182+
ordering is as given above, with the following exceptions:
183+
184+
The non-Fungi content of Index Fungorum is separated from the Fungi
185+
content and given a priority lower than NCBI and GBIF.
186+
187+
The non-Malacostraca, non-Ctenophora content of WoRMS is separated from the
188+
Malacostraca and Ctenophora content and given a priority lower than NCBI but higher
189+
than GBIF.
190+
191+
## Previous versions
192+
193+
See <a href="http://files.opentreeoflife.org/ott/">http://files.opentreeoflife.org/ott/</a>

0 commit comments

Comments
 (0)