Skip to content

Commit 68908b9

Browse files
authored
Merge branch 'master' into pf8-url-update
2 parents 61e6f9b + a7bb710 commit 68908b9

29 files changed

+3777
-20
lines changed

README.md

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -128,6 +128,17 @@ the documentation via GitHub Actions.
128128
The version switcher for the documentation can then be updated by
129129
modifying the `docs/source/_static/switcher.json` file accordingly.
130130

131+
## Citation
132+
133+
If you use the `malariagen_data` package in a publication
134+
or include any of its functions or code in other materials (_e.g._ training resources),
135+
please cite: [doi.org/10.5281/zenodo.11173411](doi.org/10.5281/zenodo.11173411)
136+
137+
Some functions may require additional citations to acknowledge specific contributions. These are indicated in the description for each relevant function.
138+
139+
For any questions, please feel free to contact us at: [[email protected]](mailto:[email protected])
140+
141+
131142
## Sponsorship
132143

133144
This project is currently supported by the following grants:

malariagen_data/af1.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,7 @@
99
MAJOR_VERSION_PATH = "v1.0"
1010
CONFIG_PATH = "v1.0-config.json"
1111
GCS_DEFAULT_URL = "gs://vo_afun_release_master_us_central1/"
12+
GCS_DEFAULT_PUBLIC_URL = "gs://vo_anoph_temp_us_central1/vo_agam_release/"
1213
GCS_REGION_URLS = {
1314
"us-central1": "gs://vo_afun_release_master_us_central1",
1415
}
@@ -78,6 +79,7 @@ class Af1(AnophelesDataResource):
7879
def __init__(
7980
self,
8081
url=None,
82+
public_url=GCS_DEFAULT_PUBLIC_URL,
8183
bokeh_output_notebook=True,
8284
results_cache=None,
8385
log=sys.stdout,
@@ -93,6 +95,7 @@ def __init__(
9395
):
9496
super().__init__(
9597
url=url,
98+
public_url=public_url,
9699
config_path=CONFIG_PATH,
97100
cohorts_analysis=cohorts_analysis,
98101
aim_analysis=None,

malariagen_data/ag3.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,7 @@
1515
MAJOR_VERSION_PATH = "v3"
1616
CONFIG_PATH = "v3-config.json"
1717
GCS_DEFAULT_URL = "gs://vo_agam_release_master_us_central1/"
18+
GCS_DEFAULT_PUBLIC_URL = "gs://vo_anoph_temp_us_central1/vo_agam_release/"
1819
GCS_REGION_URLS = {
1920
"us-central1": "gs://vo_agam_release_master_us_central1",
2021
}
@@ -138,6 +139,7 @@ class Ag3(AnophelesDataResource):
138139
def __init__(
139140
self,
140141
url=None,
142+
public_url=GCS_DEFAULT_PUBLIC_URL,
141143
bokeh_output_notebook=True,
142144
results_cache=None,
143145
log=sys.stdout,
@@ -154,6 +156,7 @@ def __init__(
154156
):
155157
super().__init__(
156158
url=url,
159+
public_url=public_url,
157160
config_path=CONFIG_PATH,
158161
cohorts_analysis=cohorts_analysis,
159162
aim_analysis=aim_analysis,

malariagen_data/anoph/base.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -47,6 +47,7 @@ def __init__(
4747
self,
4848
*,
4949
url: str,
50+
public_url: str,
5051
config_path: str,
5152
pre: bool,
5253
major_version_number: int,
@@ -117,6 +118,8 @@ def __init__(
117118
raise ValueError("A value for the `url` parameter must be provided.")
118119
del url
119120

121+
self._public_url = public_url
122+
120123
# Set up fsspec filesystem. N.B., we use fsspec here to allow for
121124
# accessing different types of storage - fsspec will automatically
122125
# detect which type of storage to use based on the URL provided.

malariagen_data/anoph/dipclust.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -47,7 +47,7 @@ def __init__(
4747
summary=""""
4848
Hierarchically cluster diplotypes in region and produce an interactive plot.
4949
50-
If you use this function in a publication, please cite the original manuscript: doi.org/10.1093/molbev/msae140
50+
If you use this function in a publication, please cite both this package and the original manuscript: doi.org/10.1093/molbev/msae140
5151
""",
5252
)
5353
def plot_diplotype_clustering(
@@ -598,7 +598,7 @@ def _insert_dipclust_snp_trace(
598598
summary=""""
599599
Perform diplotype clustering, annotated with heterozygosity, gene copy number and amino acid variants.
600600
601-
If you use this function in a publication, please cite the original manuscript: doi.org/10.1093/molbev/msae140
601+
If you use this function in a publication, please cite both this package and the original manuscript: doi.org/10.1093/molbev/msae140
602602
""",
603603
parameters=dict(
604604
heterozygosity="Plot heterozygosity track.",

malariagen_data/anoph/igv.py

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -31,20 +31,21 @@ def _igv_config(
3131
"reference": {
3232
"id": self._genome_ref_id,
3333
"name": self._genome_ref_name,
34-
"fastaURL": f"{self._url}{self._genome_fasta_path}",
35-
"indexURL": f"{self._url}{self._genome_fai_path}",
34+
"fastaURL": f"{self._public_url}{self._genome_fasta_path}",
35+
"indexURL": f"{self._public_url}{self._genome_fai_path}",
3636
"tracks": [
3737
{
3838
"name": "Genes",
3939
"type": "annotation",
4040
"format": "gff3",
41-
"url": f"{self._url}{self._geneset_gff3_path}",
41+
"url": f"{self._public_url}{self._geneset_gff3_path}",
4242
"indexed": False,
4343
}
4444
],
4545
},
4646
"locus": str(region),
4747
}
48+
4849
if tracks:
4950
config["tracks"] = tracks
5051

@@ -58,7 +59,7 @@ def _igv_site_filters_tracks(
5859
):
5960
tracks = []
6061
for site_mask in self.site_mask_ids:
61-
site_filters_vcf_url = f"{self._url}{self._major_version_path}/site_filters/{self._site_filters_analysis}/vcf/{site_mask}/{contig}_sitefilters.vcf.gz" # noqa
62+
site_filters_vcf_url = f"{self._public_url}{self._major_version_path}/site_filters/{self._site_filters_analysis}/vcf/{site_mask}/{contig}_sitefilters.vcf.gz" # f"{self._url}{self._major_version_path}/site_filters/{self._site_filters_analysis}/vcf/{site_mask}/{contig}_sitefilters.vcf.gz" # noqa
6263
track_config = {
6364
"name": f"Filters - {site_mask}",
6465
"url": site_filters_vcf_url,

malariagen_data/anopheles.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -101,6 +101,7 @@ class AnophelesDataResource(
101101
def __init__(
102102
self,
103103
url,
104+
public_url,
104105
config_path,
105106
cohorts_analysis: Optional[str],
106107
aim_analysis: Optional[str],
@@ -135,6 +136,7 @@ def __init__(
135136
):
136137
super().__init__(
137138
url=url,
139+
public_url=public_url,
138140
config_path=config_path,
139141
bokeh_output_notebook=bokeh_output_notebook,
140142
log=log,

0 commit comments

Comments
 (0)