Skip to content

Commit a62c577

Browse files
committed
modified pub
1 parent 4daa81c commit a62c577

File tree

86 files changed

+2024
-40
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

86 files changed

+2024
-40
lines changed

script/process_markdown.ipynb

Lines changed: 63 additions & 40 deletions
Original file line numberDiff line numberDiff line change
@@ -2,17 +2,17 @@
22
"cells": [
33
{
44
"cell_type": "code",
5-
"execution_count": 26,
5+
"execution_count": 1,
66
"metadata": {},
77
"outputs": [],
88
"source": [
99
"import pandas as pd\n",
10-
"from uuid import uuid5, NAMESPACE_URL\n"
10+
"import yaml"
1111
]
1212
},
1313
{
1414
"cell_type": "code",
15-
"execution_count": 5,
15+
"execution_count": 2,
1616
"metadata": {},
1717
"outputs": [
1818
{
@@ -182,7 +182,7 @@
182182
"089d8d63-3364-526f-9706-80d62d0ec88c True "
183183
]
184184
},
185-
"execution_count": 5,
185+
"execution_count": 2,
186186
"metadata": {},
187187
"output_type": "execute_result"
188188
}
@@ -195,12 +195,12 @@
195195
},
196196
{
197197
"cell_type": "code",
198-
"execution_count": 15,
198+
"execution_count": 5,
199199
"metadata": {},
200200
"outputs": [],
201201
"source": [
202202
"for i, row in dccs.iterrows():\n",
203-
"\tmeta = [\"layout: ../../layouts/DCC.astro\"]\n",
203+
"\tyml = {\"layout\": \"../../layouts/DCC.astro\"}\n",
204204
"\tif row['active']:\n",
205205
"\t\tdescription = ''\n",
206206
"\t\tfor k,v in row.items():\n",
@@ -209,19 +209,19 @@
209209
"\t\t\t\t\tif k == 'icon' and v.startswith('/img'):\n",
210210
"\t\t\t\t\t\tv = \"https://cfde-drc.s3.amazonaws.com/assets\" + v\n",
211211
"\n",
212-
"\t\t\t\t\tmeta.append(\"%s: %s\"%(k, v))\n",
212+
"\t\t\t\t\tyml[k] = v\n",
213213
"\t\t\telse:\n",
214214
"\t\t\t\tdescription = v\n",
215215
"\t\twith open('out/dccs/%s.md'%row['short_label'], 'w') as o:\n",
216216
"\t\t\to.write('---\\n')\n",
217-
"\t\t\to.write(\"\\n\".join(meta))\n",
218-
"\t\t\to.write('\\n---\\n')\n",
217+
"\t\t\to.write(yaml.dump(yml))\n",
218+
"\t\t\to.write('---\\n')\n",
219219
"\t\t\to.write(description)"
220220
]
221221
},
222222
{
223223
"cell_type": "code",
224-
"execution_count": 17,
224+
"execution_count": 6,
225225
"metadata": {},
226226
"outputs": [
227227
{
@@ -447,7 +447,7 @@
447447
"[5 rows x 22 columns]"
448448
]
449449
},
450-
"execution_count": 17,
450+
"execution_count": 6,
451451
"metadata": {},
452452
"output_type": "execute_result"
453453
}
@@ -461,63 +461,86 @@
461461
},
462462
{
463463
"cell_type": "code",
464-
"execution_count": 22,
464+
"execution_count": 13,
465+
"metadata": {},
466+
"outputs": [],
467+
"source": [
468+
"for i, row in publications.iterrows():\n",
469+
"\tyml = {\"layout\": \"../../layouts/Publication.astro\"}\n",
470+
"\tfor k,v in row.items():\n",
471+
"\t\tif not v == '':\n",
472+
"\t\t\tif k == 'dccs':\n",
473+
"\t\t\t\tv = v.split(\"; \")\n",
474+
"\t\t\tif k == \"pmid\":\n",
475+
"\t\t\t\tv = int(v)\n",
476+
"\t\t\tyml[k] = v\n",
477+
"\tfilename = \"PMID: %s\"%str(int(yml['pmid'])) if \"pmid\" in yml else \"DOI: %s\"%yml['doi'].replace(\"/\", \"-\")\n",
478+
"\twith open('out/publications/%s.md'%filename, 'w') as o:\n",
479+
"\t\to.write('---\\n')\n",
480+
"\t\to.write(yaml.dump(yml))\n",
481+
"\t\to.write('\\n---')"
482+
]
483+
},
484+
{
485+
"cell_type": "code",
486+
"execution_count": 7,
465487
"metadata": {},
466488
"outputs": [
467489
{
468490
"data": {
469491
"text/plain": [
470-
"((85, 22), 85)"
492+
"100"
471493
]
472494
},
473-
"execution_count": 22,
495+
"execution_count": 7,
474496
"metadata": {},
475497
"output_type": "execute_result"
476498
}
477499
],
478500
"source": [
479-
"publications.shape, publications.doi.nunique()"
501+
"int(100.0)"
480502
]
481503
},
482504
{
483505
"cell_type": "code",
484-
"execution_count": 24,
506+
"execution_count": 11,
485507
"metadata": {},
486508
"outputs": [
487509
{
488510
"data": {
489511
"text/plain": [
490-
"np.int64(1)"
512+
"title Predictive analyses of regulatory sequences wi...\n",
513+
"journal Nature Computational Science\n",
514+
"authors Klie A; Laub D; Talwar JV; Stites H; Jores T; ...\n",
515+
"year 2023\n",
516+
"page 946-956\n",
517+
"volume 3\n",
518+
"issue 11\n",
519+
"pmid 38177592.0\n",
520+
"pmcid PMC10768637\n",
521+
"doi 10.1038/s43588-023-00544-w\n",
522+
"landmark False\n",
523+
"tool_id \n",
524+
"dccs \n",
525+
"partnerships \n",
526+
"carousel False\n",
527+
"carousel_title \n",
528+
"carousel_link \n",
529+
"carousel_description \n",
530+
"image \n",
531+
"featured False\n",
532+
"r03 \n",
533+
"keywords [\"Workflow\", \"Genome\", \"Genomics\", \"Software\"]\n",
534+
"Name: 84, dtype: object"
491535
]
492536
},
493-
"execution_count": 24,
537+
"execution_count": 11,
494538
"metadata": {},
495539
"output_type": "execute_result"
496540
}
497541
],
498542
"source": [
499-
"(publications.pmid == '').sum()"
500-
]
501-
},
502-
{
503-
"cell_type": "code",
504-
"execution_count": 28,
505-
"metadata": {},
506-
"outputs": [],
507-
"source": [
508-
"for i, row in publications.iterrows():\n",
509-
"\tmeta = [\"layout: ../../layouts/Publication.astro\"]\n",
510-
"\tfor k,v in row.items():\n",
511-
"\t\tif not v == '':\n",
512-
"\t\t\tif k == 'dccs':\n",
513-
"\t\t\t\tv = v.split(\"; \")\n",
514-
"\n",
515-
"\t\t\tmeta.append(\"%s: %s\"%(k, v))\n",
516-
"\tuid = str(uuid5(NAMESPACE_URL, row['title']))\n",
517-
"\twith open('out/publications/%s.md'%uid, 'w') as o:\n",
518-
"\t\to.write('---\\n')\n",
519-
"\t\to.write(\"\\n\".join(meta))\n",
520-
"\t\to.write('\\n---')"
543+
"row"
521544
]
522545
},
523546
{
Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,20 @@
1+
---
2+
authors: Higgins D, Thibert JP, Mattioni M, DiGiovanna J, Grossman RL, Farrow BK,
3+
Wenger E, Volchenboum S, Carroll RJ, Haendel MA, Taylor DM, Zhu Y, Ferretti V,
4+
Resnick AC, Heath AP
5+
carousel: false
6+
dccs:
7+
- Kids First
8+
doi: 10.1158/1538-7445.AM2023-6576
9+
featured: false
10+
issue: '83'
11+
journal: Cancer Research
12+
landmark: true
13+
layout: ../../layouts/Publication.astro
14+
page: '6576'
15+
title: 'Gabriella Miller Kids First Data Resource Center (KFDRC): Empowering discovery
16+
across germline and somatic variation in pediatric cancer.'
17+
volume: 7_Supplement
18+
year: 2023
19+
20+
---
Lines changed: 22 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,22 @@
1+
---
2+
authors: Human Microbiome Project Consortium
3+
carousel: false
4+
dccs:
5+
- HMP
6+
doi: 10.1038/nature11234
7+
featured: false
8+
issue: '7402'
9+
journal: Nature
10+
keywords: '["Male", "Metagenomics", "RNA, Ribosomal, 16S", "Phenotype", "Young Adult",
11+
"Biodiversity", "Adult", "Bacteria", "Metabolic Networks and Pathways", "Metagenome",
12+
"Female", "Ecosystem", "Health", "Adolescent", "Humans"]'
13+
landmark: true
14+
layout: ../../layouts/Publication.astro
15+
page: 207-14
16+
pmcid: PMC3564958
17+
pmid: 22699609
18+
title: Structure, function and diversity of the healthy human microbiome.
19+
volume: '486'
20+
year: 2012
21+
22+
---
Lines changed: 22 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,22 @@
1+
---
2+
authors: Human Microbiome Project Consortium
3+
carousel: false
4+
dccs:
5+
- HMP
6+
doi: 10.1038/nature11209
7+
featured: false
8+
issue: '7402'
9+
journal: Nature
10+
keywords: '["Statistics as Topic", "Male", "Metagenomics", "RNA, Ribosomal, 16S",
11+
"Young Adult", "Adult", "Metagenome", "Bacteria", "Reference Standards", "Female",
12+
"Adolescent", "Humans"]'
13+
landmark: true
14+
layout: ../../layouts/Publication.astro
15+
page: 215-21
16+
pmcid: PMC3377744
17+
pmid: 22699610
18+
title: A framework for human microbiome research.
19+
volume: '486'
20+
year: 2012
21+
22+
---
Lines changed: 23 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,23 @@
1+
---
2+
authors: GTEx Consortium
3+
carousel: false
4+
dccs:
5+
- GTEx
6+
doi: 10.1038/ng.2653
7+
featured: false
8+
issue: '6'
9+
journal: Nature genetics
10+
keywords: '["Gene Expression Profiling", "Gene Expression", "Government Programs",
11+
"Organ Specificity", "Tissue Banks", "Molecular Sequence Annotation", "Consensus
12+
Development Conferences, NIH as Topic", "Quantitative Trait Loci", "United States",
13+
"Genome-Wide Association Study", "Humans"]'
14+
landmark: true
15+
layout: ../../layouts/Publication.astro
16+
page: 580-5
17+
pmcid: PMC4010069
18+
pmid: 23715323
19+
title: The Genotype-Tissue Expression (GTEx) project.
20+
volume: '45'
21+
year: 2013
22+
23+
---
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
---
2+
authors: GTEx Consortium
3+
carousel: false
4+
dccs:
5+
- GTEx
6+
doi: 10.1126/science.1262110
7+
featured: false
8+
issue: '6235'
9+
journal: Science (New York, N.Y.)
10+
keywords: '["RNA, Untranslated", "Sequence Analysis, RNA", "ARHGAP42 protein, human",
11+
"Transcriptome", "Tibial Arteries", "Blood Pressure", "GTPase-Activating Proteins",
12+
"Disease", "Genotype", "Humans", "Pilot Projects", "RNA Splicing", "Genetic Variation",
13+
"Organ Specificity", "Gene Regulatory Networks", "Quantitative Trait Loci", "Genome,
14+
Human", "Multigene Family", "Gene Expression Regulation", "Alleles", "Genome-Wide
15+
Association Study"]'
16+
landmark: true
17+
layout: ../../layouts/Publication.astro
18+
page: 648-60
19+
pmcid: PMC4547484
20+
pmid: 25954001
21+
title: 'Human genomics. The Genotype-Tissue Expression (GTEx) pilot analysis: multitissue
22+
gene regulation in humans.'
23+
volume: '348'
24+
year: 2015
25+
26+
---
Lines changed: 21 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,21 @@
1+
---
2+
authors: Ainsztein AM, Brooks PJ, Dugan VG, Ganguly A, Guo M, Howcroft TK, Kelley
3+
CA, Kuo LS, Labosky PA, Lenzi R, McKie GA, Mohla S, Procaccini D, Reilly M, Satterlee
4+
JS, Srinivas PR, Church ES, Sutherland M, Tagle DA, Tucker JM, Venkatachalam S
5+
carousel: false
6+
dccs:
7+
- ExRNA
8+
doi: 10.3402/jev.v4.27493
9+
featured: false
10+
journal: Journal of extracellular vesicles
11+
keywords: '["exRNA", "extracellular RNA", "ERCC"]'
12+
landmark: true
13+
layout: ../../layouts/Publication.astro
14+
page: '27493'
15+
pmcid: PMC4553264
16+
pmid: 26320938
17+
title: The NIH Extracellular RNA Communication Consortium.
18+
volume: '4'
19+
year: 2015
20+
21+
---
Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
---
2+
authors: Sud M, Fahy E, Cotter D, Azam K, Vadivelu I, Burant C, Edison A, Fiehn O,
3+
Higashi R, Nair KS, Sumner S, Subramaniam S
4+
carousel: false
5+
dccs:
6+
- Metabolomics
7+
doi: 10.1093/nar/gkv1042
8+
featured: false
9+
issue: D1
10+
journal: Nucleic acids research
11+
keywords: '["Databases, Chemical", "User-Computer Interface", "Mass Spectrometry",
12+
"Metabolomics", "Molecular Structure", "Magnetic Resonance Spectroscopy", "Reference
13+
Standards", "Software", "Animals", "Humans"]'
14+
landmark: true
15+
layout: ../../layouts/Publication.astro
16+
page: D463-70
17+
pmcid: PMC4702780
18+
pmid: 26467476
19+
title: 'Metabolomics Workbench: An international repository for metabolomics data
20+
and metadata, metabolite standards, protocols, tutorials and training, and analysis
21+
tools.'
22+
volume: '44'
23+
year: 2016
24+
25+
---

0 commit comments

Comments
 (0)