|
2 | 2 | "cells": [ |
3 | 3 | { |
4 | 4 | "cell_type": "code", |
5 | | - "execution_count": 26, |
| 5 | + "execution_count": 1, |
6 | 6 | "metadata": {}, |
7 | 7 | "outputs": [], |
8 | 8 | "source": [ |
9 | 9 | "import pandas as pd\n", |
10 | | - "from uuid import uuid5, NAMESPACE_URL\n" |
| 10 | + "import yaml" |
11 | 11 | ] |
12 | 12 | }, |
13 | 13 | { |
14 | 14 | "cell_type": "code", |
15 | | - "execution_count": 5, |
| 15 | + "execution_count": 2, |
16 | 16 | "metadata": {}, |
17 | 17 | "outputs": [ |
18 | 18 | { |
|
182 | 182 | "089d8d63-3364-526f-9706-80d62d0ec88c True " |
183 | 183 | ] |
184 | 184 | }, |
185 | | - "execution_count": 5, |
| 185 | + "execution_count": 2, |
186 | 186 | "metadata": {}, |
187 | 187 | "output_type": "execute_result" |
188 | 188 | } |
|
195 | 195 | }, |
196 | 196 | { |
197 | 197 | "cell_type": "code", |
198 | | - "execution_count": 15, |
| 198 | + "execution_count": 5, |
199 | 199 | "metadata": {}, |
200 | 200 | "outputs": [], |
201 | 201 | "source": [ |
202 | 202 | "for i, row in dccs.iterrows():\n", |
203 | | - "\tmeta = [\"layout: ../../layouts/DCC.astro\"]\n", |
| 203 | + "\tyml = {\"layout\": \"../../layouts/DCC.astro\"}\n", |
204 | 204 | "\tif row['active']:\n", |
205 | 205 | "\t\tdescription = ''\n", |
206 | 206 | "\t\tfor k,v in row.items():\n", |
|
209 | 209 | "\t\t\t\t\tif k == 'icon' and v.startswith('/img'):\n", |
210 | 210 | "\t\t\t\t\t\tv = \"https://cfde-drc.s3.amazonaws.com/assets\" + v\n", |
211 | 211 | "\n", |
212 | | - "\t\t\t\t\tmeta.append(\"%s: %s\"%(k, v))\n", |
| 212 | + "\t\t\t\t\tyml[k] = v\n", |
213 | 213 | "\t\t\telse:\n", |
214 | 214 | "\t\t\t\tdescription = v\n", |
215 | 215 | "\t\twith open('out/dccs/%s.md'%row['short_label'], 'w') as o:\n", |
216 | 216 | "\t\t\to.write('---\\n')\n", |
217 | | - "\t\t\to.write(\"\\n\".join(meta))\n", |
218 | | - "\t\t\to.write('\\n---\\n')\n", |
| 217 | + "\t\t\to.write(yaml.dump(yml))\n", |
| 218 | + "\t\t\to.write('---\\n')\n", |
219 | 219 | "\t\t\to.write(description)" |
220 | 220 | ] |
221 | 221 | }, |
222 | 222 | { |
223 | 223 | "cell_type": "code", |
224 | | - "execution_count": 17, |
| 224 | + "execution_count": 6, |
225 | 225 | "metadata": {}, |
226 | 226 | "outputs": [ |
227 | 227 | { |
|
447 | 447 | "[5 rows x 22 columns]" |
448 | 448 | ] |
449 | 449 | }, |
450 | | - "execution_count": 17, |
| 450 | + "execution_count": 6, |
451 | 451 | "metadata": {}, |
452 | 452 | "output_type": "execute_result" |
453 | 453 | } |
|
461 | 461 | }, |
462 | 462 | { |
463 | 463 | "cell_type": "code", |
464 | | - "execution_count": 22, |
| 464 | + "execution_count": 13, |
| 465 | + "metadata": {}, |
| 466 | + "outputs": [], |
| 467 | + "source": [ |
| 468 | + "for i, row in publications.iterrows():\n", |
| 469 | + "\tyml = {\"layout\": \"../../layouts/Publication.astro\"}\n", |
| 470 | + "\tfor k,v in row.items():\n", |
| 471 | + "\t\tif not v == '':\n", |
| 472 | + "\t\t\tif k == 'dccs':\n", |
| 473 | + "\t\t\t\tv = v.split(\"; \")\n", |
| 474 | + "\t\t\tif k == \"pmid\":\n", |
| 475 | + "\t\t\t\tv = int(v)\n", |
| 476 | + "\t\t\tyml[k] = v\n", |
| 477 | + "\tfilename = \"PMID: %s\"%str(int(yml['pmid'])) if \"pmid\" in yml else \"DOI: %s\"%yml['doi'].replace(\"/\", \"-\")\n", |
| 478 | + "\twith open('out/publications/%s.md'%filename, 'w') as o:\n", |
| 479 | + "\t\to.write('---\\n')\n", |
| 480 | + "\t\to.write(yaml.dump(yml))\n", |
| 481 | + "\t\to.write('\\n---')" |
| 482 | + ] |
| 483 | + }, |
| 484 | + { |
| 485 | + "cell_type": "code", |
| 486 | + "execution_count": 7, |
465 | 487 | "metadata": {}, |
466 | 488 | "outputs": [ |
467 | 489 | { |
468 | 490 | "data": { |
469 | 491 | "text/plain": [ |
470 | | - "((85, 22), 85)" |
| 492 | + "100" |
471 | 493 | ] |
472 | 494 | }, |
473 | | - "execution_count": 22, |
| 495 | + "execution_count": 7, |
474 | 496 | "metadata": {}, |
475 | 497 | "output_type": "execute_result" |
476 | 498 | } |
477 | 499 | ], |
478 | 500 | "source": [ |
479 | | - "publications.shape, publications.doi.nunique()" |
| 501 | + "int(100.0)" |
480 | 502 | ] |
481 | 503 | }, |
482 | 504 | { |
483 | 505 | "cell_type": "code", |
484 | | - "execution_count": 24, |
| 506 | + "execution_count": 11, |
485 | 507 | "metadata": {}, |
486 | 508 | "outputs": [ |
487 | 509 | { |
488 | 510 | "data": { |
489 | 511 | "text/plain": [ |
490 | | - "np.int64(1)" |
| 512 | + "title Predictive analyses of regulatory sequences wi...\n", |
| 513 | + "journal Nature Computational Science\n", |
| 514 | + "authors Klie A; Laub D; Talwar JV; Stites H; Jores T; ...\n", |
| 515 | + "year 2023\n", |
| 516 | + "page 946-956\n", |
| 517 | + "volume 3\n", |
| 518 | + "issue 11\n", |
| 519 | + "pmid 38177592.0\n", |
| 520 | + "pmcid PMC10768637\n", |
| 521 | + "doi 10.1038/s43588-023-00544-w\n", |
| 522 | + "landmark False\n", |
| 523 | + "tool_id \n", |
| 524 | + "dccs \n", |
| 525 | + "partnerships \n", |
| 526 | + "carousel False\n", |
| 527 | + "carousel_title \n", |
| 528 | + "carousel_link \n", |
| 529 | + "carousel_description \n", |
| 530 | + "image \n", |
| 531 | + "featured False\n", |
| 532 | + "r03 \n", |
| 533 | + "keywords [\"Workflow\", \"Genome\", \"Genomics\", \"Software\"]\n", |
| 534 | + "Name: 84, dtype: object" |
491 | 535 | ] |
492 | 536 | }, |
493 | | - "execution_count": 24, |
| 537 | + "execution_count": 11, |
494 | 538 | "metadata": {}, |
495 | 539 | "output_type": "execute_result" |
496 | 540 | } |
497 | 541 | ], |
498 | 542 | "source": [ |
499 | | - "(publications.pmid == '').sum()" |
500 | | - ] |
501 | | - }, |
502 | | - { |
503 | | - "cell_type": "code", |
504 | | - "execution_count": 28, |
505 | | - "metadata": {}, |
506 | | - "outputs": [], |
507 | | - "source": [ |
508 | | - "for i, row in publications.iterrows():\n", |
509 | | - "\tmeta = [\"layout: ../../layouts/Publication.astro\"]\n", |
510 | | - "\tfor k,v in row.items():\n", |
511 | | - "\t\tif not v == '':\n", |
512 | | - "\t\t\tif k == 'dccs':\n", |
513 | | - "\t\t\t\tv = v.split(\"; \")\n", |
514 | | - "\n", |
515 | | - "\t\t\tmeta.append(\"%s: %s\"%(k, v))\n", |
516 | | - "\tuid = str(uuid5(NAMESPACE_URL, row['title']))\n", |
517 | | - "\twith open('out/publications/%s.md'%uid, 'w') as o:\n", |
518 | | - "\t\to.write('---\\n')\n", |
519 | | - "\t\to.write(\"\\n\".join(meta))\n", |
520 | | - "\t\to.write('\\n---')" |
| 543 | + "row" |
521 | 544 | ] |
522 | 545 | }, |
523 | 546 | { |
|
0 commit comments