Skip to content

Commit 4671bf5

Browse files
committed
updated outreach
1 parent 6e743c0 commit 4671bf5

13 files changed

+74
-53
lines changed

script/ingestion/outreach.py

Lines changed: 52 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,13 +15,24 @@
1515
for k,v in dccs.iterrows():
1616
dcc_mapper[v["short_label"]] = k
1717

18-
outreach_columns = ["title", "short_description", "description", "tags", "agenda", "featured", "active", "start_date", "end_date", "application_start", "application_end", "link", "image", "carousel", "carousel_description", "cfde_specific", "flyer"]
18+
centers = pd.read_csv('https://cfde-drc.s3.amazonaws.com/database/files/current_centers.tsv', sep="\t", index_col=0, header=0)
19+
# map dcc names to their respective ids
20+
center_mapper = {}
21+
for k,v in centers.iterrows():
22+
center_mapper[v["short_label"]] = k
23+
24+
25+
outreach_columns = ["title", "short_description", "description", "tags", "agenda", "featured", "active", "start_date", "end_date", "application_start", "application_end", "link", "image", "carousel", "carousel_description", "cfde_specific", "flyer", "recurring", "ical", "schedule"]
1926
dcc_outreach_columns = ["outreach_id", "dcc_id"]
27+
center_outreach_columns = ["outreach_id", "center_id"]
2028

2129
outreach_df = pd.DataFrame("-", index=[], columns=outreach_columns)
2230
outreach_df.index.name = 'id'
2331
dcc_outreach_df = pd.DataFrame("-", index=[], columns=dcc_outreach_columns)
2432
ind = 0
33+
34+
center_outreach_df = pd.DataFrame("-", index=[], columns=center_outreach_columns)
35+
cind = 0
2536
outreach_df = outreach_df.fillna('')
2637

2738
for filename in glob('../../src/pages/outreach/*.md'):
@@ -51,6 +62,12 @@
5162
dcc_id = dcc_mapper[dcc]
5263
dcc_outreach_df.loc[ind] = [uid, dcc_mapper[dcc]]
5364
ind += 1
65+
if val.get('center'):
66+
for center in val["center"]:
67+
center_id = center_mapper[center]
68+
center_outreach_df.loc[cind] = [uid, center_mapper[center]]
69+
cind += 1
70+
5471

5572
# webinars
5673
webinars = {}
@@ -79,16 +96,22 @@
7996
outreach_df['active'] = outreach_df['active'].fillna(0).astype(bool)
8097
outreach_df['featured'] = outreach_df['featured'].fillna(0).astype(bool)
8198
outreach_df['carousel'] = outreach_df['carousel'].fillna(0).astype(bool)
99+
outreach_df['recurring'] = outreach_df['recurring'].fillna(0).astype(bool)
82100
outreach_df['cfde_specific'] = outreach_df['cfde_specific'].fillna(0).astype(bool)
83101
backup_file(outreach_df, "outreach", quoting=False)
84102
backup_file(dcc_outreach_df, "dcc_outreach", False)
103+
backup_file(center_outreach_df, "center_outreach", False)
85104

86105
cur = connection.cursor()
87106

88107
cur.execute('''
89108
DELETE FROM dcc_outreach;
90109
''')
91110

111+
cur.execute('''
112+
DELETE FROM center_outreach;
113+
''')
114+
92115
cur.execute('''
93116
DELETE FROM outreach;
94117
''')
@@ -146,6 +169,34 @@
146169
;
147170
''')
148171
cur.execute('drop table dcc_outreach_tmp;')
172+
173+
# centers
174+
175+
cur = connection.cursor()
176+
cur.execute('''
177+
create table center_outreach_tmp
178+
as table center_outreach
179+
with no data;
180+
''')
181+
c_buf = io.StringIO()
182+
center_outreach_df.to_csv(c_buf, header=True, sep="\t", index=None)
183+
c_buf.seek(0)
184+
columns = next(c_buf).strip().split('\t')
185+
cur.copy_from(c_buf, 'center_outreach_tmp',
186+
columns=center_outreach_columns,
187+
null='',
188+
sep='\t',
189+
)
190+
191+
cur.execute('''
192+
insert into center_outreach (outreach_id, center_id)
193+
select outreach_id, center_id
194+
from center_outreach_tmp
195+
on conflict
196+
do nothing
197+
;
198+
''')
199+
cur.execute('drop table center_outreach_tmp;')
149200
connection.commit()
150201

151202
print("Ingested outreach and webinars")

src/pages/outreach/Accepting Application for the 2025 Summer Research Training Program in Biomedical Big Data Science 2025-02-01.md

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,6 @@ carousel: true
55
cfde_specific: true
66
dcc:
77
- LINCS
8-
end_date: '2025-02-01T17:00:00-04:00'
98
featured: true
109
image: https://cfde-drc.s3.us-east-2.amazonaws.com/assets/img/Maayan_program.png
1110
layout: '@/layouts/Outreach.astro'
@@ -17,7 +16,7 @@ short_description: "The LINCS DCC Summer Research Training Program in Biomedical
1716
\ in the areas: data harmonization, machine learning, cloud computing, and dynamic\
1817
\ data visualization. <br/><br /> Application Deadline: February 1, 2025 <br />Program\
1918
\ Dates: June 2, 2025 \u2013 August 8, 2025 "
20-
start_date: '2024-10-01T12:00:00-05:00'
19+
application_start: '2024-10-01T12:00:00-05:00'
2120
tags: '["training program", "application deadline"]'
2221
title: Accepting Application for the 2025 Summer Research Training Program in Biomedical
2322
Big Data Science

src/pages/outreach/CFDE Centers 2025-12-31.md

Lines changed: 0 additions & 14 deletions
This file was deleted.

src/pages/outreach/CFDE Webinar Series 2025-01-23.md

Lines changed: 0 additions & 13 deletions
This file was deleted.

src/pages/outreach/Coursera Course: Big Data Science with the BD2K-LINCS Data Coordination and Integration Center.md

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -14,5 +14,7 @@ short_description: 'In this course the LINCS DCC covers computational methods in
1414
tags: '["course"]'
1515
title: 'Coursera Course: Big Data Science with the BD2K-LINCS Data Coordination and
1616
Integration Center'
17+
recurring: true
18+
start_date: '2025-04-30T00:00:00-04:00'
1719
---
1820
In this course the LINCS DCC introduces the data generation centers that collected data for the LINCS program. Then, the course covers metadata and how metadata is linked to ontologies. The course then introduces data processing methods used to clean and harmonize the LINCS data. This is followed by discussions about how data is served as RESTful APIs. Most importantly, the course covers computational methods including: clustering, gene-set enrichment analysis, interactive data visualization, and supervised learning.

src/pages/outreach/HuBMAP Visible Human MOOC (VHMOOC).md

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,8 @@ link: https://expand.iu.edu/browse/sice/cns/courses/hubmap-visible-human-mooc
1111
short_description: This 10h course introduces the HuBMAP project which aims to create
1212
an open, global reference atlas of the human body at the cellular level.
1313
tags: '["course"]'
14+
recurring: true
15+
start_date: '2020-08-04T00:00:00-04:00'
1416
title: HuBMAP Visible Human MOOC (VHMOOC)
1517
---
1618
This 10h course introduces the HuBMAP project which aims to create an open, global reference atlas of the human body at the cellular level. Among others, the course describes the compilation and coverage of HuBMAP data, demonstrates new single-cell analysis and mapping techniques, and introduces major features of the HuBMAP portal.

src/pages/outreach/MoTrPAC Office Hours.md

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,14 +5,16 @@ cfde_specific: false
55
dcc:
66
- MoTrPAC
77
featured: false
8-
image: https://cfde-drc.s3.us-east-2.amazonaws.com/assets/img/MoTrPAC.png
8+
image: https://cfde-drc.s3.us-east-2.amazonaws.com/assets/img/motrpac-office-hours.png
99
layout: '@/layouts/Outreach.astro'
1010
link: https://motrpac-data.org/
1111
short_description: The MoTrPAC Bioinformatics Center (BIC) hosts monthly open office
1212
hours to support the scientific community. Each session is hosted by one member
1313
from our infrastructure team and one from our bioinformatics team with a focus on
1414
the discussions of MoTrPAC data.
1515
tags: '["office hours"]'
16+
start_date: '2025-05-08T00:00:00-07:00'
1617
title: MoTrPAC Office Hours
18+
recurring: true
1719
---
1820
The MoTrPAC Bioinformatics Center (BIC) hosts monthly open office hours to support the scientific community. Each session is hosted by one member from our infrastructure team and one from our bioinformatics team with a focus on the discussions of MoTrPAC data.

src/pages/outreach/Multi-Omics AI-Driven Gene Set Analysis with GeneSetCart 2025-01-23.md

Lines changed: 0 additions & 17 deletions
This file was deleted.

src/pages/outreach/Omics Tools Webinar Series: ARCHS4 2025-02-27.md

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,9 @@ short_description: The webinar featured ARCHS, a resource that provides access
1616
to gene and transcript counts uniformly processed from all the human and mouse RNA-seq
1717
experiments deposited by the community in the NCBI Gene Expression Omnibus (GEO).
1818
start_date: '2025-02-27T14:00:00-05:00'
19-
tags: '["workshop"]'
19+
tags: '["webinar"]'
20+
center:
21+
- DRC
2022
title: 'Omics Tools Webinar Series: ARCHS4'
2123
---
2224
The webinar featured [ARCHS4](https://maayanlab.cloud/archs4/), a resource that provides access to gene and transcript counts uniformly processed from all the human and mouse RNA-seq experiments deposited by the community in the NCBI Gene Expression Omnibus (GEO). Watch recording [here](https://www.youtube.com/watch?v=BSz4XWFmfkg).

src/pages/outreach/Omics Tools Webinar Series: GeneSetCart 2025-01-23.md

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,9 @@ image: /img/genesetcart_webinar.png
1010
layout: '@/layouts/Outreach.astro'
1111
link: https://mountsinai.zoom.us/webinar/register/WN_ZXBJyN0SRuCj5LaYoGeXuw#/registration
1212
short_description: In this lecture, Giacomo Marino, a Bioinformatics Software Engineer in the Ma'ayan Lab at the Icahn School of Medicine at Mount Sinai, describes a new platform for assembling, augmenting, combining, visualizing, and analyzing gene sets. The platform utilizes LLMs to form hypotheses from datasets produced by NIH Common Fund programs.
13-
tags: '["workshop"]'
13+
tags: '["webinar"]'
14+
center:
15+
- DRC
1416
title: 'Omics Tools Webinar Series: GeneSetCart
1517
'
1618
---

0 commit comments

Comments
 (0)