@@ -977,38 +977,38 @@ job::job({
977977
978978 # Perform optimised joins within DuckDB
979979 copy_query <- "
980- COPY (
981- SELECT
982- cell_to_refined_sample_from_Mengyuan.cell_,
983- cell_to_refined_sample_from_Mengyuan.observation_joinid,
984- cell_to_refined_sample_from_Mengyuan.dataset_id,
985- cell_to_refined_sample_from_Mengyuan.sample_id,
986- cell_to_refined_sample_from_Mengyuan.cell_type,
987- cell_to_refined_sample_from_Mengyuan.cell_type_ontology_term_id,
988- sample_metadata.*,
989- age_days_tbl.age_days,
990- tissue_grouped.tissue_groups
991-
992- FROM cell_to_refined_sample_from_Mengyuan
993-
994- LEFT JOIN cell_ids_for_metadata
995- ON cell_ids_for_metadata.cell_ = cell_to_refined_sample_from_Mengyuan.cell_
996- AND cell_ids_for_metadata.observation_joinid = cell_to_refined_sample_from_Mengyuan.observation_joinid
997- AND cell_ids_for_metadata.dataset_id = cell_to_refined_sample_from_Mengyuan.dataset_id
998-
999- LEFT JOIN sample_metadata
1000- ON cell_ids_for_metadata.sample_ = sample_metadata.sample_
1001- AND cell_ids_for_metadata.donor_id = sample_metadata.donor_id
1002- AND cell_ids_for_metadata.dataset_id = sample_metadata.dataset_id
1003-
1004- LEFT JOIN age_days_tbl
1005- ON age_days_tbl.development_stage = sample_metadata.development_stage
1006-
1007- LEFT JOIN tissue_grouped
1008- ON tissue_grouped.tissue = sample_metadata.tissue
1009-
1010- ) TO '/vast/projects/cellxgene_curated/metadata_cellxgenedp_Apr_2024/cell_metadata_new .parquet'
1011- (FORMAT PARQUET, COMPRESSION 'gzip');
980+ COPY (
981+ SELECT
982+ cell_to_refined_sample_from_Mengyuan.cell_,
983+ cell_to_refined_sample_from_Mengyuan.observation_joinid,
984+ cell_to_refined_sample_from_Mengyuan.dataset_id,
985+ cell_to_refined_sample_from_Mengyuan.sample_id,
986+ cell_to_refined_sample_from_Mengyuan.cell_type,
987+ cell_to_refined_sample_from_Mengyuan.cell_type_ontology_term_id,
988+ sample_metadata.*,
989+ age_days_tbl.age_days,
990+ tissue_grouped.tissue_groups
991+
992+ FROM cell_to_refined_sample_from_Mengyuan
993+
994+ LEFT JOIN cell_ids_for_metadata
995+ ON cell_ids_for_metadata.cell_ = cell_to_refined_sample_from_Mengyuan.cell_
996+ AND cell_ids_for_metadata.observation_joinid = cell_to_refined_sample_from_Mengyuan.observation_joinid
997+ AND cell_ids_for_metadata.dataset_id = cell_to_refined_sample_from_Mengyuan.dataset_id
998+
999+ LEFT JOIN sample_metadata
1000+ ON cell_ids_for_metadata.sample_ = sample_metadata.sample_
1001+ AND cell_ids_for_metadata.donor_id = sample_metadata.donor_id
1002+ AND cell_ids_for_metadata.dataset_id = sample_metadata.dataset_id
1003+
1004+ LEFT JOIN age_days_tbl
1005+ ON age_days_tbl.development_stage = sample_metadata.development_stage
1006+
1007+ LEFT JOIN tissue_grouped
1008+ ON tissue_grouped.tissue = sample_metadata.tissue
1009+
1010+ ) TO '/vast/projects/cellxgene_curated/metadata_cellxgenedp_Apr_2024/cell_metadata .parquet'
1011+ (FORMAT PARQUET, COMPRESSION 'gzip');
10121012"
10131013
10141014 # Execute the final query to write the result to a Parquet file
@@ -1024,7 +1024,7 @@ job::job({
10241024
10251025cell_metadata = tbl(
10261026 dbConnect(duckdb :: duckdb(), dbdir = " :memory:" ),
1027- sql(" SELECT * FROM read_parquet('/vast/projects/cellxgene_curated/metadata_cellxgenedp_Apr_2024/cell_metadata_new .parquet')" )
1027+ sql(" SELECT * FROM read_parquet('/vast/projects/cellxgene_curated/metadata_cellxgenedp_Apr_2024/cell_metadata .parquet')" )
10281028)
10291029
10301030tissues_grouped = get_tissue_grouped()
@@ -1081,7 +1081,7 @@ dbDisconnect(con, shutdown = TRUE)
10811081non_immune_harmonisation =
10821082 read_csv(" /vast/projects/mangiola_immune_map/PostDoc/CuratedAtlasQueryR/dev/cell_type_harmonisation_non_immune.csv" )
10831083
1084- system(" ~/bin/rclone copy /vast/projects/mangiola_immune_map/PostDoc/CuratedAtlasQueryR/dev/cell_type_harmonisation_non_immune.csv box_adelaide:/Mangiola_ImmuneAtlas/reannotation_consensus/" )
1084+ # system("~/bin/rclone copy /vast/projects/mangiola_immune_map/PostDoc/CuratedAtlasQueryR/dev/cell_type_harmonisation_non_immune.csv box_adelaide:/Mangiola_ImmuneAtlas/reannotation_consensus/")
10851085
10861086
10871087tbl(
0 commit comments