diff --git a/common b/common index 876036f71..f01ff2170 160000 --- a/common +++ b/common @@ -1 +1 @@ -Subproject commit 876036f71713cbd79285b108ab0a9a8238f2b5e1 +Subproject commit f01ff2170161295e89014ee5453c61b29b4e4e77 diff --git a/docs/build/doctrees/dataset.doctree b/docs/build/doctrees/dataset.doctree index 3ea7f7bad..b39003cbc 100644 Binary files a/docs/build/doctrees/dataset.doctree and b/docs/build/doctrees/dataset.doctree differ diff --git a/docs/build/doctrees/environment.pickle b/docs/build/doctrees/environment.pickle index 68395e875..02d83a60b 100644 Binary files a/docs/build/doctrees/environment.pickle and b/docs/build/doctrees/environment.pickle differ diff --git a/docs/build/doctrees/evaluation.doctree b/docs/build/doctrees/evaluation.doctree index 43a7d2af9..44a3e89d8 100644 Binary files a/docs/build/doctrees/evaluation.doctree and b/docs/build/doctrees/evaluation.doctree differ diff --git a/docs/build/doctrees/extending.doctree b/docs/build/doctrees/extending.doctree index 1a657e459..5b3375b48 100644 Binary files a/docs/build/doctrees/extending.doctree and b/docs/build/doctrees/extending.doctree differ diff --git a/docs/build/doctrees/index.doctree b/docs/build/doctrees/index.doctree index 283a92c78..21de8b4e6 100644 Binary files a/docs/build/doctrees/index.doctree and b/docs/build/doctrees/index.doctree differ diff --git a/docs/build/doctrees/inference.doctree b/docs/build/doctrees/inference.doctree index 2fe1018d1..cfd503de4 100644 Binary files a/docs/build/doctrees/inference.doctree and b/docs/build/doctrees/inference.doctree differ diff --git a/docs/build/doctrees/leaderboard.doctree b/docs/build/doctrees/leaderboard.doctree index b8230257f..3dca66a90 100644 Binary files a/docs/build/doctrees/leaderboard.doctree and b/docs/build/doctrees/leaderboard.doctree differ diff --git a/docs/build/doctrees/repo/objects.doctree b/docs/build/doctrees/repo/objects.doctree index b0bc255df..e18920ea4 100644 Binary files a/docs/build/doctrees/repo/objects.doctree and b/docs/build/doctrees/repo/objects.doctree differ diff --git a/docs/build/html/_images/datasets.png b/docs/build/html/_images/datasets.png index b08a554c9..9ac5c6238 100644 Binary files a/docs/build/html/_images/datasets.png and b/docs/build/html/_images/datasets.png differ diff --git a/docs/build/html/_images/datasets_metrics.png b/docs/build/html/_images/datasets_metrics.png deleted file mode 100644 index cdec25940..000000000 Binary files a/docs/build/html/_images/datasets_metrics.png and /dev/null differ diff --git a/docs/build/html/_images/grn_models.png b/docs/build/html/_images/grn_models.png deleted file mode 100644 index a7d9c7d69..000000000 Binary files a/docs/build/html/_images/grn_models.png and /dev/null differ diff --git a/docs/build/html/_images/metric_quality_evaluation.png b/docs/build/html/_images/metric_quality_evaluation.png new file mode 100644 index 000000000..d321fc49e Binary files /dev/null and b/docs/build/html/_images/metric_quality_evaluation.png differ diff --git a/docs/build/html/_images/metrics.png b/docs/build/html/_images/metrics.png index f5c2fd02c..2f9e1bd36 100644 Binary files a/docs/build/html/_images/metrics.png and b/docs/build/html/_images/metrics.png differ diff --git a/docs/build/html/_images/raw_scores_300BCG.png b/docs/build/html/_images/raw_scores_300BCG.png index f4b06b0cf..cec454d14 100644 Binary files a/docs/build/html/_images/raw_scores_300BCG.png and b/docs/build/html/_images/raw_scores_300BCG.png differ diff --git a/docs/build/html/_images/raw_scores_adamson.png b/docs/build/html/_images/raw_scores_adamson.png deleted file mode 100644 index 53a2614f1..000000000 Binary files a/docs/build/html/_images/raw_scores_adamson.png and /dev/null differ diff --git a/docs/build/html/_images/raw_scores_ibd.png b/docs/build/html/_images/raw_scores_ibd.png deleted file mode 100644 index cc4e8bf19..000000000 Binary files a/docs/build/html/_images/raw_scores_ibd.png and /dev/null differ diff --git a/docs/build/html/_images/raw_scores_ibd_cd.png b/docs/build/html/_images/raw_scores_ibd_cd.png new file mode 100644 index 000000000..968629360 Binary files /dev/null and b/docs/build/html/_images/raw_scores_ibd_cd.png differ diff --git a/docs/build/html/_images/raw_scores_ibd_uc.png b/docs/build/html/_images/raw_scores_ibd_uc.png new file mode 100644 index 000000000..1d402ed77 Binary files /dev/null and b/docs/build/html/_images/raw_scores_ibd_uc.png differ diff --git a/docs/build/html/_images/raw_scores_nakatake.png b/docs/build/html/_images/raw_scores_nakatake.png index 0da93a104..4fed0c14f 100644 Binary files a/docs/build/html/_images/raw_scores_nakatake.png and b/docs/build/html/_images/raw_scores_nakatake.png differ diff --git a/docs/build/html/_images/raw_scores_norman.png b/docs/build/html/_images/raw_scores_norman.png index 538446d00..b3611239b 100644 Binary files a/docs/build/html/_images/raw_scores_norman.png and b/docs/build/html/_images/raw_scores_norman.png differ diff --git a/docs/build/html/_images/raw_scores_op.png b/docs/build/html/_images/raw_scores_op.png index b55325147..7228b96c7 100644 Binary files a/docs/build/html/_images/raw_scores_op.png and b/docs/build/html/_images/raw_scores_op.png differ diff --git a/docs/build/html/_images/raw_scores_parsebioscience.png b/docs/build/html/_images/raw_scores_parsebioscience.png index 723d508b6..3c382b4f6 100644 Binary files a/docs/build/html/_images/raw_scores_parsebioscience.png and b/docs/build/html/_images/raw_scores_parsebioscience.png differ diff --git a/docs/build/html/_images/raw_scores_replogle.png b/docs/build/html/_images/raw_scores_replogle.png index ab0d3a5ef..76915237e 100644 Binary files a/docs/build/html/_images/raw_scores_replogle.png and b/docs/build/html/_images/raw_scores_replogle.png differ diff --git a/docs/build/html/_images/raw_scores_xaira_HCT116.png b/docs/build/html/_images/raw_scores_xaira_HCT116.png index 946595ffd..307473dd8 100644 Binary files a/docs/build/html/_images/raw_scores_xaira_HCT116.png and b/docs/build/html/_images/raw_scores_xaira_HCT116.png differ diff --git a/docs/build/html/_images/raw_scores_xaira_HEK293T.png b/docs/build/html/_images/raw_scores_xaira_HEK293T.png index c451309a2..ec5856c85 100644 Binary files a/docs/build/html/_images/raw_scores_xaira_HEK293T.png and b/docs/build/html/_images/raw_scores_xaira_HEK293T.png differ diff --git a/docs/build/html/_images/summary_figure.pdf b/docs/build/html/_images/summary_figure.pdf new file mode 100644 index 000000000..a151e4a0d Binary files /dev/null and b/docs/build/html/_images/summary_figure.pdf differ diff --git a/docs/build/html/_images/summary_figure.png b/docs/build/html/_images/summary_figure.png new file mode 100644 index 000000000..5c13b7046 Binary files /dev/null and b/docs/build/html/_images/summary_figure.png differ diff --git a/docs/build/html/_images/table_datasets_summary.pdf b/docs/build/html/_images/table_datasets_summary.pdf new file mode 100644 index 000000000..edbe45376 Binary files /dev/null and b/docs/build/html/_images/table_datasets_summary.pdf differ diff --git a/docs/build/html/_images/table_datasets_summary.png b/docs/build/html/_images/table_datasets_summary.png new file mode 100644 index 000000000..27fcd22b9 Binary files /dev/null and b/docs/build/html/_images/table_datasets_summary.png differ diff --git a/docs/build/html/_sources/dataset.rst.txt b/docs/build/html/_sources/dataset.rst.txt index 8d1b096c0..9bfcb6ad5 100644 --- a/docs/build/html/_sources/dataset.rst.txt +++ b/docs/build/html/_sources/dataset.rst.txt @@ -1,13 +1,16 @@ Datasets ======== -The list of datasets integrated into geneRNIB is provided below with their perturbation signatures as well as the type of perturbation used in each dataset. +The list of datasets integrated into geneRNIB is provided below: .. image:: images/datasets.png - :width: 80% + :width: 50% :align: center ---- -All datasets provide RNA data, while the `OPSCA` and `IBD` datasets also includes scATAC data. +.. image:: images/table_datasets_summary.png + :width: 100% + :align: center +---- You need `awscli` to download the datasets. diff --git a/docs/build/html/_sources/evaluation.rst.txt b/docs/build/html/_sources/evaluation.rst.txt index cccc945ba..6c420b546 100644 --- a/docs/build/html/_sources/evaluation.rst.txt +++ b/docs/build/html/_sources/evaluation.rst.txt @@ -9,13 +9,14 @@ The evaluation metrics used in geneRNIB are summarized below. :align: center ---- -.. image:: images/datasets_metrics.png - :width: 90% +.. image:: images/metric_quality_evaluation.png + :width: 100% :align: center ---- -For a detailed description of each metric, refer to the geneRNIB paper. +For a detailed description of each metric, refer to the geneRNIB paper. Not all the metrics were applicable to all datasets, as shown in the table. In addition, only those datasets with * passed the applicability criteria for a given metric, which includes minimal variability and performance threshold set for each metric. +In addition, not all metrics passed the additional criteria for inclusion in the final score calculation, as explained in the paper, and marked with ** in the table. This includes context specificity and robustness in stability analysis. The evaluation metrics expect the inferred network to be in the form of an AnnData object with specific format as explained here. It should be noted that the metric currently evaluate only the **top TF-gene pairs**, currently limited to **50,000 edges**, ranked by their assigned weight. @@ -28,32 +29,42 @@ The inferred network should have a tabular format with the following columns: See `resources/grn_benchmark/prior/collectri.h5ad` for an example of the expected format. -Running GRN evaluation using standard pipeline ----------------------------------------- -To run the evalution for a given GRN and dataset, use the following command: + +Running GRN evaluation without docker +---------------------------------------- +Considering that Docker is not supported by certtain systems, you can run the evaluation without Docker by following these steps: ```bash -bash scripts/run_grn_evaluation.sh --prediction= --save_dir= --dataset= --build_images= +bash src/metrics/all_metrics/run_local.sh --dataset --prediction= --score --num_workers ``` example command: ```bash -bash scripts/run_grn_evaluation.sh --prediction=resources/grn_models/op/collectri.h5ad --save_dir=output/ --dataset=op --build_images=true +bash src/metrics/all_metrics/run_local.sh --dataset op --prediction=resources/grn_models/op/collectri.h5ad --score=output_score_file.h5ad --num_workers=20 ``` +If you are evaluating a new GRN model, which is not part of geneRNIB, make you to generate the consensus prior file for the dataset you are evaluating on. -Running GRN evaluation without docker +```bash +bash scripts/prior/run_consensus.sh --dataset op --new_model {new_grn_model_file.h5ad} +``` + +This will add your model to the previous ones and create the new consensus prior file needed for evaluation. + +Running GRN evaluation using standard pipeline ---------------------------------------- -Considering that Docker is not supported by certtain systems, you can run the evaluation without Docker by following these steps: + +To run the evalution for a given GRN and dataset, use the following command: ```bash -bash src/metrics/all_metrics/run_local.sh --dataset --prediction= --score --num_workers +bash scripts/run_grn_evaluation.sh --prediction= --save_dir= --dataset= --build_images= ``` example command: ```bash -bash src/metrics/all_metrics/run_local.sh --dataset op --prediction=resources/grn_models/op/collectri.h5ad --score=output_score_file.h5ad --num_workers=20 -``` \ No newline at end of file +bash scripts/run_grn_evaluation.sh --prediction=resources/grn_models/op/collectri.h5ad --save_dir=output/ --dataset=op --build_images=true +``` + diff --git a/docs/build/html/_sources/installation.rst.txt b/docs/build/html/_sources/installation.rst.txt deleted file mode 100644 index e69de29bb..000000000 diff --git a/docs/build/html/_sources/leaderboard.rst.txt b/docs/build/html/_sources/leaderboard.rst.txt index 2130ba971..0ee707263 100644 --- a/docs/build/html/_sources/leaderboard.rst.txt +++ b/docs/build/html/_sources/leaderboard.rst.txt @@ -1,14 +1,14 @@ Leaderboard ================= -.. The overal comparitive performance of the integrated GRN inference methods is summarized in the leaderboard below. +The overal comparitive performance of the integrated GRN inference methods is summarized in the leaderboard below. It should be noted that not all metrics count towards the final score, as some metrics did not pass the applicability criteria. See `here `_ for more details on the metrics applicability. -.. .. image:: images/leaderboard.png -.. :width: 90% -.. :align: center -.. ---- +.. image:: images/summary_figure.png + :width: 100% + :align: center +---- -The individual performance of the methods on each dataset is summarized below. +The individual performance of the methods on each dataset is summarized below. .. image:: images/raw_scores_op.png :width: 70% @@ -16,7 +16,7 @@ The individual performance of the methods on each dataset is summarized below. ---- .. image:: images/raw_scores_nakatake.png - :width: 60% + :width: 70% :align: center ---- @@ -25,10 +25,6 @@ The individual performance of the methods on each dataset is summarized below. :align: center ---- -.. image:: images/raw_scores_adamson.png - :width: 70% - :align: center ----- .. image:: images/raw_scores_replogle.png :width: 70% @@ -45,8 +41,13 @@ The individual performance of the methods on each dataset is summarized below. :align: center ---- -.. image:: images/raw_scores_ibd.png - :width: 90% +.. image:: images/raw_scores_ibd_uc.png + :width: 70% + :align: center +---- + +.. image:: images/raw_scores_ibd_cd.png + :width: 70% :align: center ---- diff --git a/docs/build/html/_sources/overview.rst.txt b/docs/build/html/_sources/overview.rst.txt deleted file mode 100644 index eadc7f5b6..000000000 --- a/docs/build/html/_sources/overview.rst.txt +++ /dev/null @@ -1,102 +0,0 @@ -Overview -======== - -Overview of geneRNIB - - -geneRNIB is a cloud-hosted platform designed to evaluate gene regulatory network (GRN) inference methods in a standardized and reproducible way. It brings together datasets, GRN models, evaluation metrics, and a dynamic leaderboard to track the latest advancements in GRN benchmarks. - -To ensure fair comparisons, geneRNIB provides five benchmark datasets, each tailored to assess different aspects of GRN inference. These datasets originate from the same cell types and experiments, allowing context-specific evaluations. The platform supports both transcriptomics-based GRN inference, which relies solely on gene expression data, and multi-omics approaches that integrate chromatin accessibility and gene expression to uncover regulatory interactions. - -Evaluating GRN performance is challenging due to the lack of a definitive “ground truth” network. To address this, geneRNIB employs eight standardized evaluation metrics that use perturbation data to assess inferred interactions. The Wasserstein (WS) distance measures shifts in gene expression after perturbations, helping to determine how well a model captures true regulatory effects. Additionally, regression-based metrics (R₁ and R₂) assess predictive accuracy, ensuring that inferred regulatory links contribute to meaningful predictions. - -To put GRN models into context, geneRNIB also includes three control models. A simple baseline computes Pearson correlations between genes, serving as a quick reference for benchmarking. A positive control model sets an upper bound by incorporating all available variation, while a negative control model generates random networks to ensure meaningful performance comparisons. - -Built with modern computational tools like Docker and Viash, geneRNIB prioritizes scalability and reproducibility. It provides a structured framework for integrating new datasets, inference methods, and evaluation metrics, making it a powerful resource for advancing GRN research. - - -#TODO: Fig of the datasts and the table that shows inference and evaluation datassts -#TODO: Fig of the evaluation metrics and explain - - -Installation ------------- - -For installation, follow the `task_gen_benchmark `_. - -Once the repository is cloned and the required software installed, proceed to the next steps. - -Download resources for GRN inference and evalation: ------------------- - -.. code-block:: bash - - cd task_grn_benchmark - - # download resources - scripts/download_resources.sh - -The full resources is acceesible - -Infer a GRN ------------ - -.. code-block:: bash - - viash run src/methods/dummy/config.vsh.yaml -- --multiomics_rna resources/grn-benchmark/multiomics_rna.h5ad --multiomics_atac resources/grn-benchmark/multiomics_atac.h5ad --prediction output/dummy.csv - - -Similarly, run the command for other methods. - -Evaluate a GRN --------------- - -.. code-block:: bash - - scripts/run_evaluation.sh --grn resources/grn-benchmark/grn_models/collectri.csv - -Similarly, run the command for other GRN models. - - -See examples of interacting with the framework can be found in section :doc:`examples`. - - ----- TODO: improve this with info given above - -The pipeline can evaluate algorithms that leverage only one of the multi-omic data types (RNA-Seq or ATAC-Seq) or both. -It also evaluates the performance of two controls: - -#. As a *negative control*, the pipeline evaluates the performance of a random network. -#. As a *positive control*, the pipeline evaluates the performance of a network derived from correlation of genes in the perturbation dataset used for evaluation. - -The two types of regression models are: - -#. Regression from GRN regulations to target expression -#. Regression from TF expression of predicted regulators to target expression - -The evaluation is done with the help of pertubation data, using two different approaches: - -#. Regression from GRN regulations to target expression -#. Regression from TF expression of predicted regulators to target expression - -| - -.. image:: images/regressions.png - :width: 100 % - :alt: overview of the two regression evaluation approaches - :align: center - -| -| - - -Evaluation 1: Regression from GRN regulations to target expression ------------------------------------------------------------------- -The first approach we used is similar to GRaNPA and the multivariate decision tree in Decoupler, where regulatory weights from the GRN form the feature space to predict perturbation data. In this method, we train one model per sample. The feature space matrix has dimensions of genes by transcription factors (TFs), with values being the regulatory weights from the GRN or 0 if the link is absent. The target space matrix represents the perturbation data for each sample. We evaluate the model's predictive performance using a 5-fold cross-validation scheme and the coefficient of determination (R²) as the metric. LightGBM is used for computational efficiency. - - -Evaluation 2: Regression from TF expression of predicted regulators to target expression ----------------------------------------------------------------------------------------- -In the second approach, instead of using regulatory weights, we utilized the expression of putative regulators (TFs) from the perturbation data to construct the feature space. We fit one model per gene, selecting regulators based on the regulatory weights suggested by the GRNs. This method is similar to many modern GRN inference techniques. - - diff --git a/docs/build/html/dataset.html b/docs/build/html/dataset.html index 49f90320e..76e640288 100644 --- a/docs/build/html/dataset.html +++ b/docs/build/html/dataset.html @@ -3,7 +3,7 @@ - + Datasets — OpenProblems GRN benchmarking 0.1 documentation @@ -82,10 +82,13 @@

Datasets

-

The list of datasets integrated into geneRNIB is provided below with their perturbation signatures as well as the type of perturbation used in each dataset.

-_images/datasets.png +

The list of datasets integrated into geneRNIB is provided below:

+_images/datasets.png + +
+_images/table_datasets_summary.png +
-

All datasets provide RNA data, while the OPSCA and IBD datasets also includes scATAC data.

You need awscli to download the datasets.

Downloading the main datasets

diff --git a/docs/build/html/evaluation.html b/docs/build/html/evaluation.html index 0a6ed1712..37dae3ead 100644 --- a/docs/build/html/evaluation.html +++ b/docs/build/html/evaluation.html @@ -3,7 +3,7 @@ - + GRN evaluation — OpenProblems GRN benchmarking 0.1 documentation @@ -46,8 +46,8 @@
  • Datasets
  • GRN Inference
  • GRN evaluation
  • Extending
  • @@ -81,11 +81,14 @@

    GRN evaluation

    The evaluation metrics used in geneRNIB are summarized below.

    -_images/metrics.png +_images/metrics.png +
    -_images/datasets_metrics.png +_images/metric_quality_evaluation.png +
    -

    For a detailed description of each metric, refer to the geneRNIB paper.

    +

    For a detailed description of each metric, refer to the geneRNIB paper. Not all the metrics were applicable to all datasets, as shown in the table. In addition, only those datasets with * passed the applicability criteria for a given metric, which includes minimal variability and performance threshold set for each metric. +In addition, not all metrics passed the additional criteria for inclusion in the final score calculation, as explained in the paper, and marked with ** in the table. This includes context specificity and robustness in stability analysis.

    The evaluation metrics expect the inferred network to be in the form of an AnnData object with specific format as explained here. It should be noted that the metric currently evaluate only the top TF-gene pairs, currently limited to 50,000 edges, ranked by their assigned weight.

    The inferred network should have a tabular format with the following columns:

    @@ -97,26 +100,31 @@

    GRN evaluation -

    Running GRN evaluation using standard pipeline

    -

    To run the evalution for a given GRN and dataset, use the following command:

    +
    +

    Running GRN evaluation without docker

    +

    Considering that Docker is not supported by certtain systems, you can run the evaluation without Docker by following these steps:

    `bash -bash scripts/run_grn_evaluation.sh --prediction=<inferred GRN (e.g.collectri.h5ad)> --save_dir=<e.g.output/> --dataset=<e.g. replogle> --build_images=<true or false. true for the first time running> +bash src/metrics/all_metrics/run_local.sh --dataset <dataset_name> --prediction=<inferred GRN (e.g.collectri.h5ad)> --score <output_score_file.h5ad> --num_workers <number_of_workers> `

    example command:

    `bash -bash scripts/run_grn_evaluation.sh --prediction=resources/grn_models/op/collectri.h5ad --save_dir=output/ --dataset=op --build_images=true +bash src/metrics/all_metrics/run_local.sh --dataset op --prediction=resources/grn_models/op/collectri.h5ad --score=output_score_file.h5ad --num_workers=20 `

    +

    If you are evaluating a new GRN model, which is not part of geneRNIB, make you to generate the consensus prior file for the dataset you are evaluating on.

    +

    `bash +bash scripts/prior/run_consensus.sh --dataset op --new_model {new_grn_model_file.h5ad} +`

    +

    This will add your model to the previous ones and create the new consensus prior file needed for evaluation.

    -
    -

    Running GRN evaluation without docker

    -

    Considering that Docker is not supported by certtain systems, you can run the evaluation without Docker by following these steps:

    +
    +

    Running GRN evaluation using standard pipeline

    +

    To run the evalution for a given GRN and dataset, use the following command:

    `bash -bash src/metrics/all_metrics/run_local.sh --dataset <dataset_name> --prediction=<inferred GRN (e.g.collectri.h5ad)> --score <output_score_file.h5ad> --num_workers <number_of_workers> +bash scripts/run_grn_evaluation.sh --prediction=<inferred GRN (e.g.collectri.h5ad)> --save_dir=<e.g.output/> --dataset=<e.g. replogle> --build_images=<true or false. true for the first time running> `

    example command:

    `bash -bash src/metrics/all_metrics/run_local.sh --dataset op --prediction=resources/grn_models/op/collectri.h5ad --score=output_score_file.h5ad --num_workers=20 +bash scripts/run_grn_evaluation.sh --prediction=resources/grn_models/op/collectri.h5ad --save_dir=output/ --dataset=op --build_images=true `

    diff --git a/docs/build/html/extending.html b/docs/build/html/extending.html index 44729c935..6cad5d6ec 100644 --- a/docs/build/html/extending.html +++ b/docs/build/html/extending.html @@ -3,7 +3,7 @@ - + Extending — OpenProblems GRN benchmarking 0.1 documentation diff --git a/docs/build/html/index.html b/docs/build/html/index.html index 8b77f1e8a..478251dfb 100644 --- a/docs/build/html/index.html +++ b/docs/build/html/index.html @@ -3,7 +3,7 @@ - + geneRNIB: A living benchmark for gene regulatory network inference — OpenProblems GRN benchmarking 0.1 documentation @@ -79,7 +79,8 @@

    geneRNIB: A living benchmark for gene regulatory network inference_images/overview.png +_images/overview.png +

    This documentation is supplementary to:

      @@ -114,8 +115,8 @@

      Contents

  • GRN evaluation
  • Extending
      diff --git a/docs/build/html/inference.html b/docs/build/html/inference.html index 689bfe218..e5035f54b 100644 --- a/docs/build/html/inference.html +++ b/docs/build/html/inference.html @@ -3,7 +3,7 @@ - + GRN Inference — OpenProblems GRN benchmarking 0.1 documentation diff --git a/docs/build/html/installation.html b/docs/build/html/installation.html deleted file mode 100644 index e7f000560..000000000 --- a/docs/build/html/installation.html +++ /dev/null @@ -1,102 +0,0 @@ - - - - - - - - - <no title> — OpenProblems GRN benchmarking 0.1 documentation - - - - - - - - - - - - - - - -
      - - -
      - -
      -
      -
      - -
      -
      -
      -
      - - - -
      -
      - -
      -
      -
      -
      - - - - \ No newline at end of file diff --git a/docs/build/html/leaderboard.html b/docs/build/html/leaderboard.html index 0f547f774..599c02e72 100644 --- a/docs/build/html/leaderboard.html +++ b/docs/build/html/leaderboard.html @@ -3,7 +3,7 @@ - + Leaderboard — OpenProblems GRN benchmarking 0.1 documentation @@ -75,26 +75,40 @@

      Leaderboard

      +

      The overal comparitive performance of the integrated GRN inference methods is summarized in the leaderboard below. It should be noted that not all metrics count towards the final score, as some metrics did not pass the applicability criteria. See here for more details on the metrics applicability.

      +_images/summary_figure.png + +

      The individual performance of the methods on each dataset is summarized below.

      -_images/raw_scores_op.png +_images/raw_scores_op.png +
      -_images/raw_scores_nakatake.png +_images/raw_scores_nakatake.png +
      -_images/raw_scores_norman.png +_images/raw_scores_norman.png +
      -_images/raw_scores_adamson.png +_images/raw_scores_replogle.png +
      -_images/raw_scores_replogle.png +_images/raw_scores_300BCG.png +
      -_images/raw_scores_300BCG.png +_images/raw_scores_parsebioscience.png +
      -_images/raw_scores_parsebioscience.png +_images/raw_scores_ibd_uc.png +
      -_images/raw_scores_ibd.png +_images/raw_scores_ibd_cd.png +
      -_images/raw_scores_xaira_HEK293T.png +_images/raw_scores_xaira_HEK293T.png +
      -_images/raw_scores_xaira_HCT116.png +_images/raw_scores_xaira_HCT116.png +
      diff --git a/docs/build/html/overview.html b/docs/build/html/overview.html deleted file mode 100644 index eb24f9bf2..000000000 --- a/docs/build/html/overview.html +++ /dev/null @@ -1,177 +0,0 @@ - - - - - - - - - Overview — OpenProblems GRN benchmarking 0.1 documentation - - - - - - - - - - - - - - - -
      - - -
      - -
      -
      -
      - -
      -
      -
      -
      - -
      -

      Overview

      -

      Overview of geneRNIB

      -

      geneRNIB is a cloud-hosted platform designed to evaluate gene regulatory network (GRN) inference methods in a standardized and reproducible way. It brings together datasets, GRN models, evaluation metrics, and a dynamic leaderboard to track the latest advancements in GRN benchmarks.

      -

      To ensure fair comparisons, geneRNIB provides five benchmark datasets, each tailored to assess different aspects of GRN inference. These datasets originate from the same cell types and experiments, allowing context-specific evaluations. The platform supports both transcriptomics-based GRN inference, which relies solely on gene expression data, and multi-omics approaches that integrate chromatin accessibility and gene expression to uncover regulatory interactions.

      -

      Evaluating GRN performance is challenging due to the lack of a definitive “ground truth” network. To address this, geneRNIB employs eight standardized evaluation metrics that use perturbation data to assess inferred interactions. The Wasserstein (WS) distance measures shifts in gene expression after perturbations, helping to determine how well a model captures true regulatory effects. Additionally, regression-based metrics (R₁ and R₂) assess predictive accuracy, ensuring that inferred regulatory links contribute to meaningful predictions.

      -

      To put GRN models into context, geneRNIB also includes three control models. A simple baseline computes Pearson correlations between genes, serving as a quick reference for benchmarking. A positive control model sets an upper bound by incorporating all available variation, while a negative control model generates random networks to ensure meaningful performance comparisons.

      -

      Built with modern computational tools like Docker and Viash, geneRNIB prioritizes scalability and reproducibility. It provides a structured framework for integrating new datasets, inference methods, and evaluation metrics, making it a powerful resource for advancing GRN research.

      -

      #TODO: Fig of the datasts and the table that shows inference and evaluation datassts -#TODO: Fig of the evaluation metrics and explain

      -
      -

      Installation

      -

      For installation, follow the task_gen_benchmark.

      -

      Once the repository is cloned and the required software installed, proceed to the next steps.

      -
      -
      -

      Download resources for GRN inference and evalation:

      -
      cd task_grn_benchmark
      -
      -# download resources
      -scripts/download_resources.sh
      -
      -
      -

      The full resources is acceesible

      -
      -
      -

      Infer a GRN

      -
      viash run src/methods/dummy/config.vsh.yaml -- --multiomics_rna resources/grn-benchmark/multiomics_rna.h5ad --multiomics_atac resources/grn-benchmark/multiomics_atac.h5ad --prediction output/dummy.csv
      -
      -
      -

      Similarly, run the command for other methods.

      -
      -
      -

      Evaluate a GRN

      -
      scripts/run_evaluation.sh --grn resources/grn-benchmark/grn_models/collectri.csv
      -
      -
      -

      Similarly, run the command for other GRN models.

      -

      See examples of interacting with the framework can be found in section examples.

      -

      —- TODO: improve this with info given above

      -

      The pipeline can evaluate algorithms that leverage only one of the multi-omic data types (RNA-Seq or ATAC-Seq) or both. -It also evaluates the performance of two controls:

      -
        -
      1. As a negative control, the pipeline evaluates the performance of a random network.

      2. -
      3. As a positive control, the pipeline evaluates the performance of a network derived from correlation of genes in the perturbation dataset used for evaluation.

      4. -
      -

      The two types of regression models are:

      -
        -
      1. Regression from GRN regulations to target expression

      2. -
      3. Regression from TF expression of predicted regulators to target expression

      4. -
      -

      The evaluation is done with the help of pertubation data, using two different approaches:

      -
        -
      1. Regression from GRN regulations to target expression

      2. -
      3. Regression from TF expression of predicted regulators to target expression

      4. -
      -
      -

      -
      -overview of the two regression evaluation approaches - -
      -

      -

      -
      -
      -
      -

      Evaluation 1: Regression from GRN regulations to target expression

      -

      The first approach we used is similar to GRaNPA and the multivariate decision tree in Decoupler, where regulatory weights from the GRN form the feature space to predict perturbation data. In this method, we train one model per sample. The feature space matrix has dimensions of genes by transcription factors (TFs), with values being the regulatory weights from the GRN or 0 if the link is absent. The target space matrix represents the perturbation data for each sample. We evaluate the model’s predictive performance using a 5-fold cross-validation scheme and the coefficient of determination (R²) as the metric. LightGBM is used for computational efficiency.

      -
      -
      -

      Evaluation 2: Regression from TF expression of predicted regulators to target expression

      -

      In the second approach, instead of using regulatory weights, we utilized the expression of putative regulators (TFs) from the perturbation data to construct the feature space. We fit one model per gene, selecting regulators based on the regulatory weights suggested by the GRNs. This method is similar to many modern GRN inference techniques.

      -
      -
      - - -
      -
      - -
      -
      -
      -
      - - - - \ No newline at end of file diff --git a/docs/build/html/repo/objects.html b/docs/build/html/repo/objects.html index 27b963c00..7bb339eec 100644 --- a/docs/build/html/repo/objects.html +++ b/docs/build/html/repo/objects.html @@ -3,7 +3,7 @@ - + Objects — OpenProblems GRN benchmarking 0.1 documentation diff --git a/docs/build/html/searchindex.js b/docs/build/html/searchindex.js index a24f5b86d..a2c88acdb 100644 --- a/docs/build/html/searchindex.js +++ b/docs/build/html/searchindex.js @@ -1 +1 @@ -Search.setIndex({"alltitles": {"Add a GRN evaluation metric": [[2, "add-a-grn-evaluation-metric"]], "Add a GRN inference and evalaution dataset": [[2, "add-a-grn-inference-and-evalaution-dataset"]], "Add a GRN inference method": [[2, "add-a-grn-inference-method"]], "AnnData object": [[6, "id1"], [6, "id4"], [6, "id5"], [6, "id6"]], "Contents": [[3, "contents"]], "Control Method": [[6, "control-method"]], "Datasets": [[0, null]], "Downloading the extended datasets": [[0, "downloading-the-extended-datasets"]], "Downloading the main datasets": [[0, "downloading-the-main-datasets"]], "Downloading the raw/unprocessed data": [[0, "downloading-the-raw-unprocessed-data"]], "Downloading the results": [[0, "downloading-the-results"]], "Extending": [[2, null]], "GRN": [[6, "grn"]], "GRN Inference": [[4, null]], "GRN evaluation": [[1, null]], "GRN inference using integrated methods": [[4, "grn-inference-using-integrated-methods"]], "GRN inference without method integration": [[4, "grn-inference-without-method-integration"]], "Getting started": [[3, "getting-started"]], "Label": [[6, "label"]], "Leaderboard": [[5, null]], "Method": [[6, "method"]], "Multiomics ATAC": [[6, "multiomics-atac"]], "Multiomics RNA": [[6, "multiomics-rna"]], "Objects": [[6, null]], "Perturbation": [[6, "perturbation"]], "Prior data": [[6, "prior-data"]], "Running GRN evaluation using standard pipeline": [[1, "running-grn-evaluation-using-standard-pipeline"]], "Running GRN evaluation without docker": [[1, "running-grn-evaluation-without-docker"]], "Score": [[6, "score"]], "Tabular data": [[6, "id2"], [6, "id3"]], "geneRNIB: A living benchmark for gene regulatory network inference": [[3, null]]}, "docnames": ["dataset", "evaluation", "extending", "index", "inference", "leaderboard", "repo/objects"], "envversion": {"sphinx": 64, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1}, "filenames": ["dataset.rst", "evaluation.rst", "extending.rst", "index.rst", "inference.rst", "leaderboard.rst", "repo/objects.rst"], "indexentries": {}, "objects": {}, "objnames": {}, "objtypes": {}, "terms": {"0": [2, 4], "000": [1, 4], "1": [2, 6], "2": 2, "20": 1, "3": [], "4": 2, "5": [], "50": [1, 4], "50k": 2, "6": 6, "80": [], "A": [2, 6], "For": [1, 2, 4], "If": 4, "In": 2, "It": [1, 2, 3], "The": [0, 1, 2, 3, 4, 5, 6], "There": 2, "These": 0, "To": [0, 1, 3, 4], "__merge__": 2, "_viash": [], "about": 2, "access": 0, "accordingli": 3, "accuraci": 6, "activ": [], "ad": [2, 3, 4], "adamson": [], "add": 3, "addit": 2, "addition": [0, 2], "aertslab": 6, "after": 4, "aim": [], "algorithm": 4, "align": [], "all": [0, 2], "all_metr": 1, "alreadi": [], "also": [0, 2], "amazon": [], "among": [], "an": [1, 4, 6], "anndata": [1, 2, 4], "annot": 6, "api": 2, "applic": [], "approach": [4, 6], "ar": [0, 1, 2, 3], "argument": 6, "art": 3, "assess": 3, "assign": [1, 4], "astyp": [2, 4], "atac": [], "attribut": 6, "avail": 0, "aw": [0, 2], "awscli": 0, "base": [2, 6], "base_python": 2, "base_r": [], "base_requir": 2, "baselin": [], "bash": 1, "below": [0, 1, 5], "benchmark": 6, "better": 2, "between": [], "beyond": 0, "bio": 2, "biorxiv": 3, "bioscienc": 0, "block": [], "both": [2, 3], "build_imag": 1, "bulk": 2, "c": 4, "call": 2, "can": [1, 2, 4], "categori": [], "causal": [], "cell": [0, 2, 6], "cell_count": 6, "cell_typ": 6, "celloracl": 2, "center": [], "certtain": 1, "chang": 2, "charact": 4, "check": 2, "choic": 2, "chosen": 6, "cistarget": 6, "cli": [], "cloud": 3, "code": 2, "collectri": [1, 4, 6], "column": [1, 4, 6], "com": [], "combin": 0, "command": [0, 1, 2, 4], "common": 2, "comp_method": 2, "comparison": [0, 3], "comparit": [], "competit": 3, "complet": 6, "complic": 2, "compon": [], "compound": 6, "compress": 4, "comput": [0, 3], "config": [2, 4], "connect": 6, "consensu": 0, "consid": [1, 4], "consist": [], "construct": [], "contact": 0, "contain": 0, "content": [], "control": 0, "control_method": [], "core": 0, "correct": [], "correl": 4, "could": 2, "csv": [2, 4, 6], "curat": 3, "current": [1, 2, 4], "data": [2, 3], "datafram": [2, 4], "dataset": [1, 3, 4, 5, 6], "dataset_id": [2, 4], "dataset_nam": [1, 2, 4], "datasets_raw": 0, "de": 2, "default": [0, 6], "defin": [], "definit": 2, "depend": 2, "descript": [1, 2, 6], "design": 3, "detail": 1, "develop": 3, "did": [], "differ": 2, "differenti": 2, "direct": 2, "directori": 0, "distanc": [], "distribut": [], "do": 2, "docker": [2, 3], "document": [2, 3], "documentation_url": 2, "don": [], "done": 2, "donor": 6, "donor_id": 6, "dont": 2, "doubl": 6, "download": [2, 3, 4], "draft": [], "drawn": 6, "dtype": 2, "due": 0, "dummpi": [], "dure": [], "dynam": 3, "e": [1, 2, 4], "each": [0, 1, 2, 4, 5, 6], "edg": [1, 2, 4], "effect": [], "effici": 0, "eight": [], "end": 2, "engin": 2, "enhanc": [], "ensur": [2, 4], "essenti": 2, "etc": 1, "evalaut": 3, "evalu": [0, 3, 4, 6], "evaluation_data": 2, "evalut": 1, "exampl": [1, 2, 4, 6], "except": [], "execut": 2, "expect": [1, 2, 4], "experi": 6, "explain": [1, 2], "explan": 6, "express": [2, 6], "extend": 3, "extended_data": 0, "extra": 2, "factor": 4, "fals": 1, "far": [], "featur": [2, 3], "few": [0, 2], "file": [0, 2, 6], "filter": 2, "find": [0, 6], "first": 1, "float": 6, "folder": [0, 2], "follow": [1, 2, 4], "form": 1, "format": [1, 2, 4, 6], "format_save_scor": 2, "found": 2, "from": [2, 4, 6], "full": 0, "further": 0, "futur": 3, "g": [1, 2, 4], "gene": [1, 2, 4, 6], "gene1": 2, "gene2": 2, "genernbi": 4, "genernib": [0, 1, 2, 4], "get": 2, "ghcr": 2, "github": 3, "given": [1, 4], "grn": [0, 3], "grn_benchmark": [0, 1, 2, 4], "grn_method": 2, "grn_model": 1, "grnboost2": [2, 4], "group": [], "guidelin": [], "gzip": 4, "h5ad": [1, 2, 4, 6], "ha": 2, "have": [0, 1, 2, 4], "hct116": [], "hek293t": [], "helper": 2, "here": [1, 2], "how": 2, "howev": 2, "http": 6, "i": [0, 1, 2, 3, 4, 5, 6], "ibd": 0, "id": [2, 6], "identifi": 2, "imag": 2, "implement": [], "import": [1, 2, 4], "improv": [], "includ": [0, 2], "incorpor": 0, "indic": 6, "individu": 5, "infer": [0, 1, 6], "inference_data": [2, 4], "info": 2, "inform": 2, "infrastructur": 3, "initi": [], "instal": [2, 3, 4], "instruct": 2, "integ": 6, "integr": [0, 2, 3], "io": 2, "know": [], "known": [0, 6], "label": 2, "labels_tw": 2, "larg": 0, "latest": [], "layer": [2, 6], "leaderboard": [0, 3], "let": [], "level": 6, "librari": [2, 4], "likelihood": [1, 4], "limit": [1, 4], "linc": 6, "link": 2, "list": [0, 2, 4, 6], "live": [], "load": 2, "loadtxt": 2, "locat": 2, "logarithm": 6, "lognorm": [2, 6], "main": [2, 3], "make": [], "manuscript": [], "map": 6, "mask": [], "matrix": 4, "me": [], "mean": 6, "measur": [], "mention": 0, "merg": 2, "method": [0, 3, 5], "method_id": [2, 4], "method_nam": 2, "metric": [0, 1, 3, 6], "metric_key_1": 2, "metric_key_2": 2, "metric_value_1": 2, "metric_value_2": 2, "midcpu": 2, "midmem": 2, "midtim": 2, "modal": 3, "model": [], "more": [2, 4], "most": [], "multi": 3, "multiom": [], "multiomics_atac": 6, "multiomics_rna": 6, "n_count": 6, "nakatak": [], "name": [1, 2, 6], "namespac": 2, "nativ": [], "ncol": 4, "necessari": 2, "necessarili": [], "need": [0, 2], "neg": [], "net": [2, 4], "network": [1, 2, 4], "new": [2, 3], "next": 4, "nextflow": 2, "none": [2, 4], "normal": [2, 6], "norman": [], "note": 1, "novel": 3, "np": 2, "nrow": 4, "num_work": 1, "number": 6, "number_of_work": 1, "numpi": 2, "ob": 6, "object": 1, "observ": [], "obtain": 6, "offer": 3, "omic": 3, "omit": 2, "onc": [2, 4], "one": 4, "onli": [1, 2, 4], "op": [1, 4], "op_rna": 4, "openproblem": [0, 2, 3], "opsca": 0, "option": [2, 6], "org": 6, "organ": 2, "origin": [], "other": 0, "our": [3, 4], "out": [], "outperform": [], "output": [1, 2, 4, 6], "output_score_fil": 1, "over": 3, "overlook": 2, "overview": 6, "own": [], "packag": 2, "page": [3, 4], "pair": [1, 2, 4], "panda": [2, 4], "paper": [0, 1, 3], "par": 2, "param": 2, "paramet": 2, "parent": 6, "pars": 0, "parsebiosci": [], "pass": 2, "path": [2, 6], "pd": 2, "peak": 6, "pearson": [4, 6], "pearson_corr": 4, "per": [], "perform": [3, 4, 5, 6], "permit": [], "perturb": 0, "perturbation_data": 6, "pip": [], "pipelin": [2, 3], "pl": 0, "place": 2, "plate": 6, "plate_nam": 6, "platform": [2, 3], "pleas": [], "png": [], "posit": 0, "possibl": [], "power": [], "predict": [1, 2, 4, 6], "prerequisit": 2, "pretti": 2, "previou": 0, "previous": [0, 3], "primari": 6, "prior": [0, 1, 2, 4], "prior_data": 6, "proce": 4, "process": 0, "project": [], "protocol": 3, "prove": [], "provid": [0, 2, 3, 6], "pseudo": 2, "pseudobulk": [0, 6], "pull": 2, "py": 2, "python": 2, "python_script": 2, "r": [2, 4], "r_script": 2, "randomli": 6, "rank": [1, 4], "raw": 3, "re": 3, "reach": [], "read": 2, "read_h5ad": 2, "read_predict": 2, "readabl": [], "recent": 0, "reduc": [], "refer": [1, 2], "refin": [], "reflect": 3, "reg_typ": 6, "regress": 6, "regul": 6, "regulatori": [1, 4], "relationship": 6, "remov": [], "replac": 2, "replogl": [0, 1, 4], "repositori": 2, "repres": 0, "represent": 6, "request": [0, 2], "requir": 2, "residu": 6, "resourc": [0, 1, 2, 4, 6], "resources_test": [2, 4], "result": [2, 3], "ridg": 6, "rna": [0, 2, 4], "rna_op": 2, "row": 6, "run": [0, 2, 3, 4], "run_grn_evalu": 1, "run_loc": 1, "run_test": [], "runner": 2, "s3": [0, 2], "same": 2, "sampl": 6, "save": [2, 4], "save_dir": 1, "save_to_fil": 4, "scatac": 0, "scenic": 2, "schema": 2, "scheme": 2, "score": [1, 2, 3, 4], "score_fil": 2, "script": [1, 2], "section": [2, 4], "see": [1, 2, 3, 4], "set": [], "setup": 2, "sh": 1, "shift": 6, "should": [1, 2, 4], "sign": [0, 2], "signatur": 0, "similar": 2, "sinc": 4, "singl": [0, 2, 3, 6], "size": 0, "slot": 6, "sm_name": 6, "so": 2, "some": [2, 6], "sourc": [1, 2, 4, 6], "space": [], "specif": 1, "src": [1, 2, 4, 6], "standard": [0, 3, 6], "start": 2, "state": 3, "step": 1, "still": [], "store": [2, 3, 4], "str": [2, 4], "string": [2, 4, 6], "structur": 2, "submetr": 2, "submit": 2, "subsampl": 6, "substanti": [], "success": 2, "summar": [1, 5], "summari": 2, "supplementari": [0, 3], "support": [1, 3], "sy": 2, "sync": [0, 2], "system": 1, "t": [], "tabular": 1, "tag": 0, "target": [1, 2, 4, 6], "task": 6, "terminologi": [], "test": 2, "test_run": [], "tf": [0, 1, 2, 4, 6], "tf1": 2, "tf2": 2, "tf_all": [2, 4], "tf_list": 6, "thei": [], "them": 3, "thi": [0, 2, 3, 4, 6], "those": [], "three": [2, 4], "thu": [], "time": [1, 3], "tip": 2, "togeth": 2, "top": [1, 2, 4], "track": 3, "transcript": 4, "transcriptom": [], "true": 1, "type": [0, 2, 6], "typo": [], "u": 0, "un": [2, 4, 6], "under": [], "uniqu": 2, "unprocess": 3, "updat": [2, 3], "us": [0, 2, 3, 6], "util": 2, "valu": [2, 6], "variat": 0, "veri": 0, "version": 0, "viash": [2, 4], "view": 3, "vsh": [2, 4], "wa": [], "wasserstein": [], "we": [0, 2, 4], "weight": [1, 2, 4, 6], "well": [0, 6], "were": 0, "when": 3, "where": 2, "which": [0, 2, 6], "while": [0, 2], "width": [], "within": 0, "without": 3, "work": [2, 4], "write": [2, 4], "write_h5ad": 4, "x": [2, 4], "xaira": 0, "xaira_hct116": [], "xaira_hek293t": [], "yaml": [2, 4], "yet": [], "you": [0, 1, 2, 4], "your": [2, 4], "your_method": 2, "your_method_nam": 4, "zellkonvert": 4}, "titles": ["Datasets", "GRN evaluation", "Extending", "geneRNIB: A living benchmark for gene regulatory network inference", "GRN Inference", "Leaderboard", "Objects"], "titleterms": {"A": 3, "ad": [], "add": 2, "anndata": 6, "atac": 6, "benchmark": 3, "content": 3, "control": 6, "data": [0, 6], "dataset": [0, 2], "docker": 1, "document": [], "download": 0, "evalaut": 2, "evalu": [1, 2], "extend": [0, 2], "gene": 3, "genernib": 3, "get": 3, "grn": [1, 2, 4, 6], "infer": [2, 3, 4], "integr": 4, "label": 6, "leaderboard": 5, "live": 3, "main": 0, "method": [2, 4, 6], "metric": 2, "model": [], "multiom": 6, "network": 3, "object": 6, "perturb": 6, "pipelin": 1, "prior": 6, "raw": 0, "regulatori": 3, "result": 0, "rna": 6, "run": 1, "score": 6, "standard": 1, "start": 3, "tabular": 6, "test": [], "unprocess": 0, "us": [1, 4], "without": [1, 4]}}) \ No newline at end of file +Search.setIndex({"alltitles": {"Add a GRN evaluation metric": [[2, "add-a-grn-evaluation-metric"]], "Add a GRN inference and evalaution dataset": [[2, "add-a-grn-inference-and-evalaution-dataset"]], "Add a GRN inference method": [[2, "add-a-grn-inference-method"]], "AnnData object": [[6, "id1"], [6, "id4"], [6, "id5"], [6, "id6"]], "Contents": [[3, "contents"]], "Control Method": [[6, "control-method"]], "Datasets": [[0, null]], "Downloading the extended datasets": [[0, "downloading-the-extended-datasets"]], "Downloading the main datasets": [[0, "downloading-the-main-datasets"]], "Downloading the raw/unprocessed data": [[0, "downloading-the-raw-unprocessed-data"]], "Downloading the results": [[0, "downloading-the-results"]], "Extending": [[2, null]], "GRN": [[6, "grn"]], "GRN Inference": [[4, null]], "GRN evaluation": [[1, null]], "GRN inference using integrated methods": [[4, "grn-inference-using-integrated-methods"]], "GRN inference without method integration": [[4, "grn-inference-without-method-integration"]], "Getting started": [[3, "getting-started"]], "Label": [[6, "label"]], "Leaderboard": [[5, null]], "Method": [[6, "method"]], "Multiomics ATAC": [[6, "multiomics-atac"]], "Multiomics RNA": [[6, "multiomics-rna"]], "Objects": [[6, null]], "Perturbation": [[6, "perturbation"]], "Prior data": [[6, "prior-data"]], "Running GRN evaluation using standard pipeline": [[1, "running-grn-evaluation-using-standard-pipeline"]], "Running GRN evaluation without docker": [[1, "running-grn-evaluation-without-docker"]], "Score": [[6, "score"]], "Tabular data": [[6, "id2"], [6, "id3"]], "geneRNIB: A living benchmark for gene regulatory network inference": [[3, null]]}, "docnames": ["dataset", "evaluation", "extending", "index", "inference", "leaderboard", "repo/objects"], "envversion": {"sphinx": 64, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1}, "filenames": ["dataset.rst", "evaluation.rst", "extending.rst", "index.rst", "inference.rst", "leaderboard.rst", "repo/objects.rst"], "indexentries": {}, "objects": {}, "objnames": {}, "objtypes": {}, "terms": {"0": [2, 4], "000": [1, 4], "1": [2, 6], "2": 2, "20": 1, "4": 2, "50": [1, 4], "50k": 2, "6": 6, "A": [2, 6], "For": [1, 2, 4], "If": [1, 4], "In": [1, 2], "It": [1, 2, 3, 5], "Not": 1, "The": [0, 1, 2, 3, 4, 5, 6], "There": 2, "These": 0, "To": [0, 1, 3, 4], "__merge__": 2, "about": 2, "access": 0, "accordingli": 3, "accuraci": 6, "ad": [2, 3, 4], "add": [1, 3], "addit": [1, 2], "addition": [0, 2], "aertslab": 6, "after": 4, "algorithm": 4, "all": [0, 1, 2, 5], "all_metr": 1, "also": 2, "an": [1, 4, 6], "analysi": 1, "anndata": [1, 2, 4], "annot": 6, "api": 2, "applic": [1, 5], "approach": [4, 6], "ar": [0, 1, 2, 3], "argument": 6, "art": 3, "assess": 3, "assign": [1, 4], "astyp": [2, 4], "attribut": 6, "avail": 0, "aw": [0, 2], "awscli": 0, "base": [2, 6], "base_python": 2, "base_requir": 2, "bash": 1, "below": [0, 1, 5], "benchmark": 6, "better": 2, "beyond": 0, "bio": 2, "biorxiv": 3, "bioscienc": 0, "both": [2, 3], "build_imag": 1, "bulk": 2, "c": 4, "calcul": 1, "call": 2, "can": [1, 2, 4], "cell": [0, 2, 6], "cell_count": 6, "cell_typ": 6, "celloracl": 2, "certtain": 1, "chang": 2, "charact": 4, "check": 2, "choic": 2, "chosen": 6, "cistarget": 6, "cloud": 3, "code": 2, "collectri": [1, 4, 6], "column": [1, 4, 6], "combin": 0, "command": [0, 1, 2, 4], "common": 2, "comp_method": 2, "comparison": [0, 3], "comparit": 5, "competit": 3, "complet": 6, "complic": 2, "compound": 6, "compress": 4, "comput": [0, 3], "config": [2, 4], "connect": 6, "consensu": [0, 1], "consid": [1, 4], "contact": 0, "contain": 0, "context": 1, "control": 0, "core": 0, "correl": 4, "could": 2, "count": 5, "creat": 1, "criteria": [1, 5], "csv": [2, 4, 6], "curat": 3, "current": [1, 2, 4], "data": [2, 3], "datafram": [2, 4], "dataset": [1, 3, 4, 5, 6], "dataset_id": [2, 4], "dataset_nam": [1, 2, 4], "datasets_raw": 0, "de": 2, "default": [0, 6], "definit": 2, "depend": 2, "descript": [1, 2, 6], "design": 3, "detail": [1, 5], "develop": 3, "did": 5, "differ": 2, "differenti": 2, "direct": 2, "directori": 0, "do": 2, "docker": [2, 3], "document": [2, 3], "documentation_url": 2, "done": 2, "donor": 6, "donor_id": 6, "dont": 2, "doubl": 6, "download": [2, 3, 4], "drawn": 6, "dtype": 2, "due": 0, "dynam": 3, "e": [1, 2, 4], "each": [1, 2, 4, 5, 6], "edg": [1, 2, 4], "effici": 0, "end": 2, "engin": 2, "ensur": [2, 4], "essenti": 2, "etc": 1, "evalaut": 3, "evalu": [0, 3, 4, 6], "evaluation_data": 2, "evalut": 1, "exampl": [1, 2, 4, 6], "execut": 2, "expect": [1, 2, 4], "experi": 6, "explain": [1, 2], "explan": 6, "express": [2, 6], "extend": 3, "extended_data": 0, "extra": 2, "factor": 4, "fals": 1, "featur": [2, 3], "few": [0, 2], "file": [0, 1, 2, 6], "filter": 2, "final": [1, 5], "find": [0, 6], "first": 1, "float": 6, "folder": [0, 2], "follow": [1, 2, 4], "form": 1, "format": [1, 2, 4, 6], "format_save_scor": 2, "found": 2, "from": [2, 4, 6], "full": 0, "further": 0, "futur": 3, "g": [1, 2, 4], "gene": [1, 2, 4, 6], "gene1": 2, "gene2": 2, "gener": 1, "genernbi": 4, "genernib": [0, 1, 2, 4], "get": 2, "ghcr": 2, "github": 3, "given": [1, 4], "grn": [0, 3, 5], "grn_benchmark": [0, 1, 2, 4], "grn_method": 2, "grn_model": 1, "grnboost2": [2, 4], "gzip": 4, "h5ad": [1, 2, 4, 6], "ha": 2, "have": [0, 1, 2, 4], "helper": 2, "here": [1, 2, 5], "how": 2, "howev": 2, "http": 6, "i": [0, 1, 2, 3, 4, 5, 6], "id": [2, 6], "identifi": 2, "imag": 2, "import": [1, 2, 4], "includ": [0, 1, 2], "inclus": 1, "incorpor": 0, "indic": 6, "individu": 5, "infer": [0, 1, 5, 6], "inference_data": [2, 4], "info": 2, "inform": 2, "infrastructur": 3, "instal": [2, 3, 4], "instruct": 2, "integ": 6, "integr": [0, 2, 3, 5], "io": 2, "known": [0, 6], "label": 2, "labels_tw": 2, "larg": 0, "layer": [2, 6], "leaderboard": [0, 3], "level": 6, "librari": [2, 4], "likelihood": [1, 4], "limit": [1, 4], "linc": 6, "link": 2, "list": [0, 2, 4, 6], "load": 2, "loadtxt": 2, "locat": 2, "logarithm": 6, "lognorm": [2, 6], "main": [2, 3], "make": 1, "map": 6, "mark": 1, "matrix": 4, "mean": 6, "mention": 0, "merg": 2, "method": [0, 3, 5], "method_id": [2, 4], "method_nam": 2, "metric": [0, 1, 3, 5, 6], "metric_key_1": 2, "metric_key_2": 2, "metric_value_1": 2, "metric_value_2": 2, "midcpu": 2, "midmem": 2, "midtim": 2, "minim": 1, "modal": 3, "model": 1, "more": [2, 4, 5], "multi": 3, "multiomics_atac": 6, "multiomics_rna": 6, "n_count": 6, "name": [1, 2, 6], "namespac": 2, "ncol": 4, "necessari": 2, "need": [0, 1, 2], "net": [2, 4], "network": [1, 2, 4], "new": [1, 2, 3], "new_grn_model_fil": 1, "new_model": 1, "next": 4, "nextflow": 2, "none": [2, 4], "normal": [2, 6], "note": [1, 5], "novel": 3, "np": 2, "nrow": 4, "num_work": 1, "number": 6, "number_of_work": 1, "numpi": 2, "ob": 6, "object": 1, "obtain": 6, "offer": 3, "omic": 3, "omit": 2, "onc": [2, 4], "one": 4, "ones": 1, "onli": [1, 2, 4], "op": [1, 4], "op_rna": 4, "openproblem": [0, 2, 3], "option": [2, 6], "org": 6, "organ": 2, "other": 0, "our": [3, 4], "output": [1, 2, 4, 6], "output_score_fil": 1, "over": [3, 5], "overlook": 2, "overview": 6, "packag": 2, "page": [3, 4], "pair": [1, 2, 4], "panda": [2, 4], "paper": [0, 1, 3], "par": 2, "param": 2, "paramet": 2, "parent": 6, "pars": 0, "part": 1, "pass": [1, 2, 5], "path": [2, 6], "pd": 2, "peak": 6, "pearson": [4, 6], "pearson_corr": 4, "perform": [1, 3, 4, 5, 6], "perturb": 0, "perturbation_data": 6, "pipelin": [2, 3], "pl": 0, "place": 2, "plate": 6, "plate_nam": 6, "platform": [2, 3], "posit": 0, "predict": [1, 2, 4, 6], "prerequisit": 2, "pretti": 2, "previou": [0, 1], "previous": [0, 3], "primari": 6, "prior": [0, 1, 2, 4], "prior_data": 6, "proce": 4, "process": 0, "protocol": 3, "provid": [0, 2, 3, 6], "pseudo": 2, "pseudobulk": [0, 6], "pull": 2, "py": 2, "python": 2, "python_script": 2, "r": [2, 4], "r_script": 2, "randomli": 6, "rank": [1, 4], "raw": 3, "re": 3, "read": 2, "read_h5ad": 2, "read_predict": 2, "recent": 0, "refer": [1, 2], "reflect": 3, "reg_typ": 6, "regress": 6, "regul": 6, "regulatori": [1, 4], "relationship": 6, "replac": 2, "replogl": [0, 1, 4], "repositori": 2, "repres": 0, "represent": 6, "request": [0, 2], "requir": 2, "residu": 6, "resourc": [0, 1, 2, 4, 6], "resources_test": [2, 4], "result": [2, 3], "ridg": 6, "rna": [2, 4], "rna_op": 2, "robust": 1, "row": 6, "run": [0, 2, 3, 4], "run_consensu": 1, "run_grn_evalu": 1, "run_loc": 1, "runner": 2, "s3": [0, 2], "same": 2, "sampl": 6, "save": [2, 4], "save_dir": 1, "save_to_fil": 4, "scenic": 2, "schema": 2, "scheme": 2, "score": [1, 2, 3, 4, 5], "score_fil": 2, "script": [1, 2], "section": [2, 4], "see": [1, 2, 3, 4, 5], "set": 1, "setup": 2, "sh": 1, "shift": 6, "should": [1, 2, 4, 5], "shown": 1, "sign": [0, 2], "similar": 2, "sinc": 4, "singl": [0, 2, 3, 6], "size": 0, "slot": 6, "sm_name": 6, "so": 2, "some": [2, 5, 6], "sourc": [1, 2, 4, 6], "specif": 1, "src": [1, 2, 4, 6], "stabil": 1, "standard": [0, 3, 6], "start": 2, "state": 3, "step": 1, "store": [2, 3, 4], "str": [2, 4], "string": [2, 4, 6], "structur": 2, "submetr": 2, "submit": 2, "subsampl": 6, "success": 2, "summar": [1, 5], "summari": 2, "supplementari": [0, 3], "support": [1, 3], "sy": 2, "sync": [0, 2], "system": 1, "tabl": 1, "tabular": 1, "tag": 0, "target": [1, 2, 4, 6], "task": 6, "test": 2, "tf": [0, 1, 2, 4, 6], "tf1": 2, "tf2": 2, "tf_all": [2, 4], "tf_list": 6, "them": 3, "thi": [0, 1, 2, 3, 4, 6], "those": 1, "three": [2, 4], "threshold": 1, "time": [1, 3], "tip": 2, "togeth": 2, "top": [1, 2, 4], "toward": 5, "track": 3, "transcript": 4, "true": 1, "type": [2, 6], "u": 0, "un": [2, 4, 6], "uniqu": 2, "unprocess": 3, "updat": [2, 3], "us": [0, 2, 3, 6], "util": 2, "valu": [2, 6], "variabl": 1, "variat": 0, "veri": 0, "version": 0, "viash": [2, 4], "view": 3, "vsh": [2, 4], "we": [0, 2, 4], "weight": [1, 2, 4, 6], "well": 6, "were": [0, 1], "when": 3, "where": 2, "which": [0, 1, 2, 6], "while": 2, "within": 0, "without": 3, "work": [2, 4], "write": [2, 4], "write_h5ad": 4, "x": [2, 4], "xaira": 0, "yaml": [2, 4], "you": [0, 1, 2, 4], "your": [1, 2, 4], "your_method": 2, "your_method_nam": 4, "zellkonvert": 4}, "titles": ["Datasets", "GRN evaluation", "Extending", "geneRNIB: A living benchmark for gene regulatory network inference", "GRN Inference", "Leaderboard", "Objects"], "titleterms": {"A": 3, "add": 2, "anndata": 6, "atac": 6, "benchmark": 3, "content": 3, "control": 6, "data": [0, 6], "dataset": [0, 2], "docker": 1, "download": 0, "evalaut": 2, "evalu": [1, 2], "extend": [0, 2], "gene": 3, "genernib": 3, "get": 3, "grn": [1, 2, 4, 6], "infer": [2, 3, 4], "integr": 4, "label": 6, "leaderboard": 5, "live": 3, "main": 0, "method": [2, 4, 6], "metric": 2, "multiom": 6, "network": 3, "object": 6, "perturb": 6, "pipelin": 1, "prior": 6, "raw": 0, "regulatori": 3, "result": 0, "rna": 6, "run": 1, "score": 6, "standard": 1, "start": 3, "tabular": 6, "unprocess": 0, "us": [1, 4], "without": [1, 4]}}) \ No newline at end of file diff --git a/docs/source/dataset.rst b/docs/source/dataset.rst index 8d1b096c0..9bfcb6ad5 100644 --- a/docs/source/dataset.rst +++ b/docs/source/dataset.rst @@ -1,13 +1,16 @@ Datasets ======== -The list of datasets integrated into geneRNIB is provided below with their perturbation signatures as well as the type of perturbation used in each dataset. +The list of datasets integrated into geneRNIB is provided below: .. image:: images/datasets.png - :width: 80% + :width: 50% :align: center ---- -All datasets provide RNA data, while the `OPSCA` and `IBD` datasets also includes scATAC data. +.. image:: images/table_datasets_summary.png + :width: 100% + :align: center +---- You need `awscli` to download the datasets. diff --git a/docs/source/evaluation.rst b/docs/source/evaluation.rst index cccc945ba..6c420b546 100644 --- a/docs/source/evaluation.rst +++ b/docs/source/evaluation.rst @@ -9,13 +9,14 @@ The evaluation metrics used in geneRNIB are summarized below. :align: center ---- -.. image:: images/datasets_metrics.png - :width: 90% +.. image:: images/metric_quality_evaluation.png + :width: 100% :align: center ---- -For a detailed description of each metric, refer to the geneRNIB paper. +For a detailed description of each metric, refer to the geneRNIB paper. Not all the metrics were applicable to all datasets, as shown in the table. In addition, only those datasets with * passed the applicability criteria for a given metric, which includes minimal variability and performance threshold set for each metric. +In addition, not all metrics passed the additional criteria for inclusion in the final score calculation, as explained in the paper, and marked with ** in the table. This includes context specificity and robustness in stability analysis. The evaluation metrics expect the inferred network to be in the form of an AnnData object with specific format as explained here. It should be noted that the metric currently evaluate only the **top TF-gene pairs**, currently limited to **50,000 edges**, ranked by their assigned weight. @@ -28,32 +29,42 @@ The inferred network should have a tabular format with the following columns: See `resources/grn_benchmark/prior/collectri.h5ad` for an example of the expected format. -Running GRN evaluation using standard pipeline ----------------------------------------- -To run the evalution for a given GRN and dataset, use the following command: + +Running GRN evaluation without docker +---------------------------------------- +Considering that Docker is not supported by certtain systems, you can run the evaluation without Docker by following these steps: ```bash -bash scripts/run_grn_evaluation.sh --prediction= --save_dir= --dataset= --build_images= +bash src/metrics/all_metrics/run_local.sh --dataset --prediction= --score --num_workers ``` example command: ```bash -bash scripts/run_grn_evaluation.sh --prediction=resources/grn_models/op/collectri.h5ad --save_dir=output/ --dataset=op --build_images=true +bash src/metrics/all_metrics/run_local.sh --dataset op --prediction=resources/grn_models/op/collectri.h5ad --score=output_score_file.h5ad --num_workers=20 ``` +If you are evaluating a new GRN model, which is not part of geneRNIB, make you to generate the consensus prior file for the dataset you are evaluating on. -Running GRN evaluation without docker +```bash +bash scripts/prior/run_consensus.sh --dataset op --new_model {new_grn_model_file.h5ad} +``` + +This will add your model to the previous ones and create the new consensus prior file needed for evaluation. + +Running GRN evaluation using standard pipeline ---------------------------------------- -Considering that Docker is not supported by certtain systems, you can run the evaluation without Docker by following these steps: + +To run the evalution for a given GRN and dataset, use the following command: ```bash -bash src/metrics/all_metrics/run_local.sh --dataset --prediction= --score --num_workers +bash scripts/run_grn_evaluation.sh --prediction= --save_dir= --dataset= --build_images= ``` example command: ```bash -bash src/metrics/all_metrics/run_local.sh --dataset op --prediction=resources/grn_models/op/collectri.h5ad --score=output_score_file.h5ad --num_workers=20 -``` \ No newline at end of file +bash scripts/run_grn_evaluation.sh --prediction=resources/grn_models/op/collectri.h5ad --save_dir=output/ --dataset=op --build_images=true +``` + diff --git a/docs/source/images/datasets.png b/docs/source/images/datasets.png index b08a554c9..9ac5c6238 100644 Binary files a/docs/source/images/datasets.png and b/docs/source/images/datasets.png differ diff --git a/docs/source/images/datasets_metrics.png b/docs/source/images/datasets_metrics.png deleted file mode 100644 index cdec25940..000000000 Binary files a/docs/source/images/datasets_metrics.png and /dev/null differ diff --git a/docs/source/images/metric_quality_evaluation.png b/docs/source/images/metric_quality_evaluation.png new file mode 100644 index 000000000..d321fc49e Binary files /dev/null and b/docs/source/images/metric_quality_evaluation.png differ diff --git a/docs/source/images/metrics.png b/docs/source/images/metrics.png index f5c2fd02c..2f9e1bd36 100644 Binary files a/docs/source/images/metrics.png and b/docs/source/images/metrics.png differ diff --git a/docs/source/images/raw_scores_300BCG.png b/docs/source/images/raw_scores_300BCG.png index b6ef7f7ed..cec454d14 100644 Binary files a/docs/source/images/raw_scores_300BCG.png and b/docs/source/images/raw_scores_300BCG.png differ diff --git a/docs/source/images/raw_scores_adamson.png b/docs/source/images/raw_scores_adamson.png deleted file mode 100644 index 2fdfd1794..000000000 Binary files a/docs/source/images/raw_scores_adamson.png and /dev/null differ diff --git a/docs/source/images/raw_scores_ibd.png b/docs/source/images/raw_scores_ibd.png deleted file mode 100644 index 6774168b0..000000000 Binary files a/docs/source/images/raw_scores_ibd.png and /dev/null differ diff --git a/docs/source/images/raw_scores_ibd_cd.png b/docs/source/images/raw_scores_ibd_cd.png new file mode 100644 index 000000000..968629360 Binary files /dev/null and b/docs/source/images/raw_scores_ibd_cd.png differ diff --git a/docs/source/images/raw_scores_ibd_uc.png b/docs/source/images/raw_scores_ibd_uc.png new file mode 100644 index 000000000..1d402ed77 Binary files /dev/null and b/docs/source/images/raw_scores_ibd_uc.png differ diff --git a/docs/source/images/raw_scores_nakatake.png b/docs/source/images/raw_scores_nakatake.png index be958d245..4fed0c14f 100644 Binary files a/docs/source/images/raw_scores_nakatake.png and b/docs/source/images/raw_scores_nakatake.png differ diff --git a/docs/source/images/raw_scores_norman.png b/docs/source/images/raw_scores_norman.png index a5f14c27d..b3611239b 100644 Binary files a/docs/source/images/raw_scores_norman.png and b/docs/source/images/raw_scores_norman.png differ diff --git a/docs/source/images/raw_scores_op.png b/docs/source/images/raw_scores_op.png index feb142808..7228b96c7 100644 Binary files a/docs/source/images/raw_scores_op.png and b/docs/source/images/raw_scores_op.png differ diff --git a/docs/source/images/raw_scores_parsebioscience.png b/docs/source/images/raw_scores_parsebioscience.png index 0a0571644..3c382b4f6 100644 Binary files a/docs/source/images/raw_scores_parsebioscience.png and b/docs/source/images/raw_scores_parsebioscience.png differ diff --git a/docs/source/images/raw_scores_replogle.png b/docs/source/images/raw_scores_replogle.png index ec79345c7..76915237e 100644 Binary files a/docs/source/images/raw_scores_replogle.png and b/docs/source/images/raw_scores_replogle.png differ diff --git a/docs/source/images/raw_scores_xaira_HCT116.png b/docs/source/images/raw_scores_xaira_HCT116.png index 8f02270f4..307473dd8 100644 Binary files a/docs/source/images/raw_scores_xaira_HCT116.png and b/docs/source/images/raw_scores_xaira_HCT116.png differ diff --git a/docs/source/images/raw_scores_xaira_HEK293T.png b/docs/source/images/raw_scores_xaira_HEK293T.png index 3d181dce7..ec5856c85 100644 Binary files a/docs/source/images/raw_scores_xaira_HEK293T.png and b/docs/source/images/raw_scores_xaira_HEK293T.png differ diff --git a/docs/source/images/summary_figure.png b/docs/source/images/summary_figure.png new file mode 100644 index 000000000..5c13b7046 Binary files /dev/null and b/docs/source/images/summary_figure.png differ diff --git a/docs/source/images/table_datasets_summary.png b/docs/source/images/table_datasets_summary.png new file mode 100644 index 000000000..27fcd22b9 Binary files /dev/null and b/docs/source/images/table_datasets_summary.png differ diff --git a/docs/source/leaderboard.rst b/docs/source/leaderboard.rst index 2130ba971..0ee707263 100644 --- a/docs/source/leaderboard.rst +++ b/docs/source/leaderboard.rst @@ -1,14 +1,14 @@ Leaderboard ================= -.. The overal comparitive performance of the integrated GRN inference methods is summarized in the leaderboard below. +The overal comparitive performance of the integrated GRN inference methods is summarized in the leaderboard below. It should be noted that not all metrics count towards the final score, as some metrics did not pass the applicability criteria. See `here `_ for more details on the metrics applicability. -.. .. image:: images/leaderboard.png -.. :width: 90% -.. :align: center -.. ---- +.. image:: images/summary_figure.png + :width: 100% + :align: center +---- -The individual performance of the methods on each dataset is summarized below. +The individual performance of the methods on each dataset is summarized below. .. image:: images/raw_scores_op.png :width: 70% @@ -16,7 +16,7 @@ The individual performance of the methods on each dataset is summarized below. ---- .. image:: images/raw_scores_nakatake.png - :width: 60% + :width: 70% :align: center ---- @@ -25,10 +25,6 @@ The individual performance of the methods on each dataset is summarized below. :align: center ---- -.. image:: images/raw_scores_adamson.png - :width: 70% - :align: center ----- .. image:: images/raw_scores_replogle.png :width: 70% @@ -45,8 +41,13 @@ The individual performance of the methods on each dataset is summarized below. :align: center ---- -.. image:: images/raw_scores_ibd.png - :width: 90% +.. image:: images/raw_scores_ibd_uc.png + :width: 70% + :align: center +---- + +.. image:: images/raw_scores_ibd_cd.png + :width: 70% :align: center ---- diff --git a/jobs.sh b/jobs.sh deleted file mode 100644 index 06f785dee..000000000 --- a/jobs.sh +++ /dev/null @@ -1,5 +0,0 @@ -sbatch src/metrics/regression_r/run_global.sh -sbatch src/metrics/regression_r/run_local.sh - -sbatch src/metrics/experimental/annotation/run_global.sh -sbatch src/metrics/experimental/annotation/run_local.sh \ No newline at end of file diff --git a/scripts/local_workflows/run_grn_evaluation.sh b/scripts/local_workflows/run_grn_evaluation.sh new file mode 100755 index 000000000..a2e8966b9 --- /dev/null +++ b/scripts/local_workflows/run_grn_evaluation.sh @@ -0,0 +1,288 @@ +#!/bin/bash +# Local GRN Evaluation Script +# This script evaluates all GRN predictions for all datasets using local SLURM jobs +# +# set -e +# Default parameters +RUN_CONSENSUS=false +RUN_METRICS=false +PROCESS_RESULTS=false +TEMP_DIR="output/evaluation" +RESULTS_FILE="resources/results/all_scores.csv" + + +LAYER="lognorm" +NUM_WORKERS=20 + +# get the arguments +while [[ $# -gt 0 ]]; do + key="$1" + + case $key in + --run_consensus) + RUN_CONSENSUS=true + shift + ;; + --run_consensus) + RUN_CONSENSUS=true + shift + ;; + --run_metrics) + RUN_METRICS=true + shift + ;; + --no_run_metrics) + RUN_METRICS=false + shift + ;; + --process_results) + PROCESS_RESULTS=true + shift + ;; + --no_process_results) + PROCESS_RESULTS=false + shift + ;; + --temp_dir) + TEMP_DIR="$2" + shift + shift + ;; + --results_file) + RESULTS_FILE="$2" + shift + shift + ;; + --num_workers) + NUM_WORKERS="$2" + shift + shift + ;; + *) + echo "Unknown option: $key" + exit 1 + ;; + esac +done + + +echo "==========================================" +echo "GRN Evaluation Configuration" +echo "==========================================" +echo "Run consensus: $RUN_CONSENSUS" +echo "Run metrics: $RUN_METRICS" +echo "Output directory: $TEMP_DIR" +echo "Results file: $RESULTS_FILE" +echo "Process results: $PROCESS_RESULTS" +echo "Number of workers: $NUM_WORKERS" +echo "==========================================" + +# Create output directory +mkdir -p "$TEMP_DIR" + +# Generate and source dataset configuration +echo "Generating dataset configuration..." +python src/utils/config.py +source src/utils/config.env + +# Get list of datasets from config +DATASETS=(${DATASETS//,/ }) +METHODS=(${METHODS//,/ }) + +# Function to submit a metric evaluation job +submit_metric_job() { + local dataset=$1 + local method=$2 + local prediction_file=$3 + + local job_name="${dataset}_${method}" + local score_file="${TEMP_DIR}/${dataset}_${method}_score.h5ad" + + # Skip if score file already exists + if [[ -f "$score_file" ]]; then + echo " Skipping ${job_name} - score file already exists" + return + fi + + echo " Submitting job: ${job_name}" + + + sbatch \ + --job-name="${job_name}" \ + src/metrics/all_metrics/run_local.sh \ + --dataset "${dataset}" \ + --prediction "${prediction_file}" \ + --score "${score_file}" \ + --num_workers "${NUM_WORKERS}" || echo " [ERROR] Failed to submit job for ${job_name}" +} + +# Function to process all results into a single CSV +process_all_results() { + echo "" + echo "==========================================" + echo "Processing Results" + echo "==========================================" + + local results_file="${RESULTS_FILE}" + + # Get list of datasets for parsing + local datasets_list=$(python -c "from src.utils.config import DATASET_GROUPS; print(','.join(DATASET_GROUPS.keys()))") + + # Create Python script to aggregate results + python - "$TEMP_DIR" "$RESULTS_FILE" "$datasets_list" << 'EOF' +import sys +import os +import pandas as pd +import anndata as ad +from pathlib import Path + +temp_dir = sys.argv[1] +results_file = sys.argv[2] +datasets_str = sys.argv[3] +scores_dir = Path(temp_dir) + +# Parse datasets list +known_datasets = datasets_str.split(',') + +print(f"Looking for score files in: {scores_dir}") +print(f"Will save results to: {results_file}") +print(f"Known datasets: {known_datasets[:5]}...") + +all_results = [] + +# Iterate through all score files +for score_file in scores_dir.glob("*_score.h5ad"): + try: + # Parse filename: {dataset}_{method}_score.h5ad + filename = score_file.stem # Remove .h5ad + + # Remove _score suffix + if filename.endswith('_score'): + filename = filename[:-6] # Remove last 6 characters '_score' + + # Try to match against known datasets - find which dataset this file belongs to + dataset = None + method = None + + for ds in known_datasets: + if filename.startswith(ds + '_'): + dataset = ds + method = filename[len(ds) + 1:] # Everything after dataset_ + break + + if not dataset or not method: + print(f"Warning: Could not parse filename {score_file.name}") + continue + + # Load score file + adata = ad.read_h5ad(score_file) + + # Extract metric scores from uns + if 'metric_ids' in adata.uns and 'metric_values' in adata.uns: + metric_ids = adata.uns['metric_ids'] + metric_values = adata.uns['metric_values'] + + # Create row for each metric + for metric_id, metric_value in zip(metric_ids, metric_values): + # Convert metric_value to float if it's a string + try: + score_value = float(metric_value) if isinstance(metric_value, str) else metric_value + except (ValueError, TypeError): + score_value = metric_value + + all_results.append({ + 'dataset': dataset, + 'method': method, + 'metric': metric_id, + 'score': score_value + }) + + print(f"Processed: {dataset} - {method} ({len(metric_ids)} metrics)") + else: + print(f"Warning: No metric data in {score_file.name}") + + except Exception as e: + print(f"Error processing {score_file.name}: {e}") + +# Create DataFrame +if all_results: + df = pd.DataFrame(all_results) + + # Pivot to wide format: rows=dataset+method, columns=metrics + df_wide = df.pivot_table( + index=['dataset', 'method'], + columns='metric', + values='score' + ).reset_index() + + # Save results (create directory if needed) + results_path = Path(results_file) + results_path.parent.mkdir(parents=True, exist_ok=True) + df_wide.to_csv(results_file, index=False) + print(f"\n{'='*50}") + print(f"Results saved to: {results_file}") + print(f"Total evaluations: {len(df_wide)}") + print(f"Datasets: {df_wide['dataset'].nunique()}") + print(f"Methods: {df_wide['method'].nunique()}") + print(f"Metrics: {len([c for c in df_wide.columns if c not in ['dataset', 'method']])}") + print(f"{'='*50}") +else: + print("No results found to process!") +EOF +} + +# Function to run consensus for a dataset +run_consensus() { + local dataset=$1 + bash scripts/prior/run_consensus.sh --dataset "$dataset" +} + +# Main execution +if [[ "$RUN_CONSENSUS" == "true" ]]; then + echo "" + echo "==========================================" + echo "Running Consensus for All Datasets" + echo "==========================================" + + for dataset in "${DATASETS[@]}"; do + run_consensus "$dataset" + done +fi + +if [[ "$RUN_METRICS" == "true" ]]; then + echo "" + echo "==========================================" + echo "Submitting Metric Evaluation Jobs" + echo "==========================================" + + job_count=0 + + for dataset in "${DATASETS[@]}"; do + echo "" + echo "Dataset: $dataset" + echo "----------------------------------------" + + models_folder="resources/results/${dataset}/" + # echo "Looking in: $models_folder" + + # Check each method for this dataset + for method in "${METHODS[@]}"; do + prediction_file="${models_folder}/${dataset}.${method}.${method}.prediction.h5ad" + + if [[ -f "$prediction_file" ]]; then + submit_metric_job "$dataset" "$method" "$prediction_file" + ((job_count++)) + else + echo " [NOT FOUND] ${prediction_file}" + fi + done + done + +fi + +if [[ "$PROCESS_RESULTS" == "true" ]]; then + process_all_results +fi + +echo "" +echo "Done!" diff --git a/src/local_workflows/run.sh b/scripts/local_workflows/run_grn_inference.sh similarity index 64% rename from src/local_workflows/run.sh rename to scripts/local_workflows/run_grn_inference.sh index 35775bba9..0baab01a8 100644 --- a/src/local_workflows/run.sh +++ b/scripts/local_workflows/run_grn_inference.sh @@ -3,11 +3,14 @@ set -e run_prefix='sbatch' #bash -DATASETS=('op' 'adamson' 'replogle' 'norman' 'nakatake' 'parsebioscience' '300BCG' 'xaira_HCT116' 'xaira_HEK293T') #'op' 'adamson' 'replogle' 'norman' 'nakatake' 'parsebioscience' '300BCG' 'xaira_HCT116' 'xaira_HEK293T' 'ibd_uc' 'ibd_cd' -DATASETS=('ibd_uc' 'ibd_cd') +python src/utils/config.py +source src/utils/config.env -# METHODS=('negative_control' 'positive_control' 'pearson_corr' 'portia' 'ppcor' 'grnboost' 'scenic' 'scenicplus' 'scglue' 'figr' 'granie') -METHODS=( 'ppcor' ) #'negative_control' 'positive_control' 'pearson_corr' 'portia' 'ppcor' 'grnboost' 'scenic' 'scenicplus' 'scglue' 'figr' 'granie' +DATASETS=(${DATASETS//,/ }) +# DATASETS=('parsebioscience') #'op' 'adamson' 'replogle' 'norman' 'nakatake' 'parsebioscience' '300BCG' 'xaira_HCT116' 'xaira_HEK293T' 'ibd_uc' 'ibd_cd' + +METHODS=(${METHODS//,/ }) +# METHODS=( 'scenic' 'grnboost') #'negative_control' 'positive_control' 'pearson_corr' 'portia' 'ppcor' 'grnboost' 'scenic' 'scenicplus' 'scglue' 'figr' 'granie' methods_dir='src/methods/' ctr_methods_dir='src/methods/' @@ -33,10 +36,8 @@ run_func() { if [[ "$run_prefix" == "bash" ]]; then bash "$script" $arguments elif [[ "$run_prefix" == "sbatch" ]]; then - # submit the job and capture the job ID output=$(sbatch "$script" $arguments) echo "$output" - # sbatch usually returns: "Submitted batch job 12345678" jobid=$(echo "$output" | awk '{print $4}') echo "Job ID: $jobid" else diff --git a/scripts/prior/run_consensus.sh b/scripts/prior/run_consensus.sh index 2c8622bf0..6f891ace2 100644 --- a/scripts/prior/run_consensus.sh +++ b/scripts/prior/run_consensus.sh @@ -13,21 +13,55 @@ set -e -DATASET=$1 +DATASET="" +NEW_MODEL_PATH="" + +while [[ $# -gt 0 ]]; do + case $1 in + --dataset) + DATASET="$2" + shift 2 + ;; + --new_model) + NEW_MODEL_PATH="$2" + shift 2 + ;; + *) + echo "Unknown option: $1" + echo "Usage: sbatch run_consensus.sh --dataset [--new_model ]" + exit 1 + ;; + esac +done + if [ -z "$DATASET" ]; then - echo "Usage: sbatch run_consensus.sh " + echo "Usage: sbatch run_consensus.sh --dataset [--new_model ]" exit 1 fi models_dir="resources/results/$DATASET" models=("pearson_corr" "positive_control" "portia" "ppcor" "scenic" "scprint" "grnboost" "scenicplus" "scglue" "granie" "figr" "celloracle" "scgpt" "geneformer" "spearman_corr") +python src/utils/config.py +source src/utils/config.env +METHODS=(${METHODS//,/ }) + predictions=() -for model in "${models[@]}"; do +for model in "${METHODS[@]}"; do file="${models_dir}/${DATASET}.${model}.${model}.prediction.h5ad" if [ -e "$file" ]; then predictions+=("$file") fi done + +if [ -n "$NEW_MODEL_PATH" ]; then + if [ -e "$NEW_MODEL_PATH" ]; then + echo "Adding new model: $NEW_MODEL_PATH" + predictions+=("$NEW_MODEL_PATH") + else + echo "Warning: New model path does not exist: $NEW_MODEL_PATH" + fi +fi + printf '%s\n' "${predictions[@]}" echo "Running consensus for Regression" diff --git a/scripts/process_data/rest.sh b/scripts/process_data/rest.sh index 7935f22e4..9d4fb4230 100755 --- a/scripts/process_data/rest.sh +++ b/scripts/process_data/rest.sh @@ -15,7 +15,7 @@ set -e # python src/process_data/main/adamson/script.py # python src/process_data/main/nakatake/script.py -# python src/process_data/main/norman/script.py +python src/process_data/main/norman/script.py # echo "Processing opsca" # python src/process_data/main/opsca/script.py @@ -27,5 +27,5 @@ set -e # echo "Processing 300BCG" # python src/process_data/main/300BCG/script.py -echo "Processing IBD" -python src/process_data/main/ibd/script.py +# echo "Processing IBD" +# python src/process_data/main/ibd/script.py diff --git a/scripts/run_all.sh b/scripts/run_all.sh index 32b3ac925..cf6fbcb61 100644 --- a/scripts/run_all.sh +++ b/scripts/run_all.sh @@ -1,17 +1,19 @@ set -e -# datasets=( 'replogle' 'op' 'nakatake' 'adamson' 'norman' 'xaira_HEK293T' 'xaira_HCT116' 'parsebioscience' 'ibd_uc' 'ibd_cd' '300BCG' ) #'replogle' 'op' 'nakatake' 'adamson' 'norman' 'xaira_HEK293T' 'xaira_HCT116' 'parsebioscience' 'ibd_uc' 'ibd_cd' '300BCG') # -datasets=( 'ibd_uc' 'ibd_cd' ) #'replogle' 'op' 'nakatake' 'adamson' 'norman' 'xaira_HEK293T' 'xaira_HCT116' 'parsebioscience' 'ibd_uc' 'ibd_cd' '300BCG') # -run_local=false # set to true to run locally, false to run on AWS +python src/utils/config.py +source src/utils/config.env +DATASETS=(${DATASETS//,/ }) -run_grn_inference=true -run_grn_evaluation=false -run_download=false +run_local=false +run_grn_inference=false #arg +run_consensus=true +run_grn_evaluation=true #arg +run_sync=false num_workers=20 -for dataset in "${datasets[@]}"; do +for dataset in "${DATASETS[@]}"; do trace_file="resources/results/$dataset/trace.txt" if [ "$run_grn_inference" = true ]; then @@ -48,12 +50,14 @@ for dataset in "${datasets[@]}"; do # fi - if [ "$run_local" = false ]; then - echo "Downloading inference results from AWS" - aws s3 sync s3://openproblems-data/resources/grn/results/$dataset resources/results/$dataset + # if [ "$run_local" = false ]; then + # echo "Downloading inference results from AWS" + # aws s3 sync s3://openproblems-data/resources/grn/results/$dataset resources/results/$dataset + # fi + if [ "$run_consensus" = true ]; then + echo "Running consensus for dataset: $dataset" + bash scripts/prior/run_consensus.sh --dataset $dataset # run consensus for Regression and ws distance -> needs to be run after adding each method and dataset fi - echo "Running consensus for dataset: $dataset" - bash scripts/prior/run_consensus.sh $dataset # run consensus for Regression and ws distance -> needs to be run after adding each method and dataset if [ "$run_local" = false ]; then echo "Syncing prior results to AWS" @@ -64,7 +68,7 @@ for dataset in "${datasets[@]}"; do bash scripts/run_grn_evaluation.sh --dataset=$dataset --run_local=$run_local --build_images=false --num_workers=$num_workers fi - if [ "$run_download" = true ]; then + if [ "$run_sync" = true ]; then if [ "$run_local" = false ]; then echo "Downloading evaluation results from AWS" aws s3 sync s3://openproblems-data/resources/grn/results/$dataset resources/results/$dataset diff --git a/scripts/run_consensus.sh b/scripts/run_consensus.sh new file mode 100644 index 000000000..b1a8d6b2b --- /dev/null +++ b/scripts/run_consensus.sh @@ -0,0 +1,118 @@ +#!/bin/bash +# Consensus Calculation Script +# This script runs consensus calculations for both Regression and WS distance metrics +# Usage: bash scripts/run_consensus.sh [run_mode] +# dataset: name of the dataset (e.g., replogle, op, norman) +# run_mode: 'local' (default) or 'aws' + +set -e + +DATASET=$1 + +if [ -z "$DATASET" ]; then + echo "Usage: bash scripts/run_consensus.sh [run_mode]" + echo " dataset: name of the dataset (required)" + echo " run_mode: 'local' (default) or 'aws'" + exit 1 +fi + +echo "==========================================" +echo "Running Consensus Calculation" +echo "Dataset: $DATASET" +echo "Run mode: $RUN_MODE" +echo "==========================================" + +# Set paths based on run mode +resources_dir="./resources" +models_dir="${resources_dir}/results/$DATASET" + +# Get available methods from config +echo "Checking available methods..." +available_methods=$(python -c " +from src.utils.config import METHODS +import os +methods = [] +for method in METHODS: + file = f'resources/results/$DATASET/$DATASET.{method}.{method}.prediction.h5ad' + if os.path.exists(file): + methods.append(method) +print(' '.join(methods)) +") + +if [ -z "$available_methods" ]; then + echo "No prediction files found for dataset: $DATASET" + exit 1 +fi + +echo "Available methods: $available_methods" + +# Convert space-separated list to array +methods_array=($available_methods) + +# Build predictions list +predictions=() +for method in "${methods_array[@]}"; do + file="resources/results/${DATASET}/${DATASET}.${method}.${method}.prediction.h5ad" + if [ -e "$file" ]; then + predictions+=("$file") + fi +done + +if [ ${#predictions[@]} -eq 0 ]; then + echo "No prediction files found for consensus calculation" + exit 1 +fi + +echo "Found ${#predictions[@]} prediction files for consensus calculation" +printf '%s\n' "${predictions[@]}" + +# Run Regression consensus +echo "" +echo "Running Regression consensus..." +python src/metrics/regression/consensus/script.py \ + --dataset "$DATASET" \ + --regulators_consensus "resources/grn_benchmark/prior/regulators_consensus_${DATASET}.json" \ + --evaluation_data "resources/grn_benchmark/evaluation_data/${DATASET}_bulk.h5ad" \ + --predictions "${predictions[@]}" + +echo "Regression consensus completed successfully" + +# Run WS distance consensus (only for applicable datasets) +applicable_datasets=("norman" "adamson" "replogle" "xaira_HEK293T" "xaira_HCT116") +skip_ws=true +for d in "${applicable_datasets[@]}"; do + if [[ "$DATASET" == "$d" ]]; then + skip_ws=false + break + fi +done + +if [ "$skip_ws" = true ]; then + echo "" + echo "Skipping WS distance consensus (not applicable for dataset: $DATASET)" +else + echo "" + echo "Running WS distance consensus..." + python src/metrics/ws_distance/consensus/script.py \ + --dataset "$DATASET" \ + --models_dir "resources/results/$DATASET" \ + --ws_consensus "resources/grn_benchmark/prior/ws_consensus_${DATASET}.csv" \ + --tf_all "resources/grn_benchmark/prior/tf_all.csv" \ + --evaluation_data_sc "resources/processed_data/${DATASET}_evaluation_sc.h5ad" \ + --models "${methods_array[@]}" + + echo "WS distance consensus completed successfully" +fi + +# Sync results to AWS if needed +if [ "$RUN_MODE" = "aws" ]; then + echo "" + echo "Syncing consensus results to AWS..." + aws s3 sync resources/grn_benchmark/prior s3://openproblems-data/resources/grn/grn_benchmark/prior + echo "Sync completed" +fi + +echo "" +echo "==========================================" +echo "Consensus calculation completed for $DATASET" +echo "==========================================" diff --git a/scripts/run_grn_evaluation.sh b/scripts/run_grn_evaluation.sh index 79b7f7241..c4dc0bd6a 100755 --- a/scripts/run_grn_evaluation.sh +++ b/scripts/run_grn_evaluation.sh @@ -106,8 +106,8 @@ param_aws="s3://openproblems-data/resources/grn/results/params/${RUN_ID}_param_l # Generate and source config file echo "Generating dataset configuration..." -python src/utils/config.py --output src/utils/dataset_config.env -source src/utils/dataset_config.env +python src/utils/config.py +source src/utils/config.env if [ "$RUN_LOCAL" = true ]; then @@ -181,29 +181,13 @@ HERE if [ "$PREDICTION" != "none" ]; then append_entry "single_run" $PREDICTION "$DATASET" else - grn_names=( - "positive_control" - "pearson_corr" - "negative_control" - "spearman_corr" - "scglue" - "scenicplus" - "celloracle" - "granie" - "figr" - "grnboost" - "portia" - "scenic" - "scprint" - "geneformer" - "scgpt" - ) + METHODS =(${METHODS//,/ }) grn_models_folder="${resources_dir}/results/${models_folder}/" grn_models_folder_local="./resources/results/${models_folder}/" # just to control the hetergenity of the models for different datasets # Iterate over GRN models available_methods=() - for grn_name in "${grn_names[@]}"; do + for grn_name in "${METHODS[@]}"; do prediction_file="${grn_models_folder_local}/${DATASET}.${grn_name}.${grn_name}.prediction.h5ad" if [[ -f "${prediction_file}" ]]; then prediction_file=${grn_models_folder}/${DATASET}.${grn_name}.${grn_name}.prediction.h5ad diff --git a/scripts/run_grn_inference.sh b/scripts/run_grn_inference.sh index d95691305..2772f4397 100755 --- a/scripts/run_grn_inference.sh +++ b/scripts/run_grn_inference.sh @@ -87,13 +87,12 @@ append_entry() { else layer_="$layer" fi - + group_id="${dataset}" if [ "$use_train_sc" = true ]; then rna_file="${resources_dir}/extended_data/${dataset}_train_sc.h5ad" - group_id="${dataset}_sc" else rna_file="${resources_dir}/grn_benchmark/inference_data/${dataset}_rna.h5ad" - group_id="${dataset}" + fi cat >> "$param_local" << HERE diff --git a/scripts/sync_resources.sh b/scripts/sync_resources.sh index 4f27282a8..75d1b3c24 100755 --- a/scripts/sync_resources.sh +++ b/scripts/sync_resources.sh @@ -22,14 +22,14 @@ set -e # aws s3 sync s3://openproblems-data/resources/grn/grn_benchmark resources/grn_benchmark/ --no-sign-request # aws s3 sync resources/grn_benchmark/prior s3://openproblems-data/resources/grn/grn_benchmark/prior --delete -aws s3 sync resources/extended_data/ s3://openproblems-data/resources/grn/extended_data --delete +# aws s3 sync resources/extended_data/ s3://openproblems-data/resources/grn/extended_data --delete # aws s3 sync resources/results/experiment s3://openproblems-data/resources/grn/results/experiment --delete # aws s3 sync resources_test s3://openproblems-data/resources_test/grn/ --delete # aws s3 sync s3://openproblems-data/resources_test/grn/ resources_test --delete # aws s3 sync s3://openproblems-data/resources/grn/grn_benchmark/ground_truth resources_test/grn_benchmark/ground_truth # aws s3 sync resources/grn_benchmark/ground_truth s3://openproblems-data/resources/grn/grn_benchmark/ground_truth -aws s3 sync resources/grn_benchmark/ s3://openproblems-data/resources/grn/grn_benchmark/ --delete -# aws s3 sync resources/results/ibd_uc s3://openproblems-data/resources/grn/results/ibd_uc +# aws s3 sync resources/grn_benchmark/ s3://openproblems-data/resources/grn/grn_benchmark/ --delete +aws s3 sync s3://openproblems-data/resources/grn/results/ resources/results/ --delete # aws s3 sync resources/results/ibd_cd s3://openproblems-data/resources/grn/results/ibd_cd # aws s3 sync s3://openproblems-data/resources/grn/grn_benchmark/ground_truth resources/grn_benchmark/ground_truth --no-sign-request diff --git a/src/metrics/all_metrics/helper.py b/src/metrics/all_metrics/helper.py index ec5756750..659f9ac1d 100644 --- a/src/metrics/all_metrics/helper.py +++ b/src/metrics/all_metrics/helper.py @@ -10,7 +10,7 @@ from regression.helper import main as regression from ws_distance.helper import main as ws_distance from sem.helper import main as sem -from anchor_regression.helper import main as anchor_regression +# from anchor_regression.helper import main as anchor_regression from tf_recovery.helper import main as tf_recovery from tf_binding.helper import main as tf_binding from rc_tf_act.helper import main as rc_tf_act @@ -23,7 +23,7 @@ 'regression': regression, 'ws_distance': ws_distance, 'sem': sem, - 'anchor_regression': anchor_regression, + # 'anchor_regression': anchor_regression, 'tf_recovery': tf_recovery, 'tf_binding': tf_binding, 'rc_tf_act': rc_tf_act, diff --git a/src/metrics/all_metrics/run_all.sh b/src/metrics/all_metrics/run_all.sh deleted file mode 100644 index a40711e08..000000000 --- a/src/metrics/all_metrics/run_all.sh +++ /dev/null @@ -1,20 +0,0 @@ -run_type='sbatch' - -metrics=( - rc_tf_act - regression - tf_recovery - ar - rc_tf_act - tf_binding - vc - ws_distance - sem - gs_recovery -) -for metric in "${metrics[@]}"; do - echo "Running metric: ${metric}" - ${run_type} src/metrics/${metric}/run_local.sh - echo "----------------------------------------" -done - diff --git a/src/metrics/all_metrics/run_local.sh b/src/metrics/all_metrics/run_local.sh index 00a69707d..2f3cd28c4 100644 --- a/src/metrics/all_metrics/run_local.sh +++ b/src/metrics/all_metrics/run_local.sh @@ -5,7 +5,7 @@ #SBATCH --ntasks=1 #SBATCH --cpus-per-task=20 #SBATCH --time=2:00:00 -#SBATCH --mem=120GB +#SBATCH --mem=60GB #SBATCH --partition=gpu #SBATCH --gres=gpu:1 #SBATCH --mail-type=END,FAIL @@ -77,7 +77,7 @@ fi # exit 1 # fi -source src/utils/dataset_config.env +source src/utils/config.env cell_type_var="CELLTYPE_${dataset}" cell_type="${!cell_type_var}" diff --git a/src/metrics/anchor_regression/config.vsh.yaml b/src/metrics/experimental/anchor_regression/config.novsh.yaml similarity index 100% rename from src/metrics/anchor_regression/config.vsh.yaml rename to src/metrics/experimental/anchor_regression/config.novsh.yaml diff --git a/src/metrics/anchor_regression/helper.py b/src/metrics/experimental/anchor_regression/helper.py similarity index 100% rename from src/metrics/anchor_regression/helper.py rename to src/metrics/experimental/anchor_regression/helper.py diff --git a/src/metrics/anchor_regression/run_global.sh b/src/metrics/experimental/anchor_regression/run_global.sh similarity index 100% rename from src/metrics/anchor_regression/run_global.sh rename to src/metrics/experimental/anchor_regression/run_global.sh diff --git a/src/metrics/anchor_regression/run_local.sh b/src/metrics/experimental/anchor_regression/run_local.sh similarity index 100% rename from src/metrics/anchor_regression/run_local.sh rename to src/metrics/experimental/anchor_regression/run_local.sh diff --git a/src/metrics/anchor_regression/script.py b/src/metrics/experimental/anchor_regression/script.py similarity index 100% rename from src/metrics/anchor_regression/script.py rename to src/metrics/experimental/anchor_regression/script.py diff --git a/src/metrics/rc_tf_act/run_local.sh b/src/metrics/rc_tf_act/run_local.sh index 6e961cf41..a1240c000 100755 --- a/src/metrics/rc_tf_act/run_local.sh +++ b/src/metrics/rc_tf_act/run_local.sh @@ -14,9 +14,9 @@ set -euo pipefail save_dir="output/rc_tf_act" mkdir -p "$save_dir" - + # Datasets to process (only those with rc_tf_ac grouping defined) -datasets=('300BCG' 'parsebioscience' 'op') +datasets=('ibd_uc') # datasets=('op' ) # Methods to process methods=("grnboost" "pearson_corr" "negative_control" "positive_control" "ppcor" "portia" "scenic" "scprint" "scenicplus" "celloracle" "scglue" "figr" "granie") diff --git a/src/metrics/regression/helper.py b/src/metrics/regression/helper.py index 7a07d3186..4aad5eafd 100644 --- a/src/metrics/regression/helper.py +++ b/src/metrics/regression/helper.py @@ -336,10 +336,23 @@ def main(par: Dict[str, Any]) -> Tuple[pd.DataFrame, pd.DataFrame]: # Load data prturb_adata = ad.read_h5ad(par['evaluation_data']) layer = manage_layer(prturb_adata, par) - gene_names = prturb_adata.var.index.to_numpy() + all_gene_names = prturb_adata.var.index.to_numpy() with open(par['regulators_consensus'], 'r') as f: data = json.load(f) - print(len(data), len(gene_names)) + + # Filter genes to only include those in consensus + gene_names = np.array([gene for gene in all_gene_names if gene in data]) + missing_genes = set(all_gene_names) - set(gene_names) + + if len(missing_genes) > 0: + print(f"Warning: {len(missing_genes)} genes not in consensus data and will be omitted from evaluation") + print(f"Missing genes: {sorted(list(missing_genes))[:10]}..." if len(missing_genes) > 10 else f"Missing genes: {sorted(list(missing_genes))}") + + # Filter the adata to only include genes in consensus + gene_mask = prturb_adata.var.index.isin(gene_names) + prturb_adata = prturb_adata[:, gene_mask] + + print(f"Evaluating {len(gene_names)} genes (consensus data available for all)") n_features_theta_025 = np.asarray([data[gene_name]['0.25'] for gene_name in gene_names], dtype=int) n_features_theta_075 = np.asarray([data[gene_name]['0.75'] for gene_name in gene_names], dtype=int) diff --git a/src/metrics/regression/run_local.sh b/src/metrics/regression/run_local.sh index 3e3c1d7fc..c008e80f3 100644 --- a/src/metrics/regression/run_local.sh +++ b/src/metrics/regression/run_local.sh @@ -17,7 +17,7 @@ mkdir -p "$save_dir" # datasets to process datasets=('ibd_uc' 'ibd_cd' 'op' 'parsebioscience' "300BCG" "adamson" "replogle" "xaira_HEK293T" "xaira_HCT116" "nakatake" "norman" ) #"300BCG" "ibd" 'parsebioscience', 'xaira_HEK293T' -# datasets=('xaira_HEK293T' ) #"300BCG" "ibd" 'parsebioscience', 'xaira_HEK293T' +datasets=('norman' ) #"300BCG" "ibd" 'parsebioscience', 'xaira_HEK293T' # methods to process methods=( "pearson_corr" "positive_control" "negative_control" "ppcor" "portia" "scenic" "grnboost" "scprint" "scenicplus" "celloracle" "scglue" "figr" "granie") diff --git a/src/metrics/sem/helper.py b/src/metrics/sem/helper.py index c74022b06..840b2c4da 100644 --- a/src/metrics/sem/helper.py +++ b/src/metrics/sem/helper.py @@ -510,8 +510,8 @@ def main(par): print(f"SEM HVG score (max): {np.max(valid_scores_hvg):.4f}") results = { - 'sem_grn': [float(sem_grn_score)], - 'sem_hvg': [float(sem_hvg_score)], + # 'sem_grn': [float(sem_grn_score)], + # 'sem_hvg': [float(sem_hvg_score)], 'sem': [float((sem_grn_score + sem_hvg_score) / 2)] } diff --git a/src/metrics/vc/analyze_permutation.py b/src/metrics/vc/analyze_permutation.py deleted file mode 100644 index 520ea135c..000000000 --- a/src/metrics/vc/analyze_permutation.py +++ /dev/null @@ -1,153 +0,0 @@ -""" -Analyze how vc metric scores change when GRN structure is permuted. -Tests robustness by shuffling TF-gene pairs in the network. -""" - -import numpy as np -import pandas as pd -import anndata as ad -from helper import main as main_vc -import sys - -def permute_grn_edges(net_df, permutation_degree=1.0, seed=42): - """ - Permute the GRN by shuffling TF-gene pairs. - - Args: - net_df: DataFrame with 'source', 'target', 'weight' columns - permutation_degree: Fraction of edges to permute (0.0 to 1.0) - seed: Random seed - - Returns: - Permuted network DataFrame - """ - np.random.seed(seed) - net_permuted = net_df.copy() - - n_edges = len(net_df) - n_to_permute = int(n_edges * permutation_degree) - - if n_to_permute == 0: - return net_permuted - - # Select random edges to permute - indices = np.random.choice(n_edges, n_to_permute, replace=False) - - # Shuffle the targets for selected edges - targets = net_permuted.loc[indices, 'target'].values - np.random.shuffle(targets) - net_permuted.loc[indices, 'target'] = targets - - return net_permuted - - -def run_permutation_analysis(par, permutation_degrees=[0.0, 0.2, 0.5, 0.8, 1.0]): - """ - Run vc metric with different levels of GRN permutation. - - Args: - par: Parameters dict with paths to data and prediction - permutation_degrees: List of permutation fractions to test - - Returns: - DataFrame with results for each permutation level - """ - results = [] - - # Load original prediction - read as DataFrame from var - pred_adata = ad.read_h5ad(par['prediction']) - original_net = pred_adata.var.copy() - - if 'source' not in original_net.columns or 'target' not in original_net.columns: - # Try to get from varm - if 'skeleton' in pred_adata.varm: - original_net = pd.DataFrame(pred_adata.varm['skeleton'], columns=['source', 'target', 'weight']) - else: - raise ValueError("Cannot find GRN data in prediction file") - - for degree in permutation_degrees: - print(f"\n{'='*60}") - print(f"Testing permutation degree: {degree:.0%}") - print(f"{'='*60}") - - # Permute network - if degree > 0: - permuted_net = permute_grn_edges(original_net, degree, seed=42) - - # Create permuted anndata with same structure - permuted_adata = ad.AnnData(uns=pred_adata.uns.copy()) - permuted_adata.var = permuted_net - - permuted_path = par['prediction'].replace('.h5ad', f'_perm{int(degree*100)}.h5ad') - permuted_adata.write_h5ad(permuted_path) - - # Update parameter - par_temp = par.copy() - par_temp['prediction'] = permuted_path - else: - par_temp = par.copy() - - # Run evaluation - try: - df_result = main_vc(par_temp) - r2_score = df_result['vc'].values[0] - - results.append({ - 'permutation_degree': degree, - 'r2_score': r2_score - }) - - print(f"R² score: {r2_score:.4f}") - - except Exception as e: - print(f"Error at permutation degree {degree}: {e}") - import traceback - traceback.print_exc() - results.append({ - 'permutation_degree': degree, - 'r2_score': np.nan - }) - - return pd.DataFrame(results) - - -if __name__ == '__main__': - # Configuration - dataset = 'op' # Changed from 'replogle' to 'op' - method = 'grnboost' - - par = { - 'prediction': f'resources/results/{dataset}/{dataset}.{method}.{method}.prediction.h5ad', - 'evaluation_data': f'resources/grn_benchmark/evaluation_data/{dataset}_bulk.h5ad', - 'score': f'output/vc/vc_{dataset}_{method}_permutation.h5ad' - } - - print(f"Dataset: {dataset}") - print(f"Method: {method}") - - # Run permutation analysis - results_df = run_permutation_analysis( - par, - permutation_degrees=[0.0, 0.2, 0.5, 0.8, 1.0] - ) - - # Save results - output_path = f'output/vc/permutation_analysis_{dataset}_{method}.csv' - results_df.to_csv(output_path, index=False) - - print(f"\n{'='*60}") - print("Permutation Analysis Results") - print(f"{'='*60}") - print(results_df.to_string(index=False)) - print(f"\nResults saved to: {output_path}") - - # Calculate score degradation - if len(results_df) > 0 and not results_df['r2_score'].isna().all(): - original_score = results_df.loc[results_df['permutation_degree'] == 0.0, 'r2_score'].values[0] - final_score = results_df.loc[results_df['permutation_degree'] == 1.0, 'r2_score'].values[0] - - if not np.isnan(original_score) and not np.isnan(final_score): - degradation = (original_score - final_score) / original_score * 100 - print(f"\nScore degradation with 100% permutation: {degradation:.1f}%") - print(f"Original R²: {original_score:.4f}") - print(f"Permuted R²: {final_score:.4f}") diff --git a/src/metrics/vc/analyze_robustness.py b/src/metrics/vc/analyze_robustness.py index be8021b45..04e266544 100644 --- a/src/metrics/vc/analyze_robustness.py +++ b/src/metrics/vc/analyze_robustness.py @@ -21,7 +21,7 @@ sys.path.append('src/utils') from helper import main as main_vc -from util import process_links +from util import process_links, parse_args def permute_grn(prediction: pd.DataFrame, degree: float, noise_type: str) -> pd.DataFrame: @@ -316,6 +316,7 @@ def create_robustness_plot(df_results, output_dir): help='Path to evaluation data h5ad file') parser.add_argument('--output_dir', type=str, required=True, help='Output directory for results') + parser.add_argument('--n_top_genes', type=int, default=3000) parser.add_argument('--degrees', type=float, nargs='+', default=[0.0, 0.2, 0.5, 1.0], help='Permutation degrees (0.0 to 1.0)') @@ -332,7 +333,8 @@ def create_robustness_plot(df_results, output_dir): 'output_dir': args.output_dir, 'degrees': args.degrees, 'noise_types': args.noise_types, - 'score': f"{args.output_dir}/vc_score.h5ad" + 'score': f"{args.output_dir}/vc_score.h5ad", + 'n_top_genes': args.n_top_genes } # Run analysis diff --git a/src/metrics/vc/helper.py b/src/metrics/vc/helper.py index f0c5cdd1d..7a933b51d 100644 --- a/src/metrics/vc/helper.py +++ b/src/metrics/vc/helper.py @@ -499,7 +499,8 @@ def main(par): gene_mask_grn = np.logical_or(np.any(A_full, axis=1), np.any(A_full, axis=0)) in_degrees = np.sum(A_full != 0, axis=0) out_degrees = np.sum(A_full != 0, axis=1) - n_genes_grn = par['n_top_genes'] + # n_genes_grn = par['n_top_genes'] + n_genes_grn = 1000 # Select top n_genes_grn by connectivity gene_connectivity = in_degrees + out_degrees @@ -621,9 +622,10 @@ def main(par): print(f"VC HVG: {vc_hvg_score:.4f}") print(f"VC (average): {(vc_grn_score + vc_hvg_score) / 2:.4f}") + # add baseline grn that has same target genes -> assumption: cetrain genes are easy to predict results = { - 'vc_grn': [vc_grn_score], - 'vc_hvg': [vc_hvg_score], + # 'vc_grn': [vc_grn_score], + # 'vc_hvg': [vc_hvg_score], 'vc': [float((vc_grn_score + vc_hvg_score) / 2)] } diff --git a/src/metrics/vc/run_local.sh b/src/metrics/vc/run_local.sh index 65c0cb377..93fc032f6 100644 --- a/src/metrics/vc/run_local.sh +++ b/src/metrics/vc/run_local.sh @@ -17,7 +17,7 @@ mkdir -p "$save_dir" # datasets to process datasets=( "replogle" "xaira_HEK293T" "xaira_HCT116" "nakatake" "norman" "adamson" 'parsebioscience' 'op' "300BCG" 'ibd_uc' 'ibd_cd') #"300BCG" "ibd" 'parsebioscience', 'xaira_HEK293T' -datasets=( "op" "300BCG" "parsebioscience" "ibd" ) +datasets=( "norman" ) # methods to process methods=( "pearson_corr" "positive_control" "negative_control" "ppcor" "portia" "scenic" "grnboost" "scprint" "scenicplus" "celloracle" "scglue" "figr" "granie") # methods=( "grnboost") diff --git a/src/metrics/vc/run_robustness.sh b/src/metrics/vc/run_robustness.sh index ba482e4a9..8ac3c3baf 100644 --- a/src/metrics/vc/run_robustness.sh +++ b/src/metrics/vc/run_robustness.sh @@ -12,7 +12,7 @@ set -euo pipefail # Configuration DATASET="op" -METHOD="grnboost" +METHOD="pearson_corr" OUTPUT_DIR="output/vc/robustness" # Input files @@ -36,7 +36,7 @@ python src/metrics/vc/analyze_robustness.py \ --prediction "${PREDICTION}" \ --evaluation_data "${EVALUATION_DATA}" \ --output_dir "${OUTPUT_DIR}" \ - --degrees 0.0 0.2 0.5 1.0 \ + --degrees 0.0 0.5 1.0 \ --noise_types net echo "" diff --git a/src/process_data/helper_data.py b/src/process_data/helper_data.py index 1e726fcad..43518bcdd 100644 --- a/src/process_data/helper_data.py +++ b/src/process_data/helper_data.py @@ -66,7 +66,7 @@ def normalize_func(adata, log_norm=True, pearson_residual=False, target_sum=1e4) import scipy.sparse as sp counts = adata.layers['counts'].copy() if 'counts' in adata.layers else adata.X.copy() adata.layers['counts'] = sp.csr_matrix(counts) if not sp.issparse(counts) else counts - assert sp.issparse(counts), "Counts matrix must be sparse." + assert sp.issparse(adata.layers['counts']), "Counts matrix must be sparse." print("min:", counts.min(), "max:", counts.max(), "mean:", counts.mean()) if pearson_residual: diff --git a/src/process_data/main/ibd/script.py b/src/process_data/main/ibd/script.py index 0259ba581..d34167b1f 100644 --- a/src/process_data/main/ibd/script.py +++ b/src/process_data/main/ibd/script.py @@ -191,5 +191,7 @@ def harmonize(adata_rna, adata_atac): adata_rna_bulk_d = adata_rna_bulk[adata_rna_bulk.obs['disease']==disease] adata_rna_bulk_d.uns['dataset_id'] = f'ibd_{disease.lower()}' adata_rna_bulk_d.write(f'resources/extended_data/ibd_{disease}_bulk.h5ad') +adata_rna_bulk.uns['dataset_id'] = f'ibd' +adata_rna_bulk.write(f'resources/extended_data/ibd_bulk.h5ad') print('Done') \ No newline at end of file diff --git a/src/process_data/main/norman/script.py b/src/process_data/main/norman/script.py index 359f3f474..d88cba64c 100644 --- a/src/process_data/main/norman/script.py +++ b/src/process_data/main/norman/script.py @@ -29,6 +29,7 @@ sys.path.append(meta["resources_dir"]) from helper_data import sum_by +from helper_data import wrapper_large_perturbation_data, split_data_gene_perturbation, split_control_groups def add_metadata(adata): @@ -39,7 +40,7 @@ def add_metadata(adata): adata.uns['dataset_id'] = 'norman' adata.uns['dataset_name'] = 'Norman' adata.uns['dataset_organism'] = 'human' - adata.uns['normalization_id'] = 'X_norm' + adata.uns['normalization_id'] = 'lognorm' return adata if __name__ == '__main__': @@ -62,48 +63,80 @@ def add_metadata(adata): adata.var.index = adata.var.index.astype(str) adata.obs = adata.obs[['perturbation', 'is_control', 'perturbation_type']] - # preprocess - sc.pp.filter_cells(adata, min_genes=100) - sc.pp.filter_genes(adata, min_cells=10) - - # - - adata.layers['X_norm'] = adata.X.copy() - - # - split to inference and evaluation datasets - ctr_pertb = adata[adata.obs['is_control']].obs['perturbation'].unique() - non_ctr_pertubs =adata[~adata.obs['is_control']].obs['perturbation'].unique() - train_perturbs, test_perturbs = train_test_split(non_ctr_pertubs, test_size=.5, random_state=32) - train_perturbs = np.concatenate([train_perturbs, ctr_pertb]) # add control perturbations to test set for ws_distance - test_perturbs = np.concatenate([test_perturbs, ctr_pertb]) - - adata_train_sc = adata[adata.obs['perturbation'].isin(train_perturbs)] - adata_test_sc = adata[adata.obs['perturbation'].isin(test_perturbs)] - - - # - filter genes and cells - sc.pp.filter_cells(adata_train_sc, min_genes=100) - sc.pp.filter_genes(adata_train_sc, min_cells=10) - - sc.pp.filter_cells(adata_test_sc, min_genes=100) - sc.pp.filter_genes(adata_test_sc, min_cells=10) - - # - pseudo bulk - adata_bulk = sum_by(adata, unique_mapping=True, col='perturbation') - norman_test_bulk = sum_by(adata_test_sc, unique_mapping=True, col='perturbation') # summing over X_norm - - # - normalize evaluation data - norman_test_bulk.layers['X_norm'] = norman_test_bulk.X.copy() - adata_train_sc.layers['X_norm'] = adata_train_sc.X.copy() - adata_bulk.layers['X_norm'] = adata_bulk.X.copy() - - # - add metadata - adata_bulk = add_metadata(adata_bulk) - norman_test_bulk = add_metadata(norman_test_bulk) - adata_test_sc = add_metadata(adata_test_sc) - adata_train_sc = add_metadata(adata_train_sc) - # - save - print('saving...') - adata_bulk.write(par['norman_bulk']) - adata_test_sc.write(par['norman_test_sc']) - norman_test_bulk.write(par['norman_test_bulk']) - adata_train_sc.write(par['norman_train_sc']) \ No newline at end of file + # preprocess + if False: + sc.pp.filter_cells(adata, min_genes=100) + sc.pp.filter_genes(adata, min_cells=10) + + # - + adata.layers['X_norm'] = adata.X.copy() + + # - split to inference and evaluation datasets + ctr_pertb = adata[adata.obs['is_control']].obs['perturbation'].unique() + non_ctr_pertubs =adata[~adata.obs['is_control']].obs['perturbation'].unique() + train_perturbs, test_perturbs = train_test_split(non_ctr_pertubs, test_size=.5, random_state=32) + train_perturbs = np.concatenate([train_perturbs, ctr_pertb]) # add control perturbations to test set for ws_distance + test_perturbs = np.concatenate([test_perturbs, ctr_pertb]) + + adata_train_sc = adata[adata.obs['perturbation'].isin(train_perturbs)] + adata_test_sc = adata[adata.obs['perturbation'].isin(test_perturbs)] + + + # - filter genes and cells + sc.pp.filter_cells(adata_train_sc, min_genes=100) + sc.pp.filter_genes(adata_train_sc, min_cells=10) + + sc.pp.filter_cells(adata_test_sc, min_genes=100) + sc.pp.filter_genes(adata_test_sc, min_cells=10) + + # - pseudo bulk + adata_bulk = sum_by(adata, unique_mapping=True, col='perturbation') + norman_test_bulk = sum_by(adata_test_sc, unique_mapping=True, col='perturbation') # summing over X_norm + + # - normalize evaluation data (proper log normalization to avoid overflow) + # For pseudobulk data, normalize and log transform + sc.pp.normalize_total(norman_test_bulk, target_sum=1e4) + sc.pp.log1p(norman_test_bulk) + norman_test_bulk.layers['X_norm'] = norman_test_bulk.X.copy() + + sc.pp.normalize_total(adata_bulk, target_sum=1e4) + sc.pp.log1p(adata_bulk) + adata_bulk.layers['X_norm'] = adata_bulk.X.copy() + + # For single-cell data, just copy (already filtered and should be reasonable) + adata_train_sc.layers['X_norm'] = adata_train_sc.X.copy() + adata_test_sc.layers['X_norm'] = adata_test_sc.X.copy() + + # - clean infinity values from all layers + for adata_obj, name in [(norman_test_bulk, 'norman_test_bulk'), + (adata_train_sc, 'adata_train_sc'), + (adata_bulk, 'adata_bulk'), + (adata_test_sc, 'adata_test_sc')]: + for layer_name in adata_obj.layers.keys(): + layer_data = adata_obj.layers[layer_name] + if csr_matrix is not None and isinstance(layer_data, csr_matrix): + layer_data = layer_data.toarray() + if np.any(np.isinf(layer_data)): + print(f"Warning: Found {np.sum(np.isinf(layer_data))} infinity values in {name}.layers['{layer_name}']. Replacing with 0.") + layer_data[np.isinf(layer_data)] = 0 + adata_obj.layers[layer_name] = csr_matrix(layer_data) if isinstance(adata_obj.layers[layer_name], csr_matrix) else layer_data + + # - add metadata + adata_bulk = add_metadata(adata_bulk) + norman_test_bulk = add_metadata(norman_test_bulk) + adata_test_sc = add_metadata(adata_test_sc) + adata_train_sc = add_metadata(adata_train_sc) + # - save + print('saving...') + adata_bulk.write(par['norman_bulk']) + adata_test_sc.write(par['norman_test_sc']) + norman_test_bulk.write(par['norman_test_bulk']) + adata_train_sc.write(par['norman_train_sc']) + else: + adata = split_control_groups(adata, perturbation_col='perturbation', control_flag_col='is_control', new_col='control_split') + + wrapper_large_perturbation_data(adata, split_func=split_data_gene_perturbation, + covariates=['perturbation', 'control_split'], + qc_perturbation_effect=False, + add_metadata=add_metadata, + save_name='norman') \ No newline at end of file diff --git a/src/utils/config.env b/src/utils/config.env new file mode 100644 index 000000000..7283c74fb --- /dev/null +++ b/src/utils/config.env @@ -0,0 +1,32 @@ +# Auto-generated dataset configuration +# Format: DATASET_VARIABLE=value + +# Global lists (comma-separated) +METHODS="positive_control,pearson_corr,grnboost,ppcor,portia,scenic,geneformer,scgpt,ppcor,scenicplus,celloracle,figr,granie,scglue,scprint,negative_control" +METRICS="r_precision,r_recall,ws_precision,ws_recall,vc,sem,t_rec_precision,t_rec_recall,rc_tf_act,tfb_f1,gs_f1" +DATASETS="op,parsebioscience,300BCG,ibd_uc,ibd_cd,replogle,xaira_HEK293T,xaira_HCT116,nakatake,norman" +FINAL_METRICS="r_precision,r_recall,vc,sem,ws_precision,ws_recall" + +# Cell types +CELLTYPE_replogle="K562" +CELLTYPE_norman="K562" +CELLTYPE_xaira_HEK293T="HEK293T" +CELLTYPE_xaira_HCT116="HCT116" +CELLTYPE_op="PBMC" +CELLTYPE_parsebioscience="PBMC" +CELLTYPE_300BCG="PBMC" +CELLTYPE_ibd_uc="PBMC" +CELLTYPE_ibd_cd="PBMC" +CELLTYPE_nakatake="" + +# Metrics (comma-separated) +METRICS_replogle="regression,ws_distance,tf_recovery,tf_binding,sem,gs_recovery,vc" +METRICS_norman="regression,ws_distance,tf_binding,gs_recovery,vc" +METRICS_nakatake="regression,sem,gs_recovery,vc" +METRICS_op="regression,vc,rc_tf_act,tf_binding,sem,gs_recovery" +METRICS_300BCG="regression,vc,rc_tf_act,tf_binding,sem,gs_recovery" +METRICS_ibd_uc="regression,tf_binding,gs_recovery,rc_tf_act" +METRICS_ibd_cd="regression,tf_binding,gs_recovery,rc_tf_act" +METRICS_parsebioscience="regression,vc,rc_tf_act,tf_binding,sem,gs_recovery" +METRICS_xaira_HEK293T="regression,ws_distance,tf_recovery,tf_binding,sem,gs_recovery,vc" +METRICS_xaira_HCT116="regression,ws_distance,tf_recovery,tf_binding,sem,gs_recovery,vc" diff --git a/src/utils/config.py b/src/utils/config.py index 230a51bee..1ad57379b 100644 --- a/src/utils/config.py +++ b/src/utils/config.py @@ -4,6 +4,88 @@ METHODS = ['positive_control', 'pearson_corr', 'grnboost', 'ppcor', 'portia', 'scenic', 'geneformer', 'scgpt', 'ppcor', 'scenicplus', 'celloracle', 'figr', 'granie', 'scglue', 'scprint', 'negative_control'] + + +DATASET_INFO = { + "op": { + "cell_type": "PBMC", + "perturbation_type": "Drugs", + "Inference data": " sc", + 'Measurement time': "24 hours", + "Modality": 'Multiomics' + }, + "ibd_uc": { + "cell_type": "PBMC", + "perturbation_type": "Chemicals/ bacteria", + "Inference data": "sc", + 'Measurement time': "24 hours", + "Modality": 'Multiomics' + }, + "ibd_cd": { + "cell_type": "PBMC", + "perturbation_type": "Chemicals/ bacteria", + "Inference data": "sc", + 'Measurement time': "24 hours", + "Modality": 'Multiomics' + }, + "300BCG": { + "cell_type": "PBMC", + "perturbation_type": "Chemicals", + "Inference data": "sc", + 'Measurement time': 'T0 and 3 months', + "Modality": 'Transcriptmoics' + }, + "parsebioscience": { + "cell_type": "PBMC", + "perturbation_type": "Cytokines", + "Inference data": " sc/bulk", + 'Measurement time': "24 hours", + "Modality": 'Transcriptmoics' + }, + "xaira_HEK293T": { + "cell_type": "HEK293T", + "perturbation_type": "Knockout", + "Inference data": " sc/bulk", + 'Measurement time': "7 days", + "Modality": 'Transcriptmoics' + }, + "xaira_HCT116": { + "cell_type": "HCT116", + "perturbation_type": "Knockout", + "Inference data": " sc/bulk", + 'Measurement time': "7 days", + "Modality": 'Transcriptmoics' + }, + "replogle": { + "cell_type": "K562", + "perturbation_type": "Knockout", + "Inference data": " sc/bulk", + 'Measurement time': "7 days", + "Modality": 'Transcriptmoics' + }, + "nakatake": { + "cell_type": "SEES3 (PSC)", + "perturbation_type": "Overexpression", + "Inference data": "bulk", + 'Measurement time': "2 days", + "Modality": 'Transcriptmoics' + }, + "norman": { + "cell_type": "K562", + "perturbation_type": "Activation", + "Inference data": "sc", + 'Measurement time': "7 days", + "Modality": 'Transcriptmoics' + }, + "adamson": { + "cell_type": "K562", + "perturbation_type": "Knockout", + "Inference data": "sc", + 'Measurement time': "7 days", + "Modality": 'Transcriptmoics' + }, + } + DATASET_GROUPS = { "op": { "match": ["plate_name", "donor_id", "cell_type", "well"], @@ -31,12 +113,14 @@ "match": ["donor_id", "cell_type"], "loose_match": ["donor_id", "cell_type"], "cv": ["perturbation", "cell_type"], + "rc_tf_ac": ["perturbation", "cell_type"] }, "ibd_cd": { 'anchors': ['donor_id'], "match": ["donor_id", "cell_type"], "loose_match": ["donor_id", "cell_type"], "cv": ["perturbation", "cell_type"], + "rc_tf_ac": ["perturbation", "cell_type"] }, "replogle": { "match": ["perturbation"], @@ -88,17 +172,17 @@ } DATASETS_METRICS = { - 'replogle': ['regression', 'ws_distance', 'tf_recovery', 'tf_binding', 'sem', 'gs_recovery'], + 'replogle': ['regression', 'ws_distance', 'tf_recovery', 'tf_binding', 'sem', 'gs_recovery', 'vc'], # 'adamson': ['regression', 'tf_binding', 'sem', 'gs_recovery'], - 'norman': ['regression', 'ws_distance', 'tf_binding', 'sem', 'gs_recovery'], - 'nakatake': ['regression', 'sem', 'gs_recovery'], + 'norman': ['regression', 'ws_distance', 'tf_binding', 'gs_recovery', 'vc'], + 'nakatake': ['regression', 'sem', 'gs_recovery', 'vc'], 'op': ['regression', 'vc', 'rc_tf_act', 'tf_binding', 'sem', 'gs_recovery'], '300BCG': ['regression', 'vc', 'rc_tf_act', 'tf_binding', 'sem', 'gs_recovery'], - 'ibd_uc': ['regression', 'tf_binding', 'gs_recovery'], - 'ibd_cd': ['regression', 'tf_binding', 'gs_recovery'], + 'ibd_uc': ['regression', 'tf_binding', 'gs_recovery', 'rc_tf_act'], + 'ibd_cd': ['regression', 'tf_binding', 'gs_recovery', 'rc_tf_act'], 'parsebioscience': ['regression', 'vc', 'rc_tf_act', 'tf_binding', 'sem', 'gs_recovery'], - 'xaira_HEK293T': ['regression', 'ws_distance', 'tf_recovery', 'tf_binding', 'sem', 'gs_recovery'], - 'xaira_HCT116': ['regression', 'ws_distance', 'tf_recovery', 'tf_binding', 'sem', 'gs_recovery'], + 'xaira_HEK293T': ['regression', 'ws_distance', 'tf_recovery', 'tf_binding', 'sem', 'gs_recovery', 'vc'], + 'xaira_HCT116': ['regression', 'ws_distance', 'tf_recovery', 'tf_binding', 'sem', 'gs_recovery', 'vc'], } @@ -108,27 +192,61 @@ METRICS_DATASETS.setdefault(metric, []).append(dataset) METRICS = [ - 'r_precision', 'r_recall', 'r_f1', - 'ws_precision', 'ws_recall', 'ws_f1', - 'vc', 'vc_raw', 'vc_precision', - 'sem', 'sem_precision', 'sem_raw', - 't_rec_precision', 't_rec_recall', 't_rec_f1', + 'r_precision', 'r_recall', + 'ws_precision', 'ws_recall', + 'vc', + 'sem', + # 'sem_raw', + 't_rec_precision', 't_rec_recall', + # 't_rec_f1', 'rc_tf_act', - 'tfb_precision', 'tfb_recall', 'tfb_f1', - 'gs_precision', 'gs_recall', 'gs_f1', + # 'tfb_precision', 'tfb_recall', + 'tfb_f1', + # 'gs_precision', 'gs_recall', + 'gs_f1', ] FINAL_METRICS = [ - 'r_precision', 'r_recall', + 'r_precision', + 'r_recall', 'vc', 'sem', - 'ws_precision', 'ws_recall', - 't_rec_precision', 't_rec_recall', - 'rc_tf_act', - 'tfb_f1', - 'gs_f1', + 'ws_precision', + 'ws_recall', + # 'tfb_f1', + # 'gs_f1', ] - +METRIC_THRESHOLDS = { + # Regression metrics: R2-based, meaningful if > 0.1 + 'r_precision': 0.1, + 'r_recall': 0.1, + + # Wasserstein distance metrics: precision/recall based, meaningful if > 0.05 + 'ws_precision': 0.5, + 'ws_recall': 0.5, + + # Virtual cell: r2 scores + 'vc': 0.1, + + # SEM (Structural Equation Modeling): goodness of fit (0-1), meaningful if > 0.4 + 'sem': 0.1, + + # TF recovery metrics: t-statistics from paired t-test, meaningful if > 2.0 (p<0.05) + 't_rec_precision': 2.0, + 't_rec_recall': 2.0, + + # Replica consistency (RC) for TF activity: consistency score (0-1) based on MAD, meaningful if > 0.3 + # Measures consistency of TF activity across biological replicates (1=perfect, 0=no consistency) + 'rc_tf_act': 0.3, + + # TF binding F1: F1 for TF-target binding, meaningful if > 0.05 + # Based on ChIP-seq or other binding data + 'tfb_f1': 0.05, + + # Gene set recovery F1: F1 for gene set enrichment, meaningful if > 0.1 + # Tests if predicted regulators recover known gene sets + 'gs_f1': 0.1, +} surrogate_names = { 'scprint': 'scPRINT', 'collectri': 'CollectRI', @@ -149,15 +267,17 @@ 'negative_control':'Negative Ctrl', 'scgpt': 'scGPT', 'spearman_corr': 'Spearman Corr.', + 'geneformer': 'GeneFormer', 'regression': 'Regression', 'tf_recovery': 'TF Recovery', - 'r_precision': "R (precision)", - 'r_recall': "R (recall)", - 'r_f1': "R (F1)", - 'r_raw': "R (raw)", + 'r_precision': "Regression (precision)", + 'r_recall': "Regression (recall)", + 'r_f1': "Regression (F1)", + 'r_raw': "Regression (raw)", 'ws_precision': "WS (precision)", 'ws_recall': "WS (recall)", + 'ws_distance': "WS distance", 'ws_f1': "WS (F1)", 'ws_raw': "WS (raw)", 'sem': 'SEM', @@ -170,9 +290,11 @@ 'tfb_precision': 'TF binding (precision)', 'tfb_recall': 'TF binding (recall)', 'tfb_f1': 'TF binding', + 'tf_binding': 'TF binding', 'gs_precision': 'GS (precision)', 'gs_recall': 'GS (recall)', - 'gs_f1': 'Gene sets', + 'gs_f1': 'Gene sets recovery', + 'gs_recovery': 'Gene sets recovery', 'op':'OPSCA', 'nakatake': 'Nakatake', @@ -187,15 +309,22 @@ '300BCG': '300BCG' } -def generate_config_env(output_path='src/utils/dataset_config.env'): +def generate_config_env(output_path='src/utils/config.env'): """Generate a simple env-style config file with dataset-specific configurations.""" with open(output_path, 'w') as f: f.write("# Auto-generated dataset configuration\n") f.write("# Format: DATASET_VARIABLE=value\n\n") + # Global lists + f.write("# Global lists (comma-separated)\n") + f.write(f'METHODS="{",".join(METHODS)}"\n') + f.write(f'METRICS="{",".join(METRICS)}"\n') + f.write(f'DATASETS="{",".join(DATASETS)}"\n') + f.write(f'FINAL_METRICS="{",".join(FINAL_METRICS)}"\n') + # Cell types - f.write("# Cell types\n") + f.write("\n# Cell types\n") for dataset, cell_type in DATASETS_CELLTYPES.items(): var_name = f"CELLTYPE_{dataset}" f.write(f'{var_name}="{cell_type}"\n') @@ -214,7 +343,7 @@ def generate_config_env(output_path='src/utils/dataset_config.env'): if __name__ == '__main__': import argparse parser = argparse.ArgumentParser(description='Generate dataset configuration') - parser.add_argument('--output', type=str, default='src/utils/dataset_config.env', + parser.add_argument('--output', type=str, default='src/utils/config.env', help='Output path for the config file') args = parser.parse_args() diff --git a/src/utils/dataset_config.env b/src/utils/dataset_config.env index 861b35c55..c6b08ff4e 100644 --- a/src/utils/dataset_config.env +++ b/src/utils/dataset_config.env @@ -4,7 +4,6 @@ # Cell types CELLTYPE_replogle="K562" CELLTYPE_norman="K562" -CELLTYPE_adamson="K562" CELLTYPE_xaira_HEK293T="HEK293T" CELLTYPE_xaira_HCT116="HCT116" CELLTYPE_op="PBMC" @@ -15,14 +14,13 @@ CELLTYPE_ibd_cd="PBMC" CELLTYPE_nakatake="" # Metrics (comma-separated) -METRICS_replogle="regression,ws_distance,tf_recovery,tf_binding,sem,gs_recovery" -METRICS_adamson="regression,tf_binding,sem,gs_recovery" -METRICS_norman="regression,ws_distance,tf_binding,sem,gs_recovery" -METRICS_nakatake="regression,sem,gs_recovery" +METRICS_replogle="regression,ws_distance,tf_recovery,tf_binding,sem,gs_recovery,vc" +METRICS_norman="regression,ws_distance,tf_binding,gs_recovery,vc" +METRICS_nakatake="regression,sem,gs_recovery,vc" METRICS_op="regression,vc,rc_tf_act,tf_binding,sem,gs_recovery" METRICS_300BCG="regression,vc,rc_tf_act,tf_binding,sem,gs_recovery" -METRICS_ibd_uc="regression,vc,tf_binding,sem,gs_recovery" -METRICS_ibd_cd="regression,vc,tf_binding,sem,gs_recovery" +METRICS_ibd_uc="regression,tf_binding,gs_recovery,rc_tf_act" +METRICS_ibd_cd="regression,tf_binding,gs_recovery,rc_tf_act" METRICS_parsebioscience="regression,vc,rc_tf_act,tf_binding,sem,gs_recovery" -METRICS_xaira_HEK293T="regression,ws_distance,tf_recovery,tf_binding,sem,gs_recovery" -METRICS_xaira_HCT116="regression,ws_distance,tf_recovery,tf_binding,sem,gs_recovery" +METRICS_xaira_HEK293T="regression,ws_distance,tf_recovery,tf_binding,sem,gs_recovery,vc" +METRICS_xaira_HCT116="regression,ws_distance,tf_recovery,tf_binding,sem,gs_recovery,vc" diff --git a/src/workflows/run_grn_evaluation/config.vsh.yaml b/src/workflows/run_grn_evaluation/config.vsh.yaml index bf3833843..e16609966 100644 --- a/src/workflows/run_grn_evaluation/config.vsh.yaml +++ b/src/workflows/run_grn_evaluation/config.vsh.yaml @@ -145,7 +145,7 @@ dependencies: - name: metrics/vc - name: metrics/rc_tf_act - name: metrics/sem - - name: metrics/anchor_regression + # - name: metrics/anchor_regression - name: metrics/tf_binding - name: metrics/gs_recovery - name: utils/extract_uns_metadata diff --git a/src/workflows/run_grn_evaluation/main.nf b/src/workflows/run_grn_evaluation/main.nf index 5b93c9bf9..0027271d3 100644 --- a/src/workflows/run_grn_evaluation/main.nf +++ b/src/workflows/run_grn_evaluation/main.nf @@ -17,7 +17,7 @@ workflow run_wf { regression, ws_distance, tf_recovery, - anchor_regression, + // anchor_regression, rc_tf_act, sem, vc, diff --git a/test.ipynb b/test.ipynb index 2719ea804..9aaea7f49 100644 --- a/test.ipynb +++ b/test.ipynb @@ -50,7 +50,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 7, "metadata": {}, "outputs": [ { @@ -85,9 +85,9 @@ }, { "data": { - "image/png": "", + "image/png": "", "text/plain": [ - "
      " + "
      " ] }, "metadata": {}, @@ -115,191 +115,6 @@ " plot_heatmap(df_subset, name='', cmap=\"viridis\", ax=ax)\n", " plt.title(f'{dataset}')" ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Assemble the results from differnet runs" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "!rm -r resources/results/all_main/" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Copied identical file: method_configs.yaml\n", - "Copied identical file: metric_configs.yaml\n", - "Merged: dataset_uns.yaml\n", - "Merged: score_uns.yaml\n", - "Merged: trace.txt (duplicates removed)\n", - "Copied unique file: state.yaml → state.yaml\n", - "Copied unique file: op_.celloracle.celloracle.prediction.h5ad → op_.celloracle.celloracle.prediction.h5ad\n", - "Copied unique file: scplus_mdata.h5mu.2DAaAA8E → scplus_mdata.h5mu.2DAaAA8E\n", - "Copied unique file: op_.negative_control.negative_control.prediction.h5ad → op_.negative_control.negative_control.prediction.h5ad\n", - "Copied unique file: op_.scenicplus.scenicplus.prediction.h5ad → op_.scenicplus.scenicplus.prediction.h5ad\n", - "Copied unique file: op_.portia.portia.prediction.h5ad → op_.portia.portia.prediction.h5ad\n", - "Copied unique file: op_.granie.granie.prediction.h5ad → op_.granie.granie.prediction.h5ad\n", - "Copied unique file: op_.scprint.scprint.prediction.h5ad → op_.scprint.scprint.prediction.h5ad\n", - "Copied unique file: op_.pearson_corr.pearson_corr.prediction.h5ad → op_.pearson_corr.pearson_corr.prediction.h5ad\n", - "Copied unique directory: output → output\n", - "Copied unique file: op_.scglue.scglue.prediction.h5ad → op_.scglue.scglue.prediction.h5ad\n", - "Copied unique file: op_.ppcor.ppcor.prediction.h5ad → op_.ppcor.ppcor.prediction.h5ad\n", - "Copied unique file: op_.positive_control.positive_control.prediction.h5ad → op_.positive_control.positive_control.prediction.h5ad\n", - "Copied unique file: op_.scenic.scenic.prediction.h5ad → op_.scenic.scenic.prediction.h5ad\n", - "Copied unique file: op_.figr.figr.prediction.h5ad → op_.figr.figr.prediction.h5ad\n", - "Copied unique file: task_info.yaml → task_info.yaml\n", - "Copied unique file: op_.grnboost2.grnboost2.prediction.h5ad → op_.grnboost2.grnboost2.prediction.h5ad\n", - "Copied unique file: state.yaml → state_nakatake.yaml\n", - "Copied unique file: nakatake_.positive_control.positive_control.prediction.h5ad → nakatake_.positive_control.positive_control.prediction.h5ad\n", - "Copied unique file: nakatake_.portia.portia.prediction.h5ad → nakatake_.portia.portia.prediction.h5ad\n", - "Copied unique file: nakatake_.grnboost.grnboost.prediction.h5ad → nakatake_.grnboost.grnboost.prediction.h5ad\n", - "Copied unique file: nakatake_.ppcor.ppcor.prediction.h5ad → nakatake_.ppcor.ppcor.prediction.h5ad\n", - "Copied unique file: nakatake_.pearson_corr.pearson_corr.prediction.h5ad → nakatake_.pearson_corr.pearson_corr.prediction.h5ad\n", - "Copied unique file: nakatake_.negative_control.negative_control.prediction.h5ad → nakatake_.negative_control.negative_control.prediction.h5ad\n", - "Copied unique file: nakatake_.scenic.scenic.prediction.h5ad → nakatake_.scenic.scenic.prediction.h5ad\n", - "Copied unique file: task_info.yaml → task_info_nakatake.yaml\n", - "Copied unique file: norman_.grnboost2.grnboost2.prediction.h5ad → norman_.grnboost2.grnboost2.prediction.h5ad\n", - "Copied unique file: state.yaml → state_norman.yaml\n", - "Copied unique file: norman_.ppcor.ppcor.prediction.h5ad → norman_.ppcor.ppcor.prediction.h5ad\n", - "Copied unique file: norman_.scprint.scprint.prediction.h5ad → norman_.scprint.scprint.prediction.h5ad\n", - "Copied unique file: norman_.pearson_corr.pearson_corr.prediction.h5ad → norman_.pearson_corr.pearson_corr.prediction.h5ad\n", - "Copied unique file: norman_.portia.portia.prediction.h5ad → norman_.portia.portia.prediction.h5ad\n", - "Copied unique file: norman_.negative_control.negative_control.prediction.h5ad → norman_.negative_control.negative_control.prediction.h5ad\n", - "Copied unique file: norman_.scenic.scenic.prediction.h5ad → norman_.scenic.scenic.prediction.h5ad\n", - "Copied unique file: norman_.positive_control.positive_control.prediction.h5ad → norman_.positive_control.positive_control.prediction.h5ad\n", - "Copied unique file: task_info.yaml → task_info_norman.yaml\n", - "Copied unique file: state.yaml → state_replogle.yaml\n", - "Copied unique file: replogle_.pearson_corr.pearson_corr.prediction.h5ad → replogle_.pearson_corr.pearson_corr.prediction.h5ad\n", - "Copied unique file: replogle_.positive_control.positive_control.prediction.h5ad → replogle_.positive_control.positive_control.prediction.h5ad\n", - "Copied unique file: replogle_.portia.portia.prediction.h5ad → replogle_.portia.portia.prediction.h5ad\n", - "Copied unique file: replogle_.grnboost2.grnboost2.prediction.h5ad → replogle_.grnboost2.grnboost2.prediction.h5ad\n", - "Copied unique file: replogle_.negative_control.negative_control.prediction.h5ad → replogle_.negative_control.negative_control.prediction.h5ad\n", - "Copied unique file: replogle_.ppcor.ppcor.prediction.h5ad → replogle_.ppcor.ppcor.prediction.h5ad\n", - "Copied unique file: task_info.yaml → task_info_replogle.yaml\n", - "Copied unique file: replogle_.scenic.scenic.prediction.h5ad → replogle_.scenic.scenic.prediction.h5ad\n", - "Copied unique file: state.yaml → state_adamson.yaml\n", - "Copied unique file: adamson_.portia.portia.prediction.h5ad → adamson_.portia.portia.prediction.h5ad\n", - "Copied unique file: adamson_.negative_control.negative_control.prediction.h5ad → adamson_.negative_control.negative_control.prediction.h5ad\n", - "Copied unique file: adamson_.pearson_corr.pearson_corr.prediction.h5ad → adamson_.pearson_corr.pearson_corr.prediction.h5ad\n", - "Copied unique file: adamson_.ppcor.ppcor.prediction.h5ad → adamson_.ppcor.ppcor.prediction.h5ad\n", - "Copied unique file: adamson_.scenic.scenic.prediction.h5ad → adamson_.scenic.scenic.prediction.h5ad\n", - "Copied unique file: adamson_.grnboost2.grnboost2.prediction.h5ad → adamson_.grnboost2.grnboost2.prediction.h5ad\n", - "Copied unique file: adamson_.positive_control.positive_control.prediction.h5ad → adamson_.positive_control.positive_control.prediction.h5ad\n", - "Copied unique file: task_info.yaml → task_info_adamson.yaml\n" - ] - } - ], - "source": [ - "import os\n", - "import shutil\n", - "import yaml\n", - "from pathlib import Path\n", - "from collections import OrderedDict\n", - "\n", - "base_dir = 'resources/results/'\n", - "save_dir = 'resources/results/all_main/'\n", - "runs = ['op', 'nakatake', 'norman', 'replogle', 'adamson']\n", - "\n", - "os.makedirs(save_dir, exist_ok=True)\n", - "\n", - "# 1. Copy one version of the identical files\n", - "identical_files = ['method_configs.yaml', 'metric_configs.yaml']\n", - "for fname in identical_files:\n", - " src = os.path.join(base_dir, f'{runs[0]}_run', fname)\n", - " dst = os.path.join(save_dir, fname)\n", - " shutil.copyfile(src, dst)\n", - " print(f\"Copied identical file: {fname}\")\n", - "\n", - "# 2. Merge dataset_uns.yaml by appending all contents\n", - "merged_uns = []\n", - "for run in runs:\n", - " path = os.path.join(base_dir, f'{run}_run', 'dataset_uns.yaml')\n", - "\n", - " with open(path, 'r') as f:\n", - " data = yaml.safe_load(f)\n", - " merged_uns.extend(data)\n", - " \n", - "with open(os.path.join(save_dir, 'dataset_uns.yaml'), 'w') as f:\n", - " yaml.dump(merged_uns, f)\n", - "print(\"Merged: dataset_uns.yaml\")\n", - "\n", - "# 3. Merge score_uns.yaml similarly\n", - "merged_scores = []\n", - "for run in runs:\n", - " path = os.path.join(base_dir, f'{run}_run', 'score_uns.yaml')\n", - "\n", - " with open(path, 'r') as f:\n", - " data = yaml.safe_load(f)\n", - " # - remove those with missing (because of the metric)\n", - " data = [d for d in data if d is not None and 'missing' not in str(d)]\n", - " \n", - " # print(str(data[0]))\n", - " # aa\n", - " # missing\n", - " if data:\n", - " if isinstance(data, dict):\n", - " merged_scores.append(data)\n", - " elif isinstance(data, list):\n", - " merged_scores.extend(data)\n", - " else:\n", - " print(f\"Unexpected format in {path}: {type(data)}\")\n", - "\n", - "with open(os.path.join(save_dir, 'score_uns.yaml'), 'w') as f:\n", - " yaml.dump(merged_scores, f)\n", - "print(\"Merged: score_uns.yaml\")\n", - "\n", - "# 4. Merge trace.txt with deduplication\n", - "seen_lines = OrderedDict()\n", - "for run in runs:\n", - " path = os.path.join(base_dir, f'{run}_run', 'trace.txt')\n", - " \n", - " with open(path, 'r') as f:\n", - " for line in f:\n", - " seen_lines[line] = None\n", - "\n", - "with open(os.path.join(save_dir, 'trace.txt'), 'w') as f:\n", - " for line in seen_lines.keys():\n", - " f.write(line)\n", - "df = pd.read_csv(os.path.join(save_dir, 'trace.txt'), sep='\\t')\n", - "df = df.drop_duplicates(subset=['name'])\n", - "df.to_csv(os.path.join(save_dir, 'trace.txt'), sep='\\t')\n", - "print(\"Merged: trace.txt (duplicates removed)\")\n", - "\n", - "# 5. Copy other unknown files/directories\n", - "all_known = set(identical_files + ['dataset_uns.yaml', 'score_uns.yaml', 'trace.txt'])\n", - "\n", - "for run in runs:\n", - " run_dir = Path(base_dir) / f'{run}_run'\n", - " for file_path in run_dir.iterdir():\n", - " if file_path.name in all_known:\n", - " continue\n", - "\n", - " dest_path = Path(save_dir) / file_path.name\n", - "\n", - " if dest_path.exists():\n", - " dest_path = Path(save_dir) / f\"{file_path.stem}_{run}{file_path.suffix}\"\n", - "\n", - " if file_path.is_file():\n", - " shutil.copyfile(file_path, dest_path)\n", - " print(f\"Copied unique file: {file_path.name} → {dest_path.name}\")\n", - " elif file_path.is_dir():\n", - " shutil.copytree(file_path, dest_path)\n", - " print(f\"Copied unique directory: {file_path.name} → {dest_path.name}\")" - ] } ], "metadata": {