Skip to content

Commit 8d3f714

Browse files
committed
add citations, references to libraries used
1 parent 9815080 commit 8d3f714

File tree

2 files changed

+103
-20
lines changed

2 files changed

+103
-20
lines changed

whitepaper/paper.bib

Lines changed: 92 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,34 @@
1-
@article{kalkhof2023m3dnca,
1+
@article{hunter2007matplotlib,
2+
title = {Matplotlib: {{A 2D}} Graphics Environment},
3+
author = {Hunter, J. D.},
4+
year = {2007},
5+
journal = {Computing in Science \& Engineering},
6+
volume = {9},
7+
number = {3},
8+
pages = {90--95},
9+
publisher = {IEEE COMPUTER SOC},
10+
doi = {10.1109/MCSE.2007.55},
11+
abstract = {Matplotlib is a 2D graphics package used for Python for application development, interactive scripting, and publication-quality image generation across user interfaces and operating systems.}
12+
}
13+
14+
@misc{jha2019kvasirseg,
15+
title = {Kvasir-{{SEG}}: {{A Segmented Polyp Dataset}}},
16+
shorttitle = {Kvasir-{{SEG}}},
17+
author = {Jha, Debesh and Smedsrud, Pia H. and Riegler, Michael A. and Halvorsen, P{\aa}l and de Lange, Thomas and Johansen, Dag and Johansen, H{\aa}vard D.},
18+
year = {2019},
19+
month = nov,
20+
number = {arXiv:1911.07069},
21+
eprint = {1911.07069},
22+
primaryclass = {eess},
23+
publisher = {arXiv},
24+
doi = {10.48550/arXiv.1911.07069},
25+
urldate = {2025-08-12},
26+
abstract = {Pixel-wise image segmentation is a highly demanding task in medical-image analysis. In practice, it is difficult to find annotated medical images with corresponding segmentation masks. In this paper, we present Kvasir-SEG: an open-access dataset of gastrointestinal polyp images and corresponding segmentation masks, manually annotated by a medical doctor and then verified by an experienced gastroenterologist. Moreover, we also generated the bounding boxes of the polyp regions with the help of segmentation masks. We demonstrate the use of our dataset with a traditional segmentation approach and a modern deep-learning based Convolutional Neural Network (CNN) approach. The dataset will be of value for researchers to reproduce results and compare methods. By adding segmentation masks to the Kvasir dataset, which only provide frame-wise annotations, we enable multimedia and computer vision researchers to contribute in the field of polyp segmentation and automatic analysis of colonoscopy images.},
27+
archiveprefix = {arXiv},
28+
keywords = {Computer Science - Computer Vision and Pattern Recognition,Electrical Engineering and Systems Science - Image and Video Processing}
29+
}
30+
31+
@article{kalkhof2023m3dncaa,
232
title = {{{M3D-NCA}}: {{Robust 3D Segmentation}} with {{Built-in Quality Control}}},
333
author = {Kalkhof, John and Mukhopadhyay, A.},
434
year = {2023},
@@ -29,10 +59,29 @@ @misc{kalkhof2024frequencytime
2959
urldate = {2025-07-10},
3060
abstract = {Despite considerable success, large Denoising Diffusion Models (DDMs) with UNet backbone pose practical challenges, particularly on limited hardware and in processing gigapixel images. To address these limitations, we introduce two Neural Cellular Automata (NCA)-based DDMs: Diff-NCA and FourierDiff-NCA. Capitalizing on the local communication capabilities of NCA, Diff-NCA significantly reduces the parameter counts of NCA-based DDMs. Integrating Fourier-based diffusion enables global communication early in the diffusion process. This feature is particularly valuable in synthesizing complex images with important global features, such as the CelebA dataset. We demonstrate that even a 331k parameter Diff-NCA can generate 512x512 pathology slices, while FourierDiff-NCA (1.1m parameters) reaches a three times lower FID score of 43.86, compared to the four times bigger UNet (3.94m parameters) with a score of 128.2. Additionally, FourierDiff-NCA can perform diverse tasks such as super-resolution, out-of-distribution image synthesis, and inpainting without explicit training.},
3161
archiveprefix = {arXiv},
32-
keywords = {Application:Medical Imaging,Dataset:CelebA,Neural Cellular Automata,Subject:Digital Pathology,Task:Synthesis},
62+
keywords = {Application:Medical Imaging,Dataset:CelebA,Neural Cellular Automata,Subject:Digital Pathology,Task:Synthesis}
63+
}
64+
65+
@article{kalkhof2025parameterefficient,
66+
title = {Parameter-Efficient Diffusion with Neural Cellular Automata},
67+
author = {Kalkhof, John and K{\"u}hn, Arlene and Frisch, Yannik and Mukhopadhyay, Anirban},
68+
year = {2025},
69+
month = may,
70+
journal = {npj Unconventional Computing},
71+
volume = {2},
72+
number = {1},
73+
pages = {10},
74+
publisher = {Nature Publishing Group},
75+
issn = {3004-8672},
76+
doi = {10.1038/s44335-025-00026-4},
77+
urldate = {2025-07-10},
78+
abstract = {Traditional Denoising Diffusion Models (DDMs) with UNet backbones are over-parameterized, compromising their effectiveness on limited hardware and in processing gigapixel images. To address this inefficiency, we introduce two Neural Cellular Automata (NCA)-based DDMs: Diff-NCA and FourierDiff-NCA. Leveraging the efficient local communication of NCA, Diff-NCA drastically reduces parameter counts, effectively generating 512 {\texttimes} 512 pathology slices with just 336k parameters. Extending this approach, FourierDiff-NCA integrates Fourier-based diffusion to facilitate early global communication, essential for handling complex datasets such as CelebA. With only 1.1 m parameters, it achieves a more than two times lower FID score of 49.48 compared to the four times larger UNet, which scores 128.2. This performance disparity underscores the utility of NCA-based methods in enhancing parameter efficiency. FourierDiff-NCA also demonstrates versatility by performing tasks such as super-resolution, out-of-distribution image synthesis, and inpainting without task-specific training.},
79+
copyright = {2025 The Author(s)},
80+
langid = {english},
81+
keywords = {Application:Medical Imaging,Dataset:BCSS,Dataset:CelebA,Neural Cellular Automata,Subject:Digital Pathology,tagme,Task:Image Synthesis}
3382
}
3483

35-
@article{krumb2025encapsulate,
84+
@article{krumb2025encapsulatea,
3685
title = {{{eNCApsulate}}: Neural Cellular Automata for Precision Diagnosis on Capsule Endoscopes},
3786
shorttitle = {{{eNCApsulate}}},
3887
author = {Krumb, Henry John and Mukhopadhyay, Anirban},
@@ -44,7 +93,40 @@ @article{krumb2025encapsulate
4493
urldate = {2025-07-10},
4594
abstract = {Wireless capsule endoscopy (WCE) is a noninvasive imaging method for the entire gastrointestinal tract and is a pain-free alternative to traditional endoscopy. It generates extensive video data that requires significant review time, and localizing the capsule after ingestion is a challenge. Techniques like bleeding detection and depth estimation can help with localization of pathologies, but deep learning models are typically too large to run directly on the capsule.},
4695
langid = {english},
47-
keywords = {Application:Medical Imaging,Dataset:KID2,Dataset:KvasirCapsule,Modality:WCE,Neural Cellular Automata,Subject:Intestine,Task:Depth Estimation,Task:Segmentation},
96+
keywords = {Application:Medical Imaging,Dataset:KID2,Dataset:KvasirCapsule,Modality:WCE,Neural Cellular Automata,Subject:Intestine,Task:Depth Estimation,Task:Segmentation}
97+
}
98+
99+
@article{mordvintsev2020growingb,
100+
title = {Growing {{Neural Cellular Automata}}},
101+
author = {Mordvintsev, Alexander and Randazzo, Ettore and Niklasson, Eyvind and Levin, Michael},
102+
year = {2020},
103+
month = feb,
104+
journal = {Distill},
105+
volume = {5},
106+
number = {2},
107+
pages = {e23},
108+
issn = {2476-0757},
109+
doi = {10.23915/distill.00023},
110+
urldate = {2025-08-12},
111+
abstract = {Training an end-to-end differentiable, self-organising cellular automata model of morphogenesis, able to both grow and regenerate specific patterns.},
112+
langid = {english}
113+
}
114+
115+
@misc{paszke2019pytorch,
116+
title = {{{PyTorch}}: {{An Imperative Style}}, {{High-Performance Deep Learning Library}}},
117+
shorttitle = {{{PyTorch}}},
118+
author = {Paszke, Adam and Gross, Sam and Massa, Francisco and Lerer, Adam and Bradbury, James and Chanan, Gregory and Killeen, Trevor and Lin, Zeming and Gimelshein, Natalia and Antiga, Luca and Desmaison, Alban and K{\"o}pf, Andreas and Yang, Edward and DeVito, Zach and Raison, Martin and Tejani, Alykhan and Chilamkurthy, Sasank and Steiner, Benoit and Fang, Lu and Bai, Junjie and Chintala, Soumith},
119+
year = {2019},
120+
month = dec,
121+
number = {arXiv:1912.01703},
122+
eprint = {1912.01703},
123+
primaryclass = {cs},
124+
publisher = {arXiv},
125+
doi = {10.48550/arXiv.1912.01703},
126+
urldate = {2025-08-12},
127+
abstract = {Deep learning frameworks have often focused on either usability or speed, but not both. PyTorch is a machine learning library that shows that these two goals are in fact compatible: it provides an imperative and Pythonic programming style that supports code as a model, makes debugging easy and is consistent with other popular scientific computing libraries, while remaining efficient and supporting hardware accelerators such as GPUs. In this paper, we detail the principles that drove the implementation of PyTorch and how they are reflected in its architecture. We emphasize that every aspect of PyTorch is a regular Python program under the full control of its user. We also explain how the careful and pragmatic implementation of the key components of its runtime enables them to work together to achieve compelling performance. We demonstrate the efficiency of individual subsystems, as well as the overall speed of PyTorch on several common benchmarks.},
128+
archiveprefix = {arXiv},
129+
keywords = {Computer Science - Machine Learning,Computer Science - Mathematical Software,Statistics - Machine Learning}
48130
}
49131

50132
@article{ranem2024ncamorph,
@@ -55,3 +137,9 @@ @article{ranem2024ncamorph
55137
volume = {abs/2410.22265},
56138
keywords = {Application:Medical Imaging,Neural Cellular Automata,tagme,Task:Registration}
57139
}
140+
141+
@misc{torcheval,
142+
title = {{{TorchEval}} --- {{TorchEval}} Main Documentation},
143+
urldate = {2025-08-12},
144+
howpublished = {https://docs.pytorch.org/torcheval/stable/}
145+
}

whitepaper/paper.md

Lines changed: 11 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,8 @@ authors:
1313
- name: Richard Sattel
1414
orcid: 0009-0003-1060-3462
1515
affiliation: 1
16+
- name: Jonathan Dewenter
17+
affiliation: 1
1618
- name: Dennis Grotz
1719
affiliation: 1
1820
- name: Anirban Mukhopadhyay
@@ -32,26 +34,25 @@ bibliography: paper.bib
3234

3335
# Summary
3436

35-
3637
Neural Cellular Automata (NCA) are lightweight neural network models that can be employed in various image analysis tasks such as image segmentation, classification and generation.
37-
These models are recently getting attention in the medical imaging community, thanks to their small size, their robustness and their overall versatility.
38-
In terms of accuracy, they are often on-par with state-of-the art models, while being orders of magnitude smaller in size.
38+
Initially proposed in 2020 [@mordvintsev2020growingb], these models are recently getting attention thanks to their small size, their robustness and their overall versatility.
39+
In terms of accuracy, they are often on-par with state-of-the art models for the respective downstream task, while being orders of magnitude smaller in size.
3940
However, the training dynamics of NCAs are not yet fully understood, and there is potential for investigating practical tweaks to increase accuracy, reduce VRAM requirements and increase the overall training stability.
4041
`NCALab` provides a unified and extensible research framework for training and evaluating NCAs, conducting hyperparameter searches and prototyping applications that build on NCAs for image processing.
4142

4243

4344
# Statement of Need
4445

45-
NCAs are recently gaining attention in medical imaging, where they are deployed for various modalities in different downstream tasks, including 3D prostate segmentation on MRI [@kalkhof2023mednca] [@kalkhof2023m3dnca], image registration [@ranem2024ncamorph] or image synthesis [@kalkhof2024frequencytime,@kalkhof2025parameterefficient].
46+
NCAs are recently gaining attention especially in medical imaging, where they are deployed for various modalities in different downstream tasks, including 3D prostate segmentation on MRI [@kalkhof2023mednca] [@kalkhof2023m3dncaa], image registration [@ranem2024ncamorph] or image synthesis [@kalkhof2024frequencytime,@kalkhof2025parameterefficient].
4647
In most cases, they outperform other Convolutional Neural Network or Vision Transformer architectures in terms of model size and robustness, while yielding similarly accurate predictions.
4748
However, there is no unified framework or reference implementation for training, evaluating and experimentation with NCAs.
4849

4950
Research code for Neural Cellular Automata is typically organized in individual repositories for each downstream task under investigation.
50-
Code bases often follow different approaches, even though the underlying architecture is universal; in most cases, it can be defined by the number of input channels, hidden channels and output channels and the weights of the trained network.
51+
Code bases often follow different approaches, even though the underlying architecture is in most parts universal; in most cases, it can be defined by the number of input channels, hidden channels and output channels and the weights of the trained network.
5152

5253
The goal of NCALab is to provide a uniform and easy-to-use code base for various downstream tasks with NCAs in a shared project.
5354
Within minutes, researchers and practitioners should be able to create prototypes for their ideas, inspired by the numerous example tasks provided in this code repository.
54-
Code quality is ensured by unit tests and automated static code analysis through mypy (type checking) and flake8 (linting).
55+
Code quality is ensured by unit tests and automated static code analysis through mypy (type checking) and ruff (linting).
5556

5657
# Features
5758

@@ -60,8 +61,7 @@ NCALab provides dedicated models and example tasks for recurring image analysis
6061
* Growing Neural Cellular Automata for emoji generation and other experiments
6162
* Pixel-wise image segmentation
6263
* Image classification
63-
* Per-pixel image classification
64-
* Monocular depth estimation
64+
* Per-pixel image classification (MNIST digits)
6565

6666
Until now, NCALab provides the following key features:
6767

@@ -73,20 +73,15 @@ Until now, NCALab provides the following key features:
7373
* Visualization and animation of the NCA inference process
7474

7575

76-
# Example use case: Training and Fine-Tuning
77-
78-
```python
79-
80-
```
81-
82-
8376
# Ongoing Research
8477

85-
A conference paper utilizing NCALab was recently accepted for presentation in [IPCAI 2025](https://ipcai.org), and was published in the _International Journal of Computer-Assisted Radiology and Surgery_ (@krumb2025encapsulate).
78+
A conference paper utilizing NCALab was recently accepted for presentation in [IPCAI 2025](https://ipcai.org), and was published in the _International Journal of Computer-Assisted Radiology and Surgery_ [@krumb2025encapsulatea].
8679

8780

8881
# Acknowledgements
8982

9083
This work is partially supported by Norwegian Research Council project number 322600 (Capsnetwork).
9184

85+
NCALab depends on pytorch [@paszke2019pytorch], numpy, matplotlib [@hunter2007matplotlib].
86+
9287
# References

0 commit comments

Comments
 (0)