Skip to content

Commit a13d9f8

Browse files
committed
Merge remote-tracking branch 'origin/develop' into develop
2 parents 20ace1d + e1d240f commit a13d9f8

File tree

4 files changed

+29
-1
lines changed

4 files changed

+29
-1
lines changed

source/_data/SymbioticLab.bib

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1957,6 +1957,19 @@ @Article{mercury:arxiv24
19571957
}
19581958
}
19591959
1960+
@InProceedings{autoiac:neurips24,
1961+
author = {Patrick TJ Kon and Jiachen Liu and Yiming Qiu and Weijun Fan and Ting He and Lei Lin and Haoran Zhang and Owen M. Park and George Sajan Elengikal and Yuxin Kang and Ang Chen and Mosharaf Chowdhury and Myungjin Lee and Xinyu Wang},
1962+
title = {{IaC-Eval}: A code generation benchmark for Infrastructure-as-Code programs},
1963+
year = {2024},
1964+
publist_topic = {Systems + AI},
1965+
publist_confkey = {NeurIPS'24},
1966+
booktitle = {NeurIPS},
1967+
publist_link = {paper || autoiac-neurips24.pdf},
1968+
publist_link = {code || https://github.com/autoiac-project/iac-eval},
1969+
publist_abstract = {
1970+
Infrastructure-as-Code (IaC), an important component of cloud computing, allows the definition of cloud infrastructure in high-level programs. However, developing IaC programs is challenging, complicated by factors that include the burgeoning complexity of the cloud ecosystem (e.g., diversity of cloud services and workloads), and the relative scarcity of IaC-specific code examples and public repositories. While large language models (LLMs) have shown promise in general code generation and could potentially aid in IaC development, no benchmarks currently exist for evaluating their ability to generate IaC code. We present IaC-Eval, a first step in this research direction. IaC-Eval's dataset includes 458 human-curated scenarios covering a wide range of popular AWS services, at varying difficulty levels. Each scenario mainly comprises a natural language IaC problem description and an infrastructure intent specification. The former is fed as user input to the LLM, while the latter is a general notion used to verify if the generated IaC program conforms to the user's intent; by making explicit the problem's requirements that can encompass various cloud services, resources and internal infrastructure details. Our in-depth evaluation shows that contemporary LLMs perform poorly on IaC-Eval, with the top-performing model, GPT-4, obtaining a pass@1 accuracy of 19.36%. In contrast, it scores 86.6% on EvalPlus, a popular Python code generation benchmark, highlighting a need for advancements in this domain. We open-source the IaC-Eval dataset and evaluation framework at https://github.com/autoiac-project/iac-eval to enable future research on LLM-based IaC code generation.}
1971+
}
1972+
19601973
@Article{mordal:arxiv25,
19611974
author = {Shiqi He and Insu Jang and Mosharaf Chowdhury},
19621975
title = {{Mordal}: Automated Pretrained Model Selection for Vision Language Models},
Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,7 @@
1+
---
2+
title: 'Venn Accepted to Appear at MLSys''25. Congrats Jiachen, Eric, and Yiwen!'
3+
categories:
4+
- News
5+
date: 2025-02-11 15:54:37
6+
tags:
7+
---
Binary file not shown.

source/publications/index.md

Lines changed: 9 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -430,11 +430,19 @@ venues:
430430
name: ICLR 23 Workshop on Tackling Climate Change with Machine Learning
431431
date: 2023-05-04
432432
url: https://www.climatechange.ai/events/iclr2023
433+
NeurIPS:
434+
category: Conferences
435+
occurrences:
436+
- key: NeurIPS'24
437+
name: The Thirty-eight Conference on Neural Information Processing Systems
438+
date: 2024-12-09
439+
url: https://neurips.cc/Conferences/2024
440+
acceptance: 25.8%
433441
{% endpublist %}
434442

435443
---
436444

437445
{% note default %}
438446
#### Copyright notice
439447
The documents listed above have been provided by the contributing authors as a means to ensure timely dissemination of scholarly and technical work on a noncommercial basis. Copyright and all rights therein are maintained by the authors or by other copyright holders, notwithstanding that they have offered their works here electronically. It is understood that all persons copying this information will adhere to the terms and constraints invoked by each author’s copyright. These works may not be reposted without the explicit permission of the copyright holder.
440-
{% endnote %}
448+
{% endnote %}

0 commit comments

Comments
 (0)