SMT-COMP · wintered · Jul 6, 2025 · Jul 6, 2025 · Jul 6, 2025 · Jul 6, 2025
diff --git a/Makefile b/Makefile
@@ -31,6 +31,10 @@ build: clean-build ## Build wheel file using poetry
 clean-build: ## clean build artifacts
 	@rm -rf dist
 
+.PHONY: clean-web-results
+clean-web-results: ## clean web results
+	@rm -rf web/content/results
+
 .PHONY: help
 help:
 	@grep -E '^[a-zA-Z_-]+:.*?## .*$$' $(MAKEFILE_LIST) | awk 'BEGIN {FS = ":.*?## "}; {printf "\033[36m%-20s\033[0m %s\n", $$1, $$2}'
@@ -76,8 +80,8 @@ results-generation:
 	@poetry run smtcomp export-results-pages data Incremental
 	# @echo "🚀 Generating results to web/content/results for Cloud"
 	# @poetry run smtcomp export-results-pages data Cloud
-	# @echo "🚀 Generating results to web/content/results for Parallel"
-	# @poetry run smtcomp export-results-pages data Parallel
+	@echo "🚀 Generating results to web/content/results for Parallel"
+	@poetry run smtcomp export-results-pages data Parallel
 
 cache:
 	@echo "🚀 Generating cache"

diff --git a/README.md b/README.md
@@ -257,7 +257,7 @@ The step from Single Query can be followed with the model validation results whe
 Tasks for unsat core validation can be generated by:
 
 ```
-smtcomp generate-unsatcore-validation-files ../tmp/execution SCRAMBLER_EXECUTABLE UNSAT_CORE_RESULT_DIR/*/*
+smtcomp generate-unsatcore-validation-files ../tmp/execution SCRAMBLER_EXECUTABLE UNSAT_CORE_RESULT_DIR
 ```
 
 ---

diff --git a/data/benchmarks-2025.json.gz b/data/benchmarks-2025.json.gz
diff --git a/data/latex-certificates/gen_certificates_ornament.tex b/data/latex-certificates/gen_certificates_ornament.tex
@@ -136,7 +136,7 @@
       \node [circular drop shadow={shadow scale=1.05},
              decorate, decoration=zigzag,
              fill=blue!20,draw,thick,circle,text width=3.5cm,align=center,xshift=2cm]
-              {\large\textbf{SMT-COMP\\ 2024}};
+              {\large\textbf{SMT-COMP\\ 2025}};
     \end{tikzpicture}
     \end{minipage}
 

diff --git a/data/latex-certificates/solvers_pretty_name.csv b/data/latex-certificates/solvers_pretty_name.csv
diff --git a/data/results-inc-2025.json.gz b/data/results-inc-2025.json.gz
diff --git a/data/results-mv-2025.json.gz b/data/results-mv-2025.json.gz
diff --git a/data/results-parallel-2025.json.gz b/data/results-parallel-2025.json.gz
diff --git a/data/results-sq-2025.json.gz b/data/results-sq-2025.json.gz
diff --git a/data/results-uc-2025.json.gz b/data/results-uc-2025.json.gz
diff --git a/smtcomp/benchexec.py b/smtcomp/benchexec.py
@@ -24,8 +24,10 @@ def get_suffix(track: defs.Track) -> str:
             return "_unsatcorevalidation"
         case defs.Track.SingleQuery:
             return ""
-        case _:
-            raise ValueError("No Cloud or Parallel")
+        case defs.Track.Parallel:
+            return "_parallel"
+        case defs.Track.Cloud:
+            return "_cloud"
 
 
 def get_xml_name(s: defs.Submission, track: defs.Track, division: defs.Division) -> str:
@@ -44,8 +46,9 @@ class CmdTask(BaseModel):
     taskdirs: List[str]
 
 
-def generate_benchmark_yml(benchmark: Path, expected_result: Optional[bool], orig_file: Optional[Path]) -> None:
-    ymlfile = benchmark.with_suffix(".yml")
+def generate_benchmark_yml(
+    ymlfile: Path, benchmark: Path, expected_result: Optional[bool], orig_file: Optional[Path]
+) -> None:
     with ymlfile.open("w") as f:
         f.write("format_version: '2.0'\n\n")
 
@@ -103,24 +106,38 @@ def generate_tool_modules(s: defs.Submission, cachedir: Path) -> None:
     generate_tool_module(s, cachedir, False)
 
 
-def generate_xml(config: defs.Config, cmdtasks: List[CmdTask], file: Path, tool_module_name: str) -> None:
+def generate_xml(
+    config: defs.Config, cmdtasks: List[CmdTask], file: Path, tool_module_name: str, track: defs.Track, test: bool
+) -> None:
     doc, tag, text = Doc().tagtext()
 
     doc.asis('<?xml version="1.0"?>')
     doc.asis(
         '<!DOCTYPE benchmark PUBLIC "+//IDN sosy-lab.org//DTD BenchExec benchmark 2.3//EN"'
         ' "https://www.sosy-lab.org/benchexec/benchmark-2.2.3dtd">'
     )
+
+    timelimit = config.timelimit_s_test if test else config.timelimit_s
+    cpuCores = config.cpuCores_parallel if track == defs.Track.Parallel else config.cpuCores
+    memlimit = config.memlimit_M_parallel if track == defs.Track.Parallel else config.memlimit_M
+
+    if test:
+        cpuCores = config.cpuCores_parallel_test if track == defs.Track.Parallel else config.cpuCores_test
+        memlimit = config.memlimit_M_parallel_test if track == defs.Track.Parallel else config.memlimit_M_test
     with tag(
         "benchmark",
         tool=f"tools.{tool_module_name}",
-        timelimit=f"{config.timelimit_s * config.cpuCores}s",
-        walltimelimit=f"{config.timelimit_s}s",
-        memlimit=f"{config.memlimit_M} MB",
-        cpuCores=f"{config.cpuCores}",
+        timelimit=f"{timelimit * cpuCores}s",
+        walltimelimit=f"{timelimit}s",
+        memlimit=f"{memlimit} MB",
+        cpuCores=f"{cpuCores}",
     ):
-        with tag("require", cpuModel="Intel Xeon E3-1230 v5 @ 3.40 GHz"):
-            text()
+
+        if track != defs.Track.Parallel:
+            # we run the test jobs on different machines (main machines are used)
+            used_cpuModel = "Intel Core i7" if test else "Intel Xeon E3-1230 v5 @ 3.40 GHz"
+            with tag("require", cpuModel=used_cpuModel):
+                text()
 
         with tag("resultfiles"):
             text("**/error.log")
@@ -222,7 +239,7 @@ def cmdtask_for_submission(
     return res
 
 
-def generate(s: defs.Submission, cachedir: Path, config: defs.Config) -> None:
+def generate(s: defs.Submission, cachedir: Path, config: defs.Config, test: bool) -> None:
     generate_tool_modules(s, cachedir)
 
     dst = cachedir / "benchmarks"
@@ -241,7 +258,6 @@ def generate(s: defs.Submission, cachedir: Path, config: defs.Config) -> None:
         # cloud and parallel tracks are not executed via benchexec
         if target_track in (
             defs.Track.Cloud,
-            defs.Track.Parallel,
             defs.Track.UnsatCoreValidation,
             defs.Track.ProofExhibition,
         ):
@@ -258,6 +274,8 @@ def generate(s: defs.Submission, cachedir: Path, config: defs.Config) -> None:
                     cmdtasks=res,
                     file=file,
                     tool_module_name=tool_module_name(s, target_track == defs.Track.Incremental),
+                    track=target_track,
+                    test=test,
                 )
                 generated_divisions.append(division)
 
@@ -273,9 +291,11 @@ def generate(s: defs.Submission, cachedir: Path, config: defs.Config) -> None:
             out("set -x")
             out(f"for DIVISION in {division_list}")
             out("    do\n")
-            out(f'    TARGET="../final_results{track_suffix}/$DIVISION/{tool}"')
+            out(f'    TARGET="../results/results{track_suffix}/$DIVISION/{tool}"')
             out("    rm -rf $TARGET")
             out("    mkdir -p $TARGET")
+
+            extra_args = ""
             out(
                 f"    PYTHONPATH=$(pwd) benchexec/contrib/vcloud-benchmark.py run_definitions/{tool}{track_suffix}_$DIVISION.xml --read-only-dir / --overlay-dir . --overlay-dir /home --vcloudClientHeap 500 --vcloudPriority URGENT --cgroupAccess -o $TARGET"
             )
@@ -319,6 +339,6 @@ def generate_unsatcore_validation(s: defs.Submission, cachedir: Path, config: de
         out("    rm -rf $TARGET")
         out("    mkdir -p $TARGET")
         out(
-            f"    PYTHONPATH=$(pwd) benchexec/contrib/vcloud-benchmark.py run_definitions/{tool}_unsatcorevalidation_$DIVISION.xml --read-only-dir / --overlay-dir . --overlay-dir /home --vcloudClientHeap 500 --vcloudPriority URGENT --cgroupAccess --tryLessMemory -o $TARGET"
+            f"    PYTHONPATH=$(pwd) benchexec/contrib/vcloud-benchmark.py run_definitions/{tool}_unsatcorevalidation_$DIVISION.xml --read-only-dir / --overlay-dir . --overlay-dir /home --vcloudClientHeap 500 --vcloudPriority URGENT --cgroupAccess -o $TARGET"
         )
         out("done")
diff --git a/smtcomp/certificates.py b/smtcomp/certificates.py
@@ -10,6 +10,7 @@
 import smtcomp.defs as defs
 import smtcomp.results as results
 import smtcomp.generate_website_page as page
+import smtcomp.submission as submission
 
 show_experimental = False
 
@@ -70,11 +71,13 @@ def withtrack(l: list[str], name: str, category: category) -> None:
 class overall:
 
     def __init__(self) -> None:
+        self.best = category()
         self.biggest = category()
         self.largest = category()
 
     def latex(self) -> str:
         l: list[str] = []
+        withtrack(l, "Best Overall", self.best)
         withtrack(l, "Biggest Lead", self.biggest)
         withtrack(l, "Largest Contribution", self.largest)
         return ", ".join(l)
@@ -83,7 +86,7 @@ def __str__(self) -> str:
         return self.latex()
 
     def isNotEmpty(self) -> bool:
-        return self.biggest.isNotEmpty() and self.largest.isNotEmpty()
+        return self.best.isNotEmpty() or self.biggest.isNotEmpty() or self.largest.isNotEmpty()
 
 
 class info:
@@ -132,7 +135,7 @@ def __repr__(self) -> str:
 def update(
     solvers: defaultdict[str, info],
     select: Callable[[info, str], None],
-    podium: page.PodiumDivision | page.PodiumBiggestLead | page.PodiumLargestContribution,
+    podium: page.PodiumDivision | page.PodiumBestOverall | page.PodiumBiggestLead | page.PodiumLargestContribution,
 ) -> None:
     if podium.track == defs.Track.SingleQuery:
         select(solvers[podium.winner_seq], "sq_seq")
@@ -173,12 +176,10 @@ def add_logic(logics: dict[Tuple[str, defs.Track], bool], list: dict[str, int],
         logics[v, track] = True
 
 
-def parse_pretty_names(solvers: defaultdict[str, info], pretty_names: Path) -> None:
-    with open(pretty_names, newline="") as input:
-        input = csv.DictReader(input)  # type: ignore
-
-        for row in input:
-            solvers[row["Solver Name"]].members = int(row["Members"])  # type: ignore
+def process_submissions(solvers: defaultdict[str, info], submissions: list[defs.Submission]) -> None:
+    for s in submissions:
+        if s.competitive:
+            solvers[s.name].members = len(s.contributors)
 
 
 def parse_experimental_division(solvers: Any, experimental_division: Path) -> dict[str, bool]:
@@ -192,11 +193,14 @@ def parse_experimental_division(solvers: Any, experimental_division: Path) -> di
 
 
 def generate_certificates(
-    website_results: Path, input_for_certificates: Path, pretty_names: Path, experimental_division: Path
+    website_results: Path, input_for_certificates: Path, submission_dir: Path, experimental_division: Path
 ) -> None:
     solvers: defaultdict[str, info] = defaultdict(info)
 
-    parse_pretty_names(solvers, pretty_names)
+    submissions = [submission.read_submission_or_exit(f)
+                   for f in submission_dir.glob("*.json")]
+
+    process_submissions(solvers, submissions)
     solvers["-"].members = 0
 
     # Remove experimental division
@@ -223,6 +227,8 @@ def generate_certificates(
                 continue
             case page.PodiumCrossDivision():
                 match result.root:
+                    case page.PodiumBestOverall():
+                        update(solvers, (lambda x, k: x.overall.best.update(k, True)), result.root)
                     case page.PodiumBiggestLead():
                         update(solvers, (lambda x, k: x.overall.biggest.update(k, True)), result.root)
                     case page.PodiumLargestContribution():

diff --git a/smtcomp/defs.py b/smtcomp/defs.py
@@ -15,6 +15,17 @@
 U = TypeVar("U")
 
 
+baseMapSMTLIB2025 = {
+    "Bitwuzla-MachBV": "Bitwuzla-MachBV-base",
+    "Z3-Inc-Z3++": "Z3-Inc-Z3++-base",
+    "Z3-Noodler-Mocha": "Z3-Noodler-Mocha-base",
+    "Z3-Owl": "Z3-Owl-base",
+    "Z3-Noodler": "Z3-Noodler",
+    "z3siri": "z3siri-base",
+    "Z3-alpha": "Z3-alpha-base",
+}
+
+
 class EnumAutoInt(Enum):
     """
     Normal enum with strings, but each enum is associated to an int
@@ -135,7 +146,7 @@ def name_is_default_field(cls, data: Any) -> Any:
 
 class SolverType(EnumAutoInt):
     wrapped = "wrapped"
-    derived = "derived"
+    derived = "derived"  # TODO: put a datatype information on base solver
     standalone = "Standalone"
     portfolio = "Portfolio"
 
@@ -1317,6 +1328,7 @@ class Submission(BaseModel, extra="forbid"):
     website: HttpUrl
     system_description: HttpUrl
     solver_type: SolverType
+    # TODO add field base_solver?
     participations: Participations
     seed: int | None = None
     competitive: bool = True
@@ -1325,6 +1337,7 @@ class Submission(BaseModel, extra="forbid"):
         description="Must be set for the final version of the submission. An archive on zenodo is needed in this case.",
     )
 
+    # TODO: model validator to check the sanity of the new base_solver field
     @model_validator(mode="after")
     def check_archive(self) -> Submission:
         if self.archive is None and not all(p.archive for p in self.participations.root):
@@ -1446,13 +1459,20 @@ class Results(BaseModel):
 ## Parameters that can change each year
 class Config:
     __next_id__: ClassVar[int] = 0
-    current_year = 2024
+    current_year = 2025
     oldest_previous_results = 2018
     timelimit_s = 60 * 20
+    timelimit_s_test = 60  # time limit for test runs
     memlimit_M = 1024 * 30
+    memlimit_M_test = 1024 * 8  # memory limit for test runs
+    memlimit_M_parallel = 1024 * 1000
+    memlimit_M_parallel_test = 1024 * 8
     cpuCores = 4
-    unsatcore_validation_timelimit_s = 60 * 5
-    unsatcore_validation_memlimit_M = 1024 * 30
+    cpuCores_test = 2
+    cpuCores_parallel = 128
+    cpuCores_parallel_test = 8
+    unsatcore_validation_timelimit_s = 60 * 20
+    unsatcore_validation_memlimit_M = 1024 * 15
     unsatcore_validation_cpuCores = 4
     min_used_benchmarks = 300
     ratio_of_used_benchmarks = 0.5
@@ -1494,22 +1514,21 @@ class Config:
 
     removed_benchmarks = [
         {
-            "logic": int(Logic.QF_LIA),
-            "family": "20210219-Dartagnan/ConcurrencySafety-Main",
-            "name": "39_rand_lock_p0_vs-O0.smt2",
-        }  # scrambler segfault (perhaps stack limit)
+            "logic": int(Logic.UFDTNIA),
+            "family": "20241211-verus/verismo",
+            "name": "tspec__math__nonlinearverismo_tspec.math.nonlinear.proof_mul_pos_neg_rel._01.smt2",
+        },  # reported by Mathias Preiner as syntactically invalid
+        {
+            "logic": int(Logic.UFDTNIA),
+            "family": "20241211-verus/verismo",
+            "name": "tspec__math__nonlinearverismo_tspec.math.nonlinear.proof_div_pos_neg_rel._01.smt2",
+        },  # reported by Mathias Preiner as syntactically invalid
     ]
     """
-    Benchmarks to remove before selection (currently just for aws)
+    Benchmarks to remove before selection
     """
 
-    removed_results = [
-        {
-            "logic": int(Logic.QF_BV),
-            "family": "20230221-oisc-gurtner",
-            "name": "SLL-NESTED-8-32-sp-not-excluded.smt2",
-        }  # wrong status in SMTLIB
-    ]
+    removed_results = []
     """
     Benchmarks to remove after running the solvers. Can be used when the selection has already been done.
     """
@@ -1537,7 +1556,7 @@ def data(self) -> Path:
 
     @functools.cached_property
     def previous_years(self) -> list[int]:
-        return list(range(self.oldest_previous_results, self.current_year))
+        return list(range(self.oldest_previous_results, self.current_year - 1))
 
     @functools.cached_property
     def previous_results(self) -> list[tuple[int, Path]]:
-Original file line number
+Diff line change
@@ Expand Up @@
     Tasks for unsat core validation can be generated by:
     ```
-    smtcomp generate-unsatcore-validation-files ../tmp/execution SCRAMBLER_EXECUTABLE UNSAT_CORE_RESULT_DIR/*/*
+    smtcomp generate-unsatcore-validation-files ../tmp/execution SCRAMBLER_EXECUTABLE UNSAT_CORE_RESULT_DIR
     ```
     ---
@@ Expand Down @@