aallan
diff --git a/‎.coderabbit.yaml‎
Lines changed: 2 additions & 0 deletions b/‎.coderabbit.yaml‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎.gitignore‎
Lines changed: 3 additions & 0 deletions b/‎.gitignore‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 5 additions & 2 deletions b/‎README.md‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎ROADMAP.md‎
Lines changed: 1 addition & 0 deletions b/‎ROADMAP.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎solutions/ailang/VB_T1_001_absolute_value.ail‎
Lines changed: 15 additions & 0 deletions b/‎solutions/ailang/VB_T1_001_absolute_value.ail‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎solutions/ailang/VB_T1_002_clamp.ail‎
Lines changed: 13 additions & 0 deletions b/‎solutions/ailang/VB_T1_002_clamp.ail‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎solutions/ailang/VB_T1_003_signum.ail‎
Lines changed: 12 additions & 0 deletions b/‎solutions/ailang/VB_T1_003_signum.ail‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎solutions/ailang/VB_T1_004_max_of_two.ail‎
Lines changed: 12 additions & 0 deletions b/‎solutions/ailang/VB_T1_004_max_of_two.ail‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎solutions/ailang/VB_T1_005_min_of_two.ail‎
Lines changed: 11 additions & 0 deletions b/‎solutions/ailang/VB_T1_005_min_of_two.ail‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎solutions/ailang/VB_T1_006_is_positive.ail‎
Lines changed: 10 additions & 0 deletions b/‎solutions/ailang/VB_T1_006_is_positive.ail‎
Lines changed: 10 additions & 0 deletions
@@ -48,11 +48,13 @@ reviews:
   path_filters:
     - "!**/*.vera"
     - "!**/*.av"
+    - "!**/*.ail"
     - "!context/**"
     - "!results/**/*.jsonl"
     - "!solutions/python/**"
     - "!solutions/typescript/**"
     - "!solutions/aver/**"
+    - "!solutions/ailang/**"
 
   path_instructions:
     - path: "vera_bench/**/*.py"
 
@@ -34,3 +34,6 @@ assets/benchmark_*.png
 # Script is committed; rendered PNGs are talk-prep ephemera and go into
 # the speaker's slide deck rather than the repo.
 assets/vera-bench_slide_*.png
+
+# AILANG runtime cache (created by `ailang run` in solutions/ailang/)
+solutions/ailang/.ailang/
@@ -70,7 +70,7 @@ For each problem, we measure:
 - **fix@1** — Given the error message, can the model fix it in one turn?
 - **run_correct** — Does execution produce the correct output?
 
-The same problems are also run in Python, TypeScript, and [Aver](https://github.com/jasisz/aver) as baselines. Aver is a Haskell-inspired language with zero LLM training data, providing a second data point alongside Vera for the zero-training-data thesis.
+The same problems are also run in Python, TypeScript, [Aver](https://github.com/jasisz/aver), and [AILANG](https://ailang.sunholo.com/) as baselines. AILANG and Aver are zero-training-data languages, providing additional data points alongside Vera for the language-design-vs-training-data thesis.
 
 > **Cross-language comparison:** For cross-language headline rates, use the T1–T4 aggregate. Tier 5 tests Vera's algebraic effect handlers, which other languages solve with fundamentally different native idioms. See [#50](https://github.com/aallan/vera-bench/issues/50).
 
@@ -80,6 +80,7 @@ The same problems are also run in Python, TypeScript, and [Aver](https://github.
 * Git
 * Node.js 22+ *(optional, for TypeScript baselines and generation)*
 * [Aver](https://github.com/jasisz/aver) *(optional, for Aver baselines and generation)*
+* [AILANG](https://ailang.sunholo.com/) *(optional, for AILANG baselines and generation)*
 
 ## Installation
 
@@ -135,15 +136,17 @@ vera-bench run --model claude-sonnet-4-20250514 --problem VB-T1-001
 # Spec-from-NL mode (agent writes its own contracts)
 vera-bench run --model claude-sonnet-4-20250514 --mode spec-from-nl
 
-# Ask the same model to write Python, TypeScript, or Aver for comparison
+# Ask the same model to write Python, TypeScript, Aver, or AILANG for comparison
 vera-bench run --model claude-sonnet-4-20250514 --language python
 vera-bench run --model claude-sonnet-4-20250514 --language typescript
 vera-bench run --model claude-sonnet-4-20250514 --language aver
+vera-bench run --model claude-sonnet-4-20250514 --language ailang
 
 # Run canonical baselines as a reference
 vera-bench baselines
 vera-bench baselines --language typescript
 vera-bench baselines --language aver
+vera-bench baselines --language ailang
 
 # Generate a combined report
 vera-bench report results/
 
@@ -29,6 +29,7 @@
 - [x] Strengthen postconditions to catch slot-swap bugs (issue #14)
 - [ ] Improve SKILL.md coverage of where blocks (issue #15)
 - [x] Test coverage ([issue #5](https://github.com/aallan/vera-bench/issues/5), ongoing — target 90%) — CI enforces 80% floor via `--cov-fail-under=80` in [ci.yml](.github/workflows/ci.yml), current coverage shown by [![codecov](https://codecov.io/gh/aallan/vera-bench/graph/badge.svg)](https://codecov.io/gh/aallan/vera-bench)
+- [ ] Per-test subprocess-failure diagnostics — Aver and AILANG evaluators currently `continue` on per-test failures without capturing stderr, unlike the Python/TypeScript paths. Small shared-helper refactor (issue [#72](https://github.com/aallan/vera-bench/issues/72))
 
 ## Milestone 2: Longitudinal tracking
 
 
@@ -0,0 +1,15 @@
+module benchmark/solution
+
+-- VB-T1-001: Absolute Value
+-- Compute |x|. AILANG: simple if-as-expression, no Nat subtype so we return int.
+
+export func absolute_value(x: int) -> int =
+  if x < 0 then -x else x
+
+export func main() -> () ! {IO} {
+  println(show(absolute_value(0)));
+  println(show(absolute_value(42)));
+  println(show(absolute_value(-42)));
+  println(show(absolute_value(1)));
+  println(show(absolute_value(-1)))
+}
@@ -0,0 +1,13 @@
+module benchmark/solution
+
+export func clamp(value: int, lo: int, hi: int) -> int =
+  if value < lo then lo
+  else if value > hi then hi
+  else value
+
+export func main() -> () ! {IO} {
+  println(show(clamp(50, 0, 100)));
+  println(show(clamp(-5, 0, 100)));
+  println(show(clamp(150, 0, 100)));
+  println(show(clamp(0, 0, 0)))
+}
@@ -0,0 +1,12 @@
+module benchmark/solution
+
+export func signum(x: int) -> int =
+  if x < 0 then -1
+  else if x > 0 then 1
+  else 0
+
+export func main() -> () ! {IO} {
+  println(show(signum(42)));
+  println(show(signum(-7)));
+  println(show(signum(0)))
+}
@@ -0,0 +1,12 @@
+module benchmark/solution
+
+export func max_of_two(a: int, b: int) -> int =
+  if a > b then a else b
+
+export func main() -> () ! {IO} {
+  println(show(max_of_two(3, 7)));
+  println(show(max_of_two(7, 3)));
+  println(show(max_of_two(5, 5)));
+  println(show(max_of_two(-1, -5)));
+  println(show(max_of_two(0, 0)))
+}
@@ -0,0 +1,11 @@
+module benchmark/solution
+
+export func min_of_two(a: int, b: int) -> int =
+  if a < b then a else b
+
+export func main() -> () ! {IO} {
+  println(show(min_of_two(3, 7)));
+  println(show(min_of_two(7, 3)));
+  println(show(min_of_two(5, 5)));
+  println(show(min_of_two(-1, -5)))
+}
@@ -0,0 +1,10 @@
+module benchmark/solution
+
+export func is_positive(x: int) -> bool = x > 0
+
+export func main() -> () ! {IO} {
+  println(show(is_positive(5)));
+  println(show(is_positive(-3)));
+  println(show(is_positive(0)));
+  println(show(is_positive(1)))
+}