roc-lang
diff --git a/‎.github/workflows/ci_zig_nix.yml‎
Lines changed: 4 additions & 0 deletions b/‎.github/workflows/ci_zig_nix.yml‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎build.zig‎
Lines changed: 177 additions & 31 deletions b/‎build.zig‎
Lines changed: 177 additions & 31 deletions
diff --git a/‎ci/benchmarks_zig/run_fx_benchmarks.sh‎
Lines changed: 73 additions & 0 deletions b/‎ci/benchmarks_zig/run_fx_benchmarks.sh‎
Lines changed: 73 additions & 0 deletions
diff --git a/‎design.md‎
Lines changed: 42 additions & 27 deletions b/‎design.md‎
Lines changed: 42 additions & 27 deletions
diff --git a/‎docs/langref/iterators.md‎
Lines changed: 1 addition & 0 deletions b/‎docs/langref/iterators.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎docs/langref/loops.md‎
Lines changed: 34 additions & 4 deletions b/‎docs/langref/loops.md‎
Lines changed: 34 additions & 4 deletions
@@ -33,6 +33,10 @@ jobs:
       - uses: cachix/install-nix-action@02a151ada4993995686f9ed4f1be7cfbb229e56f # ratchet:cachix/install-nix-action@v31
         with:
           nix_path: nixpkgs=channel:nixos-25.05
+          extra_nix_config: |
+              min-free = 1073741824
+              max-free = 5368709120
+              # When free space drops below min-free (1 GB), nix GCs until max-free (5 GB) is available. This avoids "No space left on device" on CI.
 
       - name: Build inside a nix dev shell
         uses: ./.github/actions/flaky-retry
 
@@ -228,6 +228,69 @@ preflight_benchmark() {
     return 2
 }
 
+# Determine whether `roc build <file>` produces a byte-identical executable for
+# the two binaries. A confirmed build slowdown whose output executable is
+# byte-identical is definitionally a false positive: the compiler produced the
+# same program, so the timing difference is measurement or binary-layout noise
+# (e.g. a larger compiler binary with slightly different code locality) rather
+# than real work.
+#
+# roc embeds nothing version-specific into the linked executable (the compiler
+# version only reaches the DWARF producer string in the intermediate bitcode,
+# which is stripped before linking), and its linker is deterministic, so two
+# compiler builds that do the same work emit byte-identical executables.
+#
+# Each binary builds in an isolated working directory and cache so their outputs
+# cannot clobber each other; --no-cache bypasses cache reads but still emits the
+# executable. Returns 0 only when both executables are present and byte-identical;
+# any uncertainty (a build failure or a missing executable) returns 1 so we fail
+# safe toward the normal slowdown failure.
+build_executable_output_identical() {
+    local main_roc="$1"
+    local pr_roc="$2"
+    local fx_file="$3"
+    local roc_extra_args="$4"
+
+    # roc resolves a platform's relative path against the source file's location
+    # and writes the executable into the current directory, so we pass an
+    # absolute source path and build from a scratch directory per binary.
+    local abs_fx
+    abs_fx="$(cd "$(dirname "$fx_file")" && pwd)/$(basename "$fx_file")" || return 1
+
+    local work
+    work=$(mktemp -d) || return 1
+    local main_dir="$work/main" pr_dir="$work/pr"
+    mkdir -p "$main_dir" "$pr_dir"
+
+    local -a extra_arg_array=()
+    if [ -n "$roc_extra_args" ]; then
+        read -r -a extra_arg_array <<< "$roc_extra_args"
+    fi
+    # Guard the array expansion so an empty extra-args list does not trip
+    # `set -u` on older bash (e.g. macOS's bash 3.2).
+    if ! ( cd "$main_dir" && XDG_CACHE_HOME="$main_dir/.cache" "$main_roc" build "$abs_fx" --no-cache "${extra_arg_array[@]+"${extra_arg_array[@]}"}" >/dev/null 2>&1 ); then
+        rm -rf "$work"
+        return 1
+    fi
+    if ! ( cd "$pr_dir" && XDG_CACHE_HOME="$pr_dir/.cache" "$pr_roc" build "$abs_fx" --no-cache "${extra_arg_array[@]+"${extra_arg_array[@]}"}" >/dev/null 2>&1 ); then
+        rm -rf "$work"
+        return 1
+    fi
+
+    local main_exe pr_exe
+    main_exe=$(find "$main_dir" -maxdepth 1 -type f -perm -u+x | head -1)
+    pr_exe=$(find "$pr_dir" -maxdepth 1 -type f -perm -u+x | head -1)
+    if [ -z "$main_exe" ] || [ -z "$pr_exe" ]; then
+        rm -rf "$work"
+        return 1
+    fi
+
+    local identical=1
+    cmp -s "$main_exe" "$pr_exe" || identical=0
+    rm -rf "$work"
+    [ "$identical" -eq 1 ]
+}
+
 # Run hyperfine benchmark and return percentage change via global variable
 # Returns 0 on success, 1 on failure
 # Sets BENCH_PCT_CHANGE on success
@@ -428,6 +491,16 @@ benchmark_file() {
         local confirm_is_slower
         confirm_is_slower=$(awk "BEGIN {print ($confirm_pct_change > 4 && $confirm_abs_delta_ms > 5) ? 1 : 0}")
         if [ "$confirm_is_slower" = "1" ]; then
+            # A build slowdown whose output executable is byte-identical is a
+            # definitional false positive (the same program cannot have cost
+            # more to produce), so pass it without a human override.
+            if [ "$roc_subcommand" = "build" ] && \
+               build_executable_output_identical "$MAIN_ROC" "$PR_ROC" "$fx_file" "$roc_extra_args"; then
+                echo "  IDENTICAL OUTPUT: $display_name produces a byte-identical executable on both binaries; treating the timing difference as a false positive (measurement or binary-layout noise), not a regression."
+                echo ""
+                return 0
+            fi
+
             echo "  SLOWER EXECUTION CONFIRMED in $display_name (${pct_change}% / ${abs_delta_ms} ms then ${confirm_pct_change}% / ${confirm_abs_delta_ms} ms)"
             SLOWER_DETECTED=1
             SLOWER_FILES+=("$display_name")
 
@@ -1110,12 +1110,14 @@ that checked module. The same checked function template may therefore produce
 many Monotype bodies, and the same checked nested lambda site may produce many
 nested Monotype functions, each with a different monomorphic function type.
 
-An instantiation context owns stage-local type cells addressed by
-`(checked module id, checked type id)`. The address is the checked identity of
-the type variable/content in the current specialization. It is not a structural
-digest, source name, runtime layout, object symbol, or generated procedure id.
-Cells begin unresolved. As the specialization is lowered, explicit evidence from
-checked data constrains those cells:
+Each specialization owns an instantiation graph: union-find nodes with
+explicit row-extension links, created by instantiating checked types on first
+touch. Instantiation contexts cache nodes by `(checked module id, checked type
+id)`. The address is the checked identity of the type variable/content in the
+current specialization. It is not a structural digest, source name, runtime
+layout, object symbol, or generated procedure id. Nodes begin unresolved. As
+the specialization is lowered, explicit evidence from checked data unifies
+those nodes:
 
 - the requested root function/value type constrains the checked root type;
 - lambda and closure expected function types constrain the nested function
@@ -1222,8 +1224,8 @@ encounter the same checked type under better evidence and try to assign a
 different Monotype type. That is not a valid compiler state; it is evidence that
 the stage was not lowering from one constrained specialization graph. The
 instantiation model makes the intended data flow explicit, so the first
-constraint and every later constraint meet in the same cell before the final
-Monotype body is emitted.
+constraint and every later constraint meet in the same graph node before the
+final Monotype body is emitted.
 
 An unconstrained checked type variable that remains open after checking lowers
 to the empty tag union in Monotype. This is not a default choice. It records the
@@ -1232,19 +1234,33 @@ can still be represented as `List([ ])` because they contain no elements, and
 code that would need an actual element value must have constrained the element
 type earlier or must be unreachable at runtime.
 
-During Monotype construction, an open checked variable is represented by a
-stage-local type cell. The cell starts as the empty tag union, and it may be
-completed with a concrete type while the same Monotype body is still being
-constructed if call-site arguments, expected lambda types, numeric literals, or
-checked type relations provide concrete evidence. This is ordinary type solving
-inside one stage. Once Monotype IR is output, no open cell remains and no
-later stage may change a type.
-
-Monotype type cells are addressed by the owning checked module id and the exact
-checked type id. They are not addressed by `TypeDigest`. A digest can identify
-closed structural type content for specialization and comparison, but it cannot
-distinguish two different open checked variables with the same shape. Treating
-those variables as the same cell is a compiler bug.
+During Monotype construction, an open checked variable is an unresolved graph
+node carrying the variable's numeric and row defaults. Unification resolves it
+when call-site arguments, expected lambda types, numeric literals, or checked
+type relations provide concrete evidence; defaults apply only at
+materialization. A Monotype is a materialized view of a solved node: it is
+reserved at a stable id and its content is refilled in place when its node
+gains evidence, so every holder of the id observes the solved type. This is
+ordinary type solving inside one stage. Once Monotype IR is output, no
+unresolved node remains reachable and no later stage may change a type.
+
+A Monotype imported into another specialization's graph is a finished
+snapshot, never a refreshable view: a specialization that needs more than its
+requested type is a unification conflict, not a silent rewrite of another
+specialization's final type. Procedure template body requests therefore defer
+to the end of the requesting specialization, when its types are final and the
+specialization key is stable. Nested functions are the exception: they share
+the requester's graph, and an inferred local procedure's body pins signature
+variables the requester's remaining body relies on, so nested bodies lower at
+their request site.
+
+Instantiation graph nodes are cached by the owning checked module id and the
+exact checked type id. They are not cached by `TypeDigest`. A digest can
+identify closed structural type content for specialization and comparison, but
+it cannot distinguish two different open checked variables with the same shape.
+Treating those variables as the same node is a compiler bug. Type digests are
+alias-transparent and encode recursive back references, so structurally equal
+types digest equally regardless of alias spelling or knot-tying ids.
 
 Generated helper code for an empty tag union, such as an inspector requested
 only because a container type mentions the empty tag union, has an unreachable
@@ -2740,12 +2756,11 @@ that value kind must be added explicitly here with a checked cache rule.
 - function values
 
 Compile-time evaluation failures are owned by checking finalization because the
-module has not been output yet. User-written compile-time crashes, exhausted
-compile-time limits, invalid compile-time host interaction, and unsupported
-compile-time operations become checking diagnostics attached to the checked root
-being finalized. OOM remains OOM. A post-check invariant failure while lowering
-or interpreting a compile-time root is still a compiler bug, not a user-facing
-diagnostic.
+module has not been output yet. User-written compile-time crashes, invalid
+compile-time host interaction, and unsupported compile-time operations become
+checking diagnostics attached to the checked root being finalized. OOM remains
+OOM. A post-check invariant failure while lowering or interpreting a
+compile-time root is still a compiler bug, not a user-facing diagnostic.
 
 While storing an eval result, the builder may reserve a `ConstNodeId` before
 storing its children so repeated references to the same acyclic runtime value
 
@@ -0,0 +1 @@
+# Iterators
@@ -4,16 +4,37 @@ Loops let you run the same code multiple times, in...well, in a loop.
 
 ## `for` Loops
 
-A `for` loop iterates over each item in a list:
+A `for` loop lets you run code on each item in an [iterator](iterators). For example:
 
 ```roc
 var $sum = 0
+
+for n in 1.to(5) {
+    $sum = $sum + n
+}
+```
+
+> The `to` method returns a [range](numbers#ranges) which is an `Iter` of the number in question. For example, [`I64.to`](builtins/I64#to) returns `Iter(I64)`, and so `n` in this example would be an `I64`.
+
+A loop body only includes statements; it does not have a final expression. The loop itself evaluates to `{}`.
+
+### Iterating over types that have `iter`
+
+`for` can also be used on types that have an `iter` method, as long as that method returns an [`Iter`](builtins/Iter). For example, [`List`](builtins/list) has (`List.iter`)[builtins/List#iter], so you can do a `for` loop over a list:
+
+```roc
+var $sum = 0
+
 for n in [1, 2, 3, 4] {
     $sum = $sum + n
 }
 ```
 
-The item can be destructured inline:
+At runtime, this `[1, 2, 3, 4]` code snippet is exactly as efficient as the earlier `1.to(5)` one. In one case, `1.to(5)` will be evaluated to an `Iter` at compile time, and in the other, `[1, 2, 3, 4].iter()` will be evaluated at compile time to an identical `Iter`. By the time either program actually runs, they will have the same memory contents and will be executing the same instructions.
+
+### Pattern matching in `for`
+
+Whatever you put between `for` and `in` is treated as a [pattern](pattern-matching), meaning (for example) that the item can be destructured inline:
 
 ```roc
 var $total = 0
@@ -22,7 +43,7 @@ for (x, y) in [(1, 2), (3, 4), (5, 6)] {
 }
 ```
 
-Use `_` if you don't want to name the item:
+As usual, you can nest patterns as much as you like, and can use `_` if you don't want to name a pattern:
 
 ```roc
 var $count = 0
@@ -31,7 +52,16 @@ for _ in items {
 }
 ```
 
-A loop body only includes statements; it does not have a final expression. The loop itself evaluates to `{}`.
+Just like with [assignments](statements#assignments), the pattern you use here must be [exhaustive](pattern-matching#exhaustiveness). For example, the following would give an exhaustiveness error because the loop body couldn't know what value to use for `amount_to_add` if the item was ever `Err` at runtime:
+
+```roc
+var $count = 0
+for Ok(amount_to_add) in items {
+    $count = $count + amount_to_add
+}
+```
+
+If you can't write an exhaustive pattern-match, you can name the entire iterator item and then use [`match`](pattern-matching#match) on it inside the loop body.
 
 ## `while` Loops