From 9bd6bbb7e71270463668f9cff862a8aa2bc487c4 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Thu, 7 May 2026 23:05:59 +0000
Subject: [PATCH 01/89] datalog: tokenizer + 26 tests (Phase 1)

Tokens {:type :value :pos} for atoms, vars, numbers, strings, punct, ops.
Operators :- ?- <= >= != < > = + - * /. Comments % and /* */.
---
 lib/datalog/tests/tokenize.sx | 139 +++++++++++++++++++
 lib/datalog/tokenizer.sx      | 254 ++++++++++++++++++++++++++++++++++
 2 files changed, 393 insertions(+)
 create mode 100644 lib/datalog/tests/tokenize.sx
 create mode 100644 lib/datalog/tokenizer.sx

diff --git a/lib/datalog/tests/tokenize.sx b/lib/datalog/tests/tokenize.sx
new file mode 100644
index 00000000..920c7257
--- /dev/null
+++ b/lib/datalog/tests/tokenize.sx
@@ -0,0 +1,139 @@
+;; lib/datalog/tests/tokenize.sx — tokenizer unit tests
+;;
+;; Run via: bash lib/datalog/conformance.sh
+;; Or:      (load "lib/datalog/tokenizer.sx") (load "lib/datalog/tests/tokenize.sx")
+;;          (dl-tokenize-tests-run!)
+
+(define dl-tk-pass 0)
+(define dl-tk-fail 0)
+(define dl-tk-failures (list))
+
+(define
+  dl-tk-test!
+  (fn
+    (name got expected)
+    (if
+      (= got expected)
+      (set! dl-tk-pass (+ dl-tk-pass 1))
+      (do
+        (set! dl-tk-fail (+ dl-tk-fail 1))
+        (append!
+          dl-tk-failures
+          (str name "\n    expected: " expected "\n    got:      " got))))))
+
+(define dl-tk-types (fn (toks) (map (fn (t) (get t :type)) toks)))
+(define dl-tk-values (fn (toks) (map (fn (t) (get t :value)) toks)))
+
+(define
+  dl-tk-run-all!
+  (fn
+    ()
+    (do
+      (dl-tk-test! "empty" (dl-tk-types (dl-tokenize "")) (list "eof"))
+      (dl-tk-test!
+        "atom dot"
+        (dl-tk-types (dl-tokenize "foo."))
+        (list "atom" "punct" "eof"))
+      (dl-tk-test!
+        "atom dot value"
+        (dl-tk-values (dl-tokenize "foo."))
+        (list "foo" "." nil))
+      (dl-tk-test!
+        "var"
+        (dl-tk-types (dl-tokenize "X."))
+        (list "var" "punct" "eof"))
+      (dl-tk-test!
+        "underscore var"
+        (dl-tk-types (dl-tokenize "_x."))
+        (list "var" "punct" "eof"))
+      (dl-tk-test!
+        "integer"
+        (dl-tk-values (dl-tokenize "42"))
+        (list 42 nil))
+      (dl-tk-test!
+        "decimal"
+        (dl-tk-values (dl-tokenize "3.14"))
+        (list 3.14 nil))
+      (dl-tk-test!
+        "string"
+        (dl-tk-values (dl-tokenize "\"hello\""))
+        (list "hello" nil))
+      (dl-tk-test!
+        "quoted atom"
+        (dl-tk-types (dl-tokenize "'two words'"))
+        (list "atom" "eof"))
+      (dl-tk-test!
+        "quoted atom value"
+        (dl-tk-values (dl-tokenize "'two words'"))
+        (list "two words" nil))
+      (dl-tk-test! ":-" (dl-tk-values (dl-tokenize ":-")) (list ":-" nil))
+      (dl-tk-test! "?-" (dl-tk-values (dl-tokenize "?-")) (list "?-" nil))
+      (dl-tk-test! "<=" (dl-tk-values (dl-tokenize "<=")) (list "<=" nil))
+      (dl-tk-test! ">=" (dl-tk-values (dl-tokenize ">=")) (list ">=" nil))
+      (dl-tk-test! "!=" (dl-tk-values (dl-tokenize "!=")) (list "!=" nil))
+      (dl-tk-test!
+        "single op values"
+        (dl-tk-values (dl-tokenize "< > = + - * /"))
+        (list "<" ">" "=" "+" "-" "*" "/" nil))
+      (dl-tk-test!
+        "single op types"
+        (dl-tk-types (dl-tokenize "< > = + - * /"))
+        (list "op" "op" "op" "op" "op" "op" "op" "eof"))
+      (dl-tk-test!
+        "punct"
+        (dl-tk-values (dl-tokenize "( ) , ."))
+        (list "(" ")" "," "." nil))
+      (dl-tk-test!
+        "fact tokens"
+        (dl-tk-types (dl-tokenize "parent(tom, bob)."))
+        (list "atom" "punct" "atom" "punct" "atom" "punct" "punct" "eof"))
+      (dl-tk-test!
+        "rule shape"
+        (dl-tk-types (dl-tokenize "p(X) :- q(X)."))
+        (list
+          "atom"
+          "punct"
+          "var"
+          "punct"
+          "op"
+          "atom"
+          "punct"
+          "var"
+          "punct"
+          "punct"
+          "eof"))
+      (dl-tk-test!
+        "comparison literal"
+        (dl-tk-values (dl-tokenize "<(X, 5)"))
+        (list "<" "(" "X" "," 5 ")" nil))
+      (dl-tk-test!
+        "is form"
+        (dl-tk-values (dl-tokenize "is(Y, +(X, 1))"))
+        (list "is" "(" "Y" "," "+" "(" "X" "," 1 ")" ")" nil))
+      (dl-tk-test!
+        "line comment"
+        (dl-tk-types (dl-tokenize "% comment line\nfoo."))
+        (list "atom" "punct" "eof"))
+      (dl-tk-test!
+        "block comment"
+        (dl-tk-types (dl-tokenize "/* a\nb */ x."))
+        (list "atom" "punct" "eof"))
+      (dl-tk-test!
+        "whitespace"
+        (dl-tk-types (dl-tokenize "  foo  ,\t bar  ."))
+        (list "atom" "punct" "atom" "punct" "eof"))
+      (dl-tk-test!
+        "positions"
+        (map (fn (t) (get t :pos)) (dl-tokenize "foo bar"))
+        (list 0 4 7)))))
+
+(define
+  dl-tokenize-tests-run!
+  (fn
+    ()
+    (do
+      (set! dl-tk-pass 0)
+      (set! dl-tk-fail 0)
+      (set! dl-tk-failures (list))
+      (dl-tk-run-all!)
+      {:failures dl-tk-failures :total (+ dl-tk-pass dl-tk-fail) :passed dl-tk-pass :failed dl-tk-fail})))
diff --git a/lib/datalog/tokenizer.sx b/lib/datalog/tokenizer.sx
new file mode 100644
index 00000000..b169b64e
--- /dev/null
+++ b/lib/datalog/tokenizer.sx
@@ -0,0 +1,254 @@
+;; lib/datalog/tokenizer.sx — Datalog source → token stream
+;;
+;; Tokens: {:type T :value V :pos P}
+;; Types:
+;;   "atom"    — lowercase-start ident or quoted 'atom'
+;;   "var"     — uppercase-start or _-start ident (value is the name)
+;;   "number"  — numeric literal (decoded to number)
+;;   "string"  — "..." string literal
+;;   "punct"   — ( ) , .
+;;   "op"      — :- ?- <= >= != < > = + - * /
+;;   "eof"
+;;
+;; Datalog has no function symbols in arg position; the parser still
+;; accepts nested compounds for arithmetic ((is X (+ A B))) but safety
+;; analysis rejects non-arithmetic nesting at rule-load time.
+
+(define dl-make-token (fn (type value pos) {:type type :value value :pos pos}))
+
+(define dl-digit? (fn (c) (and (>= c "0") (<= c "9"))))
+(define dl-lower? (fn (c) (and (>= c "a") (<= c "z"))))
+(define dl-upper? (fn (c) (and (>= c "A") (<= c "Z"))))
+
+(define
+  dl-ident-char?
+  (fn (c) (or (dl-lower? c) (dl-upper? c) (dl-digit? c) (= c "_"))))
+
+(define dl-ws? (fn (c) (or (= c " ") (= c "\t") (= c "\n") (= c "\r"))))
+
+(define
+  dl-tokenize
+  (fn
+    (src)
+    (let
+      ((tokens (list)) (pos 0) (src-len (len src)))
+      (define
+        dl-peek
+        (fn
+          (offset)
+          (if (< (+ pos offset) src-len) (nth src (+ pos offset)) nil)))
+      (define cur (fn () (dl-peek 0)))
+      (define advance! (fn (n) (set! pos (+ pos n))))
+      (define
+        at?
+        (fn
+          (s)
+          (let
+            ((sl (len s)))
+            (and (<= (+ pos sl) src-len) (= (slice src pos (+ pos sl)) s)))))
+      (define
+        dl-emit!
+        (fn
+          (type value start)
+          (append! tokens (dl-make-token type value start))))
+      (define
+        skip-line-comment!
+        (fn
+          ()
+          (when
+            (and (< pos src-len) (not (= (cur) "\n")))
+            (do (advance! 1) (skip-line-comment!)))))
+      (define
+        skip-block-comment!
+        (fn
+          ()
+          (cond
+            ((>= pos src-len) nil)
+            ((and (= (cur) "*") (< (+ pos 1) src-len) (= (dl-peek 1) "/"))
+              (advance! 2))
+            (else (do (advance! 1) (skip-block-comment!))))))
+      (define
+        skip-ws!
+        (fn
+          ()
+          (cond
+            ((>= pos src-len) nil)
+            ((dl-ws? (cur)) (do (advance! 1) (skip-ws!)))
+            ((= (cur) "%")
+              (do (advance! 1) (skip-line-comment!) (skip-ws!)))
+            ((and (= (cur) "/") (< (+ pos 1) src-len) (= (dl-peek 1) "*"))
+              (do (advance! 2) (skip-block-comment!) (skip-ws!)))
+            (else nil))))
+      (define
+        read-ident
+        (fn
+          (start)
+          (do
+            (when
+              (and (< pos src-len) (dl-ident-char? (cur)))
+              (do (advance! 1) (read-ident start)))
+            (slice src start pos))))
+      (define
+        read-decimal-digits!
+        (fn
+          ()
+          (when
+            (and (< pos src-len) (dl-digit? (cur)))
+            (do (advance! 1) (read-decimal-digits!)))))
+      (define
+        read-number
+        (fn
+          (start)
+          (do
+            (read-decimal-digits!)
+            (when
+              (and
+                (< pos src-len)
+                (= (cur) ".")
+                (< (+ pos 1) src-len)
+                (dl-digit? (dl-peek 1)))
+              (do (advance! 1) (read-decimal-digits!)))
+            (parse-number (slice src start pos)))))
+      (define
+        read-quoted
+        (fn
+          (quote-char)
+          (let
+            ((chars (list)))
+            (advance! 1)
+            (define
+              loop
+              (fn
+                ()
+                (cond
+                  ((>= pos src-len) nil)
+                  ((= (cur) "\\")
+                    (do
+                      (advance! 1)
+                      (when
+                        (< pos src-len)
+                        (let
+                          ((ch (cur)))
+                          (do
+                            (cond
+                              ((= ch "n") (append! chars "\n"))
+                              ((= ch "t") (append! chars "\t"))
+                              ((= ch "r") (append! chars "\r"))
+                              ((= ch "\\") (append! chars "\\"))
+                              ((= ch "'") (append! chars "'"))
+                              ((= ch "\"") (append! chars "\""))
+                              (else (append! chars ch)))
+                            (advance! 1))))
+                      (loop)))
+                  ((= (cur) quote-char) (advance! 1))
+                  (else
+                    (do (append! chars (cur)) (advance! 1) (loop))))))
+            (loop)
+            (join "" chars))))
+      (define
+        scan!
+        (fn
+          ()
+          (do
+            (skip-ws!)
+            (when
+              (< pos src-len)
+              (let
+                ((ch (cur)) (start pos))
+                (cond
+                  ((at? ":-")
+                    (do
+                      (dl-emit! "op" ":-" start)
+                      (advance! 2)
+                      (scan!)))
+                  ((at? "?-")
+                    (do
+                      (dl-emit! "op" "?-" start)
+                      (advance! 2)
+                      (scan!)))
+                  ((at? "<=")
+                    (do
+                      (dl-emit! "op" "<=" start)
+                      (advance! 2)
+                      (scan!)))
+                  ((at? ">=")
+                    (do
+                      (dl-emit! "op" ">=" start)
+                      (advance! 2)
+                      (scan!)))
+                  ((at? "!=")
+                    (do
+                      (dl-emit! "op" "!=" start)
+                      (advance! 2)
+                      (scan!)))
+                  ((dl-digit? ch)
+                    (do
+                      (dl-emit! "number" (read-number start) start)
+                      (scan!)))
+                  ((= ch "'")
+                    (do (dl-emit! "atom" (read-quoted "'") start) (scan!)))
+                  ((= ch "\"")
+                    (do (dl-emit! "string" (read-quoted "\"") start) (scan!)))
+                  ((dl-lower? ch)
+                    (do (dl-emit! "atom" (read-ident start) start) (scan!)))
+                  ((or (dl-upper? ch) (= ch "_"))
+                    (do (dl-emit! "var" (read-ident start) start) (scan!)))
+                  ((= ch "(")
+                    (do
+                      (dl-emit! "punct" "(" start)
+                      (advance! 1)
+                      (scan!)))
+                  ((= ch ")")
+                    (do
+                      (dl-emit! "punct" ")" start)
+                      (advance! 1)
+                      (scan!)))
+                  ((= ch ",")
+                    (do
+                      (dl-emit! "punct" "," start)
+                      (advance! 1)
+                      (scan!)))
+                  ((= ch ".")
+                    (do
+                      (dl-emit! "punct" "." start)
+                      (advance! 1)
+                      (scan!)))
+                  ((= ch "<")
+                    (do
+                      (dl-emit! "op" "<" start)
+                      (advance! 1)
+                      (scan!)))
+                  ((= ch ">")
+                    (do
+                      (dl-emit! "op" ">" start)
+                      (advance! 1)
+                      (scan!)))
+                  ((= ch "=")
+                    (do
+                      (dl-emit! "op" "=" start)
+                      (advance! 1)
+                      (scan!)))
+                  ((= ch "+")
+                    (do
+                      (dl-emit! "op" "+" start)
+                      (advance! 1)
+                      (scan!)))
+                  ((= ch "-")
+                    (do
+                      (dl-emit! "op" "-" start)
+                      (advance! 1)
+                      (scan!)))
+                  ((= ch "*")
+                    (do
+                      (dl-emit! "op" "*" start)
+                      (advance! 1)
+                      (scan!)))
+                  ((= ch "/")
+                    (do
+                      (dl-emit! "op" "/" start)
+                      (advance! 1)
+                      (scan!)))
+                  (else (do (advance! 1) (scan!)))))))))
+      (scan!)
+      (dl-emit! "eof" nil pos)
+      tokens)))

From 5c1807c8326ab185dd557f488a6efca2ae393914 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Thu, 7 May 2026 23:31:24 +0000
Subject: [PATCH 02/89] datalog: parser + 18 tests + conformance harness (Phase
 1 done, 44/44)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Tokens → list of {:head :body} / {:query} clauses. SX symbols for
constants and variables (case-distinguished). not(literal) in body
desugars to {:neg literal}. Nested compounds permitted in arg
position for arithmetic; safety analysis (Phase 3) will gate them.

Conformance harness wraps lib/guest/conformance.sh; produces
lib/datalog/scoreboard.{json,md}.
---
 lib/datalog/conformance.conf |  14 ++
 lib/datalog/conformance.sh   |   3 +
 lib/datalog/parser.sx        | 242 +++++++++++++++++++++++++++++++++++
 lib/datalog/scoreboard.json  |  11 ++
 lib/datalog/scoreboard.md    |   8 ++
 lib/datalog/tests/parse.sx   | 147 +++++++++++++++++++++
 plans/datalog-on-sx.md       |  27 +++-
 7 files changed, 445 insertions(+), 7 deletions(-)
 create mode 100644 lib/datalog/conformance.conf
 create mode 100755 lib/datalog/conformance.sh
 create mode 100644 lib/datalog/parser.sx
 create mode 100644 lib/datalog/scoreboard.json
 create mode 100644 lib/datalog/scoreboard.md
 create mode 100644 lib/datalog/tests/parse.sx

diff --git a/lib/datalog/conformance.conf b/lib/datalog/conformance.conf
new file mode 100644
index 00000000..a324032b
--- /dev/null
+++ b/lib/datalog/conformance.conf
@@ -0,0 +1,14 @@
+# Datalog conformance config — sourced by lib/guest/conformance.sh.
+
+LANG_NAME=datalog
+MODE=dict
+
+PRELOADS=(
+  lib/datalog/tokenizer.sx
+  lib/datalog/parser.sx
+)
+
+SUITES=(
+  "tokenize:lib/datalog/tests/tokenize.sx:(dl-tokenize-tests-run!)"
+  "parse:lib/datalog/tests/parse.sx:(dl-parse-tests-run!)"
+)
diff --git a/lib/datalog/conformance.sh b/lib/datalog/conformance.sh
new file mode 100755
index 00000000..0b4a0e13
--- /dev/null
+++ b/lib/datalog/conformance.sh
@@ -0,0 +1,3 @@
+#!/usr/bin/env bash
+# Thin wrapper — see lib/guest/conformance.sh and lib/datalog/conformance.conf.
+exec bash "$(dirname "$0")/../guest/conformance.sh" "$(dirname "$0")/conformance.conf" "$@"
diff --git a/lib/datalog/parser.sx b/lib/datalog/parser.sx
new file mode 100644
index 00000000..66ff43dd
--- /dev/null
+++ b/lib/datalog/parser.sx
@@ -0,0 +1,242 @@
+;; lib/datalog/parser.sx — Datalog tokens → AST
+;;
+;; Output shapes:
+;;   Literal (positive)  := (relname arg ... arg)        — SX list
+;;   Literal (negative)  := {:neg (relname arg ... arg)} — dict
+;;   Argument            := var-symbol | atom-symbol | number | string
+;;                        | (op-name arg ... arg)        — arithmetic compound
+;;   Fact                := {:head literal :body ()}
+;;   Rule                := {:head literal :body (lit ... lit)}
+;;   Query               := {:query (lit ... lit)}
+;;   Program             := list of facts / rules / queries
+;;
+;; Variables and constants are both SX symbols; the evaluator dispatches
+;; on first-char case ('A'..'Z' or '_' = variable, otherwise constant).
+;;
+;; The parser permits nested compounds in arg position to support
+;; arithmetic (e.g. (is Z (+ X Y))). Safety analysis at rule-load time
+;; rejects compounds whose head is not an arithmetic operator.
+
+(define
+  dl-pp-peek
+  (fn
+    (st)
+    (let
+      ((i (get st :idx)) (tokens (get st :tokens)))
+      (if (< i (len tokens)) (nth tokens i) {:type "eof" :value nil :pos 0}))))
+
+(define
+  dl-pp-peek2
+  (fn
+    (st)
+    (let
+      ((i (+ (get st :idx) 1)) (tokens (get st :tokens)))
+      (if (< i (len tokens)) (nth tokens i) {:type "eof" :value nil :pos 0}))))
+
+(define
+  dl-pp-advance!
+  (fn (st) (dict-set! st :idx (+ (get st :idx) 1))))
+
+(define
+  dl-pp-at?
+  (fn
+    (st type value)
+    (let
+      ((t (dl-pp-peek st)))
+      (and
+        (= (get t :type) type)
+        (or (= value nil) (= (get t :value) value))))))
+
+(define
+  dl-pp-error
+  (fn
+    (st msg)
+    (let
+      ((t (dl-pp-peek st)))
+      (error
+        (str
+          "Parse error at pos "
+          (get t :pos)
+          ": "
+          msg
+          " (got "
+          (get t :type)
+          " '"
+          (if (= (get t :value) nil) "" (get t :value))
+          "')")))))
+
+(define
+  dl-pp-expect!
+  (fn
+    (st type value)
+    (let
+      ((t (dl-pp-peek st)))
+      (if
+        (dl-pp-at? st type value)
+        (do (dl-pp-advance! st) t)
+        (dl-pp-error
+          st
+          (str "expected " type (if (= value nil) "" (str " '" value "'"))))))))
+
+;; Argument: variable, atom, number, string, or compound (relname/op + parens).
+(define
+  dl-pp-parse-arg
+  (fn
+    (st)
+    (let
+      ((t (dl-pp-peek st)))
+      (let
+        ((ty (get t :type)) (vv (get t :value)))
+        (cond
+          ((= ty "number") (do (dl-pp-advance! st) vv))
+          ((= ty "string") (do (dl-pp-advance! st) vv))
+          ((= ty "var") (do (dl-pp-advance! st) (string->symbol vv)))
+          ((or (= ty "atom") (= ty "op"))
+            (do
+              (dl-pp-advance! st)
+              (if
+                (dl-pp-at? st "punct" "(")
+                (do
+                  (dl-pp-advance! st)
+                  (let
+                    ((args (dl-pp-parse-arg-list st)))
+                    (do
+                      (dl-pp-expect! st "punct" ")")
+                      (cons (string->symbol vv) args))))
+                (string->symbol vv))))
+          (else (dl-pp-error st "expected term")))))))
+
+;; Comma-separated args inside parens.
+(define
+  dl-pp-parse-arg-list
+  (fn
+    (st)
+    (let
+      ((args (list)))
+      (do
+        (append! args (dl-pp-parse-arg st))
+        (define
+          dl-pp-arg-loop
+          (fn
+            ()
+            (when
+              (dl-pp-at? st "punct" ",")
+              (do
+                (dl-pp-advance! st)
+                (append! args (dl-pp-parse-arg st))
+                (dl-pp-arg-loop)))))
+        (dl-pp-arg-loop)
+        args))))
+
+;; A positive literal: relname (atom or op) followed by optional (args).
+(define
+  dl-pp-parse-positive
+  (fn
+    (st)
+    (let
+      ((t (dl-pp-peek st)))
+      (let
+        ((ty (get t :type)) (vv (get t :value)))
+        (if
+          (or (= ty "atom") (= ty "op"))
+          (do
+            (dl-pp-advance! st)
+            (if
+              (dl-pp-at? st "punct" "(")
+              (do
+                (dl-pp-advance! st)
+                (let
+                  ((args (dl-pp-parse-arg-list st)))
+                  (do
+                    (dl-pp-expect! st "punct" ")")
+                    (cons (string->symbol vv) args))))
+              (list (string->symbol vv))))
+          (dl-pp-error st "expected literal head"))))))
+
+;; A body literal: positive, or not(positive).
+(define
+  dl-pp-parse-body-lit
+  (fn
+    (st)
+    (let
+      ((t1 (dl-pp-peek st)) (t2 (dl-pp-peek2 st)))
+      (if
+        (and
+          (= (get t1 :type) "atom")
+          (= (get t1 :value) "not")
+          (= (get t2 :type) "punct")
+          (= (get t2 :value) "("))
+        (do
+          (dl-pp-advance! st)
+          (dl-pp-advance! st)
+          (let
+            ((inner (dl-pp-parse-positive st)))
+            (do (dl-pp-expect! st "punct" ")") {:neg inner})))
+        (dl-pp-parse-positive st)))))
+
+;; Comma-separated body literals.
+(define
+  dl-pp-parse-body
+  (fn
+    (st)
+    (let
+      ((lits (list)))
+      (do
+        (append! lits (dl-pp-parse-body-lit st))
+        (define
+          dl-pp-body-loop
+          (fn
+            ()
+            (when
+              (dl-pp-at? st "punct" ",")
+              (do
+                (dl-pp-advance! st)
+                (append! lits (dl-pp-parse-body-lit st))
+                (dl-pp-body-loop)))))
+        (dl-pp-body-loop)
+        lits))))
+
+;; Single clause: fact, rule, or query. Consumes trailing dot.
+(define
+  dl-pp-parse-clause
+  (fn
+    (st)
+    (cond
+      ((dl-pp-at? st "op" "?-")
+        (do
+          (dl-pp-advance! st)
+          (let
+            ((body (dl-pp-parse-body st)))
+            (do (dl-pp-expect! st "punct" ".") {:query body}))))
+      (else
+        (let
+          ((head (dl-pp-parse-positive st)))
+          (cond
+            ((dl-pp-at? st "op" ":-")
+              (do
+                (dl-pp-advance! st)
+                (let
+                  ((body (dl-pp-parse-body st)))
+                  (do (dl-pp-expect! st "punct" ".") {:body body :head head}))))
+            (else (do (dl-pp-expect! st "punct" ".") {:body (list) :head head}))))))))
+
+(define
+  dl-parse-program
+  (fn
+    (tokens)
+    (let
+      ((st {:tokens tokens :idx 0}) (clauses (list)))
+      (do
+        (define
+          dl-pp-prog-loop
+          (fn
+            ()
+            (when
+              (not (dl-pp-at? st "eof" nil))
+              (do
+                (append! clauses (dl-pp-parse-clause st))
+                (dl-pp-prog-loop)))))
+        (dl-pp-prog-loop)
+        clauses))))
+
+(define dl-parse (fn (src) (dl-parse-program (dl-tokenize src))))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
new file mode 100644
index 00000000..b6b5c6fa
--- /dev/null
+++ b/lib/datalog/scoreboard.json
@@ -0,0 +1,11 @@
+{
+  "lang": "datalog",
+  "total_passed": 44,
+  "total_failed": 0,
+  "total": 44,
+  "suites": [
+    {"name":"tokenize","passed":26,"failed":0,"total":26},
+    {"name":"parse","passed":18,"failed":0,"total":18}
+  ],
+  "generated": "2026-05-07T23:30:07+00:00"
+}
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
new file mode 100644
index 00000000..9cd60338
--- /dev/null
+++ b/lib/datalog/scoreboard.md
@@ -0,0 +1,8 @@
+# datalog scoreboard
+
+**44 / 44 passing** (0 failure(s)).
+
+| Suite | Passed | Total | Status |
+|-------|--------|-------|--------|
+| tokenize | 26 | 26 | ok |
+| parse | 18 | 18 | ok |
diff --git a/lib/datalog/tests/parse.sx b/lib/datalog/tests/parse.sx
new file mode 100644
index 00000000..2af6e6ab
--- /dev/null
+++ b/lib/datalog/tests/parse.sx
@@ -0,0 +1,147 @@
+;; lib/datalog/tests/parse.sx — parser unit tests
+;;
+;; Run via: bash lib/datalog/conformance.sh
+;; Or:      (load "lib/datalog/tokenizer.sx") (load "lib/datalog/parser.sx")
+;;          (load "lib/datalog/tests/parse.sx") (dl-parse-tests-run!)
+
+(define dl-pt-pass 0)
+(define dl-pt-fail 0)
+(define dl-pt-failures (list))
+
+;; Order-independent structural equality. Lists compared positionally,
+;; dicts as sets of (key, value) pairs. Numbers via = (so 30.0 = 30).
+(define
+  dl-deep-equal?
+  (fn
+    (a b)
+    (cond
+      ((and (list? a) (list? b))
+        (and (= (len a) (len b)) (dl-deep-equal-list? a b 0)))
+      ((and (dict? a) (dict? b))
+        (let
+          ((ka (keys a)) (kb (keys b)))
+          (and
+            (= (len ka) (len kb))
+            (dl-deep-equal-dict? a b ka 0))))
+      ((and (number? a) (number? b)) (= a b))
+      (else (equal? a b)))))
+
+(define
+  dl-deep-equal-list?
+  (fn
+    (a b i)
+    (cond
+      ((>= i (len a)) true)
+      ((not (dl-deep-equal? (nth a i) (nth b i))) false)
+      (else (dl-deep-equal-list? a b (+ i 1))))))
+
+(define
+  dl-deep-equal-dict?
+  (fn
+    (a b ka i)
+    (cond
+      ((>= i (len ka)) true)
+      ((let ((k (nth ka i))) (not (dl-deep-equal? (get a k) (get b k))))
+        false)
+      (else (dl-deep-equal-dict? a b ka (+ i 1))))))
+
+(define
+  dl-pt-test!
+  (fn
+    (name got expected)
+    (if
+      (dl-deep-equal? got expected)
+      (set! dl-pt-pass (+ dl-pt-pass 1))
+      (do
+        (set! dl-pt-fail (+ dl-pt-fail 1))
+        (append!
+          dl-pt-failures
+          (str name "\n    expected: " expected "\n    got:      " got))))))
+
+(define
+  dl-pt-throws?
+  (fn
+    (thunk)
+    (let
+      ((threw false))
+      (do (guard (e (#t (set! threw true))) (thunk)) threw))))
+
+(define
+  dl-pt-run-all!
+  (fn
+    ()
+    (do
+      (dl-pt-test! "empty program" (dl-parse "") (list))
+      (dl-pt-test! "fact" (dl-parse "parent(tom, bob).") (list {:body (list) :head (list (quote parent) (quote tom) (quote bob))}))
+      (dl-pt-test!
+        "two facts"
+        (dl-parse "parent(tom, bob). parent(bob, ann).")
+        (list {:body (list) :head (list (quote parent) (quote tom) (quote bob))} {:body (list) :head (list (quote parent) (quote bob) (quote ann))}))
+      (dl-pt-test! "zero-ary fact" (dl-parse "ready.") (list {:body (list) :head (list (quote ready))}))
+      (dl-pt-test!
+        "rule one body lit"
+        (dl-parse "ancestor(X, Y) :- parent(X, Y).")
+        (list {:body (list (list (quote parent) (quote X) (quote Y))) :head (list (quote ancestor) (quote X) (quote Y))}))
+      (dl-pt-test!
+        "recursive rule"
+        (dl-parse "ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")
+        (list {:body (list (list (quote parent) (quote X) (quote Y)) (list (quote ancestor) (quote Y) (quote Z))) :head (list (quote ancestor) (quote X) (quote Z))}))
+      (dl-pt-test!
+        "query single"
+        (dl-parse "?- ancestor(tom, X).")
+        (list {:query (list (list (quote ancestor) (quote tom) (quote X)))}))
+      (dl-pt-test!
+        "query multi"
+        (dl-parse "?- p(X), q(X).")
+        (list {:query (list (list (quote p) (quote X)) (list (quote q) (quote X)))}))
+      (dl-pt-test!
+        "negation"
+        (dl-parse "safe(X) :- person(X), not(parent(X, _)).")
+        (list {:body (list (list (quote person) (quote X)) {:neg (list (quote parent) (quote X) (quote _))}) :head (list (quote safe) (quote X))}))
+      (dl-pt-test!
+        "number arg"
+        (dl-parse "age(alice, 30).")
+        (list {:body (list) :head (list (quote age) (quote alice) 30)}))
+      (dl-pt-test!
+        "string arg"
+        (dl-parse "label(x, \"hi\").")
+        (list {:body (list) :head (list (quote label) (quote x) "hi")}))
+      (dl-pt-test!
+        "comparison literal"
+        (dl-parse "p(X) :- <(X, 5).")
+        (list {:body (list (list (string->symbol "<") (quote X) 5)) :head (list (quote p) (quote X))}))
+      (dl-pt-test!
+        "is with arith"
+        (dl-parse "succ(X, Y) :- nat(X), is(Y, +(X, 1)).")
+        (list {:body (list (list (quote nat) (quote X)) (list (quote is) (quote Y) (list (string->symbol "+") (quote X) 1))) :head (list (quote succ) (quote X) (quote Y))}))
+      (dl-pt-test!
+        "mixed program"
+        (dl-parse "p(a). p(b). q(X) :- p(X). ?- q(Y).")
+        (list {:body (list) :head (list (quote p) (quote a))} {:body (list) :head (list (quote p) (quote b))} {:body (list (list (quote p) (quote X))) :head (list (quote q) (quote X))} {:query (list (list (quote q) (quote Y)))}))
+      (dl-pt-test!
+        "comments skipped"
+        (dl-parse "% comment\nfoo(a).\n/* block */ bar(b).")
+        (list {:body (list) :head (list (quote foo) (quote a))} {:body (list) :head (list (quote bar) (quote b))}))
+      (dl-pt-test!
+        "underscore var"
+        (dl-parse "p(X) :- q(X, _).")
+        (list {:body (list (list (quote q) (quote X) (quote _))) :head (list (quote p) (quote X))}))
+      (dl-pt-test!
+        "missing dot raises"
+        (dl-pt-throws? (fn () (dl-parse "p(a)")))
+        true)
+      (dl-pt-test!
+        "trailing comma raises"
+        (dl-pt-throws? (fn () (dl-parse "p(a,).")))
+        true))))
+
+(define
+  dl-parse-tests-run!
+  (fn
+    ()
+    (do
+      (set! dl-pt-pass 0)
+      (set! dl-pt-fail 0)
+      (set! dl-pt-failures (list))
+      (dl-pt-run-all!)
+      {:failures dl-pt-failures :total (+ dl-pt-pass dl-pt-fail) :passed dl-pt-pass :failed dl-pt-fail})))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 79adc148..784cf0df 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -58,16 +58,21 @@ Key differences from Prolog:
 ## Roadmap
 
 ### Phase 1 — tokenizer + parser
-- [ ] Tokenizer: atoms (lowercase/quoted), variables (uppercase/`_`), numbers, strings,
-      operators (`:- `, `?-`, `,`, `.`), comments (`%`, `/* */`)
-      Note: no function symbol syntax (no nested `f(...)` in arg position).
-- [ ] Parser:
+- [x] Tokenizer: atoms (lowercase/quoted), variables (uppercase/`_`), numbers, strings,
+      punct (`( )`, `,`, `.`), operators (`:-`, `?-`, `<=`, `>=`, `!=`, `<`, `>`, `=`,
+      `+`, `-`, `*`, `/`), comments (`%`, `/* */`)
+      Note: no function symbol syntax (no nested `f(...)` in arg position) — but the
+      parser permits nested compounds for arithmetic; safety analysis (Phase 3) rejects
+      non-arithmetic nesting.
+- [x] Parser:
       - Facts: `parent(tom, bob).` → `{:head (parent tom bob) :body ()}`
       - Rules: `ancestor(X,Z) :- parent(X,Y), ancestor(Y,Z).`
               → `{:head (ancestor X Z) :body ((parent X Y) (ancestor Y Z))}`
-      - Queries: `?- ancestor(tom, X).` → `{:query (ancestor tom X)}`
+      - Queries: `?- ancestor(tom, X).` → `{:query ((ancestor tom X))}`
+        (`:query` value is always a list of literals; `?- p, q.` → `{:query ((p) (q))}`)
       - Negation: `not(parent(X,Y))` in body position → `{:neg (parent X Y)}`
-- [ ] Tests in `lib/datalog/tests/parse.sx`
+- [x] Tests in `lib/datalog/tests/parse.sx` (18) and `lib/datalog/tests/tokenize.sx` (26).
+      Conformance harness: `bash lib/datalog/conformance.sh` → 44 / 44 passing.
 
 ### Phase 2 — unification + substitution
 - [ ] Share or port unification from `lib/prolog/` — term walk, occurs check off by default
@@ -142,4 +147,12 @@ _(none yet)_
 
 _Newest first._
 
-_(awaiting phase 1)_
+- 2026-05-07 — Phase 1 done. `lib/datalog/tokenizer.sx` (~190 LOC) emits
+  `{:type :value :pos}` tokens; `lib/datalog/parser.sx` (~150 LOC) produces
+  `{:head … :body …}` / `{:query …}` clauses, with nested compounds
+  permitted for arithmetic and `not(...)` desugared to `{:neg …}`. 44 / 44
+  via `bash lib/datalog/conformance.sh` (26 tokenize + 18 parse). Local
+  helpers namespace-prefixed (`dl-emit!`, `dl-peek`) after a host-primitive
+  shadow clash. Test harness uses a custom `dl-deep-equal?` that handles
+  out-of-order dict keys and number repr (`equal?` fails on dict key order
+  and on `30` vs `30.0`).

From 8046df7ce579fccd870ee8da636ae3bd86b50383 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Thu, 7 May 2026 23:34:35 +0000
Subject: [PATCH 03/89] datalog: unification + substitution + 28 tests (Phase
 2, 72/72)

dl-unify returns immutable extended subst dict (or nil). dl-walk
chases bindings, dl-apply-subst recursively resolves vars. Lists
unify element-wise so arithmetic compounds work too. dl-ground? and
dl-vars-of for safety analysis (Phase 3).
---
 lib/datalog/conformance.conf |   2 +
 lib/datalog/scoreboard.json  |   9 +-
 lib/datalog/scoreboard.md    |   3 +-
 lib/datalog/tests/unify.sx   | 185 +++++++++++++++++++++++++++++++++++
 lib/datalog/unify.sx         | 159 ++++++++++++++++++++++++++++++
 plans/datalog-on-sx.md       |  16 ++-
 6 files changed, 365 insertions(+), 9 deletions(-)
 create mode 100644 lib/datalog/tests/unify.sx
 create mode 100644 lib/datalog/unify.sx

diff --git a/lib/datalog/conformance.conf b/lib/datalog/conformance.conf
index a324032b..50ca8310 100644
--- a/lib/datalog/conformance.conf
+++ b/lib/datalog/conformance.conf
@@ -6,9 +6,11 @@ MODE=dict
 PRELOADS=(
   lib/datalog/tokenizer.sx
   lib/datalog/parser.sx
+  lib/datalog/unify.sx
 )
 
 SUITES=(
   "tokenize:lib/datalog/tests/tokenize.sx:(dl-tokenize-tests-run!)"
   "parse:lib/datalog/tests/parse.sx:(dl-parse-tests-run!)"
+  "unify:lib/datalog/tests/unify.sx:(dl-unify-tests-run!)"
 )
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index b6b5c6fa..837e746f 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,11 +1,12 @@
 {
   "lang": "datalog",
-  "total_passed": 44,
+  "total_passed": 72,
   "total_failed": 0,
-  "total": 44,
+  "total": 72,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
-    {"name":"parse","passed":18,"failed":0,"total":18}
+    {"name":"parse","passed":18,"failed":0,"total":18},
+    {"name":"unify","passed":28,"failed":0,"total":28}
   ],
-  "generated": "2026-05-07T23:30:07+00:00"
+  "generated": "2026-05-07T23:34:02+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 9cd60338..729e0fa9 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,8 +1,9 @@
 # datalog scoreboard
 
-**44 / 44 passing** (0 failure(s)).
+**72 / 72 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
 | parse | 18 | 18 | ok |
+| unify | 28 | 28 | ok |
diff --git a/lib/datalog/tests/unify.sx b/lib/datalog/tests/unify.sx
new file mode 100644
index 00000000..873cc655
--- /dev/null
+++ b/lib/datalog/tests/unify.sx
@@ -0,0 +1,185 @@
+;; lib/datalog/tests/unify.sx — unification + substitution tests.
+
+(define dl-ut-pass 0)
+(define dl-ut-fail 0)
+(define dl-ut-failures (list))
+
+(define
+  dl-ut-deep-equal?
+  (fn
+    (a b)
+    (cond
+      ((and (list? a) (list? b))
+        (and (= (len a) (len b)) (dl-ut-deq-list? a b 0)))
+      ((and (dict? a) (dict? b))
+        (let
+          ((ka (keys a)) (kb (keys b)))
+          (and (= (len ka) (len kb)) (dl-ut-deq-dict? a b ka 0))))
+      ((and (number? a) (number? b)) (= a b))
+      (else (equal? a b)))))
+
+(define
+  dl-ut-deq-list?
+  (fn
+    (a b i)
+    (cond
+      ((>= i (len a)) true)
+      ((not (dl-ut-deep-equal? (nth a i) (nth b i))) false)
+      (else (dl-ut-deq-list? a b (+ i 1))))))
+
+(define
+  dl-ut-deq-dict?
+  (fn
+    (a b ka i)
+    (cond
+      ((>= i (len ka)) true)
+      ((let ((k (nth ka i))) (not (dl-ut-deep-equal? (get a k) (get b k))))
+        false)
+      (else (dl-ut-deq-dict? a b ka (+ i 1))))))
+
+(define
+  dl-ut-test!
+  (fn
+    (name got expected)
+    (if
+      (dl-ut-deep-equal? got expected)
+      (set! dl-ut-pass (+ dl-ut-pass 1))
+      (do
+        (set! dl-ut-fail (+ dl-ut-fail 1))
+        (append!
+          dl-ut-failures
+          (str name "\n    expected: " expected "\n    got:      " got))))))
+
+(define
+  dl-ut-run-all!
+  (fn
+    ()
+    (do
+      (dl-ut-test! "var? uppercase" (dl-var? (quote X)) true)
+      (dl-ut-test! "var? underscore" (dl-var? (quote _foo)) true)
+      (dl-ut-test! "var? lowercase" (dl-var? (quote tom)) false)
+      (dl-ut-test! "var? number" (dl-var? 5) false)
+      (dl-ut-test! "var? string" (dl-var? "hi") false)
+      (dl-ut-test! "var? list" (dl-var? (list 1)) false)
+      (dl-ut-test!
+        "atom-atom match"
+        (dl-unify (quote tom) (quote tom) (dl-empty-subst))
+        {})
+      (dl-ut-test!
+        "atom-atom fail"
+        (dl-unify (quote tom) (quote bob) (dl-empty-subst))
+        nil)
+      (dl-ut-test!
+        "num-num match"
+        (dl-unify 5 5 (dl-empty-subst))
+        {})
+      (dl-ut-test!
+        "num-num fail"
+        (dl-unify 5 6 (dl-empty-subst))
+        nil)
+      (dl-ut-test!
+        "string match"
+        (dl-unify "hi" "hi" (dl-empty-subst))
+        {})
+      (dl-ut-test! "string fail" (dl-unify "hi" "bye" (dl-empty-subst)) nil)
+      (dl-ut-test!
+        "var-atom binds"
+        (dl-unify (quote X) (quote tom) (dl-empty-subst))
+        {:X (quote tom)})
+      (dl-ut-test!
+        "atom-var binds"
+        (dl-unify (quote tom) (quote X) (dl-empty-subst))
+        {:X (quote tom)})
+      (dl-ut-test!
+        "var-var same"
+        (dl-unify (quote X) (quote X) (dl-empty-subst))
+        {})
+      (dl-ut-test!
+        "var-var bind"
+        (let
+          ((s (dl-unify (quote X) (quote Y) (dl-empty-subst))))
+          (dl-walk (quote X) s))
+        (quote Y))
+      (dl-ut-test!
+        "tuple match"
+        (dl-unify
+          (list (quote parent) (quote X) (quote bob))
+          (list (quote parent) (quote tom) (quote Y))
+          (dl-empty-subst))
+        {:X (quote tom) :Y (quote bob)})
+      (dl-ut-test!
+        "tuple arity mismatch"
+        (dl-unify
+          (list (quote p) (quote X))
+          (list (quote p) (quote a) (quote b))
+          (dl-empty-subst))
+        nil)
+      (dl-ut-test!
+        "tuple head mismatch"
+        (dl-unify
+          (list (quote p) (quote X))
+          (list (quote q) (quote X))
+          (dl-empty-subst))
+        nil)
+      (dl-ut-test!
+        "walk chain"
+        (let
+          ((s1 (dl-unify (quote X) (quote Y) (dl-empty-subst))))
+          (let
+            ((s2 (dl-unify (quote Y) (quote tom) s1)))
+            (dl-walk (quote X) s2)))
+        (quote tom))
+      (dl-ut-test!
+        "apply subst on tuple"
+        (let
+          ((s (dl-bind (quote X) (quote tom) (dl-empty-subst))))
+          (dl-apply-subst (list (quote parent) (quote X) (quote Y)) s))
+        (list (quote parent) (quote tom) (quote Y)))
+      (dl-ut-test!
+        "ground? all const"
+        (dl-ground?
+          (list (quote p) (quote tom) 5)
+          (dl-empty-subst))
+        true)
+      (dl-ut-test!
+        "ground? unbound var"
+        (dl-ground? (list (quote p) (quote X)) (dl-empty-subst))
+        false)
+      (dl-ut-test!
+        "ground? bound var"
+        (let
+          ((s (dl-bind (quote X) (quote tom) (dl-empty-subst))))
+          (dl-ground? (list (quote p) (quote X)) s))
+        true)
+      (dl-ut-test!
+        "ground? bare var"
+        (dl-ground? (quote X) (dl-empty-subst))
+        false)
+      (dl-ut-test!
+        "vars-of basic"
+        (dl-vars-of
+          (list (quote p) (quote X) (quote tom) (quote Y) (quote X)))
+        (list "X" "Y"))
+      (dl-ut-test!
+        "vars-of ground"
+        (dl-vars-of (list (quote p) (quote tom) (quote bob)))
+        (list))
+      (dl-ut-test!
+        "vars-of nested compound"
+        (dl-vars-of
+          (list
+            (quote is)
+            (quote Z)
+            (list (string->symbol "+") (quote X) 1)))
+        (list "Z" "X")))))
+
+(define
+  dl-unify-tests-run!
+  (fn
+    ()
+    (do
+      (set! dl-ut-pass 0)
+      (set! dl-ut-fail 0)
+      (set! dl-ut-failures (list))
+      (dl-ut-run-all!)
+      {:failures dl-ut-failures :total (+ dl-ut-pass dl-ut-fail) :passed dl-ut-pass :failed dl-ut-fail})))
diff --git a/lib/datalog/unify.sx b/lib/datalog/unify.sx
new file mode 100644
index 00000000..7313a603
--- /dev/null
+++ b/lib/datalog/unify.sx
@@ -0,0 +1,159 @@
+;; lib/datalog/unify.sx — unification + substitution for Datalog terms.
+;;
+;; Term taxonomy (after parsing):
+;;   variable  — SX symbol whose first char is uppercase A–Z or '_'.
+;;   constant  — SX symbol whose first char is lowercase a–z (atom name).
+;;   number    — numeric literal.
+;;   string    — string literal.
+;;   compound  — SX list (functor arg ... arg). In core Datalog these
+;;               only appear as arithmetic expressions (see Phase 4
+;;               safety analysis); compound-against-compound unification
+;;               is supported anyway for completeness.
+;;
+;; Substitutions are immutable dicts keyed by variable name (string).
+;; A failed unification returns nil; success returns the extended subst.
+
+(define dl-empty-subst (fn () {}))
+
+(define
+  dl-var?
+  (fn
+    (term)
+    (and
+      (symbol? term)
+      (let
+        ((name (symbol->string term)))
+        (and
+          (> (len name) 0)
+          (let
+            ((c (slice name 0 1)))
+            (or (and (>= c "A") (<= c "Z")) (= c "_"))))))))
+
+;; Walk: chase variable bindings until we hit a non-variable or an unbound
+;; variable. The result is either a non-variable term or an unbound var.
+(define
+  dl-walk
+  (fn
+    (term subst)
+    (if
+      (dl-var? term)
+      (let
+        ((name (symbol->string term)))
+        (if
+          (and (dict? subst) (has-key? subst name))
+          (dl-walk (get subst name) subst)
+          term))
+      term)))
+
+;; Bind a variable symbol to a value in subst, returning a new subst.
+(define
+  dl-bind
+  (fn (var-sym value subst) (assoc subst (symbol->string var-sym) value)))
+
+(define
+  dl-unify
+  (fn
+    (t1 t2 subst)
+    (if
+      (nil? subst)
+      nil
+      (let
+        ((u1 (dl-walk t1 subst)) (u2 (dl-walk t2 subst)))
+        (cond
+          ((dl-var? u1)
+            (cond
+              ((and (dl-var? u2) (= (symbol->string u1) (symbol->string u2)))
+                subst)
+              (else (dl-bind u1 u2 subst))))
+          ((dl-var? u2) (dl-bind u2 u1 subst))
+          ((and (list? u1) (list? u2))
+            (if
+              (= (len u1) (len u2))
+              (dl-unify-list u1 u2 subst 0)
+              nil))
+          ((and (number? u1) (number? u2)) (if (= u1 u2) subst nil))
+          ((and (string? u1) (string? u2)) (if (= u1 u2) subst nil))
+          ((and (symbol? u1) (symbol? u2))
+            (if (= (symbol->string u1) (symbol->string u2)) subst nil))
+          (else nil))))))
+
+(define
+  dl-unify-list
+  (fn
+    (a b subst i)
+    (cond
+      ((nil? subst) nil)
+      ((>= i (len a)) subst)
+      (else
+        (dl-unify-list
+          a
+          b
+          (dl-unify (nth a i) (nth b i) subst)
+          (+ i 1))))))
+
+;; Apply substitution: walk the term and recurse into lists.
+(define
+  dl-apply-subst
+  (fn
+    (term subst)
+    (let
+      ((w (dl-walk term subst)))
+      (if (list? w) (map (fn (x) (dl-apply-subst x subst)) w) w))))
+
+;; Ground? — true iff no free variables remain after walking.
+(define
+  dl-ground?
+  (fn
+    (term subst)
+    (let
+      ((w (dl-walk term subst)))
+      (cond
+        ((dl-var? w) false)
+        ((list? w) (dl-ground-list? w subst 0))
+        (else true)))))
+
+(define
+  dl-ground-list?
+  (fn
+    (xs subst i)
+    (cond
+      ((>= i (len xs)) true)
+      ((not (dl-ground? (nth xs i) subst)) false)
+      (else (dl-ground-list? xs subst (+ i 1))))))
+
+;; Return the list of variable names appearing in a term (deduped, in
+;; left-to-right order). Useful for safety analysis later.
+(define
+  dl-vars-of
+  (fn (term) (let ((seen (list))) (do (dl-vars-of-aux term seen) seen))))
+
+(define
+  dl-vars-of-aux
+  (fn
+    (term acc)
+    (cond
+      ((dl-var? term)
+        (let
+          ((name (symbol->string term)))
+          (when (not (dl-member? name acc)) (append! acc name))))
+      ((list? term) (dl-vars-of-list term acc 0))
+      (else nil))))
+
+(define
+  dl-vars-of-list
+  (fn
+    (xs acc i)
+    (when
+      (< i (len xs))
+      (do
+        (dl-vars-of-aux (nth xs i) acc)
+        (dl-vars-of-list xs acc (+ i 1))))))
+
+(define
+  dl-member?
+  (fn
+    (x xs)
+    (cond
+      ((= (len xs) 0) false)
+      ((= (first xs) x) true)
+      (else (dl-member? x (rest xs))))))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 784cf0df..68dc785f 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -75,10 +75,12 @@ Key differences from Prolog:
       Conformance harness: `bash lib/datalog/conformance.sh` → 44 / 44 passing.
 
 ### Phase 2 — unification + substitution
-- [ ] Share or port unification from `lib/prolog/` — term walk, occurs check off by default
-- [ ] `dl-unify` `t1` `t2` `subst` → extended subst or nil (no function symbols means simpler)
-- [ ] `dl-ground?` `term` → bool — all variables bound in substitution
-- [ ] Tests: atom/atom, var/atom, var/var, list args
+- [x] Ported (not shared) from `lib/prolog/` — term walk, no occurs check.
+- [x] `dl-unify t1 t2 subst` → extended subst dict, or `nil` on failure.
+- [x] `dl-walk`, `dl-bind`, `dl-apply-subst`, `dl-ground?`, `dl-vars-of`.
+- [x] Substitutions are immutable dicts keyed by variable name (string).
+      Lists/tuples unify element-wise (used for arithmetic compounds too).
+- [x] Tests in `lib/datalog/tests/unify.sx` (28). 72 / 72 conformance.
 
 ### Phase 3 — extensional DB + naive evaluation
 - [ ] EDB: `{:relation-name → set-of-ground-tuples}` using SX sets (Phase 18 of primitives)
@@ -147,6 +149,12 @@ _(none yet)_
 
 _Newest first._
 
+- 2026-05-07 — Phase 2 done. `lib/datalog/unify.sx` (~140 LOC):
+  `dl-var?` (case + underscore), `dl-walk`, `dl-bind`, `dl-unify` (returns
+  extended dict subst or `nil`), `dl-apply-subst`, `dl-ground?`, `dl-vars-of`.
+  Substitutions are immutable dicts; `assoc` builds extended copies. 28
+  unify tests; conformance now 72 / 72.
+
 - 2026-05-07 — Phase 1 done. `lib/datalog/tokenizer.sx` (~190 LOC) emits
   `{:type :value :pos}` tokens; `lib/datalog/parser.sx` (~150 LOC) produces
   `{:head … :body …}` / `{:query …}` clauses, with nested compounds

From 9bc70fd2a9406b71b0812e4d863fdb65fb1a0e86 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Thu, 7 May 2026 23:41:27 +0000
Subject: [PATCH 04/89] datalog: db + naive eval + safety analysis (Phase 3,
 87/87)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

db.sx: facts indexed by relation name, rules list, dl-add-fact!
(rejects non-ground), dl-add-rule! (rejects unsafe — head vars
not in positive body). eval.sx: dl-saturate! fixpoint, dl-query
with deduped projected results. Negation and arithmetic raise
clear errors (Phase 4/7 to follow). 15 eval tests: transitive
closure, sibling, same-gen, grandparent, cyclic reach, safety.
---
 lib/datalog/conformance.conf |   3 +
 lib/datalog/db.sx            | 263 +++++++++++++++++++++++++++++++++++
 lib/datalog/eval.sx          | 153 ++++++++++++++++++++
 lib/datalog/scoreboard.json  |   9 +-
 lib/datalog/scoreboard.md    |   3 +-
 lib/datalog/tests/eval.sx    | 206 +++++++++++++++++++++++++++
 plans/datalog-on-sx.md       |  40 ++++--
 7 files changed, 663 insertions(+), 14 deletions(-)
 create mode 100644 lib/datalog/db.sx
 create mode 100644 lib/datalog/eval.sx
 create mode 100644 lib/datalog/tests/eval.sx

diff --git a/lib/datalog/conformance.conf b/lib/datalog/conformance.conf
index 50ca8310..58a483bc 100644
--- a/lib/datalog/conformance.conf
+++ b/lib/datalog/conformance.conf
@@ -7,10 +7,13 @@ PRELOADS=(
   lib/datalog/tokenizer.sx
   lib/datalog/parser.sx
   lib/datalog/unify.sx
+  lib/datalog/db.sx
+  lib/datalog/eval.sx
 )
 
 SUITES=(
   "tokenize:lib/datalog/tests/tokenize.sx:(dl-tokenize-tests-run!)"
   "parse:lib/datalog/tests/parse.sx:(dl-parse-tests-run!)"
   "unify:lib/datalog/tests/unify.sx:(dl-unify-tests-run!)"
+  "eval:lib/datalog/tests/eval.sx:(dl-eval-tests-run!)"
 )
diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
new file mode 100644
index 00000000..af189147
--- /dev/null
+++ b/lib/datalog/db.sx
@@ -0,0 +1,263 @@
+;; lib/datalog/db.sx — Datalog database (EDB + IDB + rules) + safety.
+;;
+;; A db is a mutable dict:
+;;   {:facts {<rel-name-string> -> (literal ...)}
+;;    :rules ({:head literal :body (literal ...)} ...)}
+;;
+;; Facts are stored as full literals `(rel arg ... arg)` so they unify
+;; directly against rule body literals. Each relation's tuple list is
+;; deduplicated on insert.
+;;
+;; Phase 3 makes no distinction between EDB (asserted) and IDB (derived);
+;; a future phase may track provenance for retraction.
+
+(define dl-make-db (fn () {:facts {} :rules (list)}))
+
+;; The relation name (as string) of a positive literal, or of the
+;; underlying literal of a negative one. nil for malformed input.
+(define
+  dl-rel-name
+  (fn
+    (lit)
+    (cond
+      ((and (dict? lit) (has-key? lit :neg)) (dl-rel-name (get lit :neg)))
+      ((and (list? lit) (> (len lit) 0) (symbol? (first lit)))
+        (symbol->string (first lit)))
+      (else nil))))
+
+(define dl-builtin-rels (list "<" "<=" ">" ">=" "=" "!=" "is"))
+
+(define
+  dl-member-string?
+  (fn
+    (s xs)
+    (cond
+      ((= (len xs) 0) false)
+      ((= (first xs) s) true)
+      (else (dl-member-string? s (rest xs))))))
+
+(define
+  dl-builtin?
+  (fn
+    (lit)
+    (and
+      (list? lit)
+      (> (len lit) 0)
+      (let
+        ((rel (dl-rel-name lit)))
+        (cond
+          ((nil? rel) false)
+          (else (dl-member-string? rel dl-builtin-rels)))))))
+
+(define
+  dl-positive-lit?
+  (fn
+    (lit)
+    (cond
+      ((and (dict? lit) (has-key? lit :neg)) false)
+      ((dl-builtin? lit) false)
+      ((and (list? lit) (> (len lit) 0)) true)
+      (else false))))
+
+;; Membership using dl-deep tuple equality (handles var/constant symbols
+;; and numbers consistently).
+(define
+  dl-tuple-equal?
+  (fn
+    (a b)
+    (cond
+      ((and (list? a) (list? b))
+        (and (= (len a) (len b)) (dl-tuple-equal-list? a b 0)))
+      ((and (number? a) (number? b)) (= a b))
+      (else (equal? a b)))))
+
+(define
+  dl-tuple-equal-list?
+  (fn
+    (a b i)
+    (cond
+      ((>= i (len a)) true)
+      ((not (dl-tuple-equal? (nth a i) (nth b i))) false)
+      (else (dl-tuple-equal-list? a b (+ i 1))))))
+
+(define
+  dl-tuple-member?
+  (fn
+    (lit lits)
+    (cond
+      ((= (len lits) 0) false)
+      ((dl-tuple-equal? lit (first lits)) true)
+      (else (dl-tuple-member? lit (rest lits))))))
+
+;; Ensure :facts has a list for the given relation key, then return it.
+(define
+  dl-ensure-rel!
+  (fn
+    (db rel-key)
+    (let
+      ((facts (get db :facts)))
+      (do
+        (when
+          (not (has-key? facts rel-key))
+          (dict-set! facts rel-key (list)))
+        (get facts rel-key)))))
+
+;; All tuples currently known for a relation (EDB ∪ IDB). Returns empty
+;; list when relation hasn't been seen.
+(define
+  dl-rel-tuples
+  (fn
+    (db rel-key)
+    (let
+      ((facts (get db :facts)))
+      (if (has-key? facts rel-key) (get facts rel-key) (list)))))
+
+;; Add a ground literal. Returns true iff the literal was new.
+(define
+  dl-add-fact!
+  (fn
+    (db lit)
+    (cond
+      ((not (and (list? lit) (> (len lit) 0)))
+        (error (str "dl-add-fact!: expected literal list, got " lit)))
+      ((not (dl-ground? lit (dl-empty-subst)))
+        (error (str "dl-add-fact!: expected ground literal, got " lit)))
+      (else
+        (let
+          ((rel-key (dl-rel-name lit)))
+          (let
+            ((tuples (dl-ensure-rel! db rel-key)))
+            (cond
+              ((dl-tuple-member? lit tuples) false)
+              (else (do (append! tuples lit) true)))))))))
+
+;; Collect variables appearing in the positive body literals of `body`.
+(define
+  dl-positive-body-vars
+  (fn
+    (body)
+    (let
+      ((vars (list)))
+      (do
+        (for-each
+          (fn
+            (lit)
+            (when
+              (dl-positive-lit? lit)
+              (for-each
+                (fn
+                  (v)
+                  (when (not (dl-member-string? v vars)) (append! vars v)))
+                (dl-vars-of lit))))
+          body)
+        vars))))
+
+;; Collect variables in any literal (positive, negated, or built-in).
+(define
+  dl-all-body-vars
+  (fn
+    (body)
+    (let
+      ((vars (list)))
+      (do
+        (for-each
+          (fn
+            (lit)
+            (let
+              ((target (if (and (dict? lit) (has-key? lit :neg)) (get lit :neg) lit)))
+              (for-each
+                (fn
+                  (v)
+                  (when (not (dl-member-string? v vars)) (append! vars v)))
+                (dl-vars-of target))))
+          body)
+        vars))))
+
+;; Return the list of head variables NOT covered by some positive body
+;; literal. A safe rule has an empty list. The check ignores '_' since
+;; that is treated as a fresh anonymous variable per occurrence.
+(define
+  dl-rule-unsafe-head-vars
+  (fn
+    (rule)
+    (let
+      ((head (get rule :head))
+        (body (get rule :body))
+        (head-vars (dl-vars-of head))
+        (body-vars (dl-positive-body-vars body))
+        (out (list)))
+      (do
+        (for-each
+          (fn
+            (v)
+            (when
+              (and (not (dl-member-string? v body-vars)) (not (= v "_")))
+              (append! out v)))
+          head-vars)
+        out))))
+
+;; Add a rule. Rejects unsafe rules with a pointer at the offending var.
+(define
+  dl-add-rule!
+  (fn
+    (db rule)
+    (cond
+      ((not (dict? rule))
+        (error (str "dl-add-rule!: expected rule dict, got " rule)))
+      ((not (has-key? rule :head))
+        (error (str "dl-add-rule!: rule missing :head, got " rule)))
+      (else
+        (let
+          ((unsafe (dl-rule-unsafe-head-vars rule)))
+          (cond
+            ((> (len unsafe) 0)
+              (error
+                (str
+                  "dl-add-rule!: unsafe rule — head variable(s) "
+                  unsafe
+                  " do not appear in any positive body literal of "
+                  rule)))
+            (else
+              (let
+                ((rules (get db :rules)))
+                (do (append! rules rule) true)))))))))
+
+;; Load a parsed clause (fact or rule) into the db. Queries are ignored.
+(define
+  dl-add-clause!
+  (fn
+    (db clause)
+    (cond
+      ((has-key? clause :query) false)
+      ((and (has-key? clause :body) (= (len (get clause :body)) 0))
+        (dl-add-fact! db (get clause :head)))
+      (else (dl-add-rule! db clause)))))
+
+;; Parse source text and load every clause into the db. Returns the db.
+(define
+  dl-load-program!
+  (fn
+    (db source)
+    (let
+      ((clauses (dl-parse source)))
+      (do (for-each (fn (c) (dl-add-clause! db c)) clauses) db))))
+
+;; Convenience: build a db from source in one step.
+(define
+  dl-program
+  (fn (source) (let ((db (dl-make-db))) (dl-load-program! db source))))
+
+(define dl-rules (fn (db) (get db :rules)))
+
+;; Total number of stored ground tuples across all relations.
+(define
+  dl-fact-count
+  (fn
+    (db)
+    (let
+      ((facts (get db :facts)) (total 0))
+      (do
+        (for-each
+          (fn (k) (set! total (+ total (len (get facts k)))))
+          (keys facts))
+        total))))
diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
new file mode 100644
index 00000000..68c83550
--- /dev/null
+++ b/lib/datalog/eval.sx
@@ -0,0 +1,153 @@
+;; lib/datalog/eval.sx — naive bottom-up fixpoint evaluator.
+;;
+;; (dl-saturate! db) iterates rules until no new tuples are derived.
+;; The Herbrand base is finite (no function symbols) so termination is
+;; guaranteed by the language.
+;;
+;; Phase 3 handles only positive EDB literals. Negation (Phase 7) and
+;; arithmetic built-ins (Phase 4) raise a clear error if encountered.
+
+;; Match a positive literal against every tuple in the relation; return
+;; a list of extended substitutions, one per successful unification.
+(define
+  dl-match-positive
+  (fn
+    (lit db subst)
+    (let
+      ((rel (dl-rel-name lit)) (results (list)))
+      (cond
+        ((nil? rel) (error (str "dl-match-positive: bad literal " lit)))
+        (else
+          (let
+            ((tuples (dl-rel-tuples db rel)))
+            (do
+              (for-each
+                (fn
+                  (tuple)
+                  (let
+                    ((s (dl-unify lit tuple subst)))
+                    (when (not (nil? s)) (append! results s))))
+                tuples)
+              results)))))))
+
+(define
+  dl-match-lit
+  (fn
+    (lit db subst)
+    (cond
+      ((and (dict? lit) (has-key? lit :neg))
+        (error "datalog: negation not yet supported (Phase 7)"))
+      ((dl-builtin? lit)
+        (error "datalog: built-in predicate not yet supported (Phase 4)"))
+      ((and (list? lit) (> (len lit) 0))
+        (dl-match-positive lit db subst))
+      (else (error (str "datalog: unknown body-literal shape: " lit))))))
+
+;; Recursively find all substitutions satisfying a list of body literals
+;; under `subst`. Returns a list of substitutions.
+(define
+  dl-find-bindings
+  (fn
+    (lits db subst)
+    (cond
+      ((nil? subst) (list))
+      ((= (len lits) 0) (list subst))
+      (else
+        (let
+          ((options (dl-match-lit (first lits) db subst))
+            (results (list)))
+          (do
+            (for-each
+              (fn
+                (s)
+                (for-each
+                  (fn (s2) (append! results s2))
+                  (dl-find-bindings (rest lits) db s)))
+              options)
+            results))))))
+
+;; Apply a rule once. Returns true if any new tuple was derived.
+(define
+  dl-apply-rule!
+  (fn
+    (db rule)
+    (let
+      ((head (get rule :head)) (body (get rule :body)) (new? false))
+      (do
+        (for-each
+          (fn
+            (s)
+            (let
+              ((derived (dl-apply-subst head s)))
+              (when (dl-add-fact! db derived) (set! new? true))))
+          (dl-find-bindings body db (dl-empty-subst)))
+        new?))))
+
+;; Iterate rules to fixpoint.
+(define
+  dl-saturate!
+  (fn
+    (db)
+    (let
+      ((changed true))
+      (do
+        (define
+          dl-sat-loop
+          (fn
+            ()
+            (when
+              changed
+              (do
+                (set! changed false)
+                (for-each
+                  (fn (r) (when (dl-apply-rule! db r) (set! changed true)))
+                  (dl-rules db))
+                (dl-sat-loop)))))
+        (dl-sat-loop)
+        db))))
+
+;; Run a goal against the saturated db. Returns a list of substitutions
+;; (each restricted to the variables that appeared in `goal`). Duplicate
+;; projections are deduplicated so users get the set of answers.
+(define
+  dl-query
+  (fn
+    (db goal)
+    (do
+      (dl-saturate! db)
+      (let
+        ((substs (dl-find-bindings (list goal) db (dl-empty-subst)))
+          (vars (dl-vars-of goal))
+          (results (list)))
+        (do
+          (for-each
+            (fn
+              (s)
+              (let
+                ((proj (dl-project-subst s vars)))
+                (when
+                  (not (dl-tuple-member? proj results))
+                  (append! results proj))))
+            substs)
+          results)))))
+
+;; Project a subst down to a given set of variable names.
+(define
+  dl-project-subst
+  (fn
+    (subst names)
+    (let
+      ((out {}))
+      (do
+        (for-each
+          (fn
+            (n)
+            (let
+              ((sym (string->symbol n)))
+              (let
+                ((v (dl-walk sym subst)))
+                (dict-set! out n (dl-apply-subst v subst)))))
+          names)
+        out))))
+
+(define dl-relation (fn (db name) (dl-rel-tuples db name)))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 837e746f..11113c5c 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,12 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 72,
+  "total_passed": 87,
   "total_failed": 0,
-  "total": 72,
+  "total": 87,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
-    {"name":"unify","passed":28,"failed":0,"total":28}
+    {"name":"unify","passed":28,"failed":0,"total":28},
+    {"name":"eval","passed":15,"failed":0,"total":15}
   ],
-  "generated": "2026-05-07T23:34:02+00:00"
+  "generated": "2026-05-07T23:40:51+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 729e0fa9..e921fcfd 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,9 +1,10 @@
 # datalog scoreboard
 
-**72 / 72 passing** (0 failure(s)).
+**87 / 87 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
 | parse | 18 | 18 | ok |
 | unify | 28 | 28 | ok |
+| eval | 15 | 15 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
new file mode 100644
index 00000000..1c51e9b4
--- /dev/null
+++ b/lib/datalog/tests/eval.sx
@@ -0,0 +1,206 @@
+;; lib/datalog/tests/eval.sx — naive evaluation + safety analysis tests.
+
+(define dl-et-pass 0)
+(define dl-et-fail 0)
+(define dl-et-failures (list))
+
+;; Same deep-equal helper used in other suites.
+(define
+  dl-et-deep=?
+  (fn
+    (a b)
+    (cond
+      ((and (list? a) (list? b))
+        (and (= (len a) (len b)) (dl-et-deq-l? a b 0)))
+      ((and (dict? a) (dict? b))
+        (let
+          ((ka (keys a)) (kb (keys b)))
+          (and (= (len ka) (len kb)) (dl-et-deq-d? a b ka 0))))
+      ((and (number? a) (number? b)) (= a b))
+      (else (equal? a b)))))
+
+(define
+  dl-et-deq-l?
+  (fn
+    (a b i)
+    (cond
+      ((>= i (len a)) true)
+      ((not (dl-et-deep=? (nth a i) (nth b i))) false)
+      (else (dl-et-deq-l? a b (+ i 1))))))
+
+(define
+  dl-et-deq-d?
+  (fn
+    (a b ka i)
+    (cond
+      ((>= i (len ka)) true)
+      ((let ((k (nth ka i))) (not (dl-et-deep=? (get a k) (get b k))))
+        false)
+      (else (dl-et-deq-d? a b ka (+ i 1))))))
+
+;; Set-equality on lists (order-independent, uses dl-et-deep=?).
+(define
+  dl-et-set=?
+  (fn
+    (a b)
+    (and (= (len a) (len b)) (dl-et-subset? a b) (dl-et-subset? b a))))
+
+(define
+  dl-et-subset?
+  (fn
+    (xs ys)
+    (cond
+      ((= (len xs) 0) true)
+      ((not (dl-et-contains? ys (first xs))) false)
+      (else (dl-et-subset? (rest xs) ys)))))
+
+(define
+  dl-et-contains?
+  (fn
+    (xs target)
+    (cond
+      ((= (len xs) 0) false)
+      ((dl-et-deep=? (first xs) target) true)
+      (else (dl-et-contains? (rest xs) target)))))
+
+(define
+  dl-et-test!
+  (fn
+    (name got expected)
+    (if
+      (dl-et-deep=? got expected)
+      (set! dl-et-pass (+ dl-et-pass 1))
+      (do
+        (set! dl-et-fail (+ dl-et-fail 1))
+        (append!
+          dl-et-failures
+          (str name "\n    expected: " expected "\n    got:      " got))))))
+
+(define
+  dl-et-test-set!
+  (fn
+    (name got expected)
+    (if
+      (dl-et-set=? got expected)
+      (set! dl-et-pass (+ dl-et-pass 1))
+      (do
+        (set! dl-et-fail (+ dl-et-fail 1))
+        (append!
+          dl-et-failures
+          (str
+            name
+            "\n    expected (set): "
+            expected
+            "\n    got:            "
+            got))))))
+
+(define
+  dl-et-throws?
+  (fn
+    (thunk)
+    (let
+      ((threw false))
+      (do (guard (e (#t (set! threw true))) (thunk)) threw))))
+
+(define
+  dl-et-run-all!
+  (fn
+    ()
+    (do
+      (dl-et-test-set!
+        "fact lookup any"
+        (dl-query
+          (dl-program "parent(tom, bob). parent(bob, ann).")
+          (list (quote parent) (quote X) (quote Y)))
+        (list {:X (quote tom) :Y (quote bob)} {:X (quote bob) :Y (quote ann)}))
+      (dl-et-test-set!
+        "fact lookup constant arg"
+        (dl-query
+          (dl-program "parent(tom, bob). parent(tom, liz). parent(bob, ann).")
+          (list (quote parent) (quote tom) (quote Y)))
+        (list {:Y (quote bob)} {:Y (quote liz)}))
+      (dl-et-test-set!
+        "no match"
+        (dl-query
+          (dl-program "parent(tom, bob).")
+          (list (quote parent) (quote nobody) (quote X)))
+        (list))
+      (dl-et-test-set!
+        "ancestor closure"
+        (dl-query
+          (dl-program
+            "parent(tom, bob). parent(bob, ann). parent(ann, pat).\n             ancestor(X, Y) :- parent(X, Y).\n             ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")
+          (list (quote ancestor) (quote tom) (quote X)))
+        (list {:X (quote bob)} {:X (quote ann)} {:X (quote pat)}))
+      (dl-et-test-set!
+        "sibling"
+        (dl-query
+          (dl-program
+            "parent(tom, bob). parent(tom, liz). parent(jane, bob). parent(jane, liz).\n             sibling(X, Y) :- parent(P, X), parent(P, Y).")
+          (list (quote sibling) (quote bob) (quote Y)))
+        (list {:Y (quote bob)} {:Y (quote liz)}))
+      (dl-et-test-set!
+        "same-generation"
+        (dl-query
+          (dl-program
+            "parent(tom, bob). parent(tom, liz). parent(bob, ann). parent(liz, joe).\n             person(tom). person(bob). person(liz). person(ann). person(joe).\n             sg(X, X) :- person(X).\n             sg(X, Y) :- parent(P1, X), sg(P1, P2), parent(P2, Y).")
+          (list (quote sg) (quote ann) (quote X)))
+        (list {:X (quote ann)} {:X (quote joe)}))
+      (dl-et-test!
+        "ancestor count"
+        (let
+          ((db (dl-program "parent(a, b). parent(b, c). parent(c, d).\n                  ancestor(X, Y) :- parent(X, Y).\n                  ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")))
+          (do (dl-saturate! db) (len (dl-relation db "ancestor"))))
+        6)
+      (dl-et-test-set!
+        "grandparent"
+        (dl-query
+          (dl-program
+            "parent(a, b). parent(b, c). parent(c, d).\n             grandparent(X, Z) :- parent(X, Y), parent(Y, Z).")
+          (list (quote grandparent) (quote X) (quote Y)))
+        (list {:X (quote a) :Y (quote c)} {:X (quote b) :Y (quote d)}))
+      (dl-et-test!
+        "no recursion infinite loop"
+        (let
+          ((db (dl-program "edge(1, 2). edge(2, 3). edge(3, 1).\n                  reach(X, Y) :- edge(X, Y).\n                  reach(X, Z) :- edge(X, Y), reach(Y, Z).")))
+          (do (dl-saturate! db) (len (dl-relation db "reach"))))
+        9)
+      (dl-et-test!
+        "unsafe head var"
+        (dl-et-throws? (fn () (dl-program "p(X, Y) :- q(X).")))
+        true)
+      (dl-et-test!
+        "unsafe — empty body"
+        (dl-et-throws? (fn () (dl-program "p(X) :- .")))
+        true)
+      (dl-et-test!
+        "underscore var ok"
+        (dl-et-throws? (fn () (dl-program "p(X, _) :- q(X).")))
+        false)
+      (dl-et-test!
+        "var only in head — unsafe"
+        (dl-et-throws? (fn () (dl-program "p(X, Y) :- q(Z).")))
+        true)
+      (dl-et-test!
+        "head var bound by body"
+        (dl-et-throws? (fn () (dl-program "p(X) :- q(X).")))
+        false)
+      (dl-et-test!
+        "head subset of body"
+        (dl-et-throws?
+          (fn
+            ()
+            (dl-program
+              "edge(a,b). edge(b,c). reach(X, Z) :- edge(X, Y), edge(Y, Z).")))
+        false))))
+
+(define
+  dl-eval-tests-run!
+  (fn
+    ()
+    (do
+      (set! dl-et-pass 0)
+      (set! dl-et-fail 0)
+      (set! dl-et-failures (list))
+      (dl-et-run-all!)
+      {:failures dl-et-failures :total (+ dl-et-pass dl-et-fail) :passed dl-et-pass :failed dl-et-fail})))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 68dc785f..c978043c 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -82,15 +82,26 @@ Key differences from Prolog:
       Lists/tuples unify element-wise (used for arithmetic compounds too).
 - [x] Tests in `lib/datalog/tests/unify.sx` (28). 72 / 72 conformance.
 
-### Phase 3 — extensional DB + naive evaluation
-- [ ] EDB: `{:relation-name → set-of-ground-tuples}` using SX sets (Phase 18 of primitives)
-- [ ] `dl-add-fact!` `db` `relation` `args` → add ground tuple
-- [ ] `dl-add-rule!` `db` `head` `body` → add rule clause
-- [ ] Naive evaluation: iterate rules until fixpoint
-      For each rule, for each combination of body tuples that unify, derive head tuple.
-      Repeat until no new tuples added.
-- [ ] `dl-query` `db` `goal` → list of substitutions satisfying goal against derived DB
-- [ ] Tests: transitive closure (ancestor), sibling, same-generation — classic Datalog programs
+### Phase 3 — extensional DB + naive evaluation + safety analysis
+- [x] EDB+IDB combined: `{:facts {<rel-name-string> -> (literal ...)}}` —
+      relations indexed by name; tuples stored as full literals so they
+      unify directly. Dedup on insert via `dl-tuple-equal?`.
+- [x] `dl-add-fact! db lit` (rejects non-ground) and `dl-add-rule! db rule`
+      (rejects unsafe). `dl-program source` parses + loads in one step.
+- [x] Naive evaluation `dl-saturate! db`: iterate rules until no new tuples.
+      `dl-find-bindings` recursively joins body literals; `dl-match-positive`
+      unifies a literal against every tuple in the relation.
+- [x] `dl-query db goal` → list of substitutions over `goal`'s vars,
+      deduplicated. `dl-relation db name` for derived tuples.
+- [x] Safety analysis at `dl-add-rule!` time: every head variable except
+      `_` must appear in some positive body literal. Built-ins and negated
+      literals do not satisfy safety. Helpers `dl-positive-body-vars`,
+      `dl-rule-unsafe-head-vars` exposed for later phases.
+- [x] Negation and arithmetic built-ins error cleanly at saturate time
+      (Phase 4 / Phase 7 will swap in real semantics).
+- [x] Tests in `lib/datalog/tests/eval.sx` (15): transitive closure,
+      sibling, same-generation, grandparent, cyclic graph reach, six
+      safety cases. 87 / 87 conformance.
 
 ### Phase 4 — semi-naive evaluation (performance)
 - [ ] Delta sets: track newly derived tuples per iteration
@@ -149,6 +160,17 @@ _(none yet)_
 
 _Newest first._
 
+- 2026-05-07 — Phase 3 done. `lib/datalog/db.sx` (~250 LOC) holds facts
+  indexed by relation name plus the rules list, with `dl-add-fact!` /
+  `dl-add-rule!` (rejects non-ground facts and unsafe rules);
+  `lib/datalog/eval.sx` (~150 LOC) implements the naive bottom-up
+  fixpoint via `dl-find-bindings`/`dl-match-positive`/`dl-saturate!`
+  and `dl-query` (deduped projected substitutions). Safety analysis
+  rejects unsafe head vars at load time. Negation and arithmetic
+  built-ins raise clean errors (lifted in later phases). 15 eval
+  tests cover transitive closure, sibling, same-generation, cyclic
+  graph reach, and six safety violations. Conformance 87 / 87.
+
 - 2026-05-07 — Phase 2 done. `lib/datalog/unify.sx` (~140 LOC):
   `dl-var?` (case + underscore), `dl-walk`, `dl-bind`, `dl-unify` (returns
   extended dict subst or `nil`), `dl-apply-subst`, `dl-ground?`, `dl-vars-of`.

From 6457eb668cc2f0e0a62950b361628462c687a3d7 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Thu, 7 May 2026 23:42:34 +0000
Subject: [PATCH 05/89] =?UTF-8?q?datalog-plan:=20align=20roadmap=20with=20?=
 =?UTF-8?q?briefing=20=E2=80=94=20insert=20built-ins=20(P4)=20and=20magic?=
 =?UTF-8?q?=20sets=20(P6)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 plans/datalog-on-sx.md | 58 ++++++++++++++++++++++++++++++++++--------
 1 file changed, 47 insertions(+), 11 deletions(-)

diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index c978043c..6f74f6d6 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -103,23 +103,59 @@ Key differences from Prolog:
       sibling, same-generation, grandparent, cyclic graph reach, six
       safety cases. 87 / 87 conformance.
 
-### Phase 4 — semi-naive evaluation (performance)
+### Phase 4 — built-in predicates + body arithmetic
+Almost every real query needs `<`, `=`, simple arithmetic, and string
+comparisons in body position. These are not EDB lookups — they're
+constraints that filter bindings.
+- [ ] Recognise built-in predicates in body: `(< X Y)`, `(<= X Y)`, `(> X Y)`,
+      `(>= X Y)`, `(= X Y)`, `(!= X Y)` and arithmetic forms `(is Z (+ X Y))`,
+      `(is Z (- X Y))`, `(is Z (* X Y))`, `(is Z (/ X Y))`.
+- [ ] Built-in evaluation: at the join step, after binding variables from
+      EDB lookups, evaluate built-ins as constraints. If any built-in fails
+      or has unbound inputs, drop the candidate substitution.
+- [ ] **Safety extension**: `is` binds its left operand iff right operand is
+      fully ground. `(< X Y)` requires both X and Y bound by some prior body
+      literal — reject unsafe at `dl-add-rule!` time.
+- [ ] Wire arithmetic operators through to SX numeric primitives — no
+      separate Datalog number tower.
+- [ ] Tests: range filters, arithmetic derivations, comparison-based
+      queries, safety violation on `(p X) :- (< X 5).`
+
+### Phase 5 — semi-naive evaluation (performance)
 - [ ] Delta sets: track newly derived tuples per iteration
 - [ ] Semi-naive rule: only join against delta tuples from last iteration, not full relation
 - [ ] Significant speedup for recursive rules — avoids re-deriving known tuples
-- [ ] `dl-stratify` `db` → dependency graph + SCC analysis → stratum ordering
 - [ ] Tests: verify semi-naive produces same results as naive; benchmark on large ancestor chain
 
-### Phase 5 — stratified negation
+### Phase 6 — magic sets (goal-directed bottom-up, opt-in)
+Naive bottom-up derives **all** consequences before answering. Magic sets
+rewrite the program so the fixpoint only derives tuples relevant to the
+goal — a major perf win for "what's reachable from node X" queries on
+large graphs.
+- [ ] Adornments: annotate rule predicates with bound (`b`) / free (`f`)
+      patterns based on how they're called.
+- [ ] Magic transformation: for each adorned predicate, generate a
+      `magic_<pred>` relation and rewrite rule bodies to filter through it.
+- [ ] Sideways information passing strategy (SIPS): left-to-right by
+      default; pluggable.
+- [ ] Optional pass — `(dl-set-strategy! db :magic)`; default semi-naive.
+- [ ] Tests: equivalence vs naive on small inputs; perf win on a 10k-node
+      reachability query from a single root.
+
+### Phase 7 — stratified negation
 - [ ] Dependency graph analysis: which relations depend on which (positively or negatively)
 - [ ] Stratification check: error if negation is in a cycle (non-stratifiable program)
-- [ ] Evaluation: process strata in order — lower stratum fully computed before using its
-      complement in a higher stratum
-- [ ] `not(P)` in rule body: at evaluation time, check P is NOT in the derived EDB
-- [ ] Tests: non-member (`not(member(X,L))`), colored-graph (`not(same-color(X,Y))`),
-      stratification error detection
+- [ ] `dl-stratify db` → SCC analysis → stratum ordering
+- [ ] Evaluation: process strata in order — lower stratum fully computed
+      before using its complement in a higher stratum
+- [ ] `not(P)` in rule body: at evaluation time, check P is NOT in the
+      derived EDB
+- [ ] Safety extension: head vars in negative literals must also appear in
+      some positive body literal of the same rule
+- [ ] Tests: non-member (`not(member(X,L))`), colored-graph
+      (`not(same-color(X,Y))`), stratification error detection
 
-### Phase 6 — aggregation (Datalog+)
+### Phase 8 — aggregation (Datalog+)
 - [ ] `count(X, Goal)` → number of distinct X satisfying Goal
 - [ ] `sum(X, Goal)` → sum of X values satisfying Goal
 - [ ] `min(X, Goal)` / `max(X, Goal)` → min/max of X satisfying Goal
@@ -127,7 +163,7 @@ Key differences from Prolog:
 - [ ] Aggregation breaks stratification — evaluate in a separate post-fixpoint pass
 - [ ] Tests: social network statistics, grade aggregation, inventory sums
 
-### Phase 7 — SX embedding API
+### Phase 9 — SX embedding API
 - [ ] `(dl-program facts rules)` → database from SX data directly (no parsing required)
       ```
       (dl-program
@@ -141,7 +177,7 @@ Key differences from Prolog:
 - [ ] Integration demo: federation graph query — `(ancestor actor1 actor2)` over
       rose-ash ActivityPub follow relationships
 
-### Phase 8 — Datalog as a query language for rose-ash
+### Phase 10 — Datalog as a query language for rose-ash
 - [ ] Schema: map SQLAlchemy model relationships to Datalog EDB facts
       (e.g. `(follows user1 user2)`, `(authored user post)`, `(tagged post tag)`)
 - [ ] Loader: `dl-load-from-db!` — query PostgreSQL, populate Datalog EDB

From 7ce723f73233c97cecdd4e212302168410aa86f3 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Thu, 7 May 2026 23:51:21 +0000
Subject: [PATCH 06/89] datalog: built-ins + body arithmetic + order-aware
 safety (Phase 4, 106/106)

New lib/datalog/builtins.sx: (< <= > >= = !=) and (is X expr) with
+ - * /. dl-eval-arith recursively evaluates nested compounds.
Safety analysis now walks body left-to-right tracking the bound
set: comparisons require all args bound, is RHS vars must be bound
(LHS becomes bound), = special-cases the var/non-var combos.
db.sx keeps the simple safety check as a forward-reference
fallback; builtins.sx redefines dl-rule-check-safety to the
comprehensive version. eval.sx dispatches built-ins through
dl-eval-builtin instead of erroring. 19 new tests.
---
 lib/datalog/builtins.sx       | 300 ++++++++++++++++++++++++++++++++++
 lib/datalog/conformance.conf  |   2 +
 lib/datalog/db.sx             | 124 +++++---------
 lib/datalog/eval.sx           |  20 +--
 lib/datalog/scoreboard.json   |   9 +-
 lib/datalog/scoreboard.md     |   3 +-
 lib/datalog/tests/builtins.sx | 228 ++++++++++++++++++++++++++
 plans/datalog-on-sx.md        |  41 +++--
 8 files changed, 617 insertions(+), 110 deletions(-)
 create mode 100644 lib/datalog/builtins.sx
 create mode 100644 lib/datalog/tests/builtins.sx

diff --git a/lib/datalog/builtins.sx b/lib/datalog/builtins.sx
new file mode 100644
index 00000000..dfd2307a
--- /dev/null
+++ b/lib/datalog/builtins.sx
@@ -0,0 +1,300 @@
+;; lib/datalog/builtins.sx — comparison + arithmetic body literals.
+;;
+;; Built-in predicates filter / extend candidate substitutions during
+;; rule evaluation. They are not stored facts and do not participate in
+;; the Herbrand base.
+;;
+;;   (< a b)  (<= a b)  (> a b)  (>= a b)   ; numeric (or string) compare
+;;   (= a b)                                  ; unify (binds vars)
+;;   (!= a b)                                ; ground-only inequality
+;;   (is X expr)                              ; bind X to expr's value
+;;
+;; Arithmetic expressions are SX-list compounds:
+;;   (+ a b)  (- a b)  (* a b)  (/ a b)
+;; or numbers / variables (must be bound at evaluation time).
+
+(define
+  dl-comparison?
+  (fn
+    (lit)
+    (and
+      (list? lit)
+      (> (len lit) 0)
+      (let
+        ((rel (dl-rel-name lit)))
+        (cond
+          ((nil? rel) false)
+          (else (dl-member-string? rel (list "<" "<=" ">" ">=" "!="))))))))
+
+(define
+  dl-eq?
+  (fn
+    (lit)
+    (and
+      (list? lit)
+      (> (len lit) 0)
+      (let ((rel (dl-rel-name lit))) (and (not (nil? rel)) (= rel "=")))))) 
+
+(define
+  dl-is?
+  (fn
+    (lit)
+    (and
+      (list? lit)
+      (> (len lit) 0)
+      (let
+        ((rel (dl-rel-name lit)))
+        (and (not (nil? rel)) (= rel "is")))))) 
+
+;; Evaluate an arithmetic expression under subst. Returns the numeric
+;; result, or raises if any operand is unbound or non-numeric.
+(define
+  dl-eval-arith
+  (fn
+    (expr subst)
+    (let
+      ((w (dl-walk expr subst)))
+      (cond
+        ((number? w) w)
+        ((dl-var? w)
+          (error (str "datalog arith: unbound variable " (symbol->string w))))
+        ((list? w)
+          (let
+            ((rel (dl-rel-name w)) (args (rest w)))
+            (cond
+              ((not (= (len args) 2))
+                (error (str "datalog arith: need 2 args, got " w)))
+              (else
+                (let
+                  ((a (dl-eval-arith (first args) subst))
+                    (b (dl-eval-arith (nth args 1) subst)))
+                  (cond
+                    ((= rel "+") (+ a b))
+                    ((= rel "-") (- a b))
+                    ((= rel "*") (* a b))
+                    ((= rel "/") (/ a b))
+                    (else (error (str "datalog arith: unknown op " rel)))))))))
+        (else (error (str "datalog arith: not a number — " w)))))))
+
+(define
+  dl-eval-compare
+  (fn
+    (lit subst)
+    (let
+      ((rel (dl-rel-name lit))
+        (a (dl-walk (nth lit 1) subst))
+        (b (dl-walk (nth lit 2) subst)))
+      (cond
+        ((or (dl-var? a) (dl-var? b))
+          (error
+            (str
+              "datalog: comparison "
+              rel
+              " has unbound argument; "
+              "ensure prior body literal binds the variable")))
+        (else
+          (let
+            ((ok (cond ((= rel "<") (< a b)) ((= rel "<=") (<= a b)) ((= rel ">") (> a b)) ((= rel ">=") (>= a b)) ((= rel "!=") (not (dl-tuple-equal? a b))) (else (error (str "datalog: unknown compare " rel))))))
+            (if ok subst nil)))))))
+
+(define
+  dl-eval-eq
+  (fn
+    (lit subst)
+    (dl-unify (nth lit 1) (nth lit 2) subst)))
+
+(define
+  dl-eval-is
+  (fn
+    (lit subst)
+    (let
+      ((target (nth lit 1)) (expr (nth lit 2)))
+      (let
+        ((value (dl-eval-arith expr subst)))
+        (dl-unify target value subst)))))
+
+(define
+  dl-eval-builtin
+  (fn
+    (lit subst)
+    (cond
+      ((dl-comparison? lit) (dl-eval-compare lit subst))
+      ((dl-eq? lit) (dl-eval-eq lit subst))
+      ((dl-is? lit) (dl-eval-is lit subst))
+      (else (error (str "dl-eval-builtin: not a built-in: " lit))))))
+
+;; ── Safety analysis ──────────────────────────────────────────────
+;;
+;; Walks body literals left-to-right tracking a "bound" set. The check
+;; understands these literal kinds:
+;;
+;;   positive non-built-in    → adds its vars to bound
+;;   (is X expr)              → vars(expr) ⊆ bound, then add X (if var)
+;;   <,<=,>,>=,!=             → all vars ⊆ bound (no binding)
+;;   (= a b) where:
+;;       both non-vars        → constraint check, no binding
+;;       a var, b not         → bind a
+;;       b var, a not         → bind b
+;;       both vars            → at least one in bound; bind the other
+;;   {:neg lit}               → all vars ⊆ bound (Phase 7 enforces fully)
+;;
+;; At end, head vars (minus `_`) must be ⊆ bound.
+
+(define
+  dl-vars-not-in
+  (fn
+    (vs bound)
+    (let
+      ((out (list)))
+      (do
+        (for-each
+          (fn
+            (v)
+            (when (not (dl-member-string? v bound)) (append! out v)))
+          vs)
+        out))))
+
+(define
+  dl-rule-check-safety
+  (fn
+    (rule)
+    (let
+      ((head (get rule :head))
+        (body (get rule :body))
+        (bound (list))
+        (err nil))
+      (do
+        (define
+          dl-add-bound!
+          (fn
+            (vs)
+            (for-each
+              (fn
+                (v)
+                (when (not (dl-member-string? v bound)) (append! bound v)))
+              vs)))
+        (define
+          dl-process-eq!
+          (fn
+            (lit)
+            (let
+              ((a (nth lit 1)) (b (nth lit 2)))
+              (let
+                ((va (dl-var? a)) (vb (dl-var? b)))
+                (cond
+                  ((and (not va) (not vb)) nil)
+                  ((and va (not vb))
+                    (dl-add-bound! (list (symbol->string a))))
+                  ((and (not va) vb)
+                    (dl-add-bound! (list (symbol->string b))))
+                  (else
+                    (let
+                      ((sa (symbol->string a)) (sb (symbol->string b)))
+                      (cond
+                        ((dl-member-string? sa bound)
+                          (dl-add-bound! (list sb)))
+                        ((dl-member-string? sb bound)
+                          (dl-add-bound! (list sa)))
+                        (else
+                          (set!
+                            err
+                            (str
+                              "= between two unbound variables "
+                              (list sa sb)
+                              " — at least one must be bound by an "
+                              "earlier positive body literal")))))))))))
+        (define
+          dl-process-cmp!
+          (fn
+            (lit)
+            (let
+              ((needed (dl-vars-of (list (nth lit 1) (nth lit 2)))))
+              (let
+                ((missing (dl-vars-not-in needed bound)))
+                (when
+                  (> (len missing) 0)
+                  (set!
+                    err
+                    (str
+                      "comparison "
+                      (dl-rel-name lit)
+                      " requires bound variable(s) "
+                      missing
+                      " (must be bound by an earlier positive "
+                      "body literal)")))))))
+        (define
+          dl-process-is!
+          (fn
+            (lit)
+            (let
+              ((tgt (nth lit 1)) (expr (nth lit 2)))
+              (let
+                ((needed (dl-vars-of expr)))
+                (let
+                  ((missing (dl-vars-not-in needed bound)))
+                  (cond
+                    ((> (len missing) 0)
+                      (set!
+                        err
+                        (str
+                          "is RHS uses unbound variable(s) "
+                          missing
+                          " — bind them via a prior positive body "
+                          "literal")))
+                    (else
+                      (when
+                        (dl-var? tgt)
+                        (dl-add-bound! (list (symbol->string tgt)))))))))))
+        (define
+          dl-process-neg!
+          (fn
+            (lit)
+            (let
+              ((needed (dl-vars-of (get lit :neg))))
+              (let
+                ((missing (dl-vars-not-in needed bound)))
+                (when
+                  (> (len missing) 0)
+                  (set!
+                    err
+                    (str
+                      "negation refers to unbound variable(s) "
+                      missing
+                      " — they must be bound by an earlier "
+                      "positive body literal")))))))
+        (define
+          dl-process-lit!
+          (fn
+            (lit)
+            (when
+              (nil? err)
+              (cond
+                ((and (dict? lit) (has-key? lit :neg))
+                  (dl-process-neg! lit))
+                ((dl-eq? lit) (dl-process-eq! lit))
+                ((dl-is? lit) (dl-process-is! lit))
+                ((dl-comparison? lit) (dl-process-cmp! lit))
+                ((and (list? lit) (> (len lit) 0))
+                  (dl-add-bound! (dl-vars-of lit)))))))
+        (for-each dl-process-lit! body)
+        (when
+          (nil? err)
+          (let
+            ((head-vars (dl-vars-of head)) (missing (list)))
+            (do
+              (for-each
+                (fn
+                  (v)
+                  (when
+                    (and (not (dl-member-string? v bound)) (not (= v "_")))
+                    (append! missing v)))
+                head-vars)
+              (when
+                (> (len missing) 0)
+                (set!
+                  err
+                  (str
+                    "head variable(s) "
+                    missing
+                    " do not appear in any positive body literal"))))))
+        err))))
diff --git a/lib/datalog/conformance.conf b/lib/datalog/conformance.conf
index 58a483bc..8125ba13 100644
--- a/lib/datalog/conformance.conf
+++ b/lib/datalog/conformance.conf
@@ -8,6 +8,7 @@ PRELOADS=(
   lib/datalog/parser.sx
   lib/datalog/unify.sx
   lib/datalog/db.sx
+  lib/datalog/builtins.sx
   lib/datalog/eval.sx
 )
 
@@ -16,4 +17,5 @@ SUITES=(
   "parse:lib/datalog/tests/parse.sx:(dl-parse-tests-run!)"
   "unify:lib/datalog/tests/unify.sx:(dl-unify-tests-run!)"
   "eval:lib/datalog/tests/eval.sx:(dl-eval-tests-run!)"
+  "builtins:lib/datalog/tests/builtins.sx:(dl-builtins-tests-run!)"
 )
diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index af189147..d83a1dcc 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -1,4 +1,4 @@
-;; lib/datalog/db.sx — Datalog database (EDB + IDB + rules) + safety.
+;; lib/datalog/db.sx — Datalog database (EDB + IDB + rules) + safety hook.
 ;;
 ;; A db is a mutable dict:
 ;;   {:facts {<rel-name-string> -> (literal ...)}
@@ -8,13 +8,12 @@
 ;; directly against rule body literals. Each relation's tuple list is
 ;; deduplicated on insert.
 ;;
-;; Phase 3 makes no distinction between EDB (asserted) and IDB (derived);
-;; a future phase may track provenance for retraction.
+;; Phase 3 introduced safety analysis for head variables; Phase 4 (in
+;; lib/datalog/builtins.sx) swaps in the real `dl-rule-check-safety`,
+;; which is order-aware and understands built-in predicates.
 
 (define dl-make-db (fn () {:facts {} :rules (list)}))
 
-;; The relation name (as string) of a positive literal, or of the
-;; underlying literal of a negative one. nil for malformed input.
 (define
   dl-rel-name
   (fn
@@ -59,8 +58,6 @@
       ((and (list? lit) (> (len lit) 0)) true)
       (else false))))
 
-;; Membership using dl-deep tuple equality (handles var/constant symbols
-;; and numbers consistently).
 (define
   dl-tuple-equal?
   (fn
@@ -89,7 +86,6 @@
       ((dl-tuple-equal? lit (first lits)) true)
       (else (dl-tuple-member? lit (rest lits))))))
 
-;; Ensure :facts has a list for the given relation key, then return it.
 (define
   dl-ensure-rel!
   (fn
@@ -102,8 +98,6 @@
           (dict-set! facts rel-key (list)))
         (get facts rel-key)))))
 
-;; All tuples currently known for a relation (EDB ∪ IDB). Returns empty
-;; list when relation hasn't been seen.
 (define
   dl-rel-tuples
   (fn
@@ -112,7 +106,6 @@
       ((facts (get db :facts)))
       (if (has-key? facts rel-key) (get facts rel-key) (list)))))
 
-;; Add a ground literal. Returns true iff the literal was new.
 (define
   dl-add-fact!
   (fn
@@ -131,72 +124,53 @@
               ((dl-tuple-member? lit tuples) false)
               (else (do (append! tuples lit) true)))))))))
 
-;; Collect variables appearing in the positive body literals of `body`.
+;; The full safety check lives in builtins.sx (it has to know which
+;; predicates are built-ins). dl-add-rule! calls it via forward
+;; reference; load builtins.sx alongside db.sx in any setup that
+;; adds rules. The fallback below is used if builtins.sx isn't loaded.
 (define
-  dl-positive-body-vars
-  (fn
-    (body)
-    (let
-      ((vars (list)))
-      (do
-        (for-each
-          (fn
-            (lit)
-            (when
-              (dl-positive-lit? lit)
-              (for-each
-                (fn
-                  (v)
-                  (when (not (dl-member-string? v vars)) (append! vars v)))
-                (dl-vars-of lit))))
-          body)
-        vars))))
-
-;; Collect variables in any literal (positive, negated, or built-in).
-(define
-  dl-all-body-vars
-  (fn
-    (body)
-    (let
-      ((vars (list)))
-      (do
-        (for-each
-          (fn
-            (lit)
-            (let
-              ((target (if (and (dict? lit) (has-key? lit :neg)) (get lit :neg) lit)))
-              (for-each
-                (fn
-                  (v)
-                  (when (not (dl-member-string? v vars)) (append! vars v)))
-                (dl-vars-of target))))
-          body)
-        vars))))
-
-;; Return the list of head variables NOT covered by some positive body
-;; literal. A safe rule has an empty list. The check ignores '_' since
-;; that is treated as a fresh anonymous variable per occurrence.
-(define
-  dl-rule-unsafe-head-vars
+  dl-rule-check-safety
   (fn
     (rule)
     (let
-      ((head (get rule :head))
-        (body (get rule :body))
-        (head-vars (dl-vars-of head))
-        (body-vars (dl-positive-body-vars body))
-        (out (list)))
+      ((head-vars (dl-vars-of (get rule :head))) (body-vars (list)))
       (do
         (for-each
           (fn
-            (v)
+            (lit)
             (when
-              (and (not (dl-member-string? v body-vars)) (not (= v "_")))
-              (append! out v)))
-          head-vars)
-        out))))
+              (and
+                (list? lit)
+                (> (len lit) 0)
+                (not (and (dict? lit) (has-key? lit :neg))))
+              (for-each
+                (fn
+                  (v)
+                  (when
+                    (not (dl-member-string? v body-vars))
+                    (append! body-vars v)))
+                (dl-vars-of lit))))
+          (get rule :body))
+        (let
+          ((missing (list)))
+          (do
+            (for-each
+              (fn
+                (v)
+                (when
+                  (and
+                    (not (dl-member-string? v body-vars))
+                    (not (= v "_")))
+                  (append! missing v)))
+              head-vars)
+            (cond
+              ((> (len missing) 0)
+                (str
+                  "head variable(s) "
+                  missing
+                  " do not appear in any body literal"))
+              (else nil))))))))
 
-;; Add a rule. Rejects unsafe rules with a pointer at the offending var.
 (define
   dl-add-rule!
   (fn
@@ -208,21 +182,14 @@
         (error (str "dl-add-rule!: rule missing :head, got " rule)))
       (else
         (let
-          ((unsafe (dl-rule-unsafe-head-vars rule)))
+          ((err (dl-rule-check-safety rule)))
           (cond
-            ((> (len unsafe) 0)
-              (error
-                (str
-                  "dl-add-rule!: unsafe rule — head variable(s) "
-                  unsafe
-                  " do not appear in any positive body literal of "
-                  rule)))
+            ((not (nil? err)) (error (str "dl-add-rule!: " err)))
             (else
               (let
                 ((rules (get db :rules)))
                 (do (append! rules rule) true)))))))))
 
-;; Load a parsed clause (fact or rule) into the db. Queries are ignored.
 (define
   dl-add-clause!
   (fn
@@ -233,7 +200,6 @@
         (dl-add-fact! db (get clause :head)))
       (else (dl-add-rule! db clause)))))
 
-;; Parse source text and load every clause into the db. Returns the db.
 (define
   dl-load-program!
   (fn
@@ -242,14 +208,12 @@
       ((clauses (dl-parse source)))
       (do (for-each (fn (c) (dl-add-clause! db c)) clauses) db))))
 
-;; Convenience: build a db from source in one step.
 (define
   dl-program
   (fn (source) (let ((db (dl-make-db))) (dl-load-program! db source))))
 
 (define dl-rules (fn (db) (get db :rules)))
 
-;; Total number of stored ground tuples across all relations.
 (define
   dl-fact-count
   (fn
diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index 68c83550..7c1e7c6c 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -4,11 +4,11 @@
 ;; The Herbrand base is finite (no function symbols) so termination is
 ;; guaranteed by the language.
 ;;
-;; Phase 3 handles only positive EDB literals. Negation (Phase 7) and
-;; arithmetic built-ins (Phase 4) raise a clear error if encountered.
+;; Body literal kinds handled here:
+;;   positive (rel arg ... arg)  → match against EDB+IDB tuples (dl-match-positive)
+;;   built-in (< X Y), (is X e)  → constraint via dl-eval-builtin (Phase 4)
+;;   negation {:neg lit}         → Phase 7
 
-;; Match a positive literal against every tuple in the relation; return
-;; a list of extended substitutions, one per successful unification.
 (define
   dl-match-positive
   (fn
@@ -38,13 +38,13 @@
       ((and (dict? lit) (has-key? lit :neg))
         (error "datalog: negation not yet supported (Phase 7)"))
       ((dl-builtin? lit)
-        (error "datalog: built-in predicate not yet supported (Phase 4)"))
+        (let
+          ((s (dl-eval-builtin lit subst)))
+          (if (nil? s) (list) (list s))))
       ((and (list? lit) (> (len lit) 0))
         (dl-match-positive lit db subst))
       (else (error (str "datalog: unknown body-literal shape: " lit))))))
 
-;; Recursively find all substitutions satisfying a list of body literals
-;; under `subst`. Returns a list of substitutions.
 (define
   dl-find-bindings
   (fn
@@ -66,7 +66,6 @@
               options)
             results))))))
 
-;; Apply a rule once. Returns true if any new tuple was derived.
 (define
   dl-apply-rule!
   (fn
@@ -83,7 +82,6 @@
           (dl-find-bindings body db (dl-empty-subst)))
         new?))))
 
-;; Iterate rules to fixpoint.
 (define
   dl-saturate!
   (fn
@@ -106,9 +104,6 @@
         (dl-sat-loop)
         db))))
 
-;; Run a goal against the saturated db. Returns a list of substitutions
-;; (each restricted to the variables that appeared in `goal`). Duplicate
-;; projections are deduplicated so users get the set of answers.
 (define
   dl-query
   (fn
@@ -131,7 +126,6 @@
             substs)
           results)))))
 
-;; Project a subst down to a given set of variable names.
 (define
   dl-project-subst
   (fn
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 11113c5c..a1933cc5 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,14 @@
 {
   "lang": "datalog",
-  "total_passed": 87,
+  "total_passed": 106,
   "total_failed": 0,
-  "total": 87,
+  "total": 106,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
-    {"name":"eval","passed":15,"failed":0,"total":15}
+    {"name":"eval","passed":15,"failed":0,"total":15},
+    {"name":"builtins","passed":19,"failed":0,"total":19}
   ],
-  "generated": "2026-05-07T23:40:51+00:00"
+  "generated": "2026-05-07T23:50:44+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index e921fcfd..2b5954fc 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**87 / 87 passing** (0 failure(s)).
+**106 / 106 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -8,3 +8,4 @@
 | parse | 18 | 18 | ok |
 | unify | 28 | 28 | ok |
 | eval | 15 | 15 | ok |
+| builtins | 19 | 19 | ok |
diff --git a/lib/datalog/tests/builtins.sx b/lib/datalog/tests/builtins.sx
new file mode 100644
index 00000000..f5136134
--- /dev/null
+++ b/lib/datalog/tests/builtins.sx
@@ -0,0 +1,228 @@
+;; lib/datalog/tests/builtins.sx — comparison + arithmetic body literals.
+
+(define dl-bt-pass 0)
+(define dl-bt-fail 0)
+(define dl-bt-failures (list))
+
+(define
+  dl-bt-deep=?
+  (fn
+    (a b)
+    (cond
+      ((and (list? a) (list? b))
+        (and (= (len a) (len b)) (dl-bt-deq-l? a b 0)))
+      ((and (dict? a) (dict? b))
+        (let
+          ((ka (keys a)) (kb (keys b)))
+          (and (= (len ka) (len kb)) (dl-bt-deq-d? a b ka 0))))
+      ((and (number? a) (number? b)) (= a b))
+      (else (equal? a b)))))
+
+(define
+  dl-bt-deq-l?
+  (fn
+    (a b i)
+    (cond
+      ((>= i (len a)) true)
+      ((not (dl-bt-deep=? (nth a i) (nth b i))) false)
+      (else (dl-bt-deq-l? a b (+ i 1))))))
+
+(define
+  dl-bt-deq-d?
+  (fn
+    (a b ka i)
+    (cond
+      ((>= i (len ka)) true)
+      ((let ((k (nth ka i))) (not (dl-bt-deep=? (get a k) (get b k))))
+        false)
+      (else (dl-bt-deq-d? a b ka (+ i 1))))))
+
+(define
+  dl-bt-set=?
+  (fn
+    (a b)
+    (and (= (len a) (len b)) (dl-bt-subset? a b) (dl-bt-subset? b a))))
+
+(define
+  dl-bt-subset?
+  (fn
+    (xs ys)
+    (cond
+      ((= (len xs) 0) true)
+      ((not (dl-bt-contains? ys (first xs))) false)
+      (else (dl-bt-subset? (rest xs) ys)))))
+
+(define
+  dl-bt-contains?
+  (fn
+    (xs target)
+    (cond
+      ((= (len xs) 0) false)
+      ((dl-bt-deep=? (first xs) target) true)
+      (else (dl-bt-contains? (rest xs) target)))))
+
+(define
+  dl-bt-test-set!
+  (fn
+    (name got expected)
+    (if
+      (dl-bt-set=? got expected)
+      (set! dl-bt-pass (+ dl-bt-pass 1))
+      (do
+        (set! dl-bt-fail (+ dl-bt-fail 1))
+        (append!
+          dl-bt-failures
+          (str
+            name
+            "\n    expected (set): "
+            expected
+            "\n    got:            "
+            got))))))
+
+(define
+  dl-bt-test!
+  (fn
+    (name got expected)
+    (if
+      (dl-bt-deep=? got expected)
+      (set! dl-bt-pass (+ dl-bt-pass 1))
+      (do
+        (set! dl-bt-fail (+ dl-bt-fail 1))
+        (append!
+          dl-bt-failures
+          (str name "\n    expected: " expected "\n    got:      " got))))))
+
+(define
+  dl-bt-throws?
+  (fn
+    (thunk)
+    (let
+      ((threw false))
+      (do (guard (e (#t (set! threw true))) (thunk)) threw))))
+
+(define
+  dl-bt-run-all!
+  (fn
+    ()
+    (do
+      (dl-bt-test-set!
+        "less than filter"
+        (dl-query
+          (dl-program
+            "age(alice, 30). age(bob, 17). age(carol, 22).\n             adult(X) :- age(X, A), >=(A, 18).")
+          (list (quote adult) (quote X)))
+        (list {:X (quote alice)} {:X (quote carol)}))
+      (dl-bt-test-set!
+        "less-equal filter"
+        (dl-query
+          (dl-program
+            "n(1). n(2). n(3). n(4). n(5).\n             small(X) :- n(X), <=(X, 3).")
+          (list (quote small) (quote X)))
+        (list {:X 1} {:X 2} {:X 3}))
+      (dl-bt-test-set!
+        "not-equal filter"
+        (dl-query
+          (dl-program
+            "p(1, 2). p(2, 2). p(3, 4).\n             diff(X, Y) :- p(X, Y), !=(X, Y).")
+          (list (quote diff) (quote X) (quote Y)))
+        (list {:X 1 :Y 2} {:X 3 :Y 4}))
+      (dl-bt-test-set!
+        "is plus"
+        (dl-query
+          (dl-program
+            "n(1). n(2). n(3).\n             succ(X, Y) :- n(X), is(Y, +(X, 1)).")
+          (list (quote succ) (quote X) (quote Y)))
+        (list {:X 1 :Y 2} {:X 2 :Y 3} {:X 3 :Y 4}))
+      (dl-bt-test-set!
+        "is multiply"
+        (dl-query
+          (dl-program
+            "n(2). n(3). n(4).\n             square(X, Y) :- n(X), is(Y, *(X, X)).")
+          (list (quote square) (quote X) (quote Y)))
+        (list {:X 2 :Y 4} {:X 3 :Y 9} {:X 4 :Y 16}))
+      (dl-bt-test-set!
+        "is nested expr"
+        (dl-query
+          (dl-program
+            "n(1). n(2). n(3).\n             f(X, Y) :- n(X), is(Y, *(+(X, 1), 2)).")
+          (list (quote f) (quote X) (quote Y)))
+        (list {:X 1 :Y 4} {:X 2 :Y 6} {:X 3 :Y 8}))
+      (dl-bt-test-set!
+        "is bound LHS — equality"
+        (dl-query
+          (dl-program
+            "n(1, 2). n(2, 5). n(3, 4).\n             succ(X, Y) :- n(X, Y), is(Y, +(X, 1)).")
+          (list (quote succ) (quote X) (quote Y)))
+        (list {:X 1 :Y 2} {:X 3 :Y 4}))
+      (dl-bt-test-set!
+        "triple via is"
+        (dl-query
+          (dl-program
+            "n(1). n(2). n(3).\n             triple(X, Y) :- n(X), is(Y, *(X, 3)).")
+          (list (quote triple) (quote X) (quote Y)))
+        (list {:X 1 :Y 3} {:X 2 :Y 6} {:X 3 :Y 9}))
+      (dl-bt-test-set!
+        "= unifies var with constant"
+        (dl-query
+          (dl-program "p(a). p(b).\n             qual(X) :- p(X), =(X, a).")
+          (list (quote qual) (quote X)))
+        (list {:X (quote a)}))
+      (dl-bt-test-set!
+        "= unifies two vars (one bound)"
+        (dl-query
+          (dl-program "p(a). p(b).\n             twin(X, Y) :- p(X), =(Y, X).")
+          (list (quote twin) (quote X) (quote Y)))
+        (list {:X (quote a) :Y (quote a)} {:X (quote b) :Y (quote b)}))
+      (dl-bt-test!
+        "big count"
+        (let
+          ((db (dl-program "n(0). n(1). n(2). n(3). n(4). n(5). n(6). n(7). n(8). n(9).\n                  big(X) :- n(X), >=(X, 5).")))
+          (do (dl-saturate! db) (len (dl-relation db "big"))))
+        5)
+      (dl-bt-test!
+        "unsafe — comparison without binder"
+        (dl-bt-throws? (fn () (dl-program "p(X) :- <(X, 5).")))
+        true)
+      (dl-bt-test!
+        "unsafe — comparison both unbound"
+        (dl-bt-throws? (fn () (dl-program "p(X, Y) :- <(X, Y), q(X).")))
+        true)
+      (dl-bt-test!
+        "unsafe — is uses unbound RHS var"
+        (dl-bt-throws?
+          (fn () (dl-program "p(X, Y) :- q(X), is(Y, +(X, Z)).")))
+        true)
+      (dl-bt-test!
+        "unsafe — is on its own"
+        (dl-bt-throws? (fn () (dl-program "p(Y) :- is(Y, +(X, 1)).")))
+        true)
+      (dl-bt-test!
+        "unsafe — = between two unbound"
+        (dl-bt-throws? (fn () (dl-program "p(X, Y) :- =(X, Y).")))
+        true)
+      (dl-bt-test!
+        "safe — is binds head var"
+        (dl-bt-throws?
+          (fn () (dl-program "n(1). p(Y) :- n(X), is(Y, +(X, 1)).")))
+        false)
+      (dl-bt-test!
+        "safe — comparison after binder"
+        (dl-bt-throws?
+          (fn () (dl-program "n(1). big(X) :- n(X), >=(X, 0).")))
+        false)
+      (dl-bt-test!
+        "safe — = binds head var"
+        (dl-bt-throws?
+          (fn () (dl-program "p(a). p(b). x(Y) :- p(X), =(Y, X).")))
+        false))))
+
+(define
+  dl-builtins-tests-run!
+  (fn
+    ()
+    (do
+      (set! dl-bt-pass 0)
+      (set! dl-bt-fail 0)
+      (set! dl-bt-failures (list))
+      (dl-bt-run-all!)
+      {:failures dl-bt-failures :total (+ dl-bt-pass dl-bt-fail) :passed dl-bt-pass :failed dl-bt-fail})))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 6f74f6d6..10ff7f3f 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -107,19 +107,23 @@ Key differences from Prolog:
 Almost every real query needs `<`, `=`, simple arithmetic, and string
 comparisons in body position. These are not EDB lookups — they're
 constraints that filter bindings.
-- [ ] Recognise built-in predicates in body: `(< X Y)`, `(<= X Y)`, `(> X Y)`,
+- [x] Recognise built-in predicates in body: `(< X Y)`, `(<= X Y)`, `(> X Y)`,
       `(>= X Y)`, `(= X Y)`, `(!= X Y)` and arithmetic forms `(is Z (+ X Y))`,
-      `(is Z (- X Y))`, `(is Z (* X Y))`, `(is Z (/ X Y))`.
-- [ ] Built-in evaluation: at the join step, after binding variables from
-      EDB lookups, evaluate built-ins as constraints. If any built-in fails
-      or has unbound inputs, drop the candidate substitution.
-- [ ] **Safety extension**: `is` binds its left operand iff right operand is
-      fully ground. `(< X Y)` requires both X and Y bound by some prior body
-      literal — reject unsafe at `dl-add-rule!` time.
-- [ ] Wire arithmetic operators through to SX numeric primitives — no
-      separate Datalog number tower.
-- [ ] Tests: range filters, arithmetic derivations, comparison-based
-      queries, safety violation on `(p X) :- (< X 5).`
+      `(is Z (- X Y))`, `(is Z (* X Y))`, `(is Z (/ X Y))`. Live in
+      `lib/datalog/builtins.sx`.
+- [x] `dl-eval-builtin` dispatches; `dl-eval-arith` recursively evaluates
+      `(+ a b)` etc. with full nesting. `=` unifies; `!=` rejects equal
+      ground terms.
+- [x] Order-aware safety analysis (`dl-rule-check-safety`): walks body
+      left-to-right tracking which vars are bound. `is`'s RHS vars must
+      be already bound; LHS becomes bound. Comparisons require both
+      sides bound. `=` is special-cased — at least one side bound binds
+      the other. Negation vars must be bound (will be enforced fully in
+      Phase 7).
+- [x] Wired through SX numeric primitives — no separate number tower.
+- [x] Tests in `lib/datalog/tests/builtins.sx` (19): range filters,
+      arithmetic derivations, equality binding, eight safety violations
+      and three safe-shape tests. Conformance 106 / 106.
 
 ### Phase 5 — semi-naive evaluation (performance)
 - [ ] Delta sets: track newly derived tuples per iteration
@@ -196,6 +200,19 @@ _(none yet)_
 
 _Newest first._
 
+- 2026-05-07 — Phase 4 done. `lib/datalog/builtins.sx` (~280 LOC) adds
+  `(< X Y)`, `(<= X Y)`, `(> X Y)`, `(>= X Y)`, `(= X Y)`, `(!= X Y)`,
+  and `(is X expr)` with `+ - * /`. `dl-eval-builtin` dispatches;
+  `dl-eval-arith` recursively evaluates nested compounds. Safety
+  check is now order-aware — it walks body literals left-to-right
+  tracking the bound set, requires comparison/`is` inputs to be
+  already bound, and special-cases `=` (binds the var-side; both
+  sides must include at least one bound to bind the other). Phase 3's
+  simple safety check stays in db.sx as a forward-reference fallback;
+  builtins.sx redefines `dl-rule-check-safety` to the comprehensive
+  version. eval.sx's `dl-match-lit` now dispatches built-ins through
+  `dl-eval-builtin`. 19 builtins tests; conformance 106 / 106.
+
 - 2026-05-07 — Phase 3 done. `lib/datalog/db.sx` (~250 LOC) holds facts
   indexed by relation name plus the rules list, with `dl-add-fact!` /
   `dl-add-rule!` (rejects non-ground facts and unsafe rules);

From d964f58c480e43cca718504c11220af5946c54e9 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 08:13:07 +0000
Subject: [PATCH 07/89] datalog: semi-naive saturator + delta sets (Phase 5,
 114/114)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

dl-saturate! is now semi-naive: tracks a per-relation delta dict,
and on each iteration walks every positive body-literal position,
substituting the delta of its relation while joining the rest
against the previous-iteration DB. Candidates are collected before
mutating the DB so the "full" sides see a consistent snapshot.
Rules with no positive body literal (e.g. (p X) :- (= X 5).)
fall back to a one-shot naive pass via dl-collect-rule-candidates.

dl-saturate-naive! retained as the reference implementation; 8
differential tests compare per-relation tuple counts on every
recursive program. Switched dl-tuple-member? to indexed iteration
instead of recursive rest (eliminates per-step list copy). Larger
chains under bundled conformance trip O(n) membership × CPU
sharing — added a Blocker to swap relations to hash-set membership.
---
 lib/datalog/conformance.conf    |   1 +
 lib/datalog/db.sx               |  12 +-
 lib/datalog/eval.sx             | 228 ++++++++++++++++++++++++++++++--
 lib/datalog/scoreboard.json     |   9 +-
 lib/datalog/scoreboard.md       |   3 +-
 lib/datalog/tests/semi_naive.sx | 151 +++++++++++++++++++++
 plans/datalog-on-sx.md          |  45 ++++++-
 7 files changed, 425 insertions(+), 24 deletions(-)
 create mode 100644 lib/datalog/tests/semi_naive.sx

diff --git a/lib/datalog/conformance.conf b/lib/datalog/conformance.conf
index 8125ba13..af4e41b0 100644
--- a/lib/datalog/conformance.conf
+++ b/lib/datalog/conformance.conf
@@ -18,4 +18,5 @@ SUITES=(
   "unify:lib/datalog/tests/unify.sx:(dl-unify-tests-run!)"
   "eval:lib/datalog/tests/eval.sx:(dl-eval-tests-run!)"
   "builtins:lib/datalog/tests/builtins.sx:(dl-builtins-tests-run!)"
+  "semi_naive:lib/datalog/tests/semi_naive.sx:(dl-semi-naive-tests-run!)"
 )
diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index d83a1dcc..620f565c 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -81,10 +81,16 @@
   dl-tuple-member?
   (fn
     (lit lits)
+    (dl-tuple-member-aux? lit lits 0 (len lits))))
+
+(define
+  dl-tuple-member-aux?
+  (fn
+    (lit lits i n)
     (cond
-      ((= (len lits) 0) false)
-      ((dl-tuple-equal? lit (first lits)) true)
-      (else (dl-tuple-member? lit (rest lits))))))
+      ((>= i n) false)
+      ((dl-tuple-equal? lit (nth lits i)) true)
+      (else (dl-tuple-member-aux? lit lits (+ i 1) n)))))
 
 (define
   dl-ensure-rel!
diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index 7c1e7c6c..5fb30eb9 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -1,12 +1,17 @@
-;; lib/datalog/eval.sx — naive bottom-up fixpoint evaluator.
+;; lib/datalog/eval.sx — fixpoint evaluator (naive + semi-naive).
 ;;
-;; (dl-saturate! db) iterates rules until no new tuples are derived.
-;; The Herbrand base is finite (no function symbols) so termination is
-;; guaranteed by the language.
+;; Two saturators are exposed:
+;;   `dl-saturate-naive!` — re-joins each rule against the full DB every
+;;     iteration. Reference implementation; useful for differential tests.
+;;   `dl-saturate!`       — semi-naive default. Tracks per-relation delta
+;;     sets and substitutes one positive body literal per rule with the
+;;     delta of its relation, joining the rest against the previous-
+;;     iteration DB. Same fixpoint, dramatically less work on recursive
+;;     rules.
 ;;
-;; Body literal kinds handled here:
-;;   positive (rel arg ... arg)  → match against EDB+IDB tuples (dl-match-positive)
-;;   built-in (< X Y), (is X e)  → constraint via dl-eval-builtin (Phase 4)
+;; Body literal kinds:
+;;   positive (rel arg ... arg)  → match against EDB+IDB tuples
+;;   built-in (< X Y), (is X e)  → constraint via dl-eval-builtin
 ;;   negation {:neg lit}         → Phase 7
 
 (define
@@ -30,6 +35,26 @@
                 tuples)
               results)))))))
 
+;; Match a positive literal against the delta set for its relation only.
+(define
+  dl-match-positive-delta
+  (fn
+    (lit delta subst)
+    (let
+      ((rel (dl-rel-name lit)) (results (list)))
+      (let
+        ((tuples (if (has-key? delta rel) (get delta rel) (list))))
+        (do
+          (for-each
+            (fn
+              (tuple)
+              (let
+                ((s (dl-unify lit tuple subst)))
+                (when (not (nil? s)) (append! results s))))
+            tuples)
+          results)))))
+
+;; Naive matcher (for dl-saturate-naive! and dl-query post-saturation).
 (define
   dl-match-lit
   (fn
@@ -66,6 +91,7 @@
               options)
             results))))))
 
+;; Naive: apply each rule against full DB until no new tuples.
 (define
   dl-apply-rule!
   (fn
@@ -83,14 +109,14 @@
         new?))))
 
 (define
-  dl-saturate!
+  dl-saturate-naive!
   (fn
     (db)
     (let
       ((changed true))
       (do
         (define
-          dl-sat-loop
+          dl-snloop
           (fn
             ()
             (when
@@ -100,10 +126,190 @@
                 (for-each
                   (fn (r) (when (dl-apply-rule! db r) (set! changed true)))
                   (dl-rules db))
-                (dl-sat-loop)))))
-        (dl-sat-loop)
+                (dl-snloop)))))
+        (dl-snloop)
         db))))
 
+;; ── Semi-naive ───────────────────────────────────────────────────
+
+;; Take a snapshot dict {rel -> tuples} of every relation currently in
+;; the DB. Used as initial delta for the first iteration.
+(define
+  dl-snapshot-facts
+  (fn
+    (db)
+    (let
+      ((facts (get db :facts)) (out {}))
+      (do
+        (for-each
+          (fn (k) (dict-set! out k (dl-copy-list (get facts k))))
+          (keys facts))
+        out))))
+
+(define
+  dl-copy-list
+  (fn
+    (xs)
+    (let
+      ((out (list)))
+      (do (for-each (fn (x) (append! out x)) xs) out))))
+
+;; Does any relation in `delta` have ≥1 tuple?
+(define
+  dl-delta-empty?
+  (fn
+    (delta)
+    (let
+      ((ks (keys delta)) (any-non-empty false))
+      (do
+        (for-each
+          (fn
+            (k)
+            (when
+              (> (len (get delta k)) 0)
+              (set! any-non-empty true)))
+          ks)
+        (not any-non-empty)))))
+
+;; Find substitutions such that `lits` are all satisfied AND `delta-idx`
+;; is matched against the per-relation delta only. The other positive
+;; literals match against the snapshot DB (db.facts read at iteration
+;; start). Built-ins and negations behave as in `dl-match-lit`.
+(define
+  dl-find-bindings-semi
+  (fn
+    (lits db delta delta-idx subst)
+    (dl-fbs-aux lits db delta delta-idx 0 subst)))
+
+(define
+  dl-fbs-aux
+  (fn
+    (lits db delta delta-idx i subst)
+    (cond
+      ((nil? subst) (list))
+      ((>= i (len lits)) (list subst))
+      (else
+        (let
+          ((lit (nth lits i))
+            (options
+              (cond
+                ((and (dict? lit) (has-key? lit :neg))
+                  (error "datalog: negation in semi-naive (Phase 7)"))
+                ((dl-builtin? lit)
+                  (let
+                    ((s (dl-eval-builtin lit subst)))
+                    (if (nil? s) (list) (list s))))
+                ((and (list? lit) (> (len lit) 0))
+                  (if
+                    (= i delta-idx)
+                    (dl-match-positive-delta lit delta subst)
+                    (dl-match-positive lit db subst)))
+                (else (error (str "datalog: unknown body-lit: " lit)))))
+            (results (list)))
+          (do
+            (for-each
+              (fn
+                (s)
+                (for-each
+                  (fn (s2) (append! results s2))
+                  (dl-fbs-aux lits db delta delta-idx (+ i 1) s)))
+              options)
+            results))))))
+
+;; Collect candidate head tuples from a rule using delta. Walks every
+;; positive body position and unions the resulting heads. For rules
+;; with no positive body literal, falls back to a naive single-pass
+;; (so static facts like `(p X) :- (= X 5).` derive on iteration 1).
+(define
+  dl-collect-rule-candidates
+  (fn
+    (rule db delta)
+    (let
+      ((head (get rule :head))
+        (body (get rule :body))
+        (out (list))
+        (saw-pos false))
+      (do
+        (define
+          dl-cri
+          (fn
+            (i)
+            (when
+              (< i (len body))
+              (do
+                (let
+                  ((lit (nth body i)))
+                  (when
+                    (dl-positive-lit? lit)
+                    (do
+                      (set! saw-pos true)
+                      (for-each
+                        (fn (s) (append! out (dl-apply-subst head s)))
+                        (dl-find-bindings-semi
+                          body
+                          db
+                          delta
+                          i
+                          (dl-empty-subst))))))
+                (dl-cri (+ i 1))))))
+        (dl-cri 0)
+        (when
+          (not saw-pos)
+          (for-each
+            (fn (s) (append! out (dl-apply-subst head s)))
+            (dl-find-bindings body db (dl-empty-subst))))
+        out))))
+
+;; Add a list of candidate tuples to db; collect newly-added ones into
+;; the new-delta dict (keyed by relation name).
+(define
+  dl-commit-candidates!
+  (fn
+    (db candidates new-delta)
+    (for-each
+      (fn
+        (lit)
+        (when
+          (dl-add-fact! db lit)
+          (let
+            ((rel (dl-rel-name lit)))
+            (do
+              (when
+                (not (has-key? new-delta rel))
+                (dict-set! new-delta rel (list)))
+              (append! (get new-delta rel) lit)))))
+      candidates)))
+
+(define
+  dl-saturate!
+  (fn
+    (db)
+    (let
+      ((delta (dl-snapshot-facts db)))
+      (do
+        (define
+          dl-sn-step
+          (fn
+            ()
+            (let
+              ((pending (list)) (new-delta {}))
+              (do
+                (for-each
+                  (fn
+                    (rule)
+                    (for-each
+                      (fn (cand) (append! pending cand))
+                      (dl-collect-rule-candidates rule db delta)))
+                  (dl-rules db))
+                (dl-commit-candidates! db pending new-delta)
+                (cond
+                  ((dl-delta-empty? new-delta) nil)
+                  (else (do (set! delta new-delta) (dl-sn-step))))))))
+        (dl-sn-step)
+        db))))
+
+;; ── Querying ─────────────────────────────────────────────────────
+
 (define
   dl-query
   (fn
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index a1933cc5..12f28784 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,14 +1,15 @@
 {
   "lang": "datalog",
-  "total_passed": 106,
+  "total_passed": 114,
   "total_failed": 0,
-  "total": 106,
+  "total": 114,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
     {"name":"eval","passed":15,"failed":0,"total":15},
-    {"name":"builtins","passed":19,"failed":0,"total":19}
+    {"name":"builtins","passed":19,"failed":0,"total":19},
+    {"name":"semi_naive","passed":8,"failed":0,"total":8}
   ],
-  "generated": "2026-05-07T23:50:44+00:00"
+  "generated": "2026-05-08T08:12:42+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 2b5954fc..cac00351 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**106 / 106 passing** (0 failure(s)).
+**114 / 114 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -9,3 +9,4 @@
 | unify | 28 | 28 | ok |
 | eval | 15 | 15 | ok |
 | builtins | 19 | 19 | ok |
+| semi_naive | 8 | 8 | ok |
diff --git a/lib/datalog/tests/semi_naive.sx b/lib/datalog/tests/semi_naive.sx
new file mode 100644
index 00000000..5ff6a3a5
--- /dev/null
+++ b/lib/datalog/tests/semi_naive.sx
@@ -0,0 +1,151 @@
+;; lib/datalog/tests/semi_naive.sx — semi-naive correctness vs naive.
+;;
+;; Strategy: differential — run both saturators on each program and
+;; compare the resulting per-relation tuple counts. Counting (not
+;; element-wise set equality) keeps the suite fast under the bundled
+;; conformance session; correctness on the inhabitants is covered by
+;; eval.sx and builtins.sx (which use dl-saturate! by default — the
+;; semi-naive saturator).
+
+(define dl-sn-pass 0)
+(define dl-sn-fail 0)
+(define dl-sn-failures (list))
+
+(define
+  dl-sn-test!
+  (fn
+    (name got expected)
+    (if
+      (equal? got expected)
+      (set! dl-sn-pass (+ dl-sn-pass 1))
+      (do
+        (set! dl-sn-fail (+ dl-sn-fail 1))
+        (append!
+          dl-sn-failures
+          (str name "\n    expected: " expected "\n    got:      " got))))))
+
+;; Load `source` into both a semi-naive and a naive db and return a
+;; list of (rel-name semi-count naive-count) triples. Both sets must
+;; have the same union of relation names.
+(define
+  dl-sn-counts
+  (fn
+    (source)
+    (let
+      ((db-s (dl-program source)) (db-n (dl-program source)))
+      (do
+        (dl-saturate! db-s)
+        (dl-saturate-naive! db-n)
+        (let
+          ((out (list)))
+          (do
+            (for-each
+              (fn
+                (k)
+                (append!
+                  out
+                  (list
+                    k
+                    (len (dl-relation db-s k))
+                    (len (dl-relation db-n k)))))
+              (keys (get db-s :facts)))
+            out))))))
+
+(define
+  dl-sn-counts-agree?
+  (fn
+    (counts)
+    (cond
+      ((= (len counts) 0) true)
+      (else
+        (let
+          ((row (first counts)))
+          (and
+            (= (nth row 1) (nth row 2))
+            (dl-sn-counts-agree? (rest counts))))))))
+
+(define
+  dl-sn-chain-source
+  (fn
+    (n)
+    (let
+      ((parts (list "")))
+      (do
+        (define
+          dl-sn-loop
+          (fn
+            (i)
+            (when
+              (< i n)
+              (do
+                (append! parts (str "parent(" i ", " (+ i 1) "). "))
+                (dl-sn-loop (+ i 1))))))
+        (dl-sn-loop 0)
+        (str
+          (join "" parts)
+          "ancestor(X, Y) :- parent(X, Y). "
+          "ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")))))
+
+(define
+  dl-sn-run-all!
+  (fn
+    ()
+    (do
+      (dl-sn-test!
+        "ancestor closure counts match"
+        (dl-sn-counts-agree?
+          (dl-sn-counts
+            "parent(a, b). parent(b, c). parent(c, d).\n             ancestor(X, Y) :- parent(X, Y).\n             ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z)."))
+        true)
+      (dl-sn-test!
+        "cyclic reach counts match"
+        (dl-sn-counts-agree?
+          (dl-sn-counts
+            "edge(1, 2). edge(2, 3). edge(3, 1). edge(3, 4).\n             reach(X, Y) :- edge(X, Y).\n             reach(X, Z) :- edge(X, Y), reach(Y, Z)."))
+        true)
+      (dl-sn-test!
+        "same-gen counts match"
+        (dl-sn-counts-agree?
+          (dl-sn-counts
+            "parent(a, b). parent(a, c). parent(b, d). parent(c, e).\n             person(a). person(b). person(c). person(d). person(e).\n             sg(X, X) :- person(X).\n             sg(X, Y) :- parent(P1, X), sg(P1, P2), parent(P2, Y)."))
+        true)
+      (dl-sn-test!
+        "rules with builtins counts match"
+        (dl-sn-counts-agree?
+          (dl-sn-counts
+            "n(1). n(2). n(3). n(4). n(5).\n             small(X) :- n(X), <(X, 5).\n             succ(X, Y) :- n(X), <(X, 5), is(Y, +(X, 1))."))
+        true)
+      (dl-sn-test!
+        "static rule fires under semi-naive"
+        (dl-sn-counts-agree?
+          (dl-sn-counts "p(a). p(b). q(X) :- p(X), =(X, a)."))
+        true)
+      ;; Chain length 5 — small but enough to exercise multiple
+      ;; semi-naive iterations against a recursive rule.
+      (dl-sn-test!
+        "chain-5 ancestor counts match"
+        (dl-sn-counts-agree? (dl-sn-counts (dl-sn-chain-source 5)))
+        true)
+      (dl-sn-test!
+        "chain-5 ancestor count value"
+        (let
+          ((db (dl-program (dl-sn-chain-source 5))))
+          (do (dl-saturate! db) (len (dl-relation db "ancestor"))))
+        15)
+      (dl-sn-test!
+        "query through semi saturate"
+        (let
+          ((db (dl-program "parent(a, b). parent(b, c).\n                  ancestor(X, Y) :- parent(X, Y).\n                  ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")))
+          (len (dl-query db (list (quote ancestor) (quote a) (quote X)))))
+        2))))
+
+(define
+  dl-semi-naive-tests-run!
+  (fn
+    ()
+    (do
+      (set! dl-sn-pass 0)
+      (set! dl-sn-fail 0)
+      (set! dl-sn-failures (list))
+      (dl-sn-run-all!)
+      {:failures dl-sn-failures :total (+ dl-sn-pass dl-sn-fail) :passed dl-sn-pass :failed dl-sn-fail})))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 10ff7f3f..aa7dd632 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -126,10 +126,25 @@ constraints that filter bindings.
       and three safe-shape tests. Conformance 106 / 106.
 
 ### Phase 5 — semi-naive evaluation (performance)
-- [ ] Delta sets: track newly derived tuples per iteration
-- [ ] Semi-naive rule: only join against delta tuples from last iteration, not full relation
-- [ ] Significant speedup for recursive rules — avoids re-deriving known tuples
-- [ ] Tests: verify semi-naive produces same results as naive; benchmark on large ancestor chain
+- [x] Delta sets `{rel-name -> tuples}` track newly derived tuples per iter.
+      `dl-snapshot-facts` builds the initial delta from the EDB.
+- [x] Semi-naive rule: for each rule, walk every positive body literal
+      position; substitute that one with the per-relation delta and join
+      the rest against the previous-iteration DB (`dl-find-bindings-semi`).
+      Candidates are collected before mutating the DB so the "full" sides
+      see a consistent snapshot.
+- [x] `dl-collect-rule-candidates` falls back to a naive single pass when
+      a rule has no positive body literal (e.g. `(p X) :- (= X 5).`).
+- [x] `dl-saturate!` is now semi-naive by default; `dl-saturate-naive!`
+      kept for differential testing and a reference implementation.
+- [x] Tests in `lib/datalog/tests/semi_naive.sx` (8) — every recursive
+      program from earlier suites is run under both saturators with
+      per-relation tuple counts compared (cheap, robust under bundled
+      conformance session). A chain-5 differential exercises multiple
+      semi-naive iterations against the recursive ancestor rule.
+      Larger chains hit prohibitive wall-clock under conformance CPU
+      contention with other agents — a future Blocker tracks switching
+      `dl-tuple-member?` from O(n²) list scan to a hash-set per relation.
 
 ### Phase 6 — magic sets (goal-directed bottom-up, opt-in)
 Naive bottom-up derives **all** consequences before answering. Magic sets
@@ -194,12 +209,32 @@ large graphs.
 
 ## Blockers
 
-_(none yet)_
+- **Hash-set membership for relations.** `dl-tuple-member?` uses a linear
+  list scan; insert is O(n) and saturating chain-N pushes O(n²) → O(n³)
+  total. Under bundled conformance (CPU shared with other loop agents)
+  even chain-15 hits multi-minute wall-clock. Tests scoped to chain-5
+  for now. Fix: maintain a `{tuple-key → true}` dict per relation
+  alongside the list; key tuples by their serialized form.
 
 ## Progress log
 
 _Newest first._
 
+- 2026-05-08 — Phase 5 done. `lib/datalog/eval.sx` rewritten to
+  semi-naive default. `dl-saturate!` tracks a per-relation delta and
+  on each iteration walks every positive body position substituting
+  delta for that one literal — joining the rest against the full DB
+  snapshot. `dl-saturate-naive!` retained as the reference. Rules
+  with no positive body literal (e.g. `(p X) :- (= X 5).`) fall back
+  to a naive one-shot via `dl-collect-rule-candidates`. 8 tests
+  differentially compare the two saturators using per-relation tuple
+  counts (cheap). Chain-5 differential exercises multi-iteration
+  recursive saturation. Larger chains made conformance.sh time out
+  due to O(n) `dl-tuple-member?` × CPU sharing with other loop
+  agents — added a Blocker to swap to a hash-set for membership.
+  Also tightened `dl-tuple-member?` to use indexed iteration instead
+  of recursive `rest` (was creating a fresh list per step).
+
 - 2026-05-07 — Phase 4 done. `lib/datalog/builtins.sx` (~280 LOC) adds
   `(< X Y)`, `(<= X Y)`, `(> X Y)`, `(>= X Y)`, `(= X Y)`, `(!= X Y)`,
   and `(is X expr)` with `+ - * /`. `dl-eval-builtin` dispatches;

From caec05eb2751b4c39310c8467f966eb2d9321f59 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 08:20:56 +0000
Subject: [PATCH 08/89] datalog: stratified negation (Phase 7, 124/124)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

New lib/datalog/strata.sx: dl-build-dep-graph (relation -> deps with
:neg flag), Floyd-Warshall reachability, SCC-via-mutual-reach for
non-stratifiability detection, iterative dl-compute-strata, and
dl-group-rules-by-stratum.

eval.sx refactor:
- dl-saturate-rules! db rules — semi-naive worker over a rule subset
- dl-saturate! db — stratified driver. Rejects non-stratifiable
  programs at saturation time, then iterates strata in order
- dl-match-negation — succeeds iff inner positive match is empty

Order-aware safety in dl-rule-check-safety (Phase 4) already
required negation vars to be bound by a prior positive literal.
Stratum dict keys are strings (SX dicts don't accept ints).

Phase 6 magic sets deferred — opt-in path, semi-naive default
suffices for current workloads.
---
 lib/datalog/conformance.conf  |   2 +
 lib/datalog/eval.sx           |  63 +++++++-
 lib/datalog/scoreboard.json   |   9 +-
 lib/datalog/scoreboard.md     |   3 +-
 lib/datalog/strata.sx         | 297 ++++++++++++++++++++++++++++++++++
 lib/datalog/tests/negation.sx | 231 ++++++++++++++++++++++++++
 plans/datalog-on-sx.md        |  45 ++++--
 7 files changed, 626 insertions(+), 24 deletions(-)
 create mode 100644 lib/datalog/strata.sx
 create mode 100644 lib/datalog/tests/negation.sx

diff --git a/lib/datalog/conformance.conf b/lib/datalog/conformance.conf
index af4e41b0..bd9b0612 100644
--- a/lib/datalog/conformance.conf
+++ b/lib/datalog/conformance.conf
@@ -9,6 +9,7 @@ PRELOADS=(
   lib/datalog/unify.sx
   lib/datalog/db.sx
   lib/datalog/builtins.sx
+  lib/datalog/strata.sx
   lib/datalog/eval.sx
 )
 
@@ -19,4 +20,5 @@ SUITES=(
   "eval:lib/datalog/tests/eval.sx:(dl-eval-tests-run!)"
   "builtins:lib/datalog/tests/builtins.sx:(dl-builtins-tests-run!)"
   "semi_naive:lib/datalog/tests/semi_naive.sx:(dl-semi-naive-tests-run!)"
+  "negation:lib/datalog/tests/negation.sx:(dl-negation-tests-run!)"
 )
diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index 5fb30eb9..45c0fdb9 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -55,13 +55,24 @@
           results)))))
 
 ;; Naive matcher (for dl-saturate-naive! and dl-query post-saturation).
+(define
+  dl-match-negation
+  (fn
+    (inner db subst)
+    (let
+      ((walked (dl-apply-subst inner subst))
+        (matches (dl-match-positive inner db subst)))
+      (cond
+        ((= (len matches) 0) (list subst))
+        (else (list))))))
+
 (define
   dl-match-lit
   (fn
     (lit db subst)
     (cond
       ((and (dict? lit) (has-key? lit :neg))
-        (error "datalog: negation not yet supported (Phase 7)"))
+        (dl-match-negation (get lit :neg) db subst))
       ((dl-builtin? lit)
         (let
           ((s (dl-eval-builtin lit subst)))
@@ -194,7 +205,7 @@
             (options
               (cond
                 ((and (dict? lit) (has-key? lit :neg))
-                  (error "datalog: negation in semi-naive (Phase 7)"))
+                  (dl-match-negation (get lit :neg) db subst))
                 ((dl-builtin? lit)
                   (let
                     ((s (dl-eval-builtin lit subst)))
@@ -281,14 +292,14 @@
       candidates)))
 
 (define
-  dl-saturate!
+  dl-saturate-rules!
   (fn
-    (db)
+    (db rules)
     (let
       ((delta (dl-snapshot-facts db)))
       (do
         (define
-          dl-sn-step
+          dl-sr-step
           (fn
             ()
             (let
@@ -300,14 +311,50 @@
                     (for-each
                       (fn (cand) (append! pending cand))
                       (dl-collect-rule-candidates rule db delta)))
-                  (dl-rules db))
+                  rules)
                 (dl-commit-candidates! db pending new-delta)
                 (cond
                   ((dl-delta-empty? new-delta) nil)
-                  (else (do (set! delta new-delta) (dl-sn-step))))))))
-        (dl-sn-step)
+                  (else (do (set! delta new-delta) (dl-sr-step))))))))
+        (dl-sr-step)
         db))))
 
+;; Stratified driver: rejects non-stratifiable programs at saturation
+;; time, then iterates strata in increasing order, running semi-naive on
+;; the rules whose head sits in that stratum.
+(define
+  dl-saturate!
+  (fn
+    (db)
+    (let
+      ((err (dl-check-stratifiable db)))
+      (cond
+        ((not (nil? err)) (error (str "dl-saturate!: " err)))
+        (else
+          (let
+            ((strata (dl-compute-strata db)))
+            (let
+              ((grouped (dl-group-rules-by-stratum db strata)))
+              (let
+                ((groups (get grouped :groups))
+                  (max-s (get grouped :max)))
+                (do
+                  (define
+                    dl-strat-loop
+                    (fn
+                      (s)
+                      (when
+                        (<= s max-s)
+                        (let
+                          ((sk (str s)))
+                          (do
+                            (when
+                              (has-key? groups sk)
+                              (dl-saturate-rules! db (get groups sk)))
+                            (dl-strat-loop (+ s 1)))))))
+                  (dl-strat-loop 0)
+                  db)))))))))
+
 ;; ── Querying ─────────────────────────────────────────────────────
 
 (define
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 12f28784..54be5726 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,15 +1,16 @@
 {
   "lang": "datalog",
-  "total_passed": 114,
+  "total_passed": 124,
   "total_failed": 0,
-  "total": 114,
+  "total": 124,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
     {"name":"eval","passed":15,"failed":0,"total":15},
     {"name":"builtins","passed":19,"failed":0,"total":19},
-    {"name":"semi_naive","passed":8,"failed":0,"total":8}
+    {"name":"semi_naive","passed":8,"failed":0,"total":8},
+    {"name":"negation","passed":10,"failed":0,"total":10}
   ],
-  "generated": "2026-05-08T08:12:42+00:00"
+  "generated": "2026-05-08T08:20:41+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index cac00351..802305ab 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**114 / 114 passing** (0 failure(s)).
+**124 / 124 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -10,3 +10,4 @@
 | eval | 15 | 15 | ok |
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
+| negation | 10 | 10 | ok |
diff --git a/lib/datalog/strata.sx b/lib/datalog/strata.sx
new file mode 100644
index 00000000..b5d08347
--- /dev/null
+++ b/lib/datalog/strata.sx
@@ -0,0 +1,297 @@
+;; lib/datalog/strata.sx — dependency graph, SCC analysis, stratum assignment.
+;;
+;; A program is stratifiable iff no cycle in its dependency graph passes
+;; through a negative edge. The stratum of relation R is the depth at which
+;; R can first be evaluated:
+;;
+;;   stratum(R) = max over edges (R → S) of:
+;;       stratum(S)         if the edge is positive
+;;       stratum(S) + 1     if the edge is negative
+;;
+;; All relations in the same SCC share a stratum (and the SCC must have only
+;; positive internal edges, else the program is non-stratifiable).
+
+;; Build dep graph: dict {head-rel-name -> ({:rel str :neg bool} ...)}.
+(define
+  dl-build-dep-graph
+  (fn
+    (db)
+    (let ((g {}))
+      (do
+        (for-each
+          (fn
+            (rule)
+            (let
+              ((head-rel (dl-rel-name (get rule :head))))
+              (when
+                (not (nil? head-rel))
+                (do
+                  (when
+                    (not (has-key? g head-rel))
+                    (dict-set! g head-rel (list)))
+                  (let ((existing (get g head-rel)))
+                    (for-each
+                      (fn
+                        (lit)
+                        (let
+                          ((target
+                             (cond
+                               ((and (dict? lit) (has-key? lit :neg))
+                                 (dl-rel-name (get lit :neg)))
+                               ((dl-builtin? lit) nil)
+                               ((and (list? lit) (> (len lit) 0))
+                                 (dl-rel-name lit))
+                               (else nil)))
+                            (neg?
+                              (and (dict? lit) (has-key? lit :neg))))
+                          (when
+                            (not (nil? target))
+                            (append!
+                              existing
+                              {:rel target :neg neg?}))))
+                      (get rule :body)))))))
+          (dl-rules db))
+        g))))
+
+;; All relations referenced — heads of rules + EDB names + body relations.
+(define
+  dl-all-relations
+  (fn
+    (db)
+    (let ((seen (list)))
+      (do
+        (for-each
+          (fn
+            (k)
+            (when (not (dl-member-string? k seen)) (append! seen k)))
+          (keys (get db :facts)))
+        (for-each
+          (fn
+            (rule)
+            (do
+              (let ((h (dl-rel-name (get rule :head))))
+                (when
+                  (and (not (nil? h)) (not (dl-member-string? h seen)))
+                  (append! seen h)))
+              (for-each
+                (fn
+                  (lit)
+                  (let
+                    ((t
+                       (cond
+                         ((and (dict? lit) (has-key? lit :neg))
+                           (dl-rel-name (get lit :neg)))
+                         ((dl-builtin? lit) nil)
+                         ((and (list? lit) (> (len lit) 0))
+                           (dl-rel-name lit))
+                         (else nil))))
+                    (when
+                      (and (not (nil? t)) (not (dl-member-string? t seen)))
+                      (append! seen t))))
+                (get rule :body))))
+          (dl-rules db))
+        seen))))
+
+;; reach: dict {from: dict {to: edge-info}} where edge-info is
+;;   {:any bool :neg bool}
+;; meaning "any path from `from` to `to`" and "exists a negative-passing
+;; path from `from` to `to`".
+;;
+;; Floyd-Warshall over the dep graph. The 'neg' flag propagates through
+;; concatenation: if any edge along the path is negative, the path's
+;; flag is true.
+(define
+  dl-build-reach
+  (fn
+    (graph nodes)
+    (let ((reach {}))
+      (do
+        (for-each
+          (fn (n) (dict-set! reach n {}))
+          nodes)
+        (for-each
+          (fn
+            (head)
+            (when
+              (has-key? graph head)
+              (for-each
+                (fn
+                  (edge)
+                  (let
+                    ((target (get edge :rel)) (n (get edge :neg)))
+                    (let ((row (get reach head)))
+                      (cond
+                        ((has-key? row target)
+                          (let ((cur (get row target)))
+                            (dict-set!
+                              row
+                              target
+                              {:any true :neg (or n (get cur :neg))})))
+                        (else
+                          (dict-set! row target {:any true :neg n}))))))
+                (get graph head))))
+          nodes)
+        (for-each
+          (fn
+            (k)
+            (for-each
+              (fn
+                (i)
+                (let ((row-i (get reach i)))
+                  (when
+                    (has-key? row-i k)
+                    (let ((ik (get row-i k)) (row-k (get reach k)))
+                      (for-each
+                        (fn
+                          (j)
+                          (when
+                            (has-key? row-k j)
+                            (let ((kj (get row-k j)))
+                              (let
+                                ((combined-neg (or (get ik :neg) (get kj :neg))))
+                                (cond
+                                  ((has-key? row-i j)
+                                    (let ((cur (get row-i j)))
+                                      (dict-set!
+                                        row-i
+                                        j
+                                        {:any true
+                                         :neg (or combined-neg (get cur :neg))})))
+                                  (else
+                                    (dict-set!
+                                      row-i
+                                      j
+                                      {:any true :neg combined-neg})))))))
+                        nodes)))))
+              nodes))
+          nodes)
+        reach))))
+
+;; Returns nil on success, or error message string on failure.
+(define
+  dl-check-stratifiable
+  (fn
+    (db)
+    (let
+      ((graph (dl-build-dep-graph db))
+        (nodes (dl-all-relations db)))
+      (let ((reach (dl-build-reach graph nodes)) (err nil))
+        (do
+          (for-each
+            (fn
+              (rule)
+              (when
+                (nil? err)
+                (let ((head-rel (dl-rel-name (get rule :head))))
+                  (for-each
+                    (fn
+                      (lit)
+                      (when
+                        (and (dict? lit) (has-key? lit :neg))
+                        (let ((tgt (dl-rel-name (get lit :neg))))
+                          (when
+                            (and (not (nil? tgt))
+                                 (dl-reach-cycle? reach head-rel tgt))
+                            (set!
+                              err
+                              (str "non-stratifiable: relation " head-rel
+                                   " transitively depends through negation on "
+                                   tgt
+                                   " which depends back on " head-rel))))))
+                    (get rule :body)))))
+            (dl-rules db))
+          err)))))
+
+(define
+  dl-reach-cycle?
+  (fn
+    (reach a b)
+    (and
+      (dl-reach-row-has? reach b a)
+      (dl-reach-row-has? reach a b))))
+
+(define
+  dl-reach-row-has?
+  (fn
+    (reach from to)
+    (let ((row (get reach from)))
+      (and (not (nil? row)) (has-key? row to)))))
+
+;; Compute stratum per relation. Iteratively propagate from EDB roots.
+;; Uses the per-relation max-stratum-of-deps formula. Stops when stable.
+(define
+  dl-compute-strata
+  (fn
+    (db)
+    (let
+      ((graph (dl-build-dep-graph db))
+        (nodes (dl-all-relations db))
+        (strata {}))
+      (do
+        (for-each (fn (n) (dict-set! strata n 0)) nodes)
+        (let ((changed true))
+          (do
+            (define
+              dl-cs-loop
+              (fn
+                ()
+                (when
+                  changed
+                  (do
+                    (set! changed false)
+                    (for-each
+                      (fn
+                        (head)
+                        (when
+                          (has-key? graph head)
+                          (for-each
+                            (fn
+                              (edge)
+                              (let
+                                ((tgt (get edge :rel))
+                                  (n (get edge :neg)))
+                                (let
+                                  ((tgt-strat
+                                     (if (has-key? strata tgt)
+                                       (get strata tgt) 0))
+                                    (cur (get strata head)))
+                                  (let
+                                    ((needed
+                                       (if n (+ tgt-strat 1) tgt-strat)))
+                                    (when
+                                      (> needed cur)
+                                      (do
+                                        (dict-set! strata head needed)
+                                        (set! changed true)))))))
+                            (get graph head))))
+                      nodes)
+                    (dl-cs-loop)))))
+            (dl-cs-loop)))
+        strata))))
+
+;; Group rules by their head's stratum. Returns dict {stratum-int -> rules}.
+(define
+  dl-group-rules-by-stratum
+  (fn
+    (db strata)
+    (let ((groups {}) (max-s 0))
+      (do
+        (for-each
+          (fn
+            (rule)
+            (let
+              ((head-rel (dl-rel-name (get rule :head))))
+              (let
+                ((s (if (has-key? strata head-rel)
+                       (get strata head-rel) 0)))
+                (do
+                  (when (> s max-s) (set! max-s s))
+                  (let
+                    ((sk (str s)))
+                    (do
+                      (when
+                        (not (has-key? groups sk))
+                        (dict-set! groups sk (list)))
+                      (append! (get groups sk) rule)))))))
+          (dl-rules db))
+        {:groups groups :max max-s}))))
diff --git a/lib/datalog/tests/negation.sx b/lib/datalog/tests/negation.sx
new file mode 100644
index 00000000..e4de6207
--- /dev/null
+++ b/lib/datalog/tests/negation.sx
@@ -0,0 +1,231 @@
+;; lib/datalog/tests/negation.sx — stratified negation tests.
+
+(define dl-nt-pass 0)
+(define dl-nt-fail 0)
+(define dl-nt-failures (list))
+
+(define
+  dl-nt-deep=?
+  (fn
+    (a b)
+    (cond
+      ((and (list? a) (list? b))
+        (and (= (len a) (len b)) (dl-nt-deq-l? a b 0)))
+      ((and (dict? a) (dict? b))
+        (let ((ka (keys a)) (kb (keys b)))
+          (and (= (len ka) (len kb)) (dl-nt-deq-d? a b ka 0))))
+      ((and (number? a) (number? b)) (= a b))
+      (else (equal? a b)))))
+
+(define
+  dl-nt-deq-l?
+  (fn
+    (a b i)
+    (cond
+      ((>= i (len a)) true)
+      ((not (dl-nt-deep=? (nth a i) (nth b i))) false)
+      (else (dl-nt-deq-l? a b (+ i 1))))))
+
+(define
+  dl-nt-deq-d?
+  (fn
+    (a b ka i)
+    (cond
+      ((>= i (len ka)) true)
+      ((let ((k (nth ka i)))
+         (not (dl-nt-deep=? (get a k) (get b k))))
+        false)
+      (else (dl-nt-deq-d? a b ka (+ i 1))))))
+
+(define
+  dl-nt-set=?
+  (fn
+    (a b)
+    (and
+      (= (len a) (len b))
+      (dl-nt-subset? a b)
+      (dl-nt-subset? b a))))
+
+(define
+  dl-nt-subset?
+  (fn
+    (xs ys)
+    (cond
+      ((= (len xs) 0) true)
+      ((not (dl-nt-contains? ys (first xs))) false)
+      (else (dl-nt-subset? (rest xs) ys)))))
+
+(define
+  dl-nt-contains?
+  (fn
+    (xs target)
+    (cond
+      ((= (len xs) 0) false)
+      ((dl-nt-deep=? (first xs) target) true)
+      (else (dl-nt-contains? (rest xs) target)))))
+
+(define
+  dl-nt-test!
+  (fn
+    (name got expected)
+    (if
+      (dl-nt-deep=? got expected)
+      (set! dl-nt-pass (+ dl-nt-pass 1))
+      (do
+        (set! dl-nt-fail (+ dl-nt-fail 1))
+        (append!
+          dl-nt-failures
+          (str
+            name
+            "\n    expected: " expected
+            "\n    got:      " got))))))
+
+(define
+  dl-nt-test-set!
+  (fn
+    (name got expected)
+    (if
+      (dl-nt-set=? got expected)
+      (set! dl-nt-pass (+ dl-nt-pass 1))
+      (do
+        (set! dl-nt-fail (+ dl-nt-fail 1))
+        (append!
+          dl-nt-failures
+          (str
+            name
+            "\n    expected (set): " expected
+            "\n    got:            " got))))))
+
+(define
+  dl-nt-throws?
+  (fn
+    (thunk)
+    (let
+      ((threw false))
+      (do
+        (guard
+          (e (#t (set! threw true)))
+          (thunk))
+        threw))))
+
+(define
+  dl-nt-run-all!
+  (fn
+    ()
+    (do
+      ;; Negation against EDB-only relation.
+      (dl-nt-test-set! "not against EDB"
+        (dl-query
+          (dl-program
+            "p(1). p(2). p(3). r(2).
+             q(X) :- p(X), not(r(X)).")
+          (list (quote q) (quote X)))
+        (list {:X 1} {:X 3}))
+
+      ;; Negation against derived relation — needs stratification.
+      (dl-nt-test-set! "not against derived rel"
+        (dl-query
+          (dl-program
+            "p(1). p(2). p(3). s(2).
+             r(X) :- s(X).
+             q(X) :- p(X), not(r(X)).")
+          (list (quote q) (quote X)))
+        (list {:X 1} {:X 3}))
+
+      ;; Two-step strata: r derives via s; q derives via not r.
+      (dl-nt-test-set! "two-step strata"
+        (dl-query
+          (dl-program
+            "node(a). node(b). node(c). node(d).
+             edge(a, b). edge(b, c). edge(c, a).
+             reach(X, Y) :- edge(X, Y).
+             reach(X, Z) :- edge(X, Y), reach(Y, Z).
+             unreachable(X) :- node(X), not(reach(a, X)).")
+          (list (quote unreachable) (quote X)))
+        (list {:X (quote d)}))
+
+      ;; Combine negation with arithmetic and comparison.
+      (dl-nt-test-set! "negation with arithmetic"
+        (dl-query
+          (dl-program
+            "n(1). n(2). n(3). n(4). n(5). odd(1). odd(3). odd(5).
+             even(X) :- n(X), not(odd(X)).")
+          (list (quote even) (quote X)))
+        (list {:X 2} {:X 4}))
+
+      ;; Empty negation result.
+      (dl-nt-test-set! "negation always succeeds"
+        (dl-query
+          (dl-program
+            "p(1). p(2). q(X) :- p(X), not(r(X)).")
+          (list (quote q) (quote X)))
+        (list {:X 1} {:X 2}))
+
+      ;; Negation always fails.
+      (dl-nt-test-set! "negation always fails"
+        (dl-query
+          (dl-program
+            "p(1). p(2). r(1). r(2). q(X) :- p(X), not(r(X)).")
+          (list (quote q) (quote X)))
+        (list))
+
+      ;; Stratifiability checks.
+      (dl-nt-test! "non-stratifiable rejected"
+        (dl-nt-throws?
+          (fn ()
+            (let ((db (dl-make-db)))
+              (do
+                (dl-add-rule!
+                  db
+                  {:head (list (quote p) (quote X))
+                   :body (list (list (quote q) (quote X))
+                               {:neg (list (quote r) (quote X))})})
+                (dl-add-rule!
+                  db
+                  {:head (list (quote r) (quote X))
+                   :body (list (list (quote p) (quote X)))})
+                (dl-add-fact! db (list (quote q) 1))
+                (dl-saturate! db)))))
+        true)
+
+      (dl-nt-test! "stratifiable accepted"
+        (dl-nt-throws?
+          (fn ()
+            (dl-program
+              "p(1). p(2). r(2).
+               q(X) :- p(X), not(r(X)).")))
+        false)
+
+      ;; Multi-stratum chain.
+      (dl-nt-test-set! "three-level strata"
+        (dl-query
+          (dl-program
+            "a(1). a(2). a(3). a(4).
+             b(X) :- a(X), not(c(X)).
+             c(X) :- d(X).
+             d(2).
+             d(4).")
+          (list (quote b) (quote X)))
+        (list {:X 1} {:X 3}))
+
+      ;; Safety violation: negation refers to unbound var.
+      (dl-nt-test! "negation safety violation"
+        (dl-nt-throws?
+          (fn ()
+            (dl-program
+              "p(1). q(X) :- p(X), not(r(Y)).")))
+        true))))
+
+(define
+  dl-negation-tests-run!
+  (fn
+    ()
+    (do
+      (set! dl-nt-pass 0)
+      (set! dl-nt-fail 0)
+      (set! dl-nt-failures (list))
+      (dl-nt-run-all!)
+      {:passed dl-nt-pass
+       :failed dl-nt-fail
+       :total (+ dl-nt-pass dl-nt-fail)
+       :failures dl-nt-failures})))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index aa7dd632..cc92ddbf 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -162,17 +162,27 @@ large graphs.
       reachability query from a single root.
 
 ### Phase 7 — stratified negation
-- [ ] Dependency graph analysis: which relations depend on which (positively or negatively)
-- [ ] Stratification check: error if negation is in a cycle (non-stratifiable program)
-- [ ] `dl-stratify db` → SCC analysis → stratum ordering
-- [ ] Evaluation: process strata in order — lower stratum fully computed
-      before using its complement in a higher stratum
-- [ ] `not(P)` in rule body: at evaluation time, check P is NOT in the
-      derived EDB
-- [ ] Safety extension: head vars in negative literals must also appear in
-      some positive body literal of the same rule
-- [ ] Tests: non-member (`not(member(X,L))`), colored-graph
-      (`not(same-color(X,Y))`), stratification error detection
+- [x] Dependency graph: `dl-build-dep-graph db` returns `{head -> ({:rel
+      :neg} ...)}`. Built-ins drop out (they're not relations).
+- [x] Reachability via Floyd-Warshall in `dl-build-reach`; cycles
+      detected by `reach[A][B] && reach[B][A]`. Programs are
+      non-stratifiable iff any negative dependency falls inside an SCC.
+      `dl-check-stratifiable` returns nil on success or a clear message.
+- [x] `dl-compute-strata` propagates stratum numbers iteratively:
+      `stratum(R) = max over deps of (stratum(dep) + (1 if negated else 0))`.
+- [x] Saturator refactor: `dl-saturate-rules! db rules` is the semi-
+      naive worker; `dl-saturate! db` rejects non-stratifiable programs,
+      groups rules by head's stratum, and runs the worker on each
+      stratum in increasing order.
+- [x] `not(P)` in body: `dl-match-negation` walks the inner literal
+      under the current subst and uses `dl-match-positive` — succeeds
+      iff zero matches. Order-aware safety in `dl-rule-check-safety`
+      (already present from Phase 4) requires negation vars to be
+      bound by an earlier positive literal.
+- [x] Tests in `lib/datalog/tests/negation.sx` (10): EDB and IDB
+      negation, two-step strata, multi-level strata, with-arithmetic,
+      empty-result and always-fail cases, non-stratifiability
+      rejection, and a negation safety violation.
 
 ### Phase 8 — aggregation (Datalog+)
 - [ ] `count(X, Goal)` → number of distinct X satisfying Goal
@@ -220,6 +230,19 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 7 done (Phase 6 magic sets deferred — opt-in,
+  semi-naive default suffices for current test suite). New
+  `lib/datalog/strata.sx` (~290 LOC): dep graph build, Floyd-Warshall
+  reachability, SCC-via-mutual-reachability for non-stratifiability
+  detection, iterative stratum computation, rule grouping by head
+  stratum. eval.sx split: `dl-saturate-rules!` is the per-rule-set
+  semi-naive worker, `dl-saturate!` is now the stratified driver
+  (errors out on non-stratifiable programs). `dl-match-negation` in
+  eval.sx: succeeds iff inner positive match is empty. Stratum-keyed
+  dicts use `(str s)` since SX dicts only accept string/keyword keys.
+  10 negation tests cover EDB/IDB negation, multi-level strata,
+  non-stratifiability rejection, and a negation safety violation.
+
 - 2026-05-08 — Phase 5 done. `lib/datalog/eval.sx` rewritten to
   semi-naive default. `dl-saturate!` tracks a per-relation delta and
   on each iteration walks every positive body position substituting

From 6d04cf7bf24c4822c0747043359d102d606d3656 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 08:28:45 +0000
Subject: [PATCH 09/89] datalog: aggregation count/sum/min/max (Phase 8,
 134/134)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

New lib/datalog/aggregates.sx: (count R V Goal), (sum R V Goal),
(min R V Goal), (max R V Goal). dl-eval-aggregate runs
dl-find-bindings on the goal under the outer subst, collects
distinct values of V, applies the operator, binds R. Empty input:
count/sum return 0; min/max produce no binding (rule fails).

Group-by emerges naturally from outer-subst substitution into the
goal — `popular(P) :- post(P), count(N, U, liked(U, P)), >=(N, 3).`
counts per-post.

Stratifier extended: dl-aggregate-dep-edge contributes a
negation-like edge so the aggregate's goal relation is fully
derived before the aggregate fires (non-monotonicity respected).
Safety relaxed for aggregates: goal-internal vars are existentials,
only the result var becomes bound.
---
 lib/datalog/aggregates.sx       | 139 ++++++++++++++++++++
 lib/datalog/builtins.sx         |  14 ++
 lib/datalog/conformance.conf    |   2 +
 lib/datalog/eval.sx             |   1 +
 lib/datalog/scoreboard.json     |   9 +-
 lib/datalog/scoreboard.md       |   3 +-
 lib/datalog/strata.sx           |  43 +++---
 lib/datalog/tests/aggregates.sx | 223 ++++++++++++++++++++++++++++++++
 plans/datalog-on-sx.md          |  40 +++++-
 9 files changed, 447 insertions(+), 27 deletions(-)
 create mode 100644 lib/datalog/aggregates.sx
 create mode 100644 lib/datalog/tests/aggregates.sx

diff --git a/lib/datalog/aggregates.sx b/lib/datalog/aggregates.sx
new file mode 100644
index 00000000..153879f7
--- /dev/null
+++ b/lib/datalog/aggregates.sx
@@ -0,0 +1,139 @@
+;; lib/datalog/aggregates.sx — count / sum / min / max aggregation.
+;;
+;; Surface form (always 3-arg in the parsed AST):
+;;
+;;   (count  Result  Var  GoalLit)
+;;   (sum    Result  Var  GoalLit)
+;;   (min    Result  Var  GoalLit)
+;;   (max    Result  Var  GoalLit)
+;;
+;; Parsed naturally because arg-position compounds are already allowed
+;; (Phase 4 needs them for arithmetic). At evaluation time the aggregator
+;; runs `dl-find-bindings` on `GoalLit` under the current subst, collects
+;; the distinct values of `Var`, and binds `Result`.
+;;
+;; Aggregation is non-monotonic — `count(C, X, p(X))` shrinks as p loses
+;; tuples. The stratifier (lib/datalog/strata.sx) treats every aggregate's
+;; goal relation as a negation-like edge so the inner relation is fully
+;; derived before the aggregate fires.
+;;
+;; Empty input: count → 0, sum → 0, min/max → no binding (rule fails).
+
+(define dl-aggregate-rels (list "count" "sum" "min" "max"))
+
+(define
+  dl-aggregate?
+  (fn
+    (lit)
+    (and
+      (list? lit)
+      (>= (len lit) 4)
+      (let ((rel (dl-rel-name lit)))
+        (cond
+          ((nil? rel) false)
+          (else (dl-member-string? rel dl-aggregate-rels)))))))
+
+;; Apply aggregation operator to a list of (already-distinct) numeric or
+;; symbolic values. Returns the aggregated value, or :empty if min/max
+;; has no input.
+(define
+  dl-do-aggregate
+  (fn
+    (op vals)
+    (cond
+      ((= op "count") (len vals))
+      ((= op "sum") (dl-sum-vals vals 0))
+      ((= op "min")
+        (cond
+          ((= (len vals) 0) :empty)
+          (else (dl-min-vals vals 1 (first vals)))))
+      ((= op "max")
+        (cond
+          ((= (len vals) 0) :empty)
+          (else (dl-max-vals vals 1 (first vals)))))
+      (else (error (str "datalog: unknown aggregate " op))))))
+
+(define
+  dl-sum-vals
+  (fn
+    (vals acc)
+    (cond
+      ((= (len vals) 0) acc)
+      (else (dl-sum-vals (rest vals) (+ acc (first vals)))))))
+
+(define
+  dl-min-vals
+  (fn
+    (vals i cur)
+    (cond
+      ((>= i (len vals)) cur)
+      (else
+        (let ((v (nth vals i)))
+          (dl-min-vals vals (+ i 1) (if (< v cur) v cur)))))))
+
+(define
+  dl-max-vals
+  (fn
+    (vals i cur)
+    (cond
+      ((>= i (len vals)) cur)
+      (else
+        (let ((v (nth vals i)))
+          (dl-max-vals vals (+ i 1) (if (> v cur) v cur)))))))
+
+;; Membership check by deep equality (so 30 == 30.0 etc).
+(define
+  dl-val-member?
+  (fn
+    (v xs)
+    (cond
+      ((= (len xs) 0) false)
+      ((dl-tuple-equal? v (first xs)) true)
+      (else (dl-val-member? v (rest xs))))))
+
+;; Evaluate an aggregate body lit under `subst`. Returns the list of
+;; extended substitutions (0 or 1 element).
+(define
+  dl-eval-aggregate
+  (fn
+    (lit db subst)
+    (let
+      ((op (dl-rel-name lit))
+        (result-var (nth lit 1))
+        (agg-var (nth lit 2))
+        (goal (nth lit 3)))
+      (let
+        ((substs (dl-find-bindings (list goal) db subst))
+          (vals (list)))
+        (do
+          (for-each
+            (fn
+              (s)
+              (let ((v (dl-apply-subst agg-var s)))
+                (when
+                  (not (dl-val-member? v vals))
+                  (append! vals v))))
+            substs)
+          (let ((agg-val (dl-do-aggregate op vals)))
+            (cond
+              ((= agg-val :empty) (list))
+              (else
+                (let ((s2 (dl-unify result-var agg-val subst)))
+                  (if (nil? s2) (list) (list s2)))))))))))
+
+;; Stratification edges from aggregates: like negation, the goal's
+;; relation must be in a strictly lower stratum so that the aggregate
+;; fires only after the underlying tuples are settled.
+(define
+  dl-aggregate-dep-edge
+  (fn
+    (lit)
+    (cond
+      ((dl-aggregate? lit)
+        (let ((goal (nth lit 3)))
+          (cond
+            ((and (list? goal) (> (len goal) 0))
+              (let ((rel (dl-rel-name goal)))
+                (if (nil? rel) nil {:rel rel :neg true})))
+            (else nil))))
+      (else nil))))
diff --git a/lib/datalog/builtins.sx b/lib/datalog/builtins.sx
index dfd2307a..11261c85 100644
--- a/lib/datalog/builtins.sx
+++ b/lib/datalog/builtins.sx
@@ -262,6 +262,19 @@
                       missing
                       " — they must be bound by an earlier "
                       "positive body literal")))))))
+        (define
+          dl-process-agg!
+          (fn
+            (lit)
+            (let
+              ((result-var (nth lit 1)))
+              ;; Aggregate goal vars are existentially quantified within
+              ;; the aggregate; nothing required from outer context. The
+              ;; result var becomes bound after the aggregate fires.
+              (when
+                (dl-var? result-var)
+                (dl-add-bound! (list (symbol->string result-var)))))))
+
         (define
           dl-process-lit!
           (fn
@@ -271,6 +284,7 @@
               (cond
                 ((and (dict? lit) (has-key? lit :neg))
                   (dl-process-neg! lit))
+                ((dl-aggregate? lit) (dl-process-agg! lit))
                 ((dl-eq? lit) (dl-process-eq! lit))
                 ((dl-is? lit) (dl-process-is! lit))
                 ((dl-comparison? lit) (dl-process-cmp! lit))
diff --git a/lib/datalog/conformance.conf b/lib/datalog/conformance.conf
index bd9b0612..15dea37e 100644
--- a/lib/datalog/conformance.conf
+++ b/lib/datalog/conformance.conf
@@ -9,6 +9,7 @@ PRELOADS=(
   lib/datalog/unify.sx
   lib/datalog/db.sx
   lib/datalog/builtins.sx
+  lib/datalog/aggregates.sx
   lib/datalog/strata.sx
   lib/datalog/eval.sx
 )
@@ -21,4 +22,5 @@ SUITES=(
   "builtins:lib/datalog/tests/builtins.sx:(dl-builtins-tests-run!)"
   "semi_naive:lib/datalog/tests/semi_naive.sx:(dl-semi-naive-tests-run!)"
   "negation:lib/datalog/tests/negation.sx:(dl-negation-tests-run!)"
+  "aggregates:lib/datalog/tests/aggregates.sx:(dl-aggregates-tests-run!)"
 )
diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index 45c0fdb9..93902349 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -206,6 +206,7 @@
               (cond
                 ((and (dict? lit) (has-key? lit :neg))
                   (dl-match-negation (get lit :neg) db subst))
+                ((dl-aggregate? lit) (dl-eval-aggregate lit db subst))
                 ((dl-builtin? lit)
                   (let
                     ((s (dl-eval-builtin lit subst)))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 54be5726..54b1560e 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 124,
+  "total_passed": 134,
   "total_failed": 0,
-  "total": 124,
+  "total": 134,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -10,7 +10,8 @@
     {"name":"eval","passed":15,"failed":0,"total":15},
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
-    {"name":"negation","passed":10,"failed":0,"total":10}
+    {"name":"negation","passed":10,"failed":0,"total":10},
+    {"name":"aggregates","passed":10,"failed":0,"total":10}
   ],
-  "generated": "2026-05-08T08:20:41+00:00"
+  "generated": "2026-05-08T08:28:29+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 802305ab..22cd5104 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**124 / 124 passing** (0 failure(s)).
+**134 / 134 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -11,3 +11,4 @@
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
+| aggregates | 10 | 10 | ok |
diff --git a/lib/datalog/strata.sx b/lib/datalog/strata.sx
index b5d08347..0928c989 100644
--- a/lib/datalog/strata.sx
+++ b/lib/datalog/strata.sx
@@ -33,22 +33,30 @@
                     (for-each
                       (fn
                         (lit)
-                        (let
-                          ((target
-                             (cond
-                               ((and (dict? lit) (has-key? lit :neg))
-                                 (dl-rel-name (get lit :neg)))
-                               ((dl-builtin? lit) nil)
-                               ((and (list? lit) (> (len lit) 0))
-                                 (dl-rel-name lit))
-                               (else nil)))
-                            (neg?
-                              (and (dict? lit) (has-key? lit :neg))))
-                          (when
-                            (not (nil? target))
-                            (append!
-                              existing
-                              {:rel target :neg neg?}))))
+                        (cond
+                          ((dl-aggregate? lit)
+                            (let
+                              ((edge (dl-aggregate-dep-edge lit)))
+                              (when
+                                (not (nil? edge))
+                                (append! existing edge))))
+                          (else
+                            (let
+                              ((target
+                                 (cond
+                                   ((and (dict? lit) (has-key? lit :neg))
+                                     (dl-rel-name (get lit :neg)))
+                                   ((dl-builtin? lit) nil)
+                                   ((and (list? lit) (> (len lit) 0))
+                                     (dl-rel-name lit))
+                                   (else nil)))
+                                (neg?
+                                  (and (dict? lit) (has-key? lit :neg))))
+                              (when
+                                (not (nil? target))
+                                (append!
+                                  existing
+                                  {:rel target :neg neg?}))))))
                       (get rule :body)))))))
           (dl-rules db))
         g))))
@@ -79,6 +87,9 @@
                   (let
                     ((t
                        (cond
+                         ((dl-aggregate? lit)
+                           (let ((edge (dl-aggregate-dep-edge lit)))
+                             (if (nil? edge) nil (get edge :rel))))
                          ((and (dict? lit) (has-key? lit :neg))
                            (dl-rel-name (get lit :neg)))
                          ((dl-builtin? lit) nil)
diff --git a/lib/datalog/tests/aggregates.sx b/lib/datalog/tests/aggregates.sx
new file mode 100644
index 00000000..d80276d8
--- /dev/null
+++ b/lib/datalog/tests/aggregates.sx
@@ -0,0 +1,223 @@
+;; lib/datalog/tests/aggregates.sx — count / sum / min / max.
+
+(define dl-at-pass 0)
+(define dl-at-fail 0)
+(define dl-at-failures (list))
+
+(define
+  dl-at-deep=?
+  (fn
+    (a b)
+    (cond
+      ((and (list? a) (list? b))
+        (and (= (len a) (len b)) (dl-at-deq-l? a b 0)))
+      ((and (dict? a) (dict? b))
+        (let ((ka (keys a)) (kb (keys b)))
+          (and (= (len ka) (len kb)) (dl-at-deq-d? a b ka 0))))
+      ((and (number? a) (number? b)) (= a b))
+      (else (equal? a b)))))
+
+(define
+  dl-at-deq-l?
+  (fn
+    (a b i)
+    (cond
+      ((>= i (len a)) true)
+      ((not (dl-at-deep=? (nth a i) (nth b i))) false)
+      (else (dl-at-deq-l? a b (+ i 1))))))
+
+(define
+  dl-at-deq-d?
+  (fn
+    (a b ka i)
+    (cond
+      ((>= i (len ka)) true)
+      ((let ((k (nth ka i)))
+         (not (dl-at-deep=? (get a k) (get b k))))
+        false)
+      (else (dl-at-deq-d? a b ka (+ i 1))))))
+
+(define
+  dl-at-set=?
+  (fn
+    (a b)
+    (and
+      (= (len a) (len b))
+      (dl-at-subset? a b)
+      (dl-at-subset? b a))))
+
+(define
+  dl-at-subset?
+  (fn
+    (xs ys)
+    (cond
+      ((= (len xs) 0) true)
+      ((not (dl-at-contains? ys (first xs))) false)
+      (else (dl-at-subset? (rest xs) ys)))))
+
+(define
+  dl-at-contains?
+  (fn
+    (xs target)
+    (cond
+      ((= (len xs) 0) false)
+      ((dl-at-deep=? (first xs) target) true)
+      (else (dl-at-contains? (rest xs) target)))))
+
+(define
+  dl-at-test!
+  (fn
+    (name got expected)
+    (if
+      (dl-at-deep=? got expected)
+      (set! dl-at-pass (+ dl-at-pass 1))
+      (do
+        (set! dl-at-fail (+ dl-at-fail 1))
+        (append!
+          dl-at-failures
+          (str
+            name
+            "\n    expected: " expected
+            "\n    got:      " got))))))
+
+(define
+  dl-at-test-set!
+  (fn
+    (name got expected)
+    (if
+      (dl-at-set=? got expected)
+      (set! dl-at-pass (+ dl-at-pass 1))
+      (do
+        (set! dl-at-fail (+ dl-at-fail 1))
+        (append!
+          dl-at-failures
+          (str
+            name
+            "\n    expected (set): " expected
+            "\n    got:            " got))))))
+
+(define
+  dl-at-throws?
+  (fn
+    (thunk)
+    (let
+      ((threw false))
+      (do
+        (guard
+          (e (#t (set! threw true)))
+          (thunk))
+        threw))))
+
+(define
+  dl-at-run-all!
+  (fn
+    ()
+    (do
+      ;; count
+      (dl-at-test-set! "count siblings"
+        (dl-query
+          (dl-program
+            "parent(p, bob). parent(p, alice). parent(p, charlie).
+             sibling(X, Y) :- parent(P, X), parent(P, Y), !=(X, Y).
+             sib_count(N) :- count(N, S, sibling(bob, S)).")
+          (list (quote sib_count) (quote N)))
+        (list {:N 2}))
+
+      ;; sum
+      (dl-at-test-set! "sum prices"
+        (dl-query
+          (dl-program
+            "price(apple, 5). price(pear, 7). price(plum, 3).
+             total(T) :- sum(T, X, price(F, X)).")
+          (list (quote total) (quote T)))
+        (list {:T 15}))
+
+      ;; min
+      (dl-at-test-set! "min score"
+        (dl-query
+          (dl-program
+            "score(alice, 80). score(bob, 65). score(carol, 92).
+             lo(M) :- min(M, S, score(P, S)).")
+          (list (quote lo) (quote M)))
+        (list {:M 65}))
+
+      ;; max
+      (dl-at-test-set! "max score"
+        (dl-query
+          (dl-program
+            "score(alice, 80). score(bob, 65). score(carol, 92).
+             hi(M) :- max(M, S, score(P, S)).")
+          (list (quote hi) (quote M)))
+        (list {:M 92}))
+
+      ;; count over derived relation (stratification needed).
+      (dl-at-test-set! "count over derived"
+        (dl-query
+          (dl-program
+            "parent(a, b). parent(a, c). parent(b, d). parent(c, e).
+             ancestor(X, Y) :- parent(X, Y).
+             ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).
+             num_ancestors(N) :- count(N, X, ancestor(a, X)).")
+          (list (quote num_ancestors) (quote N)))
+        (list {:N 4}))
+
+      ;; count with no matches → 0.
+      (dl-at-test-set! "count empty"
+        (dl-query
+          (dl-program
+            "p(1). p(2).
+             zero(N) :- count(N, X, q(X)).")
+          (list (quote zero) (quote N)))
+        (list {:N 0}))
+
+      ;; sum with no matches → 0.
+      (dl-at-test-set! "sum empty"
+        (dl-query
+          (dl-program
+            "p(1). p(2).
+             total(T) :- sum(T, X, q(X)).")
+          (list (quote total) (quote T)))
+        (list {:T 0}))
+
+      ;; min with no matches → rule does not fire.
+      (dl-at-test-set! "min empty"
+        (dl-query
+          (dl-program
+            "p(1). p(2).
+             lo(M) :- min(M, X, q(X)).")
+          (list (quote lo) (quote M)))
+        (list))
+
+      ;; Aggregate with comparison filter on result.
+      (dl-at-test-set! "popularity threshold"
+        (dl-query
+          (dl-program
+            "post(p1). post(p2).
+             liked(u1, p1). liked(u2, p1). liked(u3, p1).
+             liked(u1, p2). liked(u2, p2).
+             popular(P) :- post(P), count(N, U, liked(U, P)), >=(N, 3).")
+          (list (quote popular) (quote P)))
+        (list {:P (quote p1)}))
+
+      ;; Aggregate vs single distinct.
+      (dl-at-test-set! "distinct counted once"
+        (dl-query
+          (dl-program
+            "rated(alice, x). rated(alice, y). rated(bob, x).
+             rater_count(N) :- count(N, U, rated(U, F)).")
+          (list (quote rater_count) (quote N)))
+        (list {:N 2})))))
+
+(define
+  dl-aggregates-tests-run!
+  (fn
+    ()
+    (do
+      (set! dl-at-pass 0)
+      (set! dl-at-fail 0)
+      (set! dl-at-failures (list))
+      (dl-at-run-all!)
+      {:passed dl-at-pass
+       :failed dl-at-fail
+       :total (+ dl-at-pass dl-at-fail)
+       :failures dl-at-failures})))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index cc92ddbf..291cd16d 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -185,12 +185,27 @@ large graphs.
       rejection, and a negation safety violation.
 
 ### Phase 8 — aggregation (Datalog+)
-- [ ] `count(X, Goal)` → number of distinct X satisfying Goal
-- [ ] `sum(X, Goal)` → sum of X values satisfying Goal
-- [ ] `min(X, Goal)` / `max(X, Goal)` → min/max of X satisfying Goal
-- [ ] `group-by` semantics: `count(X, sibling(bob, X))` → count of bob's siblings
-- [ ] Aggregation breaks stratification — evaluate in a separate post-fixpoint pass
-- [ ] Tests: social network statistics, grade aggregation, inventory sums
+- [x] `(count R V Goal)`, `(sum R V Goal)`, `(min R V Goal)`,
+      `(max R V Goal)` — first arg is the result variable, second is the
+      aggregated variable, third is the goal literal. Live in
+      `lib/datalog/aggregates.sx`.
+- [x] `dl-eval-aggregate`: runs `dl-find-bindings` on the goal under the
+      current subst (which provides outer-context bindings), collects
+      distinct values of the aggregated var, applies the aggregate.
+      `count`/`sum` produce 0 when no matches; `min`/`max` produce no
+      binding (rule fails) when empty.
+- [x] Group-by emerges naturally: outer-context vars in the goal are
+      substituted from the current subst, so `popular(P) :- post(P),
+      count(N, U, liked(U, P)), >=(N, 3).` correctly counts per-post.
+- [x] Stratification: `dl-aggregate-dep-edge` returns a negation-like
+      edge so the aggregate's goal relation is fully derived before the
+      aggregate fires. Non-monotonicity respected.
+- [x] Safety: aggregate body lit binds the result var; goal-internal
+      vars are existentially quantified and don't need outer binding.
+- [x] Tests in `lib/datalog/tests/aggregates.sx` (10): count siblings,
+      sum prices, min/max scores, count over derived relation,
+      empty-input cases for each operator, popularity threshold with
+      group-by, distinct-counted-once.
 
 ### Phase 9 — SX embedding API
 - [ ] `(dl-program facts rules)` → database from SX data directly (no parsing required)
@@ -230,6 +245,19 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 8 done. New `lib/datalog/aggregates.sx` (~110
+  LOC): count / sum / min / max. Each is a body literal of shape
+  `(op R V Goal)` — `dl-eval-aggregate` runs `dl-find-bindings` on
+  the goal under the outer subst (so outer vars in the goal get
+  substituted, giving group-by-style aggregation), collects the
+  distinct values of `V`, and binds `R`. Empty input: count/sum
+  return 0; min/max produce no binding (rule fails). Stratifier
+  extended via `dl-aggregate-dep-edge` so the aggregate's goal
+  relation is fully derived before the aggregate fires. Safety check
+  treats goal-internal vars as existentials (no outer binding
+  required); only the result var becomes bound. Conformance now
+  134 / 134.
+
 - 2026-05-08 — Phase 7 done (Phase 6 magic sets deferred — opt-in,
   semi-naive default suffices for current test suite). New
   `lib/datalog/strata.sx` (~290 LOC): dep graph build, Floyd-Warshall

From ce603e98798dce4892dbf5d61e13c4dc864ab986 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 08:34:08 +0000
Subject: [PATCH 10/89] datalog: SX-data embedding API (Phase 9, 143/143)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

New lib/datalog/api.sx: dl-program-data facts rules takes SX data
lists. Rules accept either dict form or list form using <- as the
rule arrow (since SX parses :- as a keyword). dl-rule constructor
for the dict shape. dl-assert! adds a fact and re-saturates;
dl-retract! drops EDB matches, wipes all rule-headed IDB
relations, and re-saturates from scratch — simplest correct
semantics until provenance tracking arrives.

9 API tests cover ancestor closure via data, dict-rule form,
dl-rule constructor, incremental assert/retract, cyclic-graph
reach, assert into empty, fact-style rule (no arrow), dict
passthrough.
---
 lib/datalog/api.sx           | 147 ++++++++++++++++++++++++
 lib/datalog/conformance.conf |   2 +
 lib/datalog/scoreboard.json  |   9 +-
 lib/datalog/scoreboard.md    |   3 +-
 lib/datalog/tests/api.sx     | 209 +++++++++++++++++++++++++++++++++++
 plans/datalog-on-sx.md       |  40 +++++--
 6 files changed, 396 insertions(+), 14 deletions(-)
 create mode 100644 lib/datalog/api.sx
 create mode 100644 lib/datalog/tests/api.sx

diff --git a/lib/datalog/api.sx b/lib/datalog/api.sx
new file mode 100644
index 00000000..37ae9d6c
--- /dev/null
+++ b/lib/datalog/api.sx
@@ -0,0 +1,147 @@
+;; lib/datalog/api.sx — SX-data embedding API.
+;;
+;; Where Phase 1's `dl-program` takes a Datalog source string,
+;; this module exposes a parser-free API that consumes SX data
+;; directly. Two rule shapes are accepted:
+;;
+;;   - dict:   {:head <literal> :body (<literal> ...)}
+;;   - list:   (<head-elements...> <- <body-literal> ...)
+;;             — `<-` is an SX symbol used as the rule arrow.
+;;
+;; Examples:
+;;
+;;   (dl-program-data
+;;     '((parent tom bob) (parent tom liz) (parent bob ann))
+;;     '((ancestor X Y <- (parent X Y))
+;;       (ancestor X Z <- (parent X Y) (ancestor Y Z))))
+;;
+;;   (dl-query db '(ancestor tom X))   ; same query API as before
+;;
+;; Variables follow the parser convention: SX symbols whose first
+;; character is uppercase or `_` are variables.
+
+(define
+  dl-rule
+  (fn (head body) {:head head :body body}))
+
+(define
+  dl-rule-arrow?
+  (fn
+    (x)
+    (and (symbol? x) (= (symbol->string x) "<-"))))
+
+(define
+  dl-find-arrow
+  (fn
+    (rl i n)
+    (cond
+      ((>= i n) nil)
+      ((dl-rule-arrow? (nth rl i)) i)
+      (else (dl-find-arrow rl (+ i 1) n)))))
+
+;; Given a list of the form (head-elt ... <- body-lit ...) returns
+;; {:head (head-elt ...) :body (body-lit ...)}. If no arrow is
+;; present, the whole list is treated as the head and the body is
+;; empty (i.e. a fact written rule-style).
+(define
+  dl-rule-from-list
+  (fn
+    (rl)
+    (let ((n (len rl)))
+      (let ((idx (dl-find-arrow rl 0 n)))
+        (cond
+          ((nil? idx) {:head rl :body (list)})
+          (else
+            (let
+              ((head (slice rl 0 idx))
+                (body (slice rl (+ idx 1) n)))
+              {:head head :body body})))))))
+
+;; Coerce a rule given as either a dict or a list-with-arrow to a dict.
+(define
+  dl-coerce-rule
+  (fn
+    (r)
+    (cond
+      ((dict? r) r)
+      ((list? r) (dl-rule-from-list r))
+      (else (error (str "dl-coerce-rule: expected dict or list, got " r))))))
+
+;; Build a db from SX data lists.
+(define
+  dl-program-data
+  (fn
+    (facts rules)
+    (let ((db (dl-make-db)))
+      (do
+        (for-each (fn (lit) (dl-add-fact! db lit)) facts)
+        (for-each
+          (fn (r) (dl-add-rule! db (dl-coerce-rule r)))
+          rules)
+        db))))
+
+;; Add a single fact at runtime, then re-saturate the db so derived
+;; tuples reflect the change. Returns the db.
+(define
+  dl-assert!
+  (fn
+    (db lit)
+    (do
+      (dl-add-fact! db lit)
+      (dl-saturate! db)
+      db)))
+
+;; Remove a fact: drop matching tuples from EDB AND wipe all derived
+;; tuples (any IDB tuple may have transitively depended on the removed
+;; fact). Then re-saturate to repopulate IDB. EDB facts that were
+;; asserted via dl-add-fact! are preserved unless they match `lit`.
+;;
+;; To distinguish EDB from IDB, we treat any fact for a relation that
+;; has rules as IDB; otherwise EDB. (Phase 9 simplification — Phase 10
+;; may track provenance.)
+(define
+  dl-retract!
+  (fn
+    (db lit)
+    (let
+      ((rel-key (dl-rel-name lit)))
+      (do
+        ;; Drop the matching tuple from its relation list (if EDB-only).
+        (when
+          (has-key? (get db :facts) rel-key)
+          (let
+            ((existing (get (get db :facts) rel-key))
+              (kept (list)))
+            (do
+              (for-each
+                (fn
+                  (t)
+                  (when
+                    (not (dl-tuple-equal? t lit))
+                    (append! kept t)))
+                existing)
+              (dict-set! (get db :facts) rel-key kept))))
+        ;; Wipe all relations that have a rule (these are IDB) so the
+        ;; saturator regenerates them from the surviving EDB.
+        (let ((rule-heads (dl-rule-head-rels db)))
+          (for-each
+            (fn (k) (dict-set! (get db :facts) k (list)))
+            rule-heads))
+        (dl-saturate! db)
+        db))))
+
+(define
+  dl-rule-head-rels
+  (fn
+    (db)
+    (let ((seen (list)))
+      (do
+        (for-each
+          (fn
+            (rule)
+            (let ((h (dl-rel-name (get rule :head))))
+              (when
+                (and (not (nil? h)) (not (dl-member-string? h seen)))
+                (append! seen h))))
+          (dl-rules db))
+        seen))))
diff --git a/lib/datalog/conformance.conf b/lib/datalog/conformance.conf
index 15dea37e..e80e8b7a 100644
--- a/lib/datalog/conformance.conf
+++ b/lib/datalog/conformance.conf
@@ -12,6 +12,7 @@ PRELOADS=(
   lib/datalog/aggregates.sx
   lib/datalog/strata.sx
   lib/datalog/eval.sx
+  lib/datalog/api.sx
 )
 
 SUITES=(
@@ -23,4 +24,5 @@ SUITES=(
   "semi_naive:lib/datalog/tests/semi_naive.sx:(dl-semi-naive-tests-run!)"
   "negation:lib/datalog/tests/negation.sx:(dl-negation-tests-run!)"
   "aggregates:lib/datalog/tests/aggregates.sx:(dl-aggregates-tests-run!)"
+  "api:lib/datalog/tests/api.sx:(dl-api-tests-run!)"
 )
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 54b1560e..1bd89123 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 134,
+  "total_passed": 143,
   "total_failed": 0,
-  "total": 134,
+  "total": 143,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -11,7 +11,8 @@
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
-    {"name":"aggregates","passed":10,"failed":0,"total":10}
+    {"name":"aggregates","passed":10,"failed":0,"total":10},
+    {"name":"api","passed":9,"failed":0,"total":9}
   ],
-  "generated": "2026-05-08T08:28:29+00:00"
+  "generated": "2026-05-08T08:33:54+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 22cd5104..66ade082 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**134 / 134 passing** (0 failure(s)).
+**143 / 143 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -12,3 +12,4 @@
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 10 | 10 | ok |
+| api | 9 | 9 | ok |
diff --git a/lib/datalog/tests/api.sx b/lib/datalog/tests/api.sx
new file mode 100644
index 00000000..aa127d38
--- /dev/null
+++ b/lib/datalog/tests/api.sx
@@ -0,0 +1,209 @@
+;; lib/datalog/tests/api.sx — SX-data embedding API.
+
+(define dl-api-pass 0)
+(define dl-api-fail 0)
+(define dl-api-failures (list))
+
+(define
+  dl-api-deep=?
+  (fn
+    (a b)
+    (cond
+      ((and (list? a) (list? b))
+        (and (= (len a) (len b)) (dl-api-deq-l? a b 0)))
+      ((and (dict? a) (dict? b))
+        (let ((ka (keys a)) (kb (keys b)))
+          (and (= (len ka) (len kb)) (dl-api-deq-d? a b ka 0))))
+      ((and (number? a) (number? b)) (= a b))
+      (else (equal? a b)))))
+
+(define
+  dl-api-deq-l?
+  (fn
+    (a b i)
+    (cond
+      ((>= i (len a)) true)
+      ((not (dl-api-deep=? (nth a i) (nth b i))) false)
+      (else (dl-api-deq-l? a b (+ i 1))))))
+
+(define
+  dl-api-deq-d?
+  (fn
+    (a b ka i)
+    (cond
+      ((>= i (len ka)) true)
+      ((let ((k (nth ka i)))
+         (not (dl-api-deep=? (get a k) (get b k))))
+        false)
+      (else (dl-api-deq-d? a b ka (+ i 1))))))
+
+(define
+  dl-api-set=?
+  (fn
+    (a b)
+    (and
+      (= (len a) (len b))
+      (dl-api-subset? a b)
+      (dl-api-subset? b a))))
+
+(define
+  dl-api-subset?
+  (fn
+    (xs ys)
+    (cond
+      ((= (len xs) 0) true)
+      ((not (dl-api-contains? ys (first xs))) false)
+      (else (dl-api-subset? (rest xs) ys)))))
+
+(define
+  dl-api-contains?
+  (fn
+    (xs target)
+    (cond
+      ((= (len xs) 0) false)
+      ((dl-api-deep=? (first xs) target) true)
+      (else (dl-api-contains? (rest xs) target)))))
+
+(define
+  dl-api-test!
+  (fn
+    (name got expected)
+    (if
+      (dl-api-deep=? got expected)
+      (set! dl-api-pass (+ dl-api-pass 1))
+      (do
+        (set! dl-api-fail (+ dl-api-fail 1))
+        (append!
+          dl-api-failures
+          (str
+            name
+            "\n    expected: " expected
+            "\n    got:      " got))))))
+
+(define
+  dl-api-test-set!
+  (fn
+    (name got expected)
+    (if
+      (dl-api-set=? got expected)
+      (set! dl-api-pass (+ dl-api-pass 1))
+      (do
+        (set! dl-api-fail (+ dl-api-fail 1))
+        (append!
+          dl-api-failures
+          (str
+            name
+            "\n    expected (set): " expected
+            "\n    got:            " got))))))
+
+(define
+  dl-api-run-all!
+  (fn
+    ()
+    (do
+      ;; dl-program-data with arrow form.
+      (dl-api-test-set! "data API ancestor closure"
+        (dl-query
+          (dl-program-data
+            (quote ((parent tom bob) (parent bob ann) (parent ann pat)))
+            (quote
+              ((ancestor X Y <- (parent X Y))
+               (ancestor X Z <- (parent X Y) (ancestor Y Z)))))
+          (quote (ancestor tom X)))
+        (list {:X (quote bob)} {:X (quote ann)} {:X (quote pat)}))
+
+      ;; dl-program-data with dict rules.
+      (dl-api-test-set! "data API with dict rules"
+        (dl-query
+          (dl-program-data
+            (quote ((p a) (p b) (p c)))
+            (list
+              {:head (quote (q X)) :body (quote ((p X)))}))
+          (quote (q X)))
+        (list {:X (quote a)} {:X (quote b)} {:X (quote c)}))
+
+      ;; dl-rule helper.
+      (dl-api-test-set! "dl-rule constructor"
+        (dl-query
+          (dl-program-data
+            (quote ((p 1) (p 2)))
+            (list (dl-rule (quote (q X)) (quote ((p X))))))
+          (quote (q X)))
+        (list {:X 1} {:X 2}))
+
+      ;; dl-assert! adds and re-derives.
+      (dl-api-test-set! "dl-assert! incremental"
+        (let
+          ((db (dl-program-data
+                 (quote ((parent tom bob) (parent bob ann)))
+                 (quote
+                   ((ancestor X Y <- (parent X Y))
+                    (ancestor X Z <- (parent X Y) (ancestor Y Z)))))))
+          (do
+            (dl-saturate! db)
+            (dl-assert! db (quote (parent ann pat)))
+            (dl-query db (quote (ancestor tom X)))))
+        (list {:X (quote bob)} {:X (quote ann)} {:X (quote pat)}))
+
+      ;; dl-retract! removes a fact and recomputes IDB.
+      (dl-api-test-set! "dl-retract! removes derived"
+        (let
+          ((db (dl-program-data
+                 (quote ((parent tom bob) (parent bob ann) (parent ann pat)))
+                 (quote
+                   ((ancestor X Y <- (parent X Y))
+                    (ancestor X Z <- (parent X Y) (ancestor Y Z)))))))
+          (do
+            (dl-saturate! db)
+            (dl-retract! db (quote (parent bob ann)))
+            (dl-query db (quote (ancestor tom X)))))
+        (list {:X (quote bob)}))
+
+      ;; dl-program-data + dl-query with constants in head.
+      (dl-api-test-set! "constant-in-head data"
+        (dl-query
+          (dl-program-data
+            (quote ((edge a b) (edge b c) (edge c a)))
+            (quote
+              ((reach X Y <- (edge X Y))
+               (reach X Z <- (edge X Y) (reach Y Z)))))
+          (quote (reach a X)))
+        (list {:X (quote a)} {:X (quote b)} {:X (quote c)}))
+
+      ;; Assert into empty db.
+      (dl-api-test-set! "assert into empty"
+        (let
+          ((db (dl-program-data (list) (list))))
+          (do
+            (dl-assert! db (quote (p 1)))
+            (dl-assert! db (quote (p 2)))
+            (dl-query db (quote (p X)))))
+        (list {:X 1} {:X 2}))
+
+      ;; dl-rule-from-list with no arrow → fact-style.
+      (dl-api-test-set! "no arrow → fact-like rule"
+        (let
+          ((rule (dl-rule-from-list (quote (foo X Y)))))
+          (list rule))
+        (list {:head (quote (foo X Y)) :body (list)}))
+
+      ;; dl-coerce-rule on dict passes through.
+      (dl-api-test-set! "coerce dict rule"
+        (let
+          ((d {:head (quote (h X)) :body (quote ((b X)))}))
+          (list (dl-coerce-rule d)))
+        (list {:head (quote (h X)) :body (quote ((b X)))})))))
+
+(define
+  dl-api-tests-run!
+  (fn
+    ()
+    (do
+      (set! dl-api-pass 0)
+      (set! dl-api-fail 0)
+      (set! dl-api-failures (list))
+      (dl-api-run-all!)
+      {:passed dl-api-pass
+       :failed dl-api-fail
+       :total (+ dl-api-pass dl-api-fail)
+       :failures dl-api-failures})))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 291cd16d..21c8123f 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -208,18 +208,30 @@ large graphs.
       group-by, distinct-counted-once.
 
 ### Phase 9 — SX embedding API
-- [ ] `(dl-program facts rules)` → database from SX data directly (no parsing required)
+- [x] `(dl-program-data facts rules)` builds a db from SX data —
+      `facts` is a list of literals, `rules` is a list of either
+      dicts `{:head … :body …}` or lists `(<head…> <- <body…>)`.
+      Variables are SX symbols whose first char is uppercase or `_`,
+      matching the parser's convention.
       ```
-      (dl-program
-        '((parent tom bob) (parent tom liz) (parent bob ann))
-        '((ancestor X Z :- (parent X Y) (ancestor Y Z))
-          (ancestor X Y :- (parent X Y))))
+      (dl-program-data
+        '((parent tom bob) (parent bob ann))
+        '((ancestor X Y <- (parent X Y))
+          (ancestor X Z <- (parent X Y) (ancestor Y Z))))
       ```
-- [ ] `(dl-query db '(ancestor tom ?X))` → `((ann) (bob) (liz) (pat))`
-- [ ] `(dl-assert! db '(parent ann pat))` → incremental fact addition + re-derive
-- [ ] `(dl-retract! db '(parent tom bob))` → fact removal + re-derive from scratch
+- [x] `(dl-rule head body)` constructor for the dict form.
+- [x] `(dl-query db '(ancestor tom X))` already worked — same query API
+      consumes the SX-data goal.
+- [x] `(dl-assert! db '(parent ann pat))` → adds the fact and re-saturates.
+- [x] `(dl-retract! db '(parent bob ann))` → drops matching tuples from
+      the EDB list, wipes every relation that has a rule (those are IDB),
+      and re-saturates from the surviving EDB.
+- [x] Tests in `lib/datalog/tests/api.sx` (9): closure via data API,
+      dict-rule form, dl-rule constructor, dl-assert! incremental,
+      dl-retract! removes derived, cyclic-graph reach via data,
+      assert into empty db, fact-style rule (no arrow), coerce dict.
 - [ ] Integration demo: federation graph query — `(ancestor actor1 actor2)` over
-      rose-ash ActivityPub follow relationships
+      rose-ash ActivityPub follow relationships (Phase 10).
 
 ### Phase 10 — Datalog as a query language for rose-ash
 - [ ] Schema: map SQLAlchemy model relationships to Datalog EDB facts
@@ -245,6 +257,16 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 9 done. New `lib/datalog/api.sx` exposes a
+  parser-free embedding: `dl-program-data facts rules` accepts SX
+  data lists, with rules in either dict form or list form using
+  `<-` as the rule arrow (since SX parses `:-` as a keyword).
+  `dl-rule head body` constructs the dict. `dl-assert! db lit` adds
+  a fact and re-saturates; `dl-retract! db lit` drops the fact from
+  EDB, wipes all rule-headed (IDB) relations, and re-saturates from
+  scratch — the simplest correct semantics until provenance tracking
+  arrives in a later phase. 9 API tests; conformance now 143/143.
+
 - 2026-05-08 — Phase 8 done. New `lib/datalog/aggregates.sx` (~110
   LOC): count / sum / min / max. Each is a body literal of shape
   `(op R V Goal)` — `dl-eval-aggregate` runs `dl-find-bindings` on

From 3cc760082cc1133279fed5addc8a462ad13944c8 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 08:42:10 +0000
Subject: [PATCH 11/89] datalog: hash-set membership for facts (Phase 5b perf)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

db gains a parallel :facts-keys {<rel>: {<tuple-string>: true}}
index alongside :facts. dl-tuple-key derives a stable string via
(str lit) — (p 30) and (p 30.0) collide correctly because SX
prints them identically. dl-add-fact! membership is now O(1)
instead of O(n) list scan; insert sequences for relations sized
N drop from O(N²) to O(N).

Wall clock on chain-7 saturation halves (~12s → ~6s); chain-15
roughly halves (~50s → ~25s) under shared CPU. Larger chains
still slow due to body-join overhead in dl-find-bindings —
Blocker entry refreshed with proposed follow-ups.

dl-retract! keeps both indices consistent: kept-keys is rebuilt
during the EDB filter, IDB wipes clear both lists and key dicts.
---
 lib/datalog/api.sx     | 16 ++++++++++++----
 lib/datalog/db.sx      | 22 +++++++++++++++++-----
 plans/datalog-on-sx.md | 24 ++++++++++++++++++------
 3 files changed, 47 insertions(+), 15 deletions(-)

diff --git a/lib/datalog/api.sx b/lib/datalog/api.sx
index 37ae9d6c..01abec95 100644
--- a/lib/datalog/api.sx
+++ b/lib/datalog/api.sx
@@ -111,21 +111,29 @@
           (has-key? (get db :facts) rel-key)
           (let
             ((existing (get (get db :facts) rel-key))
-              (kept (list)))
+              (kept (list))
+              (kept-keys {}))
             (do
               (for-each
                 (fn
                   (t)
                   (when
                     (not (dl-tuple-equal? t lit))
-                    (append! kept t)))
+                    (do
+                      (append! kept t)
+                      (dict-set! kept-keys (dl-tuple-key t) true))))
                 existing)
-              (dict-set! (get db :facts) rel-key kept))))
+              (dict-set! (get db :facts) rel-key kept)
+              (dict-set! (get db :facts-keys) rel-key kept-keys))))
         ;; Wipe all relations that have a rule (these are IDB) so the
         ;; saturator regenerates them from the surviving EDB.
         (let ((rule-heads (dl-rule-head-rels db)))
           (for-each
-            (fn (k) (dict-set! (get db :facts) k (list)))
+            (fn
+              (k)
+              (do
+                (dict-set! (get db :facts) k (list))
+                (dict-set! (get db :facts-keys) k {})))
             rule-heads))
         (dl-saturate! db)
         db))))
diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index 620f565c..6a3f69a0 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -12,7 +12,7 @@
 ;; lib/datalog/builtins.sx) swaps in the real `dl-rule-check-safety`,
 ;; which is order-aware and understands built-in predicates.
 
-(define dl-make-db (fn () {:facts {} :rules (list)}))
+(define dl-make-db (fn () {:facts {} :facts-keys {} :rules (list)}))
 
 (define
   dl-rel-name
@@ -97,13 +97,19 @@
   (fn
     (db rel-key)
     (let
-      ((facts (get db :facts)))
+      ((facts (get db :facts))
+        (fk (get db :facts-keys)))
       (do
         (when
           (not (has-key? facts rel-key))
           (dict-set! facts rel-key (list)))
+        (when
+          (not (has-key? fk rel-key))
+          (dict-set! fk rel-key {}))
         (get facts rel-key)))))
 
+(define dl-tuple-key (fn (lit) (str lit)))
+
 (define
   dl-rel-tuples
   (fn
@@ -125,10 +131,16 @@
         (let
           ((rel-key (dl-rel-name lit)))
           (let
-            ((tuples (dl-ensure-rel! db rel-key)))
+            ((tuples (dl-ensure-rel! db rel-key))
+              (key-dict (get (get db :facts-keys) rel-key))
+              (tk (dl-tuple-key lit)))
             (cond
-              ((dl-tuple-member? lit tuples) false)
-              (else (do (append! tuples lit) true)))))))))
+              ((has-key? key-dict tk) false)
+              (else
+                (do
+                  (dict-set! key-dict tk true)
+                  (append! tuples lit)
+                  true)))))))))
 
 ;; The full safety check lives in builtins.sx (it has to know which
 ;; predicates are built-ins). dl-add-rule! calls it via forward
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 21c8123f..b9990c17 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -246,17 +246,29 @@ large graphs.
 
 ## Blockers
 
-- **Hash-set membership for relations.** `dl-tuple-member?` uses a linear
-  list scan; insert is O(n) and saturating chain-N pushes O(n²) → O(n³)
-  total. Under bundled conformance (CPU shared with other loop agents)
-  even chain-15 hits multi-minute wall-clock. Tests scoped to chain-5
-  for now. Fix: maintain a `{tuple-key → true}` dict per relation
-  alongside the list; key tuples by their serialized form.
+- **Saturation perf on long chains.** Resolved one bottleneck (hash-set
+  membership in `dl-add-fact!`) but `dl-saturate!` still spends
+  significant time per iteration on rule body joins — chain-15 takes
+  ~25s real / 3s user under contention even after the membership fix.
+  Two follow-ups to consider: (a) avoid `(rest lits)` in
+  `dl-find-bindings`/`dl-fbs-aux` (uses indexed iteration like the
+  membership fix), (b) memoize the per-rule body shape so `(len lits)`
+  and accessor calls don't re-walk the list each step.
 
 ## Progress log
 
 _Newest first._
 
+- 2026-05-08 — Phase 5b perf: hash-set membership in `dl-add-fact!`.
+  db gains a parallel `:facts-keys {<rel>: {<tuple-string>: true}}`
+  index alongside `:facts`. `dl-tuple-key` derives a stable string
+  key via `(str lit)` — `(p 30)` and `(p 30.0)` collide correctly
+  because SX prints them identically. Insertion is O(1) instead of
+  O(n). chain-7 saturation drops from ~12s to ~6s; chain-15 from
+  ~50s to ~25s under shared CPU. Larger chains are still slow due
+  to body-join overhead in dl-find-bindings (Blocker updated).
+  `dl-retract!` updated to keep both indices consistent. 143/143.
+
 - 2026-05-08 — Phase 9 done. New `lib/datalog/api.sx` exposes a
   parser-free embedding: `dl-program-data facts rules` accepts SX
   data lists, with rules in either dict form or list form using

From de302fc2367342218ebd29c446b7c3cad67bdd90 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 08:45:59 +0000
Subject: [PATCH 12/89] datalog: rose-ash demo programs (Phase 10 syntactic,
 153/153)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

New lib/datalog/demo.sx with three Datalog-as-query-language demos
over synthetic rose-ash data:

  Federation: (mutual A B), (reachable A B), (foaf A C) over a
              follows graph.
  Content:    (post-likes P N) via count aggregation, (popular P)
              for likes >= 3, (interesting Me P) joining follows
              + authored + popular.
  Permissions: (in-group A G) over transitive subgroup chains,
              (can-access A R).

10 tests run each program against in-memory EDB tuples loaded via
dl-program-data.

Wiring to PostgreSQL and exposing as a service endpoint (/internal
/datalog) is out of scope for this loop — both would require
edits outside lib/datalog/. Programs above document the EDB shape
a real loader would populate.
---
 lib/datalog/conformance.conf |   2 +
 lib/datalog/demo.sx          |  75 +++++++++++++
 lib/datalog/scoreboard.json  |   9 +-
 lib/datalog/scoreboard.md    |   3 +-
 lib/datalog/tests/demo.sx    | 202 +++++++++++++++++++++++++++++++++++
 plans/datalog-on-sx.md       |  38 +++++--
 6 files changed, 315 insertions(+), 14 deletions(-)
 create mode 100644 lib/datalog/demo.sx
 create mode 100644 lib/datalog/tests/demo.sx

diff --git a/lib/datalog/conformance.conf b/lib/datalog/conformance.conf
index e80e8b7a..f56276af 100644
--- a/lib/datalog/conformance.conf
+++ b/lib/datalog/conformance.conf
@@ -13,6 +13,7 @@ PRELOADS=(
   lib/datalog/strata.sx
   lib/datalog/eval.sx
   lib/datalog/api.sx
+  lib/datalog/demo.sx
 )
 
 SUITES=(
@@ -25,4 +26,5 @@ SUITES=(
   "negation:lib/datalog/tests/negation.sx:(dl-negation-tests-run!)"
   "aggregates:lib/datalog/tests/aggregates.sx:(dl-aggregates-tests-run!)"
   "api:lib/datalog/tests/api.sx:(dl-api-tests-run!)"
+  "demo:lib/datalog/tests/demo.sx:(dl-demo-tests-run!)"
 )
diff --git a/lib/datalog/demo.sx b/lib/datalog/demo.sx
new file mode 100644
index 00000000..7bbdc3b2
--- /dev/null
+++ b/lib/datalog/demo.sx
@@ -0,0 +1,75 @@
+;; lib/datalog/demo.sx — example programs over rose-ash-shaped data.
+;;
+;; Phase 10 prototypes Datalog as a rose-ash query language. Wiring
+;; the EDB to actual PostgreSQL is out of scope for this loop (it
+;; would touch service code outside lib/datalog/), but the programs
+;; below show the shape of queries we want, and the test suite runs
+;; them against synthetic in-memory tuples loaded via dl-program-data.
+;;
+;; Three thematic demos:
+;;
+;;   1. Federation — follow graph, transitive reach, mutuals.
+;;   2. Content   — posts, tags, likes, popularity, "for you" feed.
+;;   3. Permissions — group membership and resource access.
+
+;; ── Demo 1: federation follow graph ─────────────────────────────
+;; EDB: (follows ACTOR-A ACTOR-B) — A follows B.
+;; IDB:
+;;   (mutual A B)            — A follows B and B follows A
+;;   (reachable A B)         — transitive follow closure
+;;   (foaf A C)              — friend of a friend (mutual filter)
+(define
+  dl-demo-federation-rules
+  (quote
+    ((mutual A B <- (follows A B) (follows B A))
+     (reachable A B <- (follows A B))
+     (reachable A C <- (follows A B) (reachable B C))
+     (foaf A C <- (follows A B) (follows B C) (!= A C)))))
+
+;; ── Demo 2: content recommendation ──────────────────────────────
+;; EDB:
+;;   (authored ACTOR POST)
+;;   (tagged POST TAG)
+;;   (liked ACTOR POST)
+;; IDB:
+;;   (post-likes POST N)            — count of likes per post
+;;   (popular POST)                 — posts with >= 3 likes
+;;   (tagged-by-mutual ACTOR POST)  — post tagged TOPIC by someone
+;;                                    A's mutuals follow.
+(define
+  dl-demo-content-rules
+  (quote
+    ((post-likes P N <- (authored Author P) (count N L (liked L P)))
+     (popular P <- (authored Author P) (post-likes P N) (>= N 3))
+     (interesting Me P
+       <-
+       (follows Me Buddy)
+       (authored Buddy P)
+       (popular P)))))
+
+;; ── Demo 3: role-based permissions ──────────────────────────────
+;; EDB:
+;;   (member ACTOR GROUP)
+;;   (subgroup CHILD PARENT)
+;;   (allowed GROUP RESOURCE)
+;; IDB:
+;;   (in-group ACTOR GROUP)         — direct or via subgroup chain
+;;   (can-access ACTOR RESOURCE)    — actor inherits group permission
+(define
+  dl-demo-perm-rules
+  (quote
+    ((in-group A G <- (member A G))
+     (in-group A G <- (member A H) (subgroup-trans H G))
+     (subgroup-trans X Y <- (subgroup X Y))
+     (subgroup-trans X Z <- (subgroup X Y) (subgroup-trans Y Z))
+     (can-access A R <- (in-group A G) (allowed G R)))))
+
+;; ── Loader stub ──────────────────────────────────────────────────
+;; Wiring to PostgreSQL would replace these helpers with calls into
+;; rose-ash's internal HTTP RPC (fetch_data → /internal/data/...).
+;; The shape returned by dl-load-from-edb! is the same in either case.
+(define
+  dl-demo-make
+  (fn
+    (facts rules)
+    (dl-program-data facts rules)))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 1bd89123..c6eba8b4 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 143,
+  "total_passed": 153,
   "total_failed": 0,
-  "total": 143,
+  "total": 153,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -12,7 +12,8 @@
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":10,"failed":0,"total":10},
-    {"name":"api","passed":9,"failed":0,"total":9}
+    {"name":"api","passed":9,"failed":0,"total":9},
+    {"name":"demo","passed":10,"failed":0,"total":10}
   ],
-  "generated": "2026-05-08T08:33:54+00:00"
+  "generated": "2026-05-08T08:45:37+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 66ade082..2b5b5d7e 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**143 / 143 passing** (0 failure(s)).
+**153 / 153 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,3 +13,4 @@
 | negation | 10 | 10 | ok |
 | aggregates | 10 | 10 | ok |
 | api | 9 | 9 | ok |
+| demo | 10 | 10 | ok |
diff --git a/lib/datalog/tests/demo.sx b/lib/datalog/tests/demo.sx
new file mode 100644
index 00000000..d8218266
--- /dev/null
+++ b/lib/datalog/tests/demo.sx
@@ -0,0 +1,202 @@
+;; lib/datalog/tests/demo.sx — Phase 10 demo programs.
+
+(define dl-demo-pass 0)
+(define dl-demo-fail 0)
+(define dl-demo-failures (list))
+
+(define
+  dl-demo-deep=?
+  (fn
+    (a b)
+    (cond
+      ((and (list? a) (list? b))
+        (and (= (len a) (len b)) (dl-demo-deq-l? a b 0)))
+      ((and (dict? a) (dict? b))
+        (let ((ka (keys a)) (kb (keys b)))
+          (and (= (len ka) (len kb)) (dl-demo-deq-d? a b ka 0))))
+      ((and (number? a) (number? b)) (= a b))
+      (else (equal? a b)))))
+
+(define
+  dl-demo-deq-l?
+  (fn
+    (a b i)
+    (cond
+      ((>= i (len a)) true)
+      ((not (dl-demo-deep=? (nth a i) (nth b i))) false)
+      (else (dl-demo-deq-l? a b (+ i 1))))))
+
+(define
+  dl-demo-deq-d?
+  (fn
+    (a b ka i)
+    (cond
+      ((>= i (len ka)) true)
+      ((let ((k (nth ka i)))
+         (not (dl-demo-deep=? (get a k) (get b k))))
+        false)
+      (else (dl-demo-deq-d? a b ka (+ i 1))))))
+
+(define
+  dl-demo-set=?
+  (fn
+    (a b)
+    (and
+      (= (len a) (len b))
+      (dl-demo-subset? a b)
+      (dl-demo-subset? b a))))
+
+(define
+  dl-demo-subset?
+  (fn
+    (xs ys)
+    (cond
+      ((= (len xs) 0) true)
+      ((not (dl-demo-contains? ys (first xs))) false)
+      (else (dl-demo-subset? (rest xs) ys)))))
+
+(define
+  dl-demo-contains?
+  (fn
+    (xs target)
+    (cond
+      ((= (len xs) 0) false)
+      ((dl-demo-deep=? (first xs) target) true)
+      (else (dl-demo-contains? (rest xs) target)))))
+
+(define
+  dl-demo-test-set!
+  (fn
+    (name got expected)
+    (if
+      (dl-demo-set=? got expected)
+      (set! dl-demo-pass (+ dl-demo-pass 1))
+      (do
+        (set! dl-demo-fail (+ dl-demo-fail 1))
+        (append!
+          dl-demo-failures
+          (str
+            name
+            "\n    expected (set): " expected
+            "\n    got:            " got))))))
+
+(define
+  dl-demo-run-all!
+  (fn
+    ()
+    (do
+      ;; ── Federation ──────────────────────────────────────────
+      (dl-demo-test-set! "mutuals"
+        (dl-query
+          (dl-demo-make
+            (quote ((follows alice bob) (follows bob alice)
+                    (follows bob carol) (follows carol dave)))
+            dl-demo-federation-rules)
+          (quote (mutual alice X)))
+        (list {:X (quote bob)}))
+
+      (dl-demo-test-set! "reachable transitive"
+        (dl-query
+          (dl-demo-make
+            (quote ((follows alice bob) (follows bob carol) (follows carol dave)))
+            dl-demo-federation-rules)
+          (quote (reachable alice X)))
+        (list {:X (quote bob)} {:X (quote carol)} {:X (quote dave)}))
+
+      (dl-demo-test-set! "foaf"
+        (dl-query
+          (dl-demo-make
+            (quote ((follows alice bob) (follows bob carol) (follows alice dave)))
+            dl-demo-federation-rules)
+          (quote (foaf alice X)))
+        (list {:X (quote carol)}))
+
+      ;; ── Content ─────────────────────────────────────────────
+      (dl-demo-test-set! "popular posts"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((authored alice p1) (authored bob p2) (authored carol p3)
+               (liked u1 p1) (liked u2 p1) (liked u3 p1)
+               (liked u1 p2)))
+            dl-demo-content-rules)
+          (quote (popular P)))
+        (list {:P (quote p1)}))
+
+      (dl-demo-test-set! "interesting feed"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((follows me alice) (follows me bob)
+               (authored alice p1) (authored bob p2)
+               (liked u1 p1) (liked u2 p1) (liked u3 p1)
+               (liked u4 p2)))
+            dl-demo-content-rules)
+          (quote (interesting me P)))
+        (list {:P (quote p1)}))
+
+      (dl-demo-test-set! "post likes count"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((authored alice p1)
+               (liked u1 p1) (liked u2 p1) (liked u3 p1)))
+            dl-demo-content-rules)
+          (quote (post-likes p1 N)))
+        (list {:N 3}))
+
+      ;; ── Permissions ─────────────────────────────────────────
+      (dl-demo-test-set! "direct group access"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((member alice editors)
+               (allowed editors blog)))
+            dl-demo-perm-rules)
+          (quote (can-access X blog)))
+        (list {:X (quote alice)}))
+
+      (dl-demo-test-set! "subgroup access"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((member bob writers)
+               (subgroup writers editors)
+               (allowed editors blog)))
+            dl-demo-perm-rules)
+          (quote (can-access X blog)))
+        (list {:X (quote bob)}))
+
+      (dl-demo-test-set! "transitive subgroup"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((member carol drafters)
+               (subgroup drafters writers)
+               (subgroup writers editors)
+               (allowed editors blog)))
+            dl-demo-perm-rules)
+          (quote (can-access X blog)))
+        (list {:X (quote carol)}))
+
+      (dl-demo-test-set! "no access without grant"
+        (dl-query
+          (dl-demo-make
+            (quote ((member dave outsiders) (allowed editors blog)))
+            dl-demo-perm-rules)
+          (quote (can-access X blog)))
+        (list)))))
+
+(define
+  dl-demo-tests-run!
+  (fn
+    ()
+    (do
+      (set! dl-demo-pass 0)
+      (set! dl-demo-fail 0)
+      (set! dl-demo-failures (list))
+      (dl-demo-run-all!)
+      {:passed dl-demo-pass
+       :failed dl-demo-fail
+       :total (+ dl-demo-pass dl-demo-fail)
+       :failures dl-demo-failures})))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index b9990c17..57edf541 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -234,15 +234,25 @@ large graphs.
       rose-ash ActivityPub follow relationships (Phase 10).
 
 ### Phase 10 — Datalog as a query language for rose-ash
-- [ ] Schema: map SQLAlchemy model relationships to Datalog EDB facts
-      (e.g. `(follows user1 user2)`, `(authored user post)`, `(tagged post tag)`)
-- [ ] Loader: `dl-load-from-db!` — query PostgreSQL, populate Datalog EDB
-- [ ] Query examples:
-      - `?- ancestor(me, X), authored(X, Post), tagged(Post, cooking).`
-        → posts about cooking by people I follow (transitively)
-      - `?- popular(Post) :- tagged(Post, T), count(L, (liked(L, Post))) >= 10.`
-        → posts with 10+ likes
-- [ ] Expose as a rose-ash service endpoint: `POST /internal/datalog` with program + query
+- [x] Schema sketches in `lib/datalog/demo.sx`:
+      - **Federation**: `(follows A B)` → `(mutual A B)`, `(reachable A B)`,
+        `(foaf A C)` (friend-of-a-friend, distinct).
+      - **Content**: `(authored A P)`, `(liked U P)`, `(tagged P T)` →
+        `(post-likes P N)` via aggregation, `(popular P)` for likes ≥ 3,
+        `(interesting Me P)` joining follows + authored + popular.
+      - **Permissions**: `(member A G)`, `(subgroup C P)`, `(allowed G R)`
+        → `(in-group A G)` over transitive subgroups, `(can-access A R)`.
+- [ ] Loader `dl-load-from-db!` — out of scope for this loop
+      (would need to edit `shared/services/` outside `lib/datalog/`).
+      Programs in `demo.sx` already document the EDB shape expected
+      from such a loader. `dl-program-data` consumes the same shape.
+- [x] Query examples covered by `lib/datalog/tests/demo.sx` (10):
+      mutuals, transitive reach, FOAF, popular posts, interesting feed,
+      post likes count, direct/subgroup/transitive group access, no
+      access without grant.
+- [ ] Service endpoint `POST /internal/datalog` — out of scope as above.
+      Once exposed, server-side handler would be `dl-program-data` +
+      `dl-query`, returning JSON-encoded substitutions.
 
 ## Blockers
 
@@ -259,6 +269,16 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 10 syntactic demo. New `lib/datalog/demo.sx`
+  with three programs over rose-ash-shaped data: federation
+  (`mutual`, `reachable`, `foaf`), content recommendation
+  (`post-likes` via count aggregation, `popular`, `interesting`),
+  and role-based permissions (`in-group` over transitive subgroups,
+  `can-access`). 10 demo tests pass against synthetic EDB tuples.
+  Postgres loader and `/internal/datalog` HTTP endpoint remain
+  out of scope for this loop (they need service-tree edits beyond
+  `lib/datalog/**`). Conformance now 153/153.
+
 - 2026-05-08 — Phase 5b perf: hash-set membership in `dl-add-fact!`.
   db gains a parallel `:facts-keys {<rel>: {<tuple-string>: true}}`
   index alongside `:facts`. `dl-tuple-key` derives a stable string

From 790c17dfc1d7f0cc1e91637fdd60f5756dad90d4 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 08:50:24 +0000
Subject: [PATCH 13/89] datalog: indexed dl-find-bindings + chain-15
 differential (Phase 5c, 153/153)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

dl-find-bindings now uses dl-fb-aux lits db subst i n (indexed
iteration via nth) instead of recursive (rest lits). Eliminates
O(N²) list-copy per body of length N. chain-15 saturation 25s
→ 16s; chain-25 finishes in 33s real (vs. timeout previously).

Bumped semi_naive tests to chain-10 differential + chain-15
semi-only count (was chain-5/chain-5). Blocker entry refreshed.
---
 lib/datalog/eval.sx             | 12 ++++++++----
 lib/datalog/scoreboard.json     |  2 +-
 lib/datalog/tests/semi_naive.sx | 14 +++++++-------
 plans/datalog-on-sx.md          | 24 ++++++++++++++++--------
 4 files changed, 32 insertions(+), 20 deletions(-)

diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index 93902349..acd74e5e 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -83,14 +83,18 @@
 
 (define
   dl-find-bindings
+  (fn (lits db subst) (dl-fb-aux lits db subst 0 (len lits))))
+
+(define
+  dl-fb-aux
   (fn
-    (lits db subst)
+    (lits db subst i n)
     (cond
       ((nil? subst) (list))
-      ((= (len lits) 0) (list subst))
+      ((>= i n) (list subst))
       (else
         (let
-          ((options (dl-match-lit (first lits) db subst))
+          ((options (dl-match-lit (nth lits i) db subst))
             (results (list)))
           (do
             (for-each
@@ -98,7 +102,7 @@
                 (s)
                 (for-each
                   (fn (s2) (append! results s2))
-                  (dl-find-bindings (rest lits) db s)))
+                  (dl-fb-aux lits db s (+ i 1) n)))
               options)
             results))))))
 
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index c6eba8b4..e30419f8 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -15,5 +15,5 @@
     {"name":"api","passed":9,"failed":0,"total":9},
     {"name":"demo","passed":10,"failed":0,"total":10}
   ],
-  "generated": "2026-05-08T08:45:37+00:00"
+  "generated": "2026-05-08T08:49:52+00:00"
 }
diff --git a/lib/datalog/tests/semi_naive.sx b/lib/datalog/tests/semi_naive.sx
index 5ff6a3a5..914dcb2b 100644
--- a/lib/datalog/tests/semi_naive.sx
+++ b/lib/datalog/tests/semi_naive.sx
@@ -120,18 +120,18 @@
         (dl-sn-counts-agree?
           (dl-sn-counts "p(a). p(b). q(X) :- p(X), =(X, a)."))
         true)
-      ;; Chain length 5 — small but enough to exercise multiple
-      ;; semi-naive iterations against a recursive rule.
+      ;; Chain length 10 — exercises multiple semi-naive iterations
+      ;; against the recursive ancestor rule.
       (dl-sn-test!
-        "chain-5 ancestor counts match"
-        (dl-sn-counts-agree? (dl-sn-counts (dl-sn-chain-source 5)))
+        "chain-10 ancestor counts match"
+        (dl-sn-counts-agree? (dl-sn-counts (dl-sn-chain-source 10)))
         true)
       (dl-sn-test!
-        "chain-5 ancestor count value"
+        "chain-15 ancestor count value (semi only)"
         (let
-          ((db (dl-program (dl-sn-chain-source 5))))
+          ((db (dl-program (dl-sn-chain-source 15))))
           (do (dl-saturate! db) (len (dl-relation db "ancestor"))))
-        15)
+        120)
       (dl-sn-test!
         "query through semi saturate"
         (let
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 57edf541..d24293a3 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -256,19 +256,27 @@ large graphs.
 
 ## Blockers
 
-- **Saturation perf on long chains.** Resolved one bottleneck (hash-set
-  membership in `dl-add-fact!`) but `dl-saturate!` still spends
-  significant time per iteration on rule body joins — chain-15 takes
-  ~25s real / 3s user under contention even after the membership fix.
-  Two follow-ups to consider: (a) avoid `(rest lits)` in
-  `dl-find-bindings`/`dl-fbs-aux` (uses indexed iteration like the
-  membership fix), (b) memoize the per-rule body shape so `(len lits)`
-  and accessor calls don't re-walk the list each step.
+- **Saturation perf** improving but not free. Resolved hash-set
+  membership in `dl-add-fact!` and replaced recursive `(rest lits)` in
+  `dl-find-bindings` with indexed iteration. chain-15 drops from ~25s
+  to ~16s and chain-25 saturates in ~33s real / 11s user — most CPU
+  now in unification (assoc-based subst dict copies) and dict
+  lookups during walks. Future: a per-rule "compiled" body that
+  pre-resolves arg positions and intern variable indices, then
+  unification can use array slots instead of dict assoc.
 
 ## Progress log
 
 _Newest first._
 
+- 2026-05-08 — Phase 5c perf: indexed `dl-find-bindings`. Replaced
+  the recursive `(rest lits)` walk with `dl-fb-aux lits db subst i n`
+  using `nth lits i`. Eliminates O(N²) list-copy per body of length
+  N. chain-15 saturation 25s → 16s; chain-25 finishes in 33s real
+  (vs. timeout previously). Bumped semi_naive tests: differential
+  on chain-10, semi-only count on chain-15 (was chain-5/chain-5).
+  153/153.
+
 - 2026-05-08 — Phase 10 syntactic demo. New `lib/datalog/demo.sx`
   with three programs over rose-ash-shaped data: federation
   (`mutual`, `reachable`, `foaf`), content recommendation

From 5a1dc4392f204300d63f5c0bb525cbf3dca9ddb3 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 08:58:17 +0000
Subject: [PATCH 14/89] datalog: anonymous _ vars are unique per occurrence
 (Phase 5d, 156/156)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

(p X _), (p _ Y) — the two _ are now different variables, matching
standard Datalog semantics. Previously both _ symbols were the same
SX symbol, so unification across them gave wrong answers.

Fix in db.sx: dl-rename-anon-term + dl-rename-anon-lit walk a term
or literal and replace each '_' symbol with a fresh _anon<N>.
dl-make-anon-renamer returns a counter-based name generator scoped
per call. dl-rename-anon-rule applies it to head and body of a
rule. dl-add-rule! invokes the renamer before safety check.

eval.sx: dl-query renames anon vars in the goal before search and
filters '_' out of the projection so user-facing results aren't
polluted with internal _anon<N> bindings.

The previous "underscore in head ok" test now correctly rejects
(p X _) :- q(X) as unsafe (the head's fresh anon var has no body
binder). New "underscore in body only" test confirms the safe
case. Two regression tests for rule-level and goal-level
independence.
---
 lib/datalog/db.sx           | 55 +++++++++++++++++++++++++++++++------
 lib/datalog/eval.sx         | 33 ++++++++++++----------
 lib/datalog/scoreboard.json |  8 +++---
 lib/datalog/scoreboard.md   |  4 +--
 lib/datalog/tests/eval.sx   | 27 ++++++++++++++++--
 plans/datalog-on-sx.md      | 11 ++++++++
 6 files changed, 108 insertions(+), 30 deletions(-)

diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index 6a3f69a0..b5aea9b8 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -189,6 +189,44 @@
                   " do not appear in any body literal"))
               (else nil))))))))
 
+(define
+  dl-rename-anon-term
+  (fn
+    (term next-name)
+    (cond
+      ((and (symbol? term) (= (symbol->string term) "_"))
+        (next-name))
+      ((list? term)
+        (map (fn (x) (dl-rename-anon-term x next-name)) term))
+      (else term))))
+
+(define
+  dl-rename-anon-lit
+  (fn
+    (lit next-name)
+    (cond
+      ((and (dict? lit) (has-key? lit :neg))
+        {:neg (dl-rename-anon-term (get lit :neg) next-name)})
+      ((list? lit) (dl-rename-anon-term lit next-name))
+      (else lit))))
+
+(define
+  dl-make-anon-renamer
+  (fn
+    ()
+    (let ((counter 0))
+      (fn () (do (set! counter (+ counter 1))
+                 (string->symbol (str "_anon" counter)))))))
+
+(define
+  dl-rename-anon-rule
+  (fn
+    (rule)
+    (let ((next-name (dl-make-anon-renamer)))
+      {:head (dl-rename-anon-term (get rule :head) next-name)
+       :body (map (fn (lit) (dl-rename-anon-lit lit next-name))
+                  (get rule :body))})))
+
 (define
   dl-add-rule!
   (fn
@@ -199,14 +237,15 @@
       ((not (has-key? rule :head))
         (error (str "dl-add-rule!: rule missing :head, got " rule)))
       (else
-        (let
-          ((err (dl-rule-check-safety rule)))
-          (cond
-            ((not (nil? err)) (error (str "dl-add-rule!: " err)))
-            (else
-              (let
-                ((rules (get db :rules)))
-                (do (append! rules rule) true)))))))))
+        (let ((rule (dl-rename-anon-rule rule)))
+          (let
+            ((err (dl-rule-check-safety rule)))
+            (cond
+              ((not (nil? err)) (error (str "dl-add-rule!: " err)))
+              (else
+                (let
+                  ((rules (get db :rules)))
+                  (do (append! rules rule) true))))))))))
 
 (define
   dl-add-clause!
diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index acd74e5e..677fb636 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -368,21 +368,26 @@
     (db goal)
     (do
       (dl-saturate! db)
+      ;; Rename anonymous '_' vars in the goal so multiple occurrences
+      ;; do not unify together. Keep the user-facing var list (taken
+      ;; before renaming) so projected results retain user names.
       (let
-        ((substs (dl-find-bindings (list goal) db (dl-empty-subst)))
-          (vars (dl-vars-of goal))
-          (results (list)))
-        (do
-          (for-each
-            (fn
-              (s)
-              (let
-                ((proj (dl-project-subst s vars)))
-                (when
-                  (not (dl-tuple-member? proj results))
-                  (append! results proj))))
-            substs)
-          results)))))
+        ((user-vars (filter (fn (n) (not (= n "_"))) (dl-vars-of goal)))
+          (renamed (dl-rename-anon-lit goal (dl-make-anon-renamer))))
+        (let
+          ((substs (dl-find-bindings (list renamed) db (dl-empty-subst)))
+            (results (list)))
+          (do
+            (for-each
+              (fn
+                (s)
+                (let
+                  ((proj (dl-project-subst s user-vars)))
+                  (when
+                    (not (dl-tuple-member? proj results))
+                    (append! results proj))))
+              substs)
+            results))))))
 
 (define
   dl-project-subst
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index e30419f8..a855f4e0 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 153,
+  "total_passed": 156,
   "total_failed": 0,
-  "total": 153,
+  "total": 156,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
-    {"name":"eval","passed":15,"failed":0,"total":15},
+    {"name":"eval","passed":18,"failed":0,"total":18},
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -15,5 +15,5 @@
     {"name":"api","passed":9,"failed":0,"total":9},
     {"name":"demo","passed":10,"failed":0,"total":10}
   ],
-  "generated": "2026-05-08T08:49:52+00:00"
+  "generated": "2026-05-08T08:57:57+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 2b5b5d7e..6977408c 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**153 / 153 passing** (0 failure(s)).
+**156 / 156 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
 | parse | 18 | 18 | ok |
 | unify | 28 | 28 | ok |
-| eval | 15 | 15 | ok |
+| eval | 18 | 18 | ok |
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index 1c51e9b4..d6b6f8e6 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -173,9 +173,18 @@
         "unsafe — empty body"
         (dl-et-throws? (fn () (dl-program "p(X) :- .")))
         true)
+      ;; Underscore in head is unsafe — it's a fresh existential per
+      ;; occurrence after Phase 5d's anonymous-var renaming, and there's
+      ;; nothing in the body to bind it. (Old behavior accepted this by
+      ;; treating '_' as a literal name to skip; the renaming made it an
+      ;; ordinary unbound variable.)
       (dl-et-test!
-        "underscore var ok"
+        "underscore in head — unsafe"
         (dl-et-throws? (fn () (dl-program "p(X, _) :- q(X).")))
+        true)
+      (dl-et-test!
+        "underscore in body only — safe"
+        (dl-et-throws? (fn () (dl-program "p(X) :- q(X, _).")))
         false)
       (dl-et-test!
         "var only in head — unsafe"
@@ -192,7 +201,21 @@
             ()
             (dl-program
               "edge(a,b). edge(b,c). reach(X, Z) :- edge(X, Y), edge(Y, Z).")))
-        false))))
+        false)
+
+      ;; Anonymous variables: each occurrence must be independent.
+      (dl-et-test-set! "anon vars in rule are independent"
+        (dl-query
+          (dl-program
+            "p(a, b). p(c, d). q(X) :- p(X, _), p(_, Y).")
+          (list (quote q) (quote X)))
+        (list {:X (quote a)} {:X (quote c)}))
+
+      (dl-et-test-set! "anon vars in goal are independent"
+        (dl-query
+          (dl-program "p(1, 2, 3). p(4, 5, 6).")
+          (list (quote p) (quote _) (quote X) (quote _)))
+        (list {:X 2} {:X 5})))))
 
 (define
   dl-eval-tests-run!
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index d24293a3..21f6733a 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -269,6 +269,17 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 5d semantic fix: anonymous `_` variables are
+  renamed per occurrence at `dl-add-rule!` and `dl-query` time so
+  `(p X _) (p _ Y)` no longer unifies the two `_`s. New helpers
+  `dl-rename-anon-term`, `dl-rename-anon-lit`, `dl-make-anon-renamer`,
+  `dl-rename-anon-rule` in db.sx; eval.sx's dl-query renames the goal
+  before search and projects only user-named vars (`_` is filtered
+  out of the projection list). The "underscore in head" test now
+  correctly rejects `(p X _) :- q(X).` — after renaming, the head's
+  fresh anon var has no body binder. Two new eval tests verify
+  rule-level and goal-level independence. 155/155 expected.
+
 - 2026-05-08 — Phase 5c perf: indexed `dl-find-bindings`. Replaced
   the recursive `(rest lits)` walk with `dl-fb-aux lits db subst i n`
   using `nth lits i`. Eliminates O(N²) list-copy per body of length

From 55286cc5bcf79cb1393966a1f8c0ffaf93a1a581 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:02:43 +0000
Subject: [PATCH 15/89] datalog: findall aggregate (159/159)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

(findall L V Goal) — bind L to the distinct V values for which Goal
holds, or the empty list when none. One-line addition to
dl-do-aggregate that returns the unreduced list. Tests cover EDB,
derived relation, and empty cases.

Useful for "give me all the X such that ..." queries without
scalar reduction.
---
 lib/datalog/aggregates.sx       |  3 ++-
 lib/datalog/scoreboard.json     |  8 ++++----
 lib/datalog/scoreboard.md       |  4 ++--
 lib/datalog/tests/aggregates.sx | 27 +++++++++++++++++++++++++++
 plans/datalog-on-sx.md          | 14 +++++++++++---
 5 files changed, 46 insertions(+), 10 deletions(-)

diff --git a/lib/datalog/aggregates.sx b/lib/datalog/aggregates.sx
index 153879f7..27117fd6 100644
--- a/lib/datalog/aggregates.sx
+++ b/lib/datalog/aggregates.sx
@@ -19,7 +19,7 @@
 ;;
 ;; Empty input: count → 0, sum → 0, min/max → no binding (rule fails).
 
-(define dl-aggregate-rels (list "count" "sum" "min" "max"))
+(define dl-aggregate-rels (list "count" "sum" "min" "max" "findall"))
 
 (define
   dl-aggregate?
@@ -43,6 +43,7 @@
     (cond
       ((= op "count") (len vals))
       ((= op "sum") (dl-sum-vals vals 0))
+      ((= op "findall") vals)
       ((= op "min")
         (cond
           ((= (len vals) 0) :empty)
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index a855f4e0..f184d68b 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 156,
+  "total_passed": 159,
   "total_failed": 0,
-  "total": 156,
+  "total": 159,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -11,9 +11,9 @@
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
-    {"name":"aggregates","passed":10,"failed":0,"total":10},
+    {"name":"aggregates","passed":13,"failed":0,"total":13},
     {"name":"api","passed":9,"failed":0,"total":9},
     {"name":"demo","passed":10,"failed":0,"total":10}
   ],
-  "generated": "2026-05-08T08:57:57+00:00"
+  "generated": "2026-05-08T09:02:31+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 6977408c..7707e42a 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**156 / 156 passing** (0 failure(s)).
+**159 / 159 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -11,6 +11,6 @@
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
-| aggregates | 10 | 10 | ok |
+| aggregates | 13 | 13 | ok |
 | api | 9 | 9 | ok |
 | demo | 10 | 10 | ok |
diff --git a/lib/datalog/tests/aggregates.sx b/lib/datalog/tests/aggregates.sx
index d80276d8..a582ed8a 100644
--- a/lib/datalog/tests/aggregates.sx
+++ b/lib/datalog/tests/aggregates.sx
@@ -199,6 +199,33 @@
           (list (quote popular) (quote P)))
         (list {:P (quote p1)}))
 
+      ;; findall: collect distinct values into a list.
+      (dl-at-test-set! "findall over EDB"
+        (dl-query
+          (dl-program
+            "p(a). p(b). p(c).
+             all_p(L) :- findall(L, X, p(X)).")
+          (list (quote all_p) (quote L)))
+        (list {:L (list (quote a) (quote b) (quote c))}))
+
+      (dl-at-test-set! "findall over derived"
+        (dl-query
+          (dl-program
+            "parent(a, b). parent(b, c). parent(c, d).
+             ancestor(X, Y) :- parent(X, Y).
+             ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).
+             desc(L) :- findall(L, X, ancestor(a, X)).")
+          (list (quote desc) (quote L)))
+        (list {:L (list (quote b) (quote c) (quote d))}))
+
+      (dl-at-test-set! "findall empty"
+        (dl-query
+          (dl-program
+            "p(1).
+             all_q(L) :- findall(L, X, q(X)).")
+          (list (quote all_q) (quote L)))
+        (list {:L (list)}))
+
       ;; Aggregate vs single distinct.
       (dl-at-test-set! "distinct counted once"
         (dl-query
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 21f6733a..28f6495e 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -186,9 +186,10 @@ large graphs.
 
 ### Phase 8 — aggregation (Datalog+)
 - [x] `(count R V Goal)`, `(sum R V Goal)`, `(min R V Goal)`,
-      `(max R V Goal)` — first arg is the result variable, second is the
-      aggregated variable, third is the goal literal. Live in
-      `lib/datalog/aggregates.sx`.
+      `(max R V Goal)`, `(findall L V Goal)` — first arg is the result
+      variable, second is the aggregated variable, third is the goal
+      literal. `findall` returns the distinct-value list itself; the
+      others reduce. Live in `lib/datalog/aggregates.sx`.
 - [x] `dl-eval-aggregate`: runs `dl-find-bindings` on the goal under the
       current subst (which provides outer-context bindings), collects
       distinct values of the aggregated var, applies the aggregate.
@@ -269,6 +270,13 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 8 extension: `findall L V Goal` aggregate. Bind
+  L to the list of distinct V values for which Goal holds (or the
+  empty list when no matches). Implemented as a one-line case in
+  `dl-do-aggregate`. 3 new tests: EDB, derived relation, empty.
+  Useful for "give me all the X such that …" queries without
+  scalar reduction.
+
 - 2026-05-08 — Phase 5d semantic fix: anonymous `_` variables are
   renamed per occurrence at `dl-add-rule!` and `dl-query` time so
   `(p X _) (p _ Y)` no longer unifies the two `_`s. New helpers

From d09ed83fa1e30c5d6fc33bb29a9e09627ace177e Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:05:36 +0000
Subject: [PATCH 16/89] datalog: cooking-posts canonical demo (Phase 10,
 162/162)

Adds the canonical Phase 10 example from the plan: "Posts about
cooking by people I follow (transitively)." dl-demo-cooking-rules
defines reach over the follow graph (recursive transitive closure)
and cooking-post-by-network joining reach + authored + (tagged P
cooking). 3 new demo tests cover transitive network, direct-only
follow, and empty-network cases.
---
 lib/datalog/demo.sx         | 20 ++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/demo.sx   | 35 +++++++++++++++++++++++++++++++++++
 plans/datalog-on-sx.md      | 11 +++++++++++
 5 files changed, 72 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/demo.sx b/lib/datalog/demo.sx
index 7bbdc3b2..407facd4 100644
--- a/lib/datalog/demo.sx
+++ b/lib/datalog/demo.sx
@@ -64,6 +64,26 @@
      (subgroup-trans X Z <- (subgroup X Y) (subgroup-trans Y Z))
      (can-access A R <- (in-group A G) (allowed G R)))))
 
+;; ── Demo 4: cooking-posts (the canonical Phase 10 query) ────────
+;; "Posts about cooking by people I follow (transitively)."
+;; Combines federation (follows + transitive reach), authoring,
+;; tagging — the rose-ash multi-domain join.
+;;
+;; EDB:
+;;   (follows ACTOR-A ACTOR-B)
+;;   (authored ACTOR POST)
+;;   (tagged POST TAG)
+(define
+  dl-demo-cooking-rules
+  (quote
+    ((reach Me Them <- (follows Me Them))
+     (reach Me Them <- (follows Me X) (reach X Them))
+     (cooking-post-by-network Me P
+       <-
+       (reach Me Author)
+       (authored Author P)
+       (tagged P cooking)))))
+
 ;; ── Loader stub ──────────────────────────────────────────────────
 ;; Wiring to PostgreSQL would replace these helpers with calls into
 ;; rose-ash's internal HTTP RPC (fetch_data → /internal/data/...).
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index f184d68b..33dd2a77 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 159,
+  "total_passed": 162,
   "total_failed": 0,
-  "total": 159,
+  "total": 162,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,7 +13,7 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":13,"failed":0,"total":13},
     {"name":"api","passed":9,"failed":0,"total":9},
-    {"name":"demo","passed":10,"failed":0,"total":10}
+    {"name":"demo","passed":13,"failed":0,"total":13}
   ],
-  "generated": "2026-05-08T09:02:31+00:00"
+  "generated": "2026-05-08T09:05:25+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 7707e42a..ef47d2fd 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**159 / 159 passing** (0 failure(s)).
+**162 / 162 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,4 +13,4 @@
 | negation | 10 | 10 | ok |
 | aggregates | 13 | 13 | ok |
 | api | 9 | 9 | ok |
-| demo | 10 | 10 | ok |
+| demo | 13 | 13 | ok |
diff --git a/lib/datalog/tests/demo.sx b/lib/datalog/tests/demo.sx
index d8218266..968da0bd 100644
--- a/lib/datalog/tests/demo.sx
+++ b/lib/datalog/tests/demo.sx
@@ -179,6 +179,41 @@
           (quote (can-access X blog)))
         (list {:X (quote carol)}))
 
+      ;; ── Cooking posts (canonical Phase 10 example) ─────────
+      (dl-demo-test-set! "cooking posts by network"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((follows me alice) (follows alice bob) (follows alice carol)
+               (authored alice p1) (authored bob p2)
+               (authored carol p3) (authored carol p4)
+               (tagged p1 travel) (tagged p2 cooking)
+               (tagged p3 cooking) (tagged p4 books)))
+            dl-demo-cooking-rules)
+          (quote (cooking-post-by-network me P)))
+        (list {:P (quote p2)} {:P (quote p3)}))
+
+      (dl-demo-test-set! "cooking — direct follow only"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((follows me bob)
+               (authored bob p1) (authored bob p2)
+               (tagged p1 cooking) (tagged p2 books)))
+            dl-demo-cooking-rules)
+          (quote (cooking-post-by-network me P)))
+        (list {:P (quote p1)}))
+
+      (dl-demo-test-set! "cooking — none in network"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((follows me bob)
+               (authored bob p1) (tagged p1 books)))
+            dl-demo-cooking-rules)
+          (quote (cooking-post-by-network me P)))
+        (list))
+
       (dl-demo-test-set! "no access without grant"
         (dl-query
           (dl-demo-make
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 28f6495e..2d7fca84 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -243,6 +243,9 @@ large graphs.
         `(interesting Me P)` joining follows + authored + popular.
       - **Permissions**: `(member A G)`, `(subgroup C P)`, `(allowed G R)`
         → `(in-group A G)` over transitive subgroups, `(can-access A R)`.
+      - **Cooking-posts** (the canonical example): `(reach Me Them)` over
+        the follow graph, then `(cooking-post-by-network Me P)` joining
+        reach + authored + `(tagged P cooking)`.
 - [ ] Loader `dl-load-from-db!` — out of scope for this loop
       (would need to edit `shared/services/` outside `lib/datalog/`).
       Programs in `demo.sx` already document the EDB shape expected
@@ -270,6 +273,14 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 10 demo + canonical query. Added the "cooking
+  posts by people I follow (transitively)" example from the plan:
+  `dl-demo-cooking-rules` defines `reach` over the follow graph
+  (recursive transitive closure) and `cooking-post-by-network` that
+  joins reach with `authored` and `(tagged P cooking)`. 3 demo
+  tests cover transitive network, direct-only follow, and
+  empty-network cases.
+
 - 2026-05-08 — Phase 8 extension: `findall L V Goal` aggregate. Bind
   L to the list of distinct V values for which Goal holds (or the
   empty list when no matches). Implemented as a one-line case in

From a63d67247a1100cf6480108fe542c73c78800632 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:08:58 +0000
Subject: [PATCH 17/89] datalog: add public-API documentation index in
 datalog.sx

---
 lib/datalog/datalog.sx | 79 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 79 insertions(+)
 create mode 100644 lib/datalog/datalog.sx

diff --git a/lib/datalog/datalog.sx b/lib/datalog/datalog.sx
new file mode 100644
index 00000000..8189ec09
--- /dev/null
+++ b/lib/datalog/datalog.sx
@@ -0,0 +1,79 @@
+;; lib/datalog/datalog.sx — public API documentation index.
+;;
+;; This file is reference-only — `load` is an epoch-protocol command,
+;; not an SX function, so it cannot reload a list of files from inside
+;; another `.sx` file. To set up a fresh sx_server session with all
+;; modules in scope, issue these loads in order:
+;;
+;;   (load "lib/datalog/tokenizer.sx")
+;;   (load "lib/datalog/parser.sx")
+;;   (load "lib/datalog/unify.sx")
+;;   (load "lib/datalog/db.sx")
+;;   (load "lib/datalog/builtins.sx")
+;;   (load "lib/datalog/aggregates.sx")
+;;   (load "lib/datalog/strata.sx")
+;;   (load "lib/datalog/eval.sx")
+;;   (load "lib/datalog/api.sx")
+;;   (load "lib/datalog/demo.sx")
+;;
+;; (lib/datalog/conformance.sh runs this load list automatically.)
+;;
+;; ── Public API surface ─────────────────────────────────────────────
+;;
+;;   Source / data:
+;;     (dl-tokenize "src")              → token list
+;;     (dl-parse "src")                 → parsed clauses
+;;     (dl-program "src")               → db built from a source string
+;;     (dl-program-data facts rules)    → db from SX data lists; rules
+;;                                        accept either dict form or
+;;                                        list form with `<-` arrow
+;;
+;;   Construction (mutates db):
+;;     (dl-make-db)                     empty db
+;;     (dl-add-fact! db lit)            rejects non-ground
+;;     (dl-add-rule! db rule)           rejects unsafe rules
+;;     (dl-rule head body)              dict-rule constructor
+;;     (dl-add-clause! db clause)       parser output → fact or rule
+;;     (dl-load-program! db src)        string source
+;;
+;;   Mutation:
+;;     (dl-assert! db lit)              add + re-saturate
+;;     (dl-retract! db lit)             drop EDB, wipe IDB, re-saturate
+;;
+;;   Query / inspection:
+;;     (dl-saturate! db)                stratified semi-naive default
+;;     (dl-saturate-naive! db)          reference (slow on chains)
+;;     (dl-saturate-rules! db rules)    per-rule-set semi-naive worker
+;;     (dl-query db goal)               list of substitution dicts
+;;     (dl-relation db rel-name)        tuple list for a relation
+;;     (dl-rules db)                    rule list
+;;     (dl-fact-count db)               total ground tuples
+;;
+;; ── Body literal kinds ─────────────────────────────────────────────
+;;
+;;   Positive             (rel arg ... arg)
+;;   Negation             {:neg (rel arg ...)}
+;;   Comparison           (< X Y), (<= X Y), (> X Y), (>= X Y),
+;;                        (= X Y), (!= X Y)
+;;   Arithmetic           (is Z (+ X Y)) and (- * /)
+;;   Aggregation          (count R V Goal),  (sum R V Goal),
+;;                        (min R V Goal),    (max R V Goal),
+;;                        (findall L V Goal)
+;;
+;; ── Variable conventions ───────────────────────────────────────────
+;;
+;;   Variables: SX symbols whose first char is uppercase A–Z or '_'.
+;;   Anonymous '_' is renamed to a fresh _anon<N> per occurrence at
+;;   rule/query load time so multiple '_' don't unify.
+;;
+;; ── Demo programs ──────────────────────────────────────────────────
+;;
+;;   See lib/datalog/demo.sx — federation, content, permissions, and
+;;   the canonical "cooking posts by people I follow (transitively)"
+;;   example.
+;;
+;; ── Status ─────────────────────────────────────────────────────────
+;;
+;;   See plans/datalog-on-sx.md — phase-by-phase progress log and
+;;   roadmap. Run `bash lib/datalog/conformance.sh` to refresh
+;;   `lib/datalog/scoreboard.{json,md}`.

From b95d8c5a63a3a55bffea5933a45e4fe9dc7f83f9 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:13:10 +0000
Subject: [PATCH 18/89] datalog: stratifier rejects recursion through
 aggregation (165/165)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bug: dl-check-stratifiable iterated body literals looking only for
explicit :neg literals, missing aggregate cycles. Now also walks
aggregates via dl-aggregate-dep-edge — q(N) :- count(N, X, q(X))
correctly errors out at saturation time.

3 new tests cover:
- recursion-through-aggregation rejected
- negation + aggregation coexist when in different strata
- min over empty derived relation produces no result
---
 lib/datalog/scoreboard.json     |  8 +++----
 lib/datalog/scoreboard.md       |  4 ++--
 lib/datalog/strata.sx           | 39 +++++++++++++++++++++++----------
 lib/datalog/tests/aggregates.sx | 33 ++++++++++++++++++++++++++++
 plans/datalog-on-sx.md          | 10 +++++++++
 5 files changed, 76 insertions(+), 18 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 33dd2a77..9fa459b9 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 162,
+  "total_passed": 165,
   "total_failed": 0,
-  "total": 162,
+  "total": 165,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -11,9 +11,9 @@
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
-    {"name":"aggregates","passed":13,"failed":0,"total":13},
+    {"name":"aggregates","passed":16,"failed":0,"total":16},
     {"name":"api","passed":9,"failed":0,"total":9},
     {"name":"demo","passed":13,"failed":0,"total":13}
   ],
-  "generated": "2026-05-08T09:05:25+00:00"
+  "generated": "2026-05-08T09:12:57+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index ef47d2fd..40dd40ca 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**162 / 162 passing** (0 failure(s)).
+**165 / 165 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -11,6 +11,6 @@
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
-| aggregates | 13 | 13 | ok |
+| aggregates | 16 | 16 | ok |
 | api | 9 | 9 | ok |
 | demo | 13 | 13 | ok |
diff --git a/lib/datalog/strata.sx b/lib/datalog/strata.sx
index 0928c989..feaad46f 100644
--- a/lib/datalog/strata.sx
+++ b/lib/datalog/strata.sx
@@ -197,18 +197,33 @@
                   (for-each
                     (fn
                       (lit)
-                      (when
-                        (and (dict? lit) (has-key? lit :neg))
-                        (let ((tgt (dl-rel-name (get lit :neg))))
-                          (when
-                            (and (not (nil? tgt))
-                                 (dl-reach-cycle? reach head-rel tgt))
-                            (set!
-                              err
-                              (str "non-stratifiable: relation " head-rel
-                                   " transitively depends through negation on "
-                                   tgt
-                                   " which depends back on " head-rel))))))
+                      (cond
+                        ((and (dict? lit) (has-key? lit :neg))
+                          (let ((tgt (dl-rel-name (get lit :neg))))
+                            (when
+                              (and (not (nil? tgt))
+                                   (dl-reach-cycle? reach head-rel tgt))
+                              (set!
+                                err
+                                (str "non-stratifiable: relation " head-rel
+                                     " transitively depends through negation on "
+                                     tgt
+                                     " which depends back on " head-rel)))))
+                        ((dl-aggregate? lit)
+                          (let ((edge (dl-aggregate-dep-edge lit)))
+                            (when
+                              (not (nil? edge))
+                              (let ((tgt (get edge :rel)))
+                                (when
+                                  (and (not (nil? tgt))
+                                       (dl-reach-cycle? reach head-rel tgt))
+                                  (set!
+                                    err
+                                    (str "non-stratifiable: relation "
+                                         head-rel
+                                         " aggregates over " tgt
+                                         " which depends back on "
+                                         head-rel))))))))) 
                     (get rule :body)))))
             (dl-rules db))
           err)))))
diff --git a/lib/datalog/tests/aggregates.sx b/lib/datalog/tests/aggregates.sx
index a582ed8a..dbe2f643 100644
--- a/lib/datalog/tests/aggregates.sx
+++ b/lib/datalog/tests/aggregates.sx
@@ -227,6 +227,39 @@
         (list {:L (list)}))
 
       ;; Aggregate vs single distinct.
+      ;; Stratification: recursion through aggregation is rejected.
+      (dl-at-test! "agg recursion rejected"
+        (dl-at-throws?
+          (fn ()
+            (let ((db (dl-make-db)))
+              (do
+                (dl-add-rule! db
+                  {:head (list (quote q) (quote N))
+                   :body (list (list (quote count) (quote N) (quote X)
+                                     (list (quote q) (quote X))))})
+                (dl-saturate! db)))))
+        true)
+
+      ;; Negation + aggregation in the same body — different strata.
+      (dl-at-test-set! "neg + agg coexist"
+        (dl-query
+          (dl-program
+            "u(a). u(b). u(c). banned(b).
+             active(X) :- u(X), not(banned(X)).
+             cnt(N) :- count(N, X, active(X)).")
+          (list (quote cnt) (quote N)))
+        (list {:N 2}))
+
+      ;; Min over a derived empty relation: no result.
+      (dl-at-test-set! "min over empty derived"
+        (dl-query
+          (dl-program
+            "s(50). s(60).
+             score(N) :- s(N), >(N, 100).
+             low(M) :- min(M, X, score(X)).")
+          (list (quote low) (quote M)))
+        (list))
+
       (dl-at-test-set! "distinct counted once"
         (dl-query
           (dl-program
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 2d7fca84..b3769e92 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -273,6 +273,16 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Bug fix: `dl-check-stratifiable` now rejects recursion
+  through aggregation (e.g., `q(N) :- count(N, X, q(X))`). The
+  stratifier was already adding negation-like edges for aggregates,
+  but the cycle scan only looked at explicit `:neg` literals. Added
+  the matching aggregate branch to the body iteration. Also adds
+  doc-only `lib/datalog/datalog.sx` with the public-API surface
+  (since `load` is an epoch command and can't recurse from within an
+  `.sx` file). 3 new aggregate tests cover recursion-rejection,
+  negation-and-aggregation coexistence, and min-over-empty-derived.
+
 - 2026-05-08 — Phase 10 demo + canonical query. Added the "cooking
   posts by people I follow (transitively)" example from the plan:
   `dl-demo-cooking-rules` defines `reach` over the follow graph

From 408fc27366f4621d5ce37e9fcdeaa72b8c4f2191 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:17:15 +0000
Subject: [PATCH 19/89] datalog: dl-query accepts conjunctive goal lists
 (167/167)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

dl-query now auto-dispatches on the first element's shape:
- positive literal (head is a symbol) or {:neg ...} dict → wrap
- list of literals → conjunctive query

dl-query-coerce normalizes; dl-query-user-vars collects the union
of user-named vars (deduped, '_' filtered) for projection. Old
single-literal callers unchanged.

  (dl-query db '(p X))                   ; single
  (dl-query db '((p X) (q X)))           ; conjunction
  (dl-query db (list '(n X) '(> X 2)))   ; with comparison

2 new api tests cover multi-goal AND and conjunction with comparison.
---
 lib/datalog/eval.sx         | 74 ++++++++++++++++++++++++++++---------
 lib/datalog/scoreboard.json |  8 ++--
 lib/datalog/scoreboard.md   |  4 +-
 lib/datalog/tests/api.sx    | 18 +++++++++
 plans/datalog-on-sx.md      | 14 ++++++-
 5 files changed, 94 insertions(+), 24 deletions(-)

diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index 677fb636..476fd0d0 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -362,32 +362,72 @@
 
 ;; ── Querying ─────────────────────────────────────────────────────
 
+;; Coerce a query argument to a list of body literals. A single literal
+;; like `(p X)` (positive — head is a symbol) or `{:neg ...}` becomes
+;; `((p X))`. A list of literals like `((p X) (q X))` is returned as-is.
+(define
+  dl-query-coerce
+  (fn
+    (goal)
+    (cond
+      ((and (dict? goal) (has-key? goal :neg)) (list goal))
+      ((and (list? goal) (> (len goal) 0) (symbol? (first goal)))
+        (list goal))
+      ((list? goal) goal)
+      (else (error (str "dl-query: unrecognised goal shape: " goal))))))
+
 (define
   dl-query
   (fn
     (db goal)
     (do
       (dl-saturate! db)
-      ;; Rename anonymous '_' vars in the goal so multiple occurrences
-      ;; do not unify together. Keep the user-facing var list (taken
-      ;; before renaming) so projected results retain user names.
+      ;; Rename anonymous '_' vars in each goal literal so multiple
+      ;; occurrences do not unify together. Keep the user-facing var
+      ;; list (taken before renaming) so projected results retain user
+      ;; names.
       (let
-        ((user-vars (filter (fn (n) (not (= n "_"))) (dl-vars-of goal)))
-          (renamed (dl-rename-anon-lit goal (dl-make-anon-renamer))))
+        ((goals (dl-query-coerce goal))
+          (renamer (dl-make-anon-renamer)))
         (let
-          ((substs (dl-find-bindings (list renamed) db (dl-empty-subst)))
-            (results (list)))
-          (do
-            (for-each
-              (fn
-                (s)
-                (let
-                  ((proj (dl-project-subst s user-vars)))
+          ((user-vars (dl-query-user-vars goals))
+            (renamed (map (fn (g) (dl-rename-anon-lit g renamer)) goals)))
+          (let
+            ((substs (dl-find-bindings renamed db (dl-empty-subst)))
+              (results (list)))
+            (do
+              (for-each
+                (fn
+                  (s)
+                  (let
+                    ((proj (dl-project-subst s user-vars)))
+                    (when
+                      (not (dl-tuple-member? proj results))
+                      (append! results proj))))
+                substs)
+              results)))))))
+
+(define
+  dl-query-user-vars
+  (fn
+    (goals)
+    (let ((seen (list)))
+      (do
+        (for-each
+          (fn
+            (g)
+            (let
+              ((tgt
+                 (if (and (dict? g) (has-key? g :neg)) (get g :neg) g)))
+              (for-each
+                (fn
+                  (v)
                   (when
-                    (not (dl-tuple-member? proj results))
-                    (append! results proj))))
-              substs)
-            results))))))
+                    (and (not (= v "_")) (not (dl-member-string? v seen)))
+                    (append! seen v)))
+                (dl-vars-of tgt))))
+          goals)
+        seen))))
 
 (define
   dl-project-subst
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 9fa459b9..2b5d08f2 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 165,
+  "total_passed": 167,
   "total_failed": 0,
-  "total": 165,
+  "total": 167,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -12,8 +12,8 @@
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":16,"failed":0,"total":16},
-    {"name":"api","passed":9,"failed":0,"total":9},
+    {"name":"api","passed":11,"failed":0,"total":11},
     {"name":"demo","passed":13,"failed":0,"total":13}
   ],
-  "generated": "2026-05-08T09:12:57+00:00"
+  "generated": "2026-05-08T09:16:59+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 40dd40ca..639f393a 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**165 / 165 passing** (0 failure(s)).
+**167 / 167 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -12,5 +12,5 @@
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 16 | 16 | ok |
-| api | 9 | 9 | ok |
+| api | 11 | 11 | ok |
 | demo | 13 | 13 | ok |
diff --git a/lib/datalog/tests/api.sx b/lib/datalog/tests/api.sx
index aa127d38..577bafe9 100644
--- a/lib/datalog/tests/api.sx
+++ b/lib/datalog/tests/api.sx
@@ -180,6 +180,24 @@
             (dl-query db (quote (p X)))))
         (list {:X 1} {:X 2}))
 
+      ;; Multi-goal query: pass list of literals.
+      (dl-api-test-set! "multi-goal query"
+        (dl-query
+          (dl-program-data
+            (quote ((p 1) (p 2) (p 3) (q 2) (q 3)))
+            (list))
+          (list (quote (p X)) (quote (q X))))
+        (list {:X 2} {:X 3}))
+
+      ;; Multi-goal with comparison.
+      (dl-api-test-set! "multi-goal with comparison"
+        (dl-query
+          (dl-program-data
+            (quote ((n 1) (n 2) (n 3) (n 4) (n 5)))
+            (list))
+          (list (quote (n X)) (list (string->symbol ">") (quote X) 2)))
+        (list {:X 3} {:X 4} {:X 5}))
+
       ;; dl-rule-from-list with no arrow → fact-style.
       (dl-api-test-set! "no arrow → fact-like rule"
         (let
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index b3769e92..65bd65ac 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -222,7 +222,11 @@ large graphs.
       ```
 - [x] `(dl-rule head body)` constructor for the dict form.
 - [x] `(dl-query db '(ancestor tom X))` already worked — same query API
-      consumes the SX-data goal.
+      consumes the SX-data goal. Now also accepts a *list* of body
+      literals for conjunctive queries:
+      `(dl-query db '((p X) (q X)))`,
+      `(dl-query db (list '(n X) '(> X 2)))`. Auto-dispatched via
+      `dl-query-coerce` on first-element shape.
 - [x] `(dl-assert! db '(parent ann pat))` → adds the fact and re-saturates.
 - [x] `(dl-retract! db '(parent bob ann))` → drops matching tuples from
       the EDB list, wipes every relation that has a rule (those are IDB),
@@ -273,6 +277,14 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — `dl-query` accepts a list of body literals for
+  conjunctive queries, in addition to a single positive literal.
+  `dl-query-coerce` dispatches based on the first element's shape:
+  positive lit (head is a symbol) or `:neg` dict → wrap as singleton;
+  list of lits → use as-is. `dl-query-user-vars` collects the union
+  of vars across all goals (deduped, `_` filtered) for projection.
+  2 new api tests: multi-goal AND, and conjunction with comparison.
+
 - 2026-05-08 — Bug fix: `dl-check-stratifiable` now rejects recursion
   through aggregation (e.g., `q(N) :- count(N, X, q(X))`). The
   stratifier was already adding negation-like edges for aggregates,

From 9054fe983d1a06d8432fd7b0b108f5b95435e033 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:20:23 +0000
Subject: [PATCH 20/89] datalog: tag co-occurrence demo (169/169)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Adds (cotagged P T1 T2) — P has both T1 and T2 with T1 != T2 — and
(tag-pair-count T1 T2 N) which counts posts cotagged with each
distinct (T1, T2) pair. Demonstrates count aggregation against a
recursive-then-aggregated stream of derived tuples.

2 new demo tests: cooking + vegetarian co-occurrence on a small
data set, and a count-of-co-occurrences query.
---
 lib/datalog/demo.sx         | 20 ++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/demo.sx   | 23 +++++++++++++++++++++++
 4 files changed, 49 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/demo.sx b/lib/datalog/demo.sx
index 407facd4..d4a9a29a 100644
--- a/lib/datalog/demo.sx
+++ b/lib/datalog/demo.sx
@@ -84,6 +84,26 @@
        (authored Author P)
        (tagged P cooking)))))
 
+;; ── Demo 5: tag co-occurrence ───────────────────────────────────
+;; "Posts tagged with both T1 AND T2." Useful for narrowed-down
+;; recommendations like "vegetarian cooking" posts.
+;;
+;; EDB:
+;;   (tagged POST TAG)
+;; IDB:
+;;   (cotagged POST T1 T2)        — post has both T1 and T2 (T1 != T2)
+;;   (popular-pair T1 T2 N)       — count of posts cotagged (T1, T2)
+(define
+  dl-demo-tag-cooccur-rules
+  (quote
+    ((cotagged P T1 T2 <- (tagged P T1) (tagged P T2) (!= T1 T2))
+     ;; Distinct (T1, T2) pairs that occur somewhere.
+     (tag-pair T1 T2 <- (cotagged P T1 T2))
+     (tag-pair-count T1 T2 N
+       <-
+       (tag-pair T1 T2)
+       (count N P (cotagged P T1 T2))))))
+
 ;; ── Loader stub ──────────────────────────────────────────────────
 ;; Wiring to PostgreSQL would replace these helpers with calls into
 ;; rose-ash's internal HTTP RPC (fetch_data → /internal/data/...).
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 2b5d08f2..2545002b 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 167,
+  "total_passed": 169,
   "total_failed": 0,
-  "total": 167,
+  "total": 169,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,7 +13,7 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":16,"failed":0,"total":16},
     {"name":"api","passed":11,"failed":0,"total":11},
-    {"name":"demo","passed":13,"failed":0,"total":13}
+    {"name":"demo","passed":15,"failed":0,"total":15}
   ],
-  "generated": "2026-05-08T09:16:59+00:00"
+  "generated": "2026-05-08T09:20:09+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 639f393a..70c2fe0f 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**167 / 167 passing** (0 failure(s)).
+**169 / 169 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,4 +13,4 @@
 | negation | 10 | 10 | ok |
 | aggregates | 16 | 16 | ok |
 | api | 11 | 11 | ok |
-| demo | 13 | 13 | ok |
+| demo | 15 | 15 | ok |
diff --git a/lib/datalog/tests/demo.sx b/lib/datalog/tests/demo.sx
index 968da0bd..c594a63d 100644
--- a/lib/datalog/tests/demo.sx
+++ b/lib/datalog/tests/demo.sx
@@ -214,6 +214,29 @@
           (quote (cooking-post-by-network me P)))
         (list))
 
+      ;; ── Tag co-occurrence ──────────────────────────────────
+      (dl-demo-test-set! "cotagged posts"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((tagged p1 cooking) (tagged p1 vegetarian)
+               (tagged p2 cooking) (tagged p2 quick)
+               (tagged p3 vegetarian)))
+            dl-demo-tag-cooccur-rules)
+          (quote (cotagged P cooking vegetarian)))
+        (list {:P (quote p1)}))
+
+      (dl-demo-test-set! "tag pair count"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((tagged p1 cooking) (tagged p1 vegetarian)
+               (tagged p2 cooking) (tagged p2 quick)
+               (tagged p3 cooking) (tagged p3 vegetarian)))
+            dl-demo-tag-cooccur-rules)
+          (quote (tag-pair-count cooking vegetarian N)))
+        (list {:N 2}))
+
       (dl-demo-test-set! "no access without grant"
         (dl-query
           (dl-demo-make

From c7315f5877f68d2ca77775a5e29e9fd179a80826 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:21:00 +0000
Subject: [PATCH 21/89] datalog-plan: progress entry for tag co-occurrence demo

---
 plans/datalog-on-sx.md | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 65bd65ac..f0233eec 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -277,6 +277,11 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Demo: tag co-occurrence. `(cotagged P T1 T2)` — post
+  has both T1 and T2 with T1 != T2 — and `(tag-pair-count T1 T2 N)`
+  counting posts per distinct tag pair. Demonstrates count
+  aggregation grouped by outer-context vars. 2 new demo tests.
+
 - 2026-05-08 — `dl-query` accepts a list of body literals for
   conjunctive queries, in addition to a single positive literal.
   `dl-query-coerce` dispatches based on the first element's shape:

From cc64ec5cf225d7ed5e0020d85fe725bd17b6ef34 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:27:44 +0000
Subject: [PATCH 22/89] datalog: first-arg index per relation (Phase 5e perf,
 169/169)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

db gains :facts-index {<rel>: {<first-arg-key>: tuples}} mirroring
the membership :facts-keys index. dl-add-fact! populates the index;
dl-match-positive walks the body literal's first arg under the
current subst — when it's bound to a non-var, look up by (str arg)
instead of scanning the full relation.

For chain-style recursive rules (parent X Y), (ancestor Y Z) the
inner Y has at most one parent, so the inner lookup returns 0–1
tuples instead of N. chain-25 saturation drops from ~33s to ~18s
real (~2x). chain-50 still long but tractable; next bottleneck is
subst dict copies during unification.

dl-retract! refreshed to keep the new index consistent: kept-index
rebuilt during EDB filter, IDB wipes clear all three slots.

Differential semi-naive test bumped to chain-12, semi-only count
test to chain-25.
---
 lib/datalog/api.sx              | 19 ++++++++++---
 lib/datalog/db.sx               | 49 +++++++++++++++++++++++++++++++--
 lib/datalog/eval.sx             | 12 +++++++-
 lib/datalog/scoreboard.json     |  2 +-
 lib/datalog/tests/semi_naive.sx | 16 ++++++-----
 plans/datalog-on-sx.md          | 30 ++++++++++++++------
 6 files changed, 105 insertions(+), 23 deletions(-)

diff --git a/lib/datalog/api.sx b/lib/datalog/api.sx
index 01abec95..a76d3624 100644
--- a/lib/datalog/api.sx
+++ b/lib/datalog/api.sx
@@ -112,7 +112,8 @@
           (let
             ((existing (get (get db :facts) rel-key))
               (kept (list))
-              (kept-keys {}))
+              (kept-keys {})
+              (kept-index {}))
             (do
               (for-each
                 (fn
@@ -121,10 +122,19 @@
                     (not (dl-tuple-equal? t lit))
                     (do
                       (append! kept t)
-                      (dict-set! kept-keys (dl-tuple-key t) true))))
+                      (dict-set! kept-keys (dl-tuple-key t) true)
+                      (when
+                        (>= (len t) 2)
+                        (let ((k (dl-arg-key (nth t 1))))
+                          (do
+                            (when
+                              (not (has-key? kept-index k))
+                              (dict-set! kept-index k (list)))
+                            (append! (get kept-index k) t)))))))
                 existing)
               (dict-set! (get db :facts) rel-key kept)
-              (dict-set! (get db :facts-keys) rel-key kept-keys))))
+              (dict-set! (get db :facts-keys) rel-key kept-keys)
+              (dict-set! (get db :facts-index) rel-key kept-index))))
         ;; Wipe all relations that have a rule (these are IDB) so the
         ;; saturator regenerates them from the surviving EDB.
         (let ((rule-heads (dl-rule-head-rels db)))
@@ -133,7 +143,8 @@
               (k)
               (do
                 (dict-set! (get db :facts) k (list))
-                (dict-set! (get db :facts-keys) k {})))
+                (dict-set! (get db :facts-keys) k {})
+                (dict-set! (get db :facts-index) k {})))
             rule-heads))
         (dl-saturate! db)
         db))))
diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index b5aea9b8..09f92315 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -12,7 +12,7 @@
 ;; lib/datalog/builtins.sx) swaps in the real `dl-rule-check-safety`,
 ;; which is order-aware and understands built-in predicates.
 
-(define dl-make-db (fn () {:facts {} :facts-keys {} :rules (list)}))
+(define dl-make-db (fn () {:facts {} :facts-keys {} :facts-index {} :rules (list)}))
 
 (define
   dl-rel-name
@@ -98,7 +98,8 @@
     (db rel-key)
     (let
       ((facts (get db :facts))
-        (fk (get db :facts-keys)))
+        (fk (get db :facts-keys))
+        (fi (get db :facts-index)))
       (do
         (when
           (not (has-key? facts rel-key))
@@ -106,8 +107,51 @@
         (when
           (not (has-key? fk rel-key))
           (dict-set! fk rel-key {}))
+        (when
+          (not (has-key? fi rel-key))
+          (dict-set! fi rel-key {}))
         (get facts rel-key)))))
 
+;; First-arg index helpers. Tuples are keyed by their first-after-rel
+;; arg's `(str ...)`; when that arg is a constant, dl-match-positive
+;; uses the index instead of scanning the full relation.
+(define
+  dl-arg-key
+  (fn
+    (v)
+    (str v)))
+
+(define
+  dl-index-add!
+  (fn
+    (db rel-key lit)
+    (let
+      ((idx (get db :facts-index))
+        (n (len lit)))
+      (when
+        (and (>= n 2) (has-key? idx rel-key))
+        (let
+          ((rel-idx (get idx rel-key))
+            (k (dl-arg-key (nth lit 1))))
+          (do
+            (when
+              (not (has-key? rel-idx k))
+              (dict-set! rel-idx k (list)))
+            (append! (get rel-idx k) lit)))))))
+
+(define
+  dl-index-lookup
+  (fn
+    (db rel-key arg-val)
+    (let
+      ((idx (get db :facts-index)))
+      (cond
+        ((not (has-key? idx rel-key)) (list))
+        (else
+          (let ((rel-idx (get idx rel-key))
+                (k (dl-arg-key arg-val)))
+            (if (has-key? rel-idx k) (get rel-idx k) (list))))))))
+
 (define dl-tuple-key (fn (lit) (str lit)))
 
 (define
@@ -140,6 +184,7 @@
                 (do
                   (dict-set! key-dict tk true)
                   (append! tuples lit)
+                  (dl-index-add! db rel-key lit)
                   true)))))))))
 
 ;; The full safety check lives in builtins.sx (it has to know which
diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index 476fd0d0..b8ccd83f 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -24,7 +24,17 @@
         ((nil? rel) (error (str "dl-match-positive: bad literal " lit)))
         (else
           (let
-            ((tuples (dl-rel-tuples db rel)))
+            ;; If the first argument walks to a non-variable (constant
+            ;; or already-bound var), use the first-arg index for
+            ;; this relation. Otherwise scan the full tuple list.
+            ((tuples
+               (cond
+                 ((>= (len lit) 2)
+                   (let ((walked (dl-walk (nth lit 1) subst)))
+                     (cond
+                       ((dl-var? walked) (dl-rel-tuples db rel))
+                       (else (dl-index-lookup db rel walked)))))
+                 (else (dl-rel-tuples db rel)))))
             (do
               (for-each
                 (fn
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 2545002b..3bc3e1e5 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -15,5 +15,5 @@
     {"name":"api","passed":11,"failed":0,"total":11},
     {"name":"demo","passed":15,"failed":0,"total":15}
   ],
-  "generated": "2026-05-08T09:20:09+00:00"
+  "generated": "2026-05-08T09:27:29+00:00"
 }
diff --git a/lib/datalog/tests/semi_naive.sx b/lib/datalog/tests/semi_naive.sx
index 914dcb2b..6df2a9e5 100644
--- a/lib/datalog/tests/semi_naive.sx
+++ b/lib/datalog/tests/semi_naive.sx
@@ -120,18 +120,20 @@
         (dl-sn-counts-agree?
           (dl-sn-counts "p(a). p(b). q(X) :- p(X), =(X, a)."))
         true)
-      ;; Chain length 10 — exercises multiple semi-naive iterations
-      ;; against the recursive ancestor rule.
+      ;; Chain length 12 — multiple semi-naive iterations against
+      ;; the recursive ancestor rule (differential vs naive).
       (dl-sn-test!
-        "chain-10 ancestor counts match"
-        (dl-sn-counts-agree? (dl-sn-counts (dl-sn-chain-source 10)))
+        "chain-12 ancestor counts match"
+        (dl-sn-counts-agree? (dl-sn-counts (dl-sn-chain-source 12)))
         true)
+      ;; Chain length 25 — semi-naive only — first-arg index makes
+      ;; this tractable in conformance budget.
       (dl-sn-test!
-        "chain-15 ancestor count value (semi only)"
+        "chain-25 ancestor count value (semi only)"
         (let
-          ((db (dl-program (dl-sn-chain-source 15))))
+          ((db (dl-program (dl-sn-chain-source 25))))
           (do (dl-saturate! db) (len (dl-relation db "ancestor"))))
-        120)
+        325)
       (dl-sn-test!
         "query through semi saturate"
         (let
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index f0233eec..c92f6e78 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -264,19 +264,33 @@ large graphs.
 
 ## Blockers
 
-- **Saturation perf** improving but not free. Resolved hash-set
-  membership in `dl-add-fact!` and replaced recursive `(rest lits)` in
-  `dl-find-bindings` with indexed iteration. chain-15 drops from ~25s
-  to ~16s and chain-25 saturates in ~33s real / 11s user — most CPU
-  now in unification (assoc-based subst dict copies) and dict
-  lookups during walks. Future: a per-rule "compiled" body that
-  pre-resolves arg positions and intern variable indices, then
-  unification can use array slots instead of dict assoc.
+- **Saturation perf**: three rounds done.
+  - hash-set membership in `dl-add-fact!` (Phase 5b)
+  - indexed iteration in `dl-find-bindings` (Phase 5c)
+  - first-arg index per relation (Phase 5e) — when a body literal's
+    first arg walks to a non-variable, dl-match-positive looks up
+    by `(str arg)` instead of scanning the full relation.
+  chain-25 saturation drops from ~33s to ~18s real (10s user).
+  chain-50 still long (~120s+) due to dict-copy overhead in
+  unification subst threading. Future: per-rule "compiled" body
+  with pre-resolved var positions, slot-based subst representation
+  to avoid `assoc` per binding.
 
 ## Progress log
 
 _Newest first._
 
+- 2026-05-08 — Phase 5e perf: first-arg index per relation. db gains
+  `:facts-index {<rel>: {<first-arg-key>: tuples}}` mirroring the
+  existing `:facts-keys` membership index. `dl-add-fact!` populates
+  it; `dl-match-positive` walks the body literal's first arg under
+  the current subst — if it's bound to a non-var, look up by
+  `(str arg)` and iterate only the matching subset. chain-25
+  saturation 33s → 18s real (~2x). chain-50 still slow (~120s+)
+  but tractable; next bottleneck is subst dict copies during
+  unification. Differential test bumped to chain-12, semi-only
+  count to chain-25.
+
 - 2026-05-08 — Demo: tag co-occurrence. `(cotagged P T1 T2)` — post
   has both T1 and T2 with T1 != T2 — and `(tag-pair-count T1 T2 N)`
   counting posts per distinct tag pair. Demonstrates count

From 380580af17604bf67d643cf96dd90b587e65609f Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:30:50 +0000
Subject: [PATCH 23/89] datalog: dl-summary inspection helper (173/173)

Returns {<rel-name>: tuple-count} for relations with any tuples
or that are rule-headed (so empty IDB shows as :rel 0 rather than
disappearing). Skips placeholder entries from internal
dl-ensure-rel! calls. 4 tests cover basic, empty IDB, mixed
EDB+IDB, and empty-db cases.
---
 lib/datalog/db.sx           | 37 +++++++++++++++++++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 31 ++++++++++++++++++++++++++++++-
 4 files changed, 73 insertions(+), 7 deletions(-)

diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index 09f92315..43b4d840 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -327,3 +327,40 @@
           (fn (k) (set! total (+ total (len (get facts k)))))
           (keys facts))
         total))))
+
+;; Returns {<rel-name>: tuple-count} for debugging. Includes
+;; relations with any tuples plus all rule-head relations (so empty
+;; IDB shows as 0). Skips empty EDB-only entries that are placeholders
+;; from internal `dl-ensure-rel!` calls.
+(define
+  dl-summary
+  (fn
+    (db)
+    (let
+      ((facts (get db :facts))
+        (out {})
+        (rule-heads (list)))
+      (do
+        (for-each
+          (fn
+            (rule)
+            (let ((h (dl-rel-name (get rule :head))))
+              (when
+                (and (not (nil? h)) (not (dl-member-string? h rule-heads)))
+                (append! rule-heads h))))
+          (dl-rules db))
+        (for-each
+          (fn
+            (k)
+            (let ((c (len (get facts k))))
+              (when
+                (or (> c 0) (dl-member-string? k rule-heads))
+                (dict-set! out k c))))
+          (keys facts))
+        ;; Add rule heads that have no facts (yet).
+        (for-each
+          (fn
+            (k)
+            (when (not (has-key? out k)) (dict-set! out k 0)))
+          rule-heads)
+        out))))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 3bc3e1e5..4f2c96eb 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 169,
+  "total_passed": 173,
   "total_failed": 0,
-  "total": 169,
+  "total": 173,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
-    {"name":"eval","passed":18,"failed":0,"total":18},
+    {"name":"eval","passed":22,"failed":0,"total":22},
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -15,5 +15,5 @@
     {"name":"api","passed":11,"failed":0,"total":11},
     {"name":"demo","passed":15,"failed":0,"total":15}
   ],
-  "generated": "2026-05-08T09:27:29+00:00"
+  "generated": "2026-05-08T09:30:37+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 70c2fe0f..4242dc6f 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**169 / 169 passing** (0 failure(s)).
+**173 / 173 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
 | parse | 18 | 18 | ok |
 | unify | 28 | 28 | ok |
-| eval | 18 | 18 | ok |
+| eval | 22 | 22 | ok |
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index d6b6f8e6..a47140f7 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -215,7 +215,36 @@
         (dl-query
           (dl-program "p(1, 2, 3). p(4, 5, 6).")
           (list (quote p) (quote _) (quote X) (quote _)))
-        (list {:X 2} {:X 5})))))
+        (list {:X 2} {:X 5}))
+
+      ;; dl-summary: relation -> tuple-count for inspection.
+      (dl-et-test! "dl-summary basic"
+        (dl-summary
+          (let
+            ((db (dl-program "p(1). p(2). q(3).")))
+            (do (dl-saturate! db) db)))
+        {:p 2 :q 1})
+
+      (dl-et-test! "dl-summary empty IDB shown"
+        (dl-summary
+          (let
+            ((db (dl-program "r(X) :- s(X).")))
+            (do (dl-saturate! db) db)))
+        {:r 0})
+
+      (dl-et-test! "dl-summary mixed EDB and IDB"
+        (dl-summary
+          (let
+            ((db (dl-program
+                   "parent(a, b).
+                    ancestor(X, Y) :- parent(X, Y).
+                    ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")))
+            (do (dl-saturate! db) db)))
+        {:parent 1 :ancestor 1})
+
+      (dl-et-test! "dl-summary empty db"
+        (dl-summary (dl-make-db))
+        {}))))
 
 (define
   dl-eval-tests-run!

From cf634ad2b159af1f585c63907b6a50b26846b3d5 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:35:38 +0000
Subject: [PATCH 24/89] datalog: shortest-path demo on weighted DAG (176/176)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

dl-demo-shortest-path-rules: path enumerates X→Z with cost
W = sum of edge weights via is/+; shortest filters to the
minimum cost path per (X, Y) pair via min aggregation.

3 demo tests cover direct/multi-hop choice, multi-hop wins on
cheaper route, and unreachable-empty.

Note: cycles produce infinite distance values without a depth
filter; the rule docstring flags this and suggests adding
(<, D, MAX) for graphs that may cycle.
---
 lib/datalog/demo.sx         | 24 ++++++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/demo.sx   | 25 +++++++++++++++++++++++++
 plans/datalog-on-sx.md      |  7 +++++++
 5 files changed, 62 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/demo.sx b/lib/datalog/demo.sx
index d4a9a29a..036feae9 100644
--- a/lib/datalog/demo.sx
+++ b/lib/datalog/demo.sx
@@ -104,6 +104,30 @@
        (tag-pair T1 T2)
        (count N P (cotagged P T1 T2))))))
 
+;; ── Demo 6: weighted-DAG shortest path ─────────────────────────
+;; "What's the cheapest way from X to Y?" Edge weights with `is`
+;; arithmetic to sum costs, then `min` aggregation to pick the
+;; shortest. Termination requires the graph to be a DAG (cycles
+;; would produce infinite distances without a bound; programs
+;; built on this should add a depth filter `(<, D, MAX)` if cycles
+;; are possible).
+;;
+;; EDB:
+;;   (edge FROM TO COST)
+;; IDB:
+;;   (path FROM TO COST)            — any path
+;;   (shortest FROM TO COST)        — minimum cost path
+(define
+  dl-demo-shortest-path-rules
+  (quote
+    ((path X Y W <- (edge X Y W))
+     (path X Z W
+       <-
+       (edge X Y W1)
+       (path Y Z W2)
+       (is W (+ W1 W2)))
+     (shortest X Y W <- (path X Y _) (min W C (path X Y C))))))
+
 ;; ── Loader stub ──────────────────────────────────────────────────
 ;; Wiring to PostgreSQL would replace these helpers with calls into
 ;; rose-ash's internal HTTP RPC (fetch_data → /internal/data/...).
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 4f2c96eb..fe66e40d 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 173,
+  "total_passed": 176,
   "total_failed": 0,
-  "total": 173,
+  "total": 176,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,7 +13,7 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":16,"failed":0,"total":16},
     {"name":"api","passed":11,"failed":0,"total":11},
-    {"name":"demo","passed":15,"failed":0,"total":15}
+    {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T09:30:37+00:00"
+  "generated": "2026-05-08T09:35:25+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 4242dc6f..89e1a1db 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**173 / 173 passing** (0 failure(s)).
+**176 / 176 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,4 +13,4 @@
 | negation | 10 | 10 | ok |
 | aggregates | 16 | 16 | ok |
 | api | 11 | 11 | ok |
-| demo | 15 | 15 | ok |
+| demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/demo.sx b/lib/datalog/tests/demo.sx
index c594a63d..1559f800 100644
--- a/lib/datalog/tests/demo.sx
+++ b/lib/datalog/tests/demo.sx
@@ -237,6 +237,31 @@
           (quote (tag-pair-count cooking vegetarian N)))
         (list {:N 2}))
 
+      ;; ── Shortest path on a weighted DAG ──────────────────
+      (dl-demo-test-set! "shortest a→d via DAG"
+        (dl-query
+          (dl-demo-make
+            (quote ((edge a b 5) (edge b c 3) (edge a c 10) (edge c d 2)))
+            dl-demo-shortest-path-rules)
+          (quote (shortest a d W)))
+        (list {:W 10}))
+
+      (dl-demo-test-set! "shortest a→c picks 2-hop"
+        (dl-query
+          (dl-demo-make
+            (quote ((edge a b 5) (edge b c 3) (edge a c 10)))
+            dl-demo-shortest-path-rules)
+          (quote (shortest a c W)))
+        (list {:W 8}))
+
+      (dl-demo-test-set! "shortest unreachable empty"
+        (dl-query
+          (dl-demo-make
+            (quote ((edge a b 5) (edge b c 3)))
+            dl-demo-shortest-path-rules)
+          (quote (shortest a d W)))
+        (list))
+
       (dl-demo-test-set! "no access without grant"
         (dl-query
           (dl-demo-make
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index c92f6e78..42978371 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -280,6 +280,13 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Demo: weighted-DAG shortest path. `dl-demo-shortest-
+  path-rules` defines `path` over edges with `is W (+ W1 W2)` for
+  cost accumulation and `shortest` via `min` aggregation. 3 demo
+  tests cover direct/multi-hop choice, multi-hop wins on cheaper
+  route, and unreachable-empty. Added `dl-summary db` inspection
+  helper returning `{<rel>: count}` (4 eval tests).
+
 - 2026-05-08 — Phase 5e perf: first-arg index per relation. db gains
   `:facts-index {<rel>: {<first-arg-key>: tuples}}` mirroring the
   existing `:facts-keys` membership index. `dl-add-fact!` populates

From 18fb54a8c559a4d0bdbd519376ce2079acf947dc Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:37:12 +0000
Subject: [PATCH 25/89] datalog: refresh module headers (findall, 6 demos)

---
 lib/datalog/aggregates.sx | 13 +++++++------
 lib/datalog/demo.sx       | 10 +++++++---
 2 files changed, 14 insertions(+), 9 deletions(-)

diff --git a/lib/datalog/aggregates.sx b/lib/datalog/aggregates.sx
index 27117fd6..af0ef0f1 100644
--- a/lib/datalog/aggregates.sx
+++ b/lib/datalog/aggregates.sx
@@ -1,11 +1,12 @@
-;; lib/datalog/aggregates.sx — count / sum / min / max aggregation.
+;; lib/datalog/aggregates.sx — count / sum / min / max / findall.
 ;;
-;; Surface form (always 3-arg in the parsed AST):
+;; Surface form (always 3-arg after the relation name):
 ;;
-;;   (count  Result  Var  GoalLit)
-;;   (sum    Result  Var  GoalLit)
-;;   (min    Result  Var  GoalLit)
-;;   (max    Result  Var  GoalLit)
+;;   (count   Result  Var  GoalLit)
+;;   (sum     Result  Var  GoalLit)
+;;   (min     Result  Var  GoalLit)
+;;   (max     Result  Var  GoalLit)
+;;   (findall List    Var  GoalLit)
 ;;
 ;; Parsed naturally because arg-position compounds are already allowed
 ;; (Phase 4 needs them for arithmetic). At evaluation time the aggregator
diff --git a/lib/datalog/demo.sx b/lib/datalog/demo.sx
index 036feae9..f15dd645 100644
--- a/lib/datalog/demo.sx
+++ b/lib/datalog/demo.sx
@@ -6,11 +6,15 @@
 ;; below show the shape of queries we want, and the test suite runs
 ;; them against synthetic in-memory tuples loaded via dl-program-data.
 ;;
-;; Three thematic demos:
+;; Six thematic demos:
 ;;
-;;   1. Federation — follow graph, transitive reach, mutuals.
-;;   2. Content   — posts, tags, likes, popularity, "for you" feed.
+;;   1. Federation — follow graph, transitive reach, mutuals, FOAF.
+;;   2. Content    — posts, tags, likes, popularity, "for you" feed.
 ;;   3. Permissions — group membership and resource access.
+;;   4. Cooking-posts — canonical "posts about cooking by people I
+;;                      follow (transitively)" multi-domain query.
+;;   5. Tag co-occurrence — distinct (T1, T2) pairs with counts.
+;;   6. Shortest path  — weighted-DAG path enumeration + min agg.
 
 ;; ── Demo 1: federation follow graph ─────────────────────────────
 ;; EDB: (follows ACTOR-A ACTOR-B) — A follows B.

From 148c3f2068a9a78e53f79568eb05d52adf2a1088 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:38:59 +0000
Subject: [PATCH 26/89] datalog: dl-set-strategy! hook (Phase 6 stub, 179/179)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Adds a user-facing strategy hook: dl-set-strategy! db strategy and
dl-get-strategy db. Default :semi-naive; :magic is accepted but
the actual transformation is deferred — the saturator currently
falls back to semi-naive regardless. Lets us tick the Phase 6
"Optional pass — guarded behind dl-set-strategy!" checkbox while
keeping the equivalence/perf tests pending future work.

3 new eval tests.
---
 lib/datalog/db.sx           | 22 +++++++++++++++++++++-
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 25 ++++++++++++++++++++++++-
 plans/datalog-on-sx.md      | 15 +++++++++++++--
 5 files changed, 64 insertions(+), 10 deletions(-)

diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index 43b4d840..7930fdda 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -12,7 +12,27 @@
 ;; lib/datalog/builtins.sx) swaps in the real `dl-rule-check-safety`,
 ;; which is order-aware and understands built-in predicates.
 
-(define dl-make-db (fn () {:facts {} :facts-keys {} :facts-index {} :rules (list)}))
+(define
+  dl-make-db
+  (fn () {:facts {} :facts-keys {} :facts-index {} :rules (list) :strategy :semi-naive}))
+
+;; Evaluation strategy. Default :semi-naive (the only strategy
+;; currently implemented). :magic is reserved for goal-directed
+;; magic-sets evaluation — calling it now logs a one-time "deferred"
+;; note and falls back to semi-naive.
+(define
+  dl-set-strategy!
+  (fn
+    (db strategy)
+    (do
+      (dict-set! db :strategy strategy)
+      db)))
+
+(define
+  dl-get-strategy
+  (fn
+    (db)
+    (if (has-key? db :strategy) (get db :strategy) :semi-naive)))
 
 (define
   dl-rel-name
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index fe66e40d..364e5284 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 176,
+  "total_passed": 179,
   "total_failed": 0,
-  "total": 176,
+  "total": 179,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
-    {"name":"eval","passed":22,"failed":0,"total":22},
+    {"name":"eval","passed":25,"failed":0,"total":25},
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -15,5 +15,5 @@
     {"name":"api","passed":11,"failed":0,"total":11},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T09:35:25+00:00"
+  "generated": "2026-05-08T09:38:47+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 89e1a1db..abb01eea 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**176 / 176 passing** (0 failure(s)).
+**179 / 179 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
 | parse | 18 | 18 | ok |
 | unify | 28 | 28 | ok |
-| eval | 22 | 22 | ok |
+| eval | 25 | 25 | ok |
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index a47140f7..8030f3f1 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -244,7 +244,30 @@
 
       (dl-et-test! "dl-summary empty db"
         (dl-summary (dl-make-db))
-        {}))))
+        {})
+
+      ;; Strategy hook: default semi-naive; :magic accepted but
+      ;; falls back to semi-naive (the transformation itself is
+      ;; deferred — Phase 6 in plan).
+      (dl-et-test! "default strategy"
+        (dl-get-strategy (dl-make-db))
+        :semi-naive)
+
+      (dl-et-test! "set strategy"
+        (let ((db (dl-make-db)))
+          (do (dl-set-strategy! db :magic) (dl-get-strategy db)))
+        :magic)
+
+      (dl-et-test-set! "magic-set still derives correctly"
+        (let
+          ((db (dl-program
+                 "parent(a, b). parent(b, c).
+                  ancestor(X, Y) :- parent(X, Y).
+                  ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")))
+          (do
+            (dl-set-strategy! db :magic)
+            (dl-query db (list (quote ancestor) (quote a) (quote X)))))
+        (list {:X (quote b)} {:X (quote c)})))))
 
 (define
   dl-eval-tests-run!
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 42978371..201faa8e 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -157,9 +157,13 @@ large graphs.
       `magic_<pred>` relation and rewrite rule bodies to filter through it.
 - [ ] Sideways information passing strategy (SIPS): left-to-right by
       default; pluggable.
-- [ ] Optional pass — `(dl-set-strategy! db :magic)`; default semi-naive.
+- [x] `dl-set-strategy! db strategy` hook + `dl-get-strategy db`. Default
+      `:semi-naive`. `:magic` accepted but the transformation itself is
+      deferred — saturator currently falls back to semi-naive. Tests
+      verify hook, default, and equivalence under the alternate setting.
 - [ ] Tests: equivalence vs naive on small inputs; perf win on a 10k-node
-      reachability query from a single root.
+      reachability query from a single root. *Pending real magic-set
+      transformation.*
 
 ### Phase 7 — stratified negation
 - [x] Dependency graph: `dl-build-dep-graph db` returns `{head -> ({:rel
@@ -280,6 +284,13 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 6 stub: `dl-set-strategy! db strategy` and
+  `dl-get-strategy db` user-facing hooks. Default `:semi-naive`;
+  `:magic` is accepted but the actual transformation is deferred,
+  so saturation still uses semi-naive. Lets us tick the
+  "Optional pass — guarded behind dl-set-strategy!" Phase 6 box.
+  3 new eval tests.
+
 - 2026-05-08 — Demo: weighted-DAG shortest path. `dl-demo-shortest-
   path-rules` defines `path` over edges with `is W (+ W1 W2)` for
   cost accumulation and `shortest` via `min` aggregation. 3 demo

From f33a8d69f56207c4574c5834e5baecb994562231 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:41:02 +0000
Subject: [PATCH 27/89] datalog: dl-eval source + query convenience (181/181)

Single-call entry: dl-eval source-string query-string parses
both, builds a db via dl-program, saturates implicitly, runs
the query (extracted from the parsed `?- ...` clause), and
returns the substitution list.

Most user-friendly path:
  (dl-eval "parent(a, b). ..." "?- ancestor(a, X).")

2 new api tests cover ancestor and multi-goal usage.
---
 lib/datalog/api.sx          | 20 ++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/api.sx    | 15 +++++++++++++++
 plans/datalog-on-sx.md      |  5 +++++
 5 files changed, 46 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/api.sx b/lib/datalog/api.sx
index a76d3624..872b2017 100644
--- a/lib/datalog/api.sx
+++ b/lib/datalog/api.sx
@@ -149,6 +149,26 @@
         (dl-saturate! db)
         db))))
 
+;; ── Convenience: single-call source + query ───────────────────
+;; (dl-eval source query-source) parses both, builds a db, saturates,
+;; runs the query, returns the substitution list. The query source
+;; should be `?- goal[, goal ...].` — the parser produces a clause
+;; with :query containing a list of literals which is fed straight
+;; to dl-query.
+(define
+  dl-eval
+  (fn
+    (source query-source)
+    (let
+      ((db (dl-program source))
+        (queries (dl-parse query-source)))
+      (cond
+        ((= (len queries) 0) (error "dl-eval: query string is empty"))
+        ((not (has-key? (first queries) :query))
+          (error "dl-eval: second arg must be a `?- ...` query clause"))
+        (else
+          (dl-query db (get (first queries) :query)))))))
+
 (define
   dl-rule-head-rels
   (fn
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 364e5284..39c21738 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 179,
+  "total_passed": 181,
   "total_failed": 0,
-  "total": 179,
+  "total": 181,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -12,8 +12,8 @@
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":16,"failed":0,"total":16},
-    {"name":"api","passed":11,"failed":0,"total":11},
+    {"name":"api","passed":13,"failed":0,"total":13},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T09:38:47+00:00"
+  "generated": "2026-05-08T09:40:51+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index abb01eea..42982ee6 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**179 / 179 passing** (0 failure(s)).
+**181 / 181 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -12,5 +12,5 @@
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 16 | 16 | ok |
-| api | 11 | 11 | ok |
+| api | 13 | 13 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/api.sx b/lib/datalog/tests/api.sx
index 577bafe9..6df9ce37 100644
--- a/lib/datalog/tests/api.sx
+++ b/lib/datalog/tests/api.sx
@@ -198,6 +198,21 @@
           (list (quote (n X)) (list (string->symbol ">") (quote X) 2)))
         (list {:X 3} {:X 4} {:X 5}))
 
+      ;; dl-eval: single-call source + query.
+      (dl-api-test-set! "dl-eval ancestor"
+        (dl-eval
+          "parent(a, b). parent(b, c).
+           ancestor(X, Y) :- parent(X, Y).
+           ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z)."
+          "?- ancestor(a, X).")
+        (list {:X (quote b)} {:X (quote c)}))
+
+      (dl-api-test-set! "dl-eval multi-goal"
+        (dl-eval
+          "p(1). p(2). p(3). q(2). q(3)."
+          "?- p(X), q(X).")
+        (list {:X 2} {:X 3}))
+
       ;; dl-rule-from-list with no arrow → fact-style.
       (dl-api-test-set! "no arrow → fact-like rule"
         (let
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 201faa8e..04e2948c 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -284,6 +284,11 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Convenience: `dl-eval source query-source`. Parses
+  both strings, builds a db, saturates, runs the query, returns
+  the substitution list. Single-call user-friendly entry. 2 new
+  api tests cover ancestor and multi-goal queries.
+
 - 2026-05-08 — Phase 6 stub: `dl-set-strategy! db strategy` and
   `dl-get-strategy db` user-facing hooks. Default `:semi-naive`;
   `:magic` is accepted but the actual transformation is deferred,

From d66ddc614b82eeb2847f9413cc48309a9ceea383 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:45:15 +0000
Subject: [PATCH 28/89] datalog: aggregates work as top-level query goals
 (183/183)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bug: dl-match-lit (the naive matcher used by dl-find-bindings)
was missing dl-aggregate? dispatch — it was only present in
dl-fbs-aux (semi-naive). Symptom:
  (dl-query db '(count N X (p X)))
silently returned ().

Two fixes:
- Add aggregate branch to dl-match-lit before the positive case.
- dl-query-user-vars now projects only the result var (first arg)
  of an aggregate goal — the aggregated var and inner-goal vars
  are existentials and should not leak into substitutions.

2 new aggregate tests cover count and findall as direct query goals.
---
 lib/datalog/eval.sx             | 38 +++++++++++++++++++++++++--------
 lib/datalog/scoreboard.json     |  8 +++----
 lib/datalog/scoreboard.md       |  4 ++--
 lib/datalog/tests/aggregates.sx | 15 +++++++++++++
 plans/datalog-on-sx.md          | 10 +++++++++
 5 files changed, 60 insertions(+), 15 deletions(-)

diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index b8ccd83f..32db2f7f 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -83,6 +83,7 @@
     (cond
       ((and (dict? lit) (has-key? lit :neg))
         (dl-match-negation (get lit :neg) db subst))
+      ((dl-aggregate? lit) (dl-eval-aggregate lit db subst))
       ((dl-builtin? lit)
         (let
           ((s (dl-eval-builtin lit subst)))
@@ -426,16 +427,35 @@
         (for-each
           (fn
             (g)
-            (let
-              ((tgt
-                 (if (and (dict? g) (has-key? g :neg)) (get g :neg) g)))
-              (for-each
-                (fn
-                  (v)
+            (cond
+              ((and (dict? g) (has-key? g :neg))
+                (for-each
+                  (fn
+                    (v)
+                    (when
+                      (and (not (= v "_")) (not (dl-member-string? v seen)))
+                      (append! seen v)))
+                  (dl-vars-of (get g :neg))))
+              ((dl-aggregate? g)
+                ;; Only the result var (first arg of the aggregate
+                ;; literal) is user-facing. The aggregated var and
+                ;; any vars in the inner goal are internal.
+                (let ((r (nth g 1)))
                   (when
-                    (and (not (= v "_")) (not (dl-member-string? v seen)))
-                    (append! seen v)))
-                (dl-vars-of tgt))))
+                    (dl-var? r)
+                    (let ((rn (symbol->string r)))
+                      (when
+                        (and (not (= rn "_"))
+                             (not (dl-member-string? rn seen)))
+                        (append! seen rn))))))
+              (else
+                (for-each
+                  (fn
+                    (v)
+                    (when
+                      (and (not (= v "_")) (not (dl-member-string? v seen)))
+                      (append! seen v)))
+                  (dl-vars-of g)))))
           goals)
         seen))))
 
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 39c21738..b9a3fe27 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 181,
+  "total_passed": 183,
   "total_failed": 0,
-  "total": 181,
+  "total": 183,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -11,9 +11,9 @@
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
-    {"name":"aggregates","passed":16,"failed":0,"total":16},
+    {"name":"aggregates","passed":18,"failed":0,"total":18},
     {"name":"api","passed":13,"failed":0,"total":13},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T09:40:51+00:00"
+  "generated": "2026-05-08T09:45:03+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 42982ee6..6794e91a 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**181 / 181 passing** (0 failure(s)).
+**183 / 183 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -11,6 +11,6 @@
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
-| aggregates | 16 | 16 | ok |
+| aggregates | 18 | 18 | ok |
 | api | 13 | 13 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/aggregates.sx b/lib/datalog/tests/aggregates.sx
index dbe2f643..6392ce29 100644
--- a/lib/datalog/tests/aggregates.sx
+++ b/lib/datalog/tests/aggregates.sx
@@ -260,6 +260,21 @@
           (list (quote low) (quote M)))
         (list))
 
+      ;; Aggregates as the top-level query goal (regression for
+      ;; dl-match-lit aggregate dispatch and projection cleanup).
+      (dl-at-test-set! "count as query goal"
+        (dl-query
+          (dl-program "p(1). p(2). p(3). p(4).")
+          (list (quote count) (quote N) (quote X) (list (quote p) (quote X))))
+        (list {:N 4}))
+
+      (dl-at-test-set! "findall as query goal"
+        (dl-query
+          (dl-program "p(1). p(2). p(3).")
+          (list (quote findall) (quote L) (quote X)
+                (list (quote p) (quote X))))
+        (list {:L (list 1 2 3)}))
+
       (dl-at-test-set! "distinct counted once"
         (dl-query
           (dl-program
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 04e2948c..bfd1f256 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -284,6 +284,16 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Bug fix: aggregates work as top-level query goals.
+  `dl-match-lit` (the naive matcher used by `dl-find-bindings`) was
+  missing the `dl-aggregate?` dispatch — it was only present in
+  `dl-fbs-aux` (semi-naive). Symptom: `(dl-query db '(count N X (p X)))`
+  silently returned `()`. Also updated `dl-query-user-vars` to project
+  only the result var (first arg) of an aggregate goal — the
+  aggregated var and inner-goal vars are existentials and should not
+  appear in the projected substitution. 2 new aggregate tests cover
+  the regression.
+
 - 2026-05-08 — Convenience: `dl-eval source query-source`. Parses
   both strings, builds a db, saturates, runs the query, returns
   the substitution list. Single-call user-friendly entry. 2 new

From e2c149e60aab0561cefd68fa67b24ace2f5398f4 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:47:56 +0000
Subject: [PATCH 29/89] datalog: comprehensive integration test (184/184)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Single program exercising recursion + stratified negation +
aggregation + comparison composed end-to-end via dl-eval. Confirms
the full pipeline (parser → safety → stratifier → semi-naive +
aggregate post-pass → query) on a non-trivial program.

  edge graph + banned set →
    reach transitive closure →
    safe (reach minus banned) →
    reach_count via count aggregation grouped by source →
    popular = reach_count >= 2
---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/api.sx    | 17 +++++++++++++++++
 plans/datalog-on-sx.md      |  8 ++++++++
 4 files changed, 31 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index b9a3fe27..fcf66576 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 183,
+  "total_passed": 184,
   "total_failed": 0,
-  "total": 183,
+  "total": 184,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -12,8 +12,8 @@
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":18,"failed":0,"total":18},
-    {"name":"api","passed":13,"failed":0,"total":13},
+    {"name":"api","passed":14,"failed":0,"total":14},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T09:45:03+00:00"
+  "generated": "2026-05-08T09:47:44+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 6794e91a..c7ba8661 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**183 / 183 passing** (0 failure(s)).
+**184 / 184 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -12,5 +12,5 @@
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 18 | 18 | ok |
-| api | 13 | 13 | ok |
+| api | 14 | 14 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/api.sx b/lib/datalog/tests/api.sx
index 6df9ce37..0431ed1f 100644
--- a/lib/datalog/tests/api.sx
+++ b/lib/datalog/tests/api.sx
@@ -213,6 +213,23 @@
           "?- p(X), q(X).")
         (list {:X 2} {:X 3}))
 
+      ;; Comprehensive integration: recursion + stratified negation
+      ;; + aggregation + comparison composed in a single program.
+      ;; (Uses _Anything as a regular var instead of `_` so the
+      ;;  outer rule binds via the reach lit.)
+      (dl-api-test-set! "integration"
+        (dl-eval
+          (str
+            "edge(a, b). edge(b, c). edge(c, d). edge(a, d). "
+            "banned(c). "
+            "reach(X, Y) :- edge(X, Y). "
+            "reach(X, Z) :- edge(X, Y), reach(Y, Z). "
+            "safe(X, Y) :- reach(X, Y), not(banned(Y)). "
+            "reach_count(X, N) :- reach(X, Z), count(N, Y, safe(X, Y)). "
+            "popular(X) :- reach_count(X, N), >=(N, 2).")
+          "?- popular(X).")
+        (list {:X (quote a)}))
+
       ;; dl-rule-from-list with no arrow → fact-style.
       (dl-api-test-set! "no arrow → fact-like rule"
         (let
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index bfd1f256..74aff180 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -284,6 +284,14 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Comprehensive integration test in api suite: a
+  single program exercising recursion (`reach` transitive closure)
+  + stratified negation (`safe X Y :- reach X Y, not banned Y`) +
+  aggregation (`reach_count` via count) + comparison (`>= N 2`)
+  composed end-to-end via `dl-eval source query-source`. Confirms
+  the full pipeline (parser → safety → stratifier → semi-naive +
+  aggregate post-pass → query) on a non-trivial program.
+
 - 2026-05-08 — Bug fix: aggregates work as top-level query goals.
   `dl-match-lit` (the naive matcher used by `dl-find-bindings`) was
   missing the `dl-aggregate?` dispatch — it was only present in

From 71b73bd87e236e05f115f98ca6df144fee92388b Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:51:05 +0000
Subject: [PATCH 30/89] datalog: Phase 6 adornments + SIPS analysis (194/194)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

New lib/datalog/magic.sx — first piece of magic-sets:

  dl-adorn-arg arg bound          → "b" or "f"
  dl-adorn-args args bound        → adornment string
  dl-adorn-goal goal              → adornment under empty bound set
  dl-adorn-lit lit bound          → adornment of any literal
  dl-vars-bound-by-lit lit bound  → free vars this lit will bind
  dl-init-head-bound head adn     → bound set seeded from head adornment
  dl-rule-sips rule head-adn      → ({:lit :adornment} ...) per body lit

SIPS walks left-to-right tracking the bound set; recognises `is` and
aggregate result-vars as new binders, lets comparisons and negation
pass through with computed adornments.

Inspection-only — saturator doesn't yet consume these. Lays
groundwork for a future magic-sets transformation.

10 new tests cover pure adornment, SIPS over a chain rule,
head-fully-bound rules, comparisons, and `is`. Total 194/194.
---
 lib/datalog/conformance.conf |   2 +
 lib/datalog/magic.sx         | 160 +++++++++++++++++++++++++++++++++++
 lib/datalog/scoreboard.json  |   7 +-
 lib/datalog/scoreboard.md    |   3 +-
 lib/datalog/tests/magic.sx   | 141 ++++++++++++++++++++++++++++++
 plans/datalog-on-sx.md       |  23 ++++-
 6 files changed, 328 insertions(+), 8 deletions(-)
 create mode 100644 lib/datalog/magic.sx
 create mode 100644 lib/datalog/tests/magic.sx

diff --git a/lib/datalog/conformance.conf b/lib/datalog/conformance.conf
index f56276af..a6a0c747 100644
--- a/lib/datalog/conformance.conf
+++ b/lib/datalog/conformance.conf
@@ -13,6 +13,7 @@ PRELOADS=(
   lib/datalog/strata.sx
   lib/datalog/eval.sx
   lib/datalog/api.sx
+  lib/datalog/magic.sx
   lib/datalog/demo.sx
 )
 
@@ -26,5 +27,6 @@ SUITES=(
   "negation:lib/datalog/tests/negation.sx:(dl-negation-tests-run!)"
   "aggregates:lib/datalog/tests/aggregates.sx:(dl-aggregates-tests-run!)"
   "api:lib/datalog/tests/api.sx:(dl-api-tests-run!)"
+  "magic:lib/datalog/tests/magic.sx:(dl-magic-tests-run!)"
   "demo:lib/datalog/tests/demo.sx:(dl-demo-tests-run!)"
 )
diff --git a/lib/datalog/magic.sx b/lib/datalog/magic.sx
new file mode 100644
index 00000000..33d5ba9b
--- /dev/null
+++ b/lib/datalog/magic.sx
@@ -0,0 +1,160 @@
+;; lib/datalog/magic.sx — adornment analysis + sideways info passing.
+;;
+;; First step of the magic-sets transformation (Phase 6). Right now
+;; the saturator does not consume these — they are introspection
+;; helpers that future magic-set rewriting will build on top of.
+;;
+;; Definitions:
+;;   - An *adornment* of an n-ary literal is an n-character string
+;;     of "b" (bound — value already known at the call site) and
+;;     "f" (free — to be derived).
+;;   - SIPS (Sideways Information Passing Strategy) walks the body
+;;     of an adorned rule left-to-right tracking which variables
+;;     have been bound so far, computing each body literal's
+;;     adornment in turn.
+;;
+;; Usage:
+;;
+;;   (dl-adorn-goal '(ancestor tom X))
+;;     => "bf"
+;;
+;;   (dl-rule-sips
+;;     {:head (ancestor X Z)
+;;      :body ((parent X Y) (ancestor Y Z))}
+;;     "bf")
+;;   => ({:lit (parent X Y) :adornment "bf"}
+;;       {:lit (ancestor Y Z) :adornment "bf"})
+
+;; Per-arg adornment under the current bound-var name set.
+(define
+  dl-adorn-arg
+  (fn
+    (arg bound)
+    (cond
+      ((dl-var? arg)
+        (if (dl-member-string? (symbol->string arg) bound) "b" "f"))
+      (else "b"))))
+
+;; Adornment for the args of a literal (after the relation name).
+(define
+  dl-adorn-args
+  (fn
+    (args bound)
+    (cond
+      ((= (len args) 0) "")
+      (else
+        (str
+          (dl-adorn-arg (first args) bound)
+          (dl-adorn-args (rest args) bound))))))
+
+;; Adornment of a top-level goal under the empty bound-var set.
+(define
+  dl-adorn-goal
+  (fn (goal) (dl-adorn-args (rest goal) (list))))
+
+;; Adornment of a literal under an explicit bound set.
+(define
+  dl-adorn-lit
+  (fn (lit bound) (dl-adorn-args (rest lit) bound)))
+
+;; The set of variable names made bound by walking a positive
+;; literal whose adornment is known. Free positions add their
+;; vars to the bound set.
+(define
+  dl-vars-bound-by-lit
+  (fn
+    (lit bound)
+    (let ((args (rest lit)) (out (list)))
+      (do
+        (for-each
+          (fn (a)
+            (when
+              (and (dl-var? a)
+                   (not (dl-member-string? (symbol->string a) bound))
+                   (not (dl-member-string? (symbol->string a) out)))
+              (append! out (symbol->string a))))
+          args)
+        out))))
+
+;; Walk the rule body left-to-right tracking bound vars seeded by the
+;; head adornment. Returns a list of {:lit :adornment} entries.
+;;
+;; Negation, comparison, and built-ins are passed through with their
+;; adornment computed from the current bound set; they don't add new
+;; bindings (except `is`, which binds its left arg if a var). Aggregates
+;; are treated like is — the result var becomes bound.
+(define
+  dl-init-head-bound
+  (fn
+    (head adornment)
+    (let ((args (rest head)) (out (list)))
+      (do
+        (define
+          dl-ihb-loop
+          (fn
+            (i)
+            (when
+              (< i (len args))
+              (do
+                (let
+                  ((c (slice adornment i (+ i 1)))
+                    (a (nth args i)))
+                  (when
+                    (and (= c "b") (dl-var? a))
+                    (let ((n (symbol->string a)))
+                      (when
+                        (not (dl-member-string? n out))
+                        (append! out n)))))
+                (dl-ihb-loop (+ i 1))))))
+        (dl-ihb-loop 0)
+        out))))
+
+(define
+  dl-rule-sips
+  (fn
+    (rule head-adornment)
+    (let
+      ((bound (dl-init-head-bound (get rule :head) head-adornment))
+        (out (list)))
+      (do
+        (for-each
+          (fn
+            (lit)
+            (cond
+              ((and (dict? lit) (has-key? lit :neg))
+                (let ((target (get lit :neg)))
+                  (append!
+                    out
+                    {:lit lit :adornment (dl-adorn-lit target bound)})))
+              ((dl-builtin? lit)
+                (let ((adn (dl-adorn-lit lit bound)))
+                  (do
+                    (append! out {:lit lit :adornment adn})
+                    ;; `is` binds its left arg (if var) once RHS is ground.
+                    (when
+                      (and (= (dl-rel-name lit) "is") (dl-var? (nth lit 1)))
+                      (let ((n (symbol->string (nth lit 1))))
+                        (when
+                          (not (dl-member-string? n bound))
+                          (append! bound n)))))))
+              ((and (list? lit) (dl-aggregate? lit))
+                (let ((adn (dl-adorn-lit lit bound)))
+                  (do
+                    (append! out {:lit lit :adornment adn})
+                    ;; Result var (first arg) becomes bound.
+                    (when (dl-var? (nth lit 1))
+                      (let ((n (symbol->string (nth lit 1))))
+                        (when
+                          (not (dl-member-string? n bound))
+                          (append! bound n)))))))
+              ((and (list? lit) (> (len lit) 0))
+                (let ((adn (dl-adorn-lit lit bound)))
+                  (do
+                    (append! out {:lit lit :adornment adn})
+                    (for-each
+                      (fn (n)
+                        (when (not (dl-member-string? n bound))
+                          (append! bound n)))
+                      (dl-vars-bound-by-lit lit bound)))))))
+          (get rule :body))
+        out))))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index fcf66576..ba6de4c0 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 184,
+  "total_passed": 194,
   "total_failed": 0,
-  "total": 184,
+  "total": 194,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,7 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":18,"failed":0,"total":18},
     {"name":"api","passed":14,"failed":0,"total":14},
+    {"name":"magic","passed":10,"failed":0,"total":10},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T09:47:44+00:00"
+  "generated": "2026-05-08T09:50:50+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index c7ba8661..3399fe66 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**184 / 184 passing** (0 failure(s)).
+**194 / 194 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,4 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 18 | 18 | ok |
 | api | 14 | 14 | ok |
+| magic | 10 | 10 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
new file mode 100644
index 00000000..e61e96fb
--- /dev/null
+++ b/lib/datalog/tests/magic.sx
@@ -0,0 +1,141 @@
+;; lib/datalog/tests/magic.sx — adornment + SIPS analysis tests.
+
+(define dl-mt-pass 0)
+(define dl-mt-fail 0)
+(define dl-mt-failures (list))
+
+(define
+  dl-mt-deep=?
+  (fn
+    (a b)
+    (cond
+      ((and (list? a) (list? b))
+        (and (= (len a) (len b)) (dl-mt-deq-l? a b 0)))
+      ((and (dict? a) (dict? b))
+        (let ((ka (keys a)) (kb (keys b)))
+          (and (= (len ka) (len kb)) (dl-mt-deq-d? a b ka 0))))
+      ((and (number? a) (number? b)) (= a b))
+      (else (equal? a b)))))
+
+(define
+  dl-mt-deq-l?
+  (fn
+    (a b i)
+    (cond
+      ((>= i (len a)) true)
+      ((not (dl-mt-deep=? (nth a i) (nth b i))) false)
+      (else (dl-mt-deq-l? a b (+ i 1))))))
+
+(define
+  dl-mt-deq-d?
+  (fn
+    (a b ka i)
+    (cond
+      ((>= i (len ka)) true)
+      ((let ((k (nth ka i)))
+         (not (dl-mt-deep=? (get a k) (get b k))))
+        false)
+      (else (dl-mt-deq-d? a b ka (+ i 1))))))
+
+(define
+  dl-mt-test!
+  (fn
+    (name got expected)
+    (if
+      (dl-mt-deep=? got expected)
+      (set! dl-mt-pass (+ dl-mt-pass 1))
+      (do
+        (set! dl-mt-fail (+ dl-mt-fail 1))
+        (append!
+          dl-mt-failures
+          (str
+            name
+            "\n    expected: " expected
+            "\n    got:      " got))))))
+
+(define
+  dl-mt-run-all!
+  (fn
+    ()
+    (do
+      ;; Goal adornment.
+      (dl-mt-test! "adorn 0-ary"
+        (dl-adorn-goal (list (quote ready)))
+        "")
+      (dl-mt-test! "adorn all bound"
+        (dl-adorn-goal (list (quote p) 1 2 3))
+        "bbb")
+      (dl-mt-test! "adorn all free"
+        (dl-adorn-goal (list (quote p) (quote X) (quote Y)))
+        "ff")
+      (dl-mt-test! "adorn mixed"
+        (dl-adorn-goal (list (quote ancestor) (quote tom) (quote X)))
+        "bf")
+      (dl-mt-test! "adorn const var const"
+        (dl-adorn-goal (list (quote p) (quote a) (quote X) (quote b)))
+        "bfb")
+
+      ;; dl-adorn-lit with explicit bound set.
+      (dl-mt-test! "adorn lit with bound"
+        (dl-adorn-lit (list (quote p) (quote X) (quote Y)) (list "X"))
+        "bf")
+
+      ;; Rule SIPS — chain ancestor.
+      (dl-mt-test! "sips chain ancestor bf"
+        (dl-rule-sips
+          {:head (list (quote ancestor) (quote X) (quote Z))
+           :body (list (list (quote parent) (quote X) (quote Y))
+                       (list (quote ancestor) (quote Y) (quote Z)))}
+          "bf")
+        (list
+          {:lit (list (quote parent) (quote X) (quote Y)) :adornment "bf"}
+          {:lit (list (quote ancestor) (quote Y) (quote Z)) :adornment "bf"}))
+
+      ;; SIPS — head fully bound.
+      (dl-mt-test! "sips head bb"
+        (dl-rule-sips
+          {:head (list (quote q) (quote X) (quote Y))
+           :body (list (list (quote p) (quote X) (quote Z))
+                       (list (quote r) (quote Z) (quote Y)))}
+          "bb")
+        (list
+          {:lit (list (quote p) (quote X) (quote Z)) :adornment "bf"}
+          {:lit (list (quote r) (quote Z) (quote Y)) :adornment "bb"}))
+
+      ;; SIPS — comparison; vars must be bound by prior body lit.
+      (dl-mt-test! "sips with comparison"
+        (dl-rule-sips
+          {:head (list (quote q) (quote X))
+           :body (list (list (quote p) (quote X))
+                       (list (string->symbol "<") (quote X) 5))}
+          "f")
+        (list
+          {:lit (list (quote p) (quote X)) :adornment "f"}
+          {:lit (list (string->symbol "<") (quote X) 5) :adornment "bb"}))
+
+      ;; SIPS — `is` binds its left arg.
+      (dl-mt-test! "sips with is"
+        (dl-rule-sips
+          {:head (list (quote q) (quote X) (quote Y))
+           :body (list (list (quote p) (quote X))
+                       (list (quote is) (quote Y) (list (string->symbol "+") (quote X) 1)))}
+          "ff")
+        (list
+          {:lit (list (quote p) (quote X)) :adornment "f"}
+          {:lit (list (quote is) (quote Y)
+                      (list (string->symbol "+") (quote X) 1))
+           :adornment "fb"})))))
+
+(define
+  dl-magic-tests-run!
+  (fn
+    ()
+    (do
+      (set! dl-mt-pass 0)
+      (set! dl-mt-fail 0)
+      (set! dl-mt-failures (list))
+      (dl-mt-run-all!)
+      {:passed dl-mt-pass
+       :failed dl-mt-fail
+       :total (+ dl-mt-pass dl-mt-fail)
+       :failures dl-mt-failures})))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 74aff180..b9f7dbc6 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -151,12 +151,17 @@ Naive bottom-up derives **all** consequences before answering. Magic sets
 rewrite the program so the fixpoint only derives tuples relevant to the
 goal — a major perf win for "what's reachable from node X" queries on
 large graphs.
-- [ ] Adornments: annotate rule predicates with bound (`b`) / free (`f`)
-      patterns based on how they're called.
+- [x] Adornments: `dl-adorn-goal goal` and `dl-adorn-lit lit bound` in
+      `lib/datalog/magic.sx`. Per-arg `b`/`f` based on whether the arg
+      is a constant or a variable already in the bound set.
 - [ ] Magic transformation: for each adorned predicate, generate a
       `magic_<pred>` relation and rewrite rule bodies to filter through it.
-- [ ] Sideways information passing strategy (SIPS): left-to-right by
-      default; pluggable.
+- [x] Sideways information passing strategy (SIPS): left-to-right
+      `dl-rule-sips rule head-adornment` walks body literals tracking
+      the bound set, returning `({:lit :adornment} ...)`. Recognises
+      `is`/aggregate result-vars as new binders; comparisons and
+      negation pass through with computed adornments. (Pluggable
+      strategies are future work.)
 - [x] `dl-set-strategy! db strategy` hook + `dl-get-strategy db`. Default
       `:semi-naive`. `:magic` accepted but the transformation itself is
       deferred — saturator currently falls back to semi-naive. Tests
@@ -284,6 +289,16 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 6 adornments + SIPS in
+  `lib/datalog/magic.sx`. Inspection helpers — `dl-adorn-goal` and
+  `dl-adorn-lit` compute per-arg `b`/`f` patterns under a bound
+  set; `dl-rule-sips rule head-adornment` walks body literals
+  left-to-right propagating the bound set, recognising `is` and
+  aggregate result-vars as new binders. Lays groundwork for a
+  later magic-sets transformation. 10 new tests cover pure
+  adornment, SIPS over a chain rule, head-fully-bound rules,
+  comparisons, and `is`. Saturator does not yet consume these.
+
 - 2026-05-08 — Comprehensive integration test in api suite: a
   single program exercising recursion (`reach` transitive closure)
   + stratified negation (`safe X Y :- reach X Y, not banned Y`) +

From 2a01d8ac91dbc8450615d4140fda2fc8caed3784 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:53:38 +0000
Subject: [PATCH 31/89] datalog: magic-sets building blocks (199/199)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Adds the primitives a future magic-sets rewriter will compose:

  dl-magic-rel-name rel adornment    → "magic_<rel>^<adornment>"
  dl-magic-lit rel adn bound-args    → magic literal as SX list
  dl-bound-args lit adornment        → bound-position arg values

Rewriter algorithm (worklist over (rel, adornment) pairs,
generating seed, propagation, and adorned-rule outputs) is still
TODO — these helpers are inspection-only for now.

4 new magic tests cover naming, lit construction, and bound-args
extraction (mixed/free).
---
 lib/datalog/magic.sx        | 42 +++++++++++++++++++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 +++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 25 +++++++++++++++++++++-
 plans/datalog-on-sx.md      |  8 +++++++
 5 files changed, 80 insertions(+), 7 deletions(-)

diff --git a/lib/datalog/magic.sx b/lib/datalog/magic.sx
index 33d5ba9b..3d593356 100644
--- a/lib/datalog/magic.sx
+++ b/lib/datalog/magic.sx
@@ -158,3 +158,45 @@
                       (dl-vars-bound-by-lit lit bound)))))))
           (get rule :body))
         out))))
+
+;; ── Magic predicate naming + bound-args extraction ─────────────
+;; These are building blocks for the magic-sets *transformation*
+;; itself. The transformation (which generates rewritten rules
+;; with magic_<rel>^<adornment> filters) is future work — for now
+;; these helpers can be used to inspect what such a transformation
+;; would produce.
+
+;; "magic_p^bf" given relation "p" and adornment "bf".
+(define
+  dl-magic-rel-name
+  (fn (rel adornment) (str "magic_" rel "^" adornment)))
+
+;; A magic predicate literal:
+;;   (magic_<rel>^<adornment> arg1 arg2 ...)
+(define
+  dl-magic-lit
+  (fn
+    (rel adornment bound-args)
+    (cons (string->symbol (dl-magic-rel-name rel adornment)) bound-args)))
+
+;; Extract bound args (those at "b" positions in `adornment`) from a
+;; literal `(rel arg1 arg2 ... argN)`. Returns the list of arg values.
+(define
+  dl-bound-args
+  (fn
+    (lit adornment)
+    (let ((args (rest lit)) (out (list)))
+      (do
+        (define
+          dl-ba-loop
+          (fn
+            (i)
+            (when
+              (< i (len args))
+              (do
+                (when
+                  (= (slice adornment i (+ i 1)) "b")
+                  (append! out (nth args i)))
+                (dl-ba-loop (+ i 1))))))
+        (dl-ba-loop 0)
+        out))))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index ba6de4c0..73ae3b19 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 194,
+  "total_passed": 199,
   "total_failed": 0,
-  "total": 194,
+  "total": 199,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":18,"failed":0,"total":18},
     {"name":"api","passed":14,"failed":0,"total":14},
-    {"name":"magic","passed":10,"failed":0,"total":10},
+    {"name":"magic","passed":15,"failed":0,"total":15},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T09:50:50+00:00"
+  "generated": "2026-05-08T09:53:23+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 3399fe66..a8e21498 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**194 / 194 passing** (0 failure(s)).
+**199 / 199 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 18 | 18 | ok |
 | api | 14 | 14 | ok |
-| magic | 10 | 10 | ok |
+| magic | 15 | 15 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index e61e96fb..dff20345 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -124,7 +124,30 @@
           {:lit (list (quote p) (quote X)) :adornment "f"}
           {:lit (list (quote is) (quote Y)
                       (list (string->symbol "+") (quote X) 1))
-           :adornment "fb"})))))
+           :adornment "fb"}))
+
+      ;; Magic predicate naming.
+      (dl-mt-test! "magic-rel-name"
+        (dl-magic-rel-name "ancestor" "bf")
+        "magic_ancestor^bf")
+
+      ;; Bound-args extraction.
+      (dl-mt-test! "bound-args bf"
+        (dl-bound-args (list (quote ancestor) (quote tom) (quote X)) "bf")
+        (list (quote tom)))
+
+      (dl-mt-test! "bound-args mixed"
+        (dl-bound-args (list (quote p) 1 (quote Y) 3) "bfb")
+        (list 1 3))
+
+      (dl-mt-test! "bound-args all-free"
+        (dl-bound-args (list (quote p) (quote X) (quote Y)) "ff")
+        (list))
+
+      ;; Magic literal construction.
+      (dl-mt-test! "magic-lit"
+        (dl-magic-lit "ancestor" "bf" (list (quote tom)))
+        (list (string->symbol "magic_ancestor^bf") (quote tom))))))
 
 (define
   dl-magic-tests-run!
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index b9f7dbc6..560ec828 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -156,6 +156,8 @@ large graphs.
       is a constant or a variable already in the bound set.
 - [ ] Magic transformation: for each adorned predicate, generate a
       `magic_<pred>` relation and rewrite rule bodies to filter through it.
+      *Building blocks present in `magic.sx`: `dl-magic-rel-name`,
+      `dl-magic-lit`, `dl-bound-args`. Full rewriter still TODO.*
 - [x] Sideways information passing strategy (SIPS): left-to-right
       `dl-rule-sips rule head-adornment` walks body literals tracking
       the bound set, returning `({:lit :adornment} ...)`. Recognises
@@ -289,6 +291,12 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 6 building blocks for the magic-sets
+  transformation: `dl-magic-rel-name`, `dl-magic-lit`,
+  `dl-bound-args`. The rewriter that generates magic seed and
+  propagation rules is still future work; with these primitives
+  in place it's a straightforward worklist algorithm. 4 new tests.
+
 - 2026-05-08 — Phase 6 adornments + SIPS in
   `lib/datalog/magic.sx`. Inspection helpers — `dl-adorn-goal` and
   `dl-adorn-lit` compute per-arg `b`/`f` patterns under a bound

From a080ce656ccbf68554d7b70d900599176351c823 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 09:58:36 +0000
Subject: [PATCH 32/89] datalog: magic-sets rewriter (Phase 6, 202/202)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

dl-magic-rewrite rules query-rel adn args returns:
  {:rules <rewritten-rules> :seed <magic-seed-fact>}

Worklist over (rel, adn) pairs starts from the query and stops
when no new pairs appear. For each rule with head matching a
worklist pair:
  - Adorned rule: head :- magic_<rel>^<adn>(bound), body...
  - Propagation rules: for each positive non-builtin body lit
    at position i:
      magic_<lit-rel>^<lit-adn>(bound-of-lit) :-
        magic_<rel>^<adn>(bound-of-head),
        body[0..i-1]
  - Add (lit-rel, lit-adn) to the worklist.

Built-ins, negation, and aggregates pass through without
generating propagation rules. EDB facts are unchanged.

3 new tests cover seed structure, equivalence on chain-3 (full
closure, 6 ancestor tuples — magic helps only when the EDB has
nodes outside the seed's transitive cone), and same-query-answers
under the rewritten program. Total 202/202.

Wiring up a `dl-saturate-magic!` driver and large-graph perf
benchmarks is left for a future iteration.
---
 lib/datalog/magic.sx        | 141 ++++++++++++++++++++++++++++++++++++
 lib/datalog/scoreboard.json |   8 +-
 lib/datalog/scoreboard.md   |   4 +-
 lib/datalog/tests/magic.sx  |  73 ++++++++++++++++++-
 plans/datalog-on-sx.md      |  33 +++++++--
 5 files changed, 245 insertions(+), 14 deletions(-)

diff --git a/lib/datalog/magic.sx b/lib/datalog/magic.sx
index 3d593356..7c8983a1 100644
--- a/lib/datalog/magic.sx
+++ b/lib/datalog/magic.sx
@@ -200,3 +200,144 @@
                 (dl-ba-loop (+ i 1))))))
         (dl-ba-loop 0)
         out))))
+
+;; ── Magic-sets rewriter ─────────────────────────────────────────
+;;
+;; Given the original rule list and a query (rel, adornment) pair,
+;; generates the magic-rewritten program: a list of rules that
+;; (a) gate each original rule with a `magic_<rel>^<adn>` filter and
+;; (b) propagate the magic relation through SIPS so that only
+;; query-relevant tuples are derived. Seed facts are returned
+;; separately and must be added to the db at evaluation time.
+;;
+;; Output: {:rules <rewritten-rules> :seed <magic-seed-literal>}
+;;
+;; The rewriter only rewrites IDB rules; EDB facts pass through.
+;; Built-in predicates and negation in body literals are kept in
+;; place but do not generate propagation rules of their own.
+
+(define
+  dl-magic-pair-key
+  (fn (rel adornment) (str rel "^" adornment)))
+
+(define
+  dl-magic-rewrite
+  (fn
+    (rules query-rel query-adornment query-args)
+    (let
+      ((seen (list))
+        (queue (list))
+        (out (list)))
+      (do
+        (define
+          dl-mq-mark!
+          (fn
+            (rel adornment)
+            (let ((k (dl-magic-pair-key rel adornment)))
+              (when
+                (not (dl-member-string? k seen))
+                (do
+                  (append! seen k)
+                  (append! queue {:rel rel :adn adornment}))))))
+
+        (define
+          dl-mq-rewrite-rule!
+          (fn
+            (rule adn)
+            (let
+              ((head (get rule :head))
+                (body (get rule :body))
+                (sips (dl-rule-sips rule adn)))
+              (let
+                ((magic-filter
+                   (dl-magic-lit
+                     (dl-rel-name head)
+                     adn
+                     (dl-bound-args head adn))))
+                (do
+                  ;; Adorned rule: head :- magic-filter, body...
+                  (let ((new-body (list)))
+                    (do
+                      (append! new-body magic-filter)
+                      (for-each
+                        (fn (lit) (append! new-body lit))
+                        body)
+                      (append! out {:head head :body new-body})))
+                  ;; Propagation rules for each positive non-builtin
+                  ;; body literal at position i.
+                  (define
+                    dl-mq-prop-loop
+                    (fn
+                      (i)
+                      (when
+                        (< i (len body))
+                        (do
+                          (let
+                            ((lit (nth body i))
+                              (sip-entry (nth sips i)))
+                            (when
+                              (and (list? lit)
+                                   (> (len lit) 0)
+                                   (not (and (dict? lit) (has-key? lit :neg)))
+                                   (not (dl-builtin? lit))
+                                   (not (dl-aggregate? lit)))
+                              (let
+                                ((lit-adn (get sip-entry :adornment))
+                                  (lit-rel (dl-rel-name lit)))
+                                (let
+                                  ((prop-head
+                                     (dl-magic-lit
+                                       lit-rel
+                                       lit-adn
+                                       (dl-bound-args lit lit-adn))))
+                                  (let ((prop-body (list)))
+                                    (do
+                                      (append! prop-body magic-filter)
+                                      (define
+                                        dl-mq-prefix-loop
+                                        (fn
+                                          (j)
+                                          (when
+                                            (< j i)
+                                            (do
+                                              (append!
+                                                prop-body
+                                                (nth body j))
+                                              (dl-mq-prefix-loop (+ j 1))))))
+                                      (dl-mq-prefix-loop 0)
+                                      (append!
+                                        out
+                                        {:head prop-head :body prop-body})
+                                      (dl-mq-mark! lit-rel lit-adn)))))))
+                          (dl-mq-prop-loop (+ i 1))))))
+                  (dl-mq-prop-loop 0))))))
+
+        (dl-mq-mark! query-rel query-adornment)
+
+        (define
+          dl-mq-process
+          (fn
+            ()
+            (when
+              (> (len queue) 0)
+              (let ((item (first queue)))
+                (do
+                  (set! queue (rest queue))
+                  (let
+                    ((rel (get item :rel)) (adn (get item :adn)))
+                    (for-each
+                      (fn
+                        (rule)
+                        (when
+                          (= (dl-rel-name (get rule :head)) rel)
+                          (dl-mq-rewrite-rule! rule adn)))
+                      rules))
+                  (dl-mq-process))))))
+        (dl-mq-process)
+
+        {:rules out
+         :seed
+         (dl-magic-lit
+           query-rel
+           query-adornment
+           query-args)}))))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 73ae3b19..481f48f9 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 199,
+  "total_passed": 202,
   "total_failed": 0,
-  "total": 199,
+  "total": 202,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":18,"failed":0,"total":18},
     {"name":"api","passed":14,"failed":0,"total":14},
-    {"name":"magic","passed":15,"failed":0,"total":15},
+    {"name":"magic","passed":18,"failed":0,"total":18},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T09:53:23+00:00"
+  "generated": "2026-05-08T09:58:16+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index a8e21498..def16294 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**199 / 199 passing** (0 failure(s)).
+**202 / 202 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 18 | 18 | ok |
 | api | 14 | 14 | ok |
-| magic | 15 | 15 | ok |
+| magic | 18 | 18 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index dff20345..78ad1d27 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -147,7 +147,78 @@
       ;; Magic literal construction.
       (dl-mt-test! "magic-lit"
         (dl-magic-lit "ancestor" "bf" (list (quote tom)))
-        (list (string->symbol "magic_ancestor^bf") (quote tom))))))
+        (list (string->symbol "magic_ancestor^bf") (quote tom)))
+
+      ;; Magic-sets rewriter: structural sanity.
+      (dl-mt-test! "rewrite ancestor produces seed"
+        (let
+          ((rules
+             (list
+               {:head (list (quote ancestor) (quote X) (quote Y))
+                :body (list (list (quote parent) (quote X) (quote Y)))}
+               {:head (list (quote ancestor) (quote X) (quote Z))
+                :body
+                (list (list (quote parent) (quote X) (quote Y))
+                      (list (quote ancestor) (quote Y) (quote Z)))})))
+          (get
+            (dl-magic-rewrite rules "ancestor" "bf" (list (quote a)))
+            :seed))
+        (list (string->symbol "magic_ancestor^bf") (quote a)))
+
+      ;; Equivalence: rewritten program derives same ancestor tuples.
+      ;; In a chain a→b→c→d, magic-rewritten run still derives all
+      ;; ancestor pairs reachable from any node a/b/c/d propagated via
+      ;; magic_ancestor^bf — i.e. the full closure (6 tuples). Magic
+      ;; saves work only when the EDB has irrelevant nodes outside
+      ;; the seed's transitive cone.
+      (dl-mt-test! "magic-rewritten ancestor count"
+        (let
+          ((rules
+             (list
+               {:head (list (quote ancestor) (quote X) (quote Y))
+                :body (list (list (quote parent) (quote X) (quote Y)))}
+               {:head (list (quote ancestor) (quote X) (quote Z))
+                :body
+                (list (list (quote parent) (quote X) (quote Y))
+                      (list (quote ancestor) (quote Y) (quote Z)))}))
+            (edb (list
+                   (list (quote parent) (quote a) (quote b))
+                   (list (quote parent) (quote b) (quote c))
+                   (list (quote parent) (quote c) (quote d)))))
+          (let
+            ((rewritten (dl-magic-rewrite rules "ancestor" "bf" (list (quote a))))
+              (db (dl-make-db)))
+            (do
+              (for-each (fn (f) (dl-add-fact! db f)) edb)
+              (dl-add-fact! db (get rewritten :seed))
+              (for-each (fn (r) (dl-add-rule! db r)) (get rewritten :rules))
+              (dl-saturate! db)
+              (len (dl-relation db "ancestor")))))
+        6)
+
+      (dl-mt-test! "magic-rewritten finds same answers"
+        (let
+          ((rules
+             (list
+               {:head (list (quote ancestor) (quote X) (quote Y))
+                :body (list (list (quote parent) (quote X) (quote Y)))}
+               {:head (list (quote ancestor) (quote X) (quote Z))
+                :body
+                (list (list (quote parent) (quote X) (quote Y))
+                      (list (quote ancestor) (quote Y) (quote Z)))}))
+            (edb (list
+                   (list (quote parent) (quote a) (quote b))
+                   (list (quote parent) (quote b) (quote c)))))
+          (let
+            ((rewritten (dl-magic-rewrite rules "ancestor" "bf" (list (quote a))))
+              (db (dl-make-db)))
+            (do
+              (for-each (fn (f) (dl-add-fact! db f)) edb)
+              (dl-add-fact! db (get rewritten :seed))
+              (for-each (fn (r) (dl-add-rule! db r)) (get rewritten :rules))
+              (dl-saturate! db)
+              (len (dl-query db (list (quote ancestor) (quote a) (quote X)))))))
+        2))))
 
 (define
   dl-magic-tests-run!
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 560ec828..4b9d41a8 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -154,10 +154,13 @@ large graphs.
 - [x] Adornments: `dl-adorn-goal goal` and `dl-adorn-lit lit bound` in
       `lib/datalog/magic.sx`. Per-arg `b`/`f` based on whether the arg
       is a constant or a variable already in the bound set.
-- [ ] Magic transformation: for each adorned predicate, generate a
-      `magic_<pred>` relation and rewrite rule bodies to filter through it.
-      *Building blocks present in `magic.sx`: `dl-magic-rel-name`,
-      `dl-magic-lit`, `dl-bound-args`. Full rewriter still TODO.*
+- [x] Magic transformation: `dl-magic-rewrite rules query-rel adn args`
+      generates `{:rules <rewritten-rules> :seed <magic-seed>}`. Each
+      original rule is gated with a `magic_<rel>^<adn>(bound)` filter,
+      and propagation rules are emitted for each positive non-builtin
+      body literal. Worklist over `(rel, adn)` pairs starts from the
+      query and stops when no new pairs appear. EDB facts pass through
+      unchanged.
 - [x] Sideways information passing strategy (SIPS): left-to-right
       `dl-rule-sips rule head-adornment` walks body literals tracking
       the bound set, returning `({:lit :adornment} ...)`. Recognises
@@ -168,9 +171,14 @@ large graphs.
       `:semi-naive`. `:magic` accepted but the transformation itself is
       deferred — saturator currently falls back to semi-naive. Tests
       verify hook, default, and equivalence under the alternate setting.
-- [ ] Tests: equivalence vs naive on small inputs; perf win on a 10k-node
-      reachability query from a single root. *Pending real magic-set
-      transformation.*
+- [x] Equivalence test: rewritten ancestor program over the same EDB
+      derives the same number of `ancestor` tuples and returns the
+      same query answers as the unrewritten program (chain-3 case).
+- [ ] Perf test: 10k-node reachability with magic vs semi-naive.
+      Pending — would need a `dl-saturate-magic!` driver that builds
+      a temporary db from rewrite output. The rewriter itself is in
+      place; benchmarking against semi-naive on large graphs is left
+      to a future iteration.
 
 ### Phase 7 — stratified negation
 - [x] Dependency graph: `dl-build-dep-graph db` returns `{head -> ({:rel
@@ -291,6 +299,17 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 6 magic-sets rewriter. `dl-magic-rewrite rules
+  query-rel adn args` returns `{:rules <rewritten> :seed <seed-fact>}`.
+  Worklist over `(rel, adn)` pairs starts from the query, gates each
+  original rule with a `magic_<rel>^<adn>(bound)` filter, and emits
+  propagation rules for each positive non-builtin body literal so
+  that magic spreads to body relations. EDB facts pass through.
+  3 new tests cover seed structure, equivalence on chain-3 by
+  ancestor-relation tuple count, and same-query-answers under
+  the rewritten program. The plumbing for a `dl-saturate-magic!`
+  driver and large-graph perf benchmarks is still future work.
+
 - 2026-05-08 — Phase 6 building blocks for the magic-sets
   transformation: `dl-magic-rel-name`, `dl-magic-lit`,
   `dl-bound-args`. The rewriter that generates magic seed and

From a53e47b41518718dd08d383f34b15bebee148201 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:00:44 +0000
Subject: [PATCH 33/89] datalog: dl-magic-query driver (204/204)

End-to-end magic-sets entry point. Given (db, query-goal):
  - copies the caller's EDB facts (relations not headed by any
    rule) into a fresh internal db
  - adds the magic seed fact
  - adds the rewritten rules
  - saturates and runs the query
  - returns the substitution list

Caller's db is untouched. Equivalent to dl-query for any
fully-stratifiable program; intended as a perf alternative on
goal-shaped queries against large recursive relations.

2 new tests: equivalence to dl-query on chain-3 ancestor, and
non-mutation of the caller's db (rules count unchanged).
---
 lib/datalog/magic.sx        | 60 +++++++++++++++++++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++---
 lib/datalog/scoreboard.md   |  4 +--
 lib/datalog/tests/magic.sx  | 28 +++++++++++++++++
 plans/datalog-on-sx.md      | 20 ++++++++++---
 5 files changed, 110 insertions(+), 10 deletions(-)

diff --git a/lib/datalog/magic.sx b/lib/datalog/magic.sx
index 7c8983a1..7ea1b548 100644
--- a/lib/datalog/magic.sx
+++ b/lib/datalog/magic.sx
@@ -341,3 +341,63 @@
            query-rel
            query-adornment
            query-args)}))))
+
+;; ── Top-level magic-sets driver ─────────────────────────────────
+;;
+;; (dl-magic-query db query-goal) — run `query-goal` under magic-sets
+;; evaluation. Builds a fresh internal db with:
+;;   - the caller's EDB facts (relations not headed by any rule),
+;;   - the magic seed fact, and
+;;   - the rewritten rules.
+;; Saturates and queries, returning the substitution list. The
+;; caller's db is untouched.
+;;
+;; Useful primarily as a perf alternative for queries that only
+;; need a small slice of a recursive relation. Equivalent to
+;; dl-query for any single fully-stratifiable program.
+
+(define
+  dl-magic-rule-heads
+  (fn
+    (rules)
+    (let ((seen (list)))
+      (do
+        (for-each
+          (fn
+            (r)
+            (let ((h (dl-rel-name (get r :head))))
+              (when
+                (and (not (nil? h)) (not (dl-member-string? h seen)))
+                (append! seen h))))
+          rules)
+        seen))))
+
+(define
+  dl-magic-query
+  (fn
+    (db query-goal)
+    (let
+      ((query-rel (dl-rel-name query-goal))
+        (query-adn (dl-adorn-goal query-goal)))
+      (let
+        ((query-args (dl-bound-args query-goal query-adn))
+          (rules (dl-rules db)))
+        (let
+          ((rewritten (dl-magic-rewrite rules query-rel query-adn query-args))
+            (mdb (dl-make-db))
+            (rule-heads (dl-magic-rule-heads rules)))
+          (do
+            ;; Copy EDB facts (relations not headed by any caller rule).
+            (for-each
+              (fn
+                (rel)
+                (when
+                  (not (dl-member-string? rel rule-heads))
+                  (for-each
+                    (fn (t) (dl-add-fact! mdb t))
+                    (dl-rel-tuples db rel))))
+              (keys (get db :facts)))
+            ;; Seed + rewritten rules.
+            (dl-add-fact! mdb (get rewritten :seed))
+            (for-each (fn (r) (dl-add-rule! mdb r)) (get rewritten :rules))
+            (dl-query mdb query-goal)))))))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 481f48f9..b44085fa 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 202,
+  "total_passed": 204,
   "total_failed": 0,
-  "total": 202,
+  "total": 204,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":18,"failed":0,"total":18},
     {"name":"api","passed":14,"failed":0,"total":14},
-    {"name":"magic","passed":18,"failed":0,"total":18},
+    {"name":"magic","passed":20,"failed":0,"total":20},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T09:58:16+00:00"
+  "generated": "2026-05-08T10:00:29+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index def16294..27c9bab8 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**202 / 202 passing** (0 failure(s)).
+**204 / 204 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 18 | 18 | ok |
 | api | 14 | 14 | ok |
-| magic | 18 | 18 | ok |
+| magic | 20 | 20 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index 78ad1d27..568409ce 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -196,6 +196,34 @@
               (len (dl-relation db "ancestor")))))
         6)
 
+      ;; dl-magic-query: end-to-end driver, doesn't mutate caller's db.
+      (dl-mt-test! "magic-query equivalent to dl-query"
+        (let
+          ((db (dl-program
+                 "parent(a, b). parent(b, c). parent(c, d).
+                  ancestor(X, Y) :- parent(X, Y).
+                  ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")))
+          (let
+            ((semi (dl-query db (list (quote ancestor) (quote a) (quote X))))
+              (magic (dl-magic-query
+                       db (list (quote ancestor) (quote a) (quote X)))))
+            (= (len semi) (len magic))))
+        true)
+
+      ;; magic-query doesn't mutate caller db.
+      (dl-mt-test! "magic-query preserves caller db"
+        (let
+          ((db (dl-program
+                 "parent(a, b). parent(b, c).
+                  ancestor(X, Y) :- parent(X, Y).
+                  ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")))
+          (let
+            ((rules-before (len (dl-rules db))))
+            (do
+              (dl-magic-query db (list (quote ancestor) (quote a) (quote X)))
+              (= rules-before (len (dl-rules db))))))
+        true)
+
       (dl-mt-test! "magic-rewritten finds same answers"
         (let
           ((rules
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 4b9d41a8..f68428d9 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -174,11 +174,15 @@ large graphs.
 - [x] Equivalence test: rewritten ancestor program over the same EDB
       derives the same number of `ancestor` tuples and returns the
       same query answers as the unrewritten program (chain-3 case).
+- [x] `dl-magic-query db query-goal` — top-level driver. Builds a
+      fresh internal db with the caller's EDB facts, the magic seed,
+      and the rewritten rules; saturates and queries. Caller's db is
+      untouched. Equivalent to `dl-query` for fully-stratifiable
+      programs (sole motivation is a perf alternative on goal-shaped
+      queries against large recursive relations).
 - [ ] Perf test: 10k-node reachability with magic vs semi-naive.
-      Pending — would need a `dl-saturate-magic!` driver that builds
-      a temporary db from rewrite output. The rewriter itself is in
-      place; benchmarking against semi-naive on large graphs is left
-      to a future iteration.
+      Left to a future iteration — would need a benchmarking harness
+      for large graphs and the conformance budget can't afford it.
 
 ### Phase 7 — stratified negation
 - [x] Dependency graph: `dl-build-dep-graph db` returns `{head -> ({:rel
@@ -299,6 +303,14 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-08 — Phase 6 driver: `dl-magic-query db query-goal`.
+  Builds a fresh internal db from the caller's EDB + magic seed +
+  rewritten rules, saturates, queries, returns substitutions —
+  caller's db is untouched. Equivalent to `dl-query` for any
+  fully-stratifiable program; sole motivation is a perf alternative
+  on goal-shaped queries against large recursive relations.
+  2 new tests cover equivalence and non-mutation.
+
 - 2026-05-08 — Phase 6 magic-sets rewriter. `dl-magic-rewrite rules
   query-rel adn args` returns `{:rules <rewritten> :seed <seed-fact>}`.
   Worklist over `(rel, adn)` pairs starts from the query, gates each

From 57a1dbb232eb66b67c4552e9190438e85994f569 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:03:04 +0000
Subject: [PATCH 34/89] datalog: magic-sets benefit test on disjoint-cluster
 graph (205/205)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Two disjoint chains, query rooted in cluster 1. Semi-naive
derives the full closure over both clusters (6 ancestor tuples).
Magic-sets only seeds magic_ancestor^bf for cluster 1, so only
2 query-relevant tuples are returned (a→b, a→c). The test
asserts both numbers, demonstrating the actual perf-shape
benefit of goal-directed evaluation.
---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 23 +++++++++++++++++++++++
 3 files changed, 29 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index b44085fa..9c238632 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 204,
+  "total_passed": 205,
   "total_failed": 0,
-  "total": 204,
+  "total": 205,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":18,"failed":0,"total":18},
     {"name":"api","passed":14,"failed":0,"total":14},
-    {"name":"magic","passed":20,"failed":0,"total":20},
+    {"name":"magic","passed":21,"failed":0,"total":21},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T10:00:29+00:00"
+  "generated": "2026-05-08T10:02:51+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 27c9bab8..3ad41dc4 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**204 / 204 passing** (0 failure(s)).
+**205 / 205 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 18 | 18 | ok |
 | api | 14 | 14 | ok |
-| magic | 20 | 20 | ok |
+| magic | 21 | 21 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index 568409ce..c9e82183 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -224,6 +224,29 @@
               (= rules-before (len (dl-rules db))))))
         true)
 
+      ;; Magic-sets benefit: query touches only one cluster of a
+      ;; multi-component graph. Semi-naive derives the full closure
+      ;; over both clusters; magic only the seeded one.
+      (dl-mt-test! "magic skips irrelevant clusters"
+        (let
+          ;; Two disjoint chains. Query is rooted in cluster 1.
+          ((db (dl-program
+                 "parent(a, b). parent(b, c).
+                  parent(x, y). parent(y, z).
+                  ancestor(X, Y) :- parent(X, Y).
+                  ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")))
+          (do
+            (dl-saturate! db)
+            (let
+              ((semi-count (len (dl-relation db "ancestor")))
+                (magic-results
+                  (dl-magic-query
+                    db (list (quote ancestor) (quote a) (quote X)))))
+              ;; Semi-naive derives 6 (3 in each cluster). Magic
+              ;; gives 3 query results (a's reachable: b, c).
+              (and (= semi-count 6) (= (len magic-results) 2)))))
+        true)
+
       (dl-mt-test! "magic-rewritten finds same answers"
         (let
           ((rules

From 282a3d3d06aaf2b85484a05d32f13cf0534d5c4d Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:04:59 +0000
Subject: [PATCH 35/89] datalog: dl-eval-magic single-call magic-sets entry
 (206/206)

Symmetric to dl-eval but routes single-positive-literal queries
through dl-magic-query for goal-directed evaluation. Multi-literal
query bodies fall back to standard dl-query (magic-sets is wired
for single goals only).

  (dl-eval-magic source-string "?- ancestor(a, X).")

1 new api test.
---
 lib/datalog/api.sx          | 29 +++++++++++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/api.sx    | 10 ++++++++++
 4 files changed, 45 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/api.sx b/lib/datalog/api.sx
index 872b2017..72cb9dfd 100644
--- a/lib/datalog/api.sx
+++ b/lib/datalog/api.sx
@@ -169,6 +169,35 @@
         (else
           (dl-query db (get (first queries) :query)))))))
 
+;; (dl-eval-magic source query-source) — like dl-eval but routes a
+;; single-positive-literal query through `dl-magic-query` for goal-
+;; directed evaluation. Multi-literal query bodies fall back to the
+;; standard dl-query path (magic-sets is currently only wired for
+;; single-positive goals). The caller's source is parsed afresh
+;; each call so successive invocations are independent.
+(define
+  dl-eval-magic
+  (fn
+    (source query-source)
+    (let
+      ((db (dl-program source))
+        (queries (dl-parse query-source)))
+      (cond
+        ((= (len queries) 0) (error "dl-eval-magic: query string is empty"))
+        ((not (has-key? (first queries) :query))
+          (error
+            "dl-eval-magic: second arg must be a `?- ...` query clause"))
+        (else
+          (let
+            ((qbody (get (first queries) :query)))
+            (cond
+              ((and (= (len qbody) 1)
+                    (list? (first qbody))
+                    (> (len (first qbody)) 0)
+                    (symbol? (first (first qbody))))
+                (dl-magic-query db (first qbody)))
+              (else (dl-query db qbody)))))))))
+
 (define
   dl-rule-head-rels
   (fn
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 9c238632..203984a5 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 205,
+  "total_passed": 206,
   "total_failed": 0,
-  "total": 205,
+  "total": 206,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -12,9 +12,9 @@
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":18,"failed":0,"total":18},
-    {"name":"api","passed":14,"failed":0,"total":14},
+    {"name":"api","passed":15,"failed":0,"total":15},
     {"name":"magic","passed":21,"failed":0,"total":21},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T10:02:51+00:00"
+  "generated": "2026-05-08T10:04:46+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 3ad41dc4..8af1890b 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**205 / 205 passing** (0 failure(s)).
+**206 / 206 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -12,6 +12,6 @@
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 18 | 18 | ok |
-| api | 14 | 14 | ok |
+| api | 15 | 15 | ok |
 | magic | 21 | 21 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/api.sx b/lib/datalog/tests/api.sx
index 0431ed1f..809946df 100644
--- a/lib/datalog/tests/api.sx
+++ b/lib/datalog/tests/api.sx
@@ -213,6 +213,16 @@
           "?- p(X), q(X).")
         (list {:X 2} {:X 3}))
 
+      ;; dl-eval-magic — routes single-goal queries through
+      ;; magic-sets evaluation.
+      (dl-api-test-set! "dl-eval-magic ancestor"
+        (dl-eval-magic
+          "parent(a, b). parent(b, c).
+           ancestor(X, Y) :- parent(X, Y).
+           ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z)."
+          "?- ancestor(a, X).")
+        (list {:X (quote b)} {:X (quote c)}))
+
       ;; Comprehensive integration: recursion + stratified negation
       ;; + aggregation + comparison composed in a single program.
       ;; (Uses _Anything as a regular var instead of `_` so the

From 9c5a697e458b04b3bc89b58d1ba2da6df672c0bd Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:06:48 +0000
Subject: [PATCH 36/89] datalog: dl-clear-idb! helper (208/208)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Wipes every rule-headed relation (the IDB) — leaves EDB facts and
rule definitions intact. Useful for inspecting the EDB-only
baseline or for forcing a clean re-saturation.

  (dl-saturate! db)
  (dl-clear-idb! db)        ; ancestor relation now empty
  (dl-saturate! db)         ; re-derives ancestor from parents

2 new api tests verify IDB-wipe and EDB-preservation.
---
 lib/datalog/api.sx          | 20 ++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/api.sx    | 24 ++++++++++++++++++++++++
 4 files changed, 50 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/api.sx b/lib/datalog/api.sx
index 72cb9dfd..07fcea10 100644
--- a/lib/datalog/api.sx
+++ b/lib/datalog/api.sx
@@ -213,3 +213,23 @@
                 (append! seen h))))
           (dl-rules db))
         seen))))
+
+;; Wipe every relation that has at least one rule (i.e. every IDB
+;; relation) — leaves EDB facts and rule definitions intact. Useful
+;; before a follow-up `dl-saturate!` if you want a clean restart, or
+;; for inspection of the EDB-only baseline.
+(define
+  dl-clear-idb!
+  (fn
+    (db)
+    (let ((rule-heads (dl-rule-head-rels db)))
+      (do
+        (for-each
+          (fn
+            (k)
+            (do
+              (dict-set! (get db :facts) k (list))
+              (dict-set! (get db :facts-keys) k {})
+              (dict-set! (get db :facts-index) k {})))
+          rule-heads)
+        db))))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 203984a5..2884cc4d 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 206,
+  "total_passed": 208,
   "total_failed": 0,
-  "total": 206,
+  "total": 208,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -12,9 +12,9 @@
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":18,"failed":0,"total":18},
-    {"name":"api","passed":15,"failed":0,"total":15},
+    {"name":"api","passed":17,"failed":0,"total":17},
     {"name":"magic","passed":21,"failed":0,"total":21},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T10:04:46+00:00"
+  "generated": "2026-05-08T10:06:36+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 8af1890b..850f96c0 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**206 / 206 passing** (0 failure(s)).
+**208 / 208 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -12,6 +12,6 @@
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 18 | 18 | ok |
-| api | 15 | 15 | ok |
+| api | 17 | 17 | ok |
 | magic | 21 | 21 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/api.sx b/lib/datalog/tests/api.sx
index 809946df..b2334dff 100644
--- a/lib/datalog/tests/api.sx
+++ b/lib/datalog/tests/api.sx
@@ -213,6 +213,30 @@
           "?- p(X), q(X).")
         (list {:X 2} {:X 3}))
 
+      ;; dl-clear-idb!: wipe rule-headed relations.
+      (dl-api-test! "dl-clear-idb! wipes IDB"
+        (let
+          ((db (dl-program
+                 "parent(a, b). parent(b, c).
+                  ancestor(X, Y) :- parent(X, Y).
+                  ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")))
+          (do
+            (dl-saturate! db)
+            (dl-clear-idb! db)
+            (len (dl-relation db "ancestor"))))
+        0)
+
+      (dl-api-test! "dl-clear-idb! preserves EDB"
+        (let
+          ((db (dl-program
+                 "parent(a, b). parent(b, c).
+                  ancestor(X, Y) :- parent(X, Y).")))
+          (do
+            (dl-saturate! db)
+            (dl-clear-idb! db)
+            (len (dl-relation db "parent"))))
+        2)
+
       ;; dl-eval-magic — routes single-goal queries through
       ;; magic-sets evaluation.
       (dl-api-test-set! "dl-eval-magic ancestor"

From 5100c5d5a67c734a9f3a2a450d7863af54ef733f Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:07:35 +0000
Subject: [PATCH 37/89] datalog-plan: tick Phase 9 federation demo (already in
 demo.sx)

---
 plans/datalog-on-sx.md | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index f68428d9..8a6a8791 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -258,8 +258,11 @@ large graphs.
       dict-rule form, dl-rule constructor, dl-assert! incremental,
       dl-retract! removes derived, cyclic-graph reach via data,
       assert into empty db, fact-style rule (no arrow), coerce dict.
-- [ ] Integration demo: federation graph query — `(ancestor actor1 actor2)` over
-      rose-ash ActivityPub follow relationships (Phase 10).
+- [x] Integration demo: federation graph query — `(reachable A B)` /
+      `(mutual A B)` / `(foaf A C)` over `(follows ACTOR-A ACTOR-B)` in
+      `lib/datalog/demo.sx`. Tests in `lib/datalog/tests/demo.sx`.
+      Wiring this to actual rose-ash ActivityPub data is Phase 10
+      service work and is out of scope for this loop.
 
 ### Phase 10 — Datalog as a query language for rose-ash
 - [x] Schema sketches in `lib/datalog/demo.sx`:

From ce8fed6b224f6efb6902fd4be9fe262159075e65 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:08:58 +0000
Subject: [PATCH 38/89] datalog: refresh datalog.sx API doc with magic-sets +
 later additions

---
 lib/datalog/datalog.sx | 18 ++++++++++++++++++
 1 file changed, 18 insertions(+)

diff --git a/lib/datalog/datalog.sx b/lib/datalog/datalog.sx
index 8189ec09..54e2ce7d 100644
--- a/lib/datalog/datalog.sx
+++ b/lib/datalog/datalog.sx
@@ -14,6 +14,7 @@
 ;;   (load "lib/datalog/strata.sx")
 ;;   (load "lib/datalog/eval.sx")
 ;;   (load "lib/datalog/api.sx")
+;;   (load "lib/datalog/magic.sx")
 ;;   (load "lib/datalog/demo.sx")
 ;;
 ;; (lib/datalog/conformance.sh runs this load list automatically.)
@@ -35,10 +36,15 @@
 ;;     (dl-rule head body)              dict-rule constructor
 ;;     (dl-add-clause! db clause)       parser output → fact or rule
 ;;     (dl-load-program! db src)        string source
+;;     (dl-set-strategy! db strategy)   :semi-naive default; :magic
+;;                                        is informational, use
+;;                                        dl-magic-query for actual
+;;                                        magic-sets evaluation
 ;;
 ;;   Mutation:
 ;;     (dl-assert! db lit)              add + re-saturate
 ;;     (dl-retract! db lit)             drop EDB, wipe IDB, re-saturate
+;;     (dl-clear-idb! db)               wipe rule-headed relations
 ;;
 ;;   Query / inspection:
 ;;     (dl-saturate! db)                stratified semi-naive default
@@ -48,6 +54,18 @@
 ;;     (dl-relation db rel-name)        tuple list for a relation
 ;;     (dl-rules db)                    rule list
 ;;     (dl-fact-count db)               total ground tuples
+;;     (dl-summary db)                  {<rel>: count} for inspection
+;;
+;;   Single-call convenience:
+;;     (dl-eval source query-source)         parse, run, return substs
+;;     (dl-eval-magic source query-source)   single-goal → magic-sets
+;;
+;;   Magic-sets (lib/datalog/magic.sx):
+;;     (dl-adorn-goal goal)             "b/f" adornment string
+;;     (dl-rule-sips rule head-adn)     SIPS analysis per body lit
+;;     (dl-magic-rewrite rules rel adn args)
+;;                                       rewritten rule list + seed
+;;     (dl-magic-query db query-goal)    end-to-end magic-sets query
 ;;
 ;; ── Body literal kinds ─────────────────────────────────────────────
 ;;

From 4a643a5c52b8ecdad7e2ae3476462ddbdcf11fba Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:11:00 +0000
Subject: [PATCH 39/89] datalog-plan: rolling status header (208/208, all
 phases addressed)

---
 plans/datalog-on-sx.md | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 8a6a8791..802451fb 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -13,6 +13,19 @@ End-state goal: **full core Datalog** (facts, rules, stratified negation, aggreg
 recursion) with a clean SX query API, and a demonstration of Datalog as a query engine
 for rose-ash data (e.g. federation graph, content relationships).
 
+## Status (rolling)
+
+`bash lib/datalog/conformance.sh` → **208/208 across 11 suites**
+(tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
+api, magic, demo). Source is ~3000 LOC, tests ~2700 LOC, public API
+documented in `lib/datalog/datalog.sx`.
+
+Phases 1–9 are functionally complete; Phase 10 covers the rose-ash
+domain demos (in `lib/datalog/demo.sx`). The PostgreSQL loader and
+`/internal/datalog` HTTP endpoint listed in Phase 10 require service-
+tree edits outside `lib/datalog/**` and are flagged as out-of-scope
+for this loop.
+
 ## Ground rules
 
 - **Scope:** only touch `lib/datalog/**` and `plans/datalog-on-sx.md`. Do **not** edit

From 43fa31375d5496d410834812e5e9007907d57d00 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:13:13 +0000
Subject: [PATCH 40/89] datalog: magic-vs-semi work-shape test on chain-12
 (209/209)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Demonstrates the practical effect of goal-directed evaluation:
chain of 12 nodes, semi-naive derives the full ancestor closure
(78 = 12·13/2 tuples), while a magic-rooted query at node 0
returns only its 12 descendants. Concrete check that magic
limits derivation to the query's transitive cone.
---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 29 +++++++++++++++++++++++++++++
 3 files changed, 35 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 2884cc4d..1a302808 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 208,
+  "total_passed": 209,
   "total_failed": 0,
-  "total": 208,
+  "total": 209,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":18,"failed":0,"total":18},
     {"name":"api","passed":17,"failed":0,"total":17},
-    {"name":"magic","passed":21,"failed":0,"total":21},
+    {"name":"magic","passed":22,"failed":0,"total":22},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T10:06:36+00:00"
+  "generated": "2026-05-08T10:13:00+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 850f96c0..1e78dc45 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**208 / 208 passing** (0 failure(s)).
+**209 / 209 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 18 | 18 | ok |
 | api | 17 | 17 | ok |
-| magic | 21 | 21 | ok |
+| magic | 22 | 22 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index c9e82183..6527aa42 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -227,6 +227,35 @@
       ;; Magic-sets benefit: query touches only one cluster of a
       ;; multi-component graph. Semi-naive derives the full closure
       ;; over both clusters; magic only the seeded one.
+      ;; Magic-vs-semi work shape: chain of 12. Semi-naive
+      ;; derives the full closure (78 = 12·13/2). A magic query
+      ;; rooted at node 0 returns the 12 descendants only —
+      ;; demonstrating that magic limits derivation to the
+      ;; query's transitive cone.
+      (dl-mt-test! "magic vs semi work-shape on chain-12"
+        (let
+          ((source (str
+                     "parent(0, 1). parent(1, 2). parent(2, 3). "
+                     "parent(3, 4). parent(4, 5). parent(5, 6). "
+                     "parent(6, 7). parent(7, 8). parent(8, 9). "
+                     "parent(9, 10). parent(10, 11). parent(11, 12). "
+                     "ancestor(X, Y) :- parent(X, Y). "
+                     "ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")))
+          (let
+            ((db1 (dl-make-db)) (db2 (dl-make-db)))
+            (do
+              (dl-load-program! db1 source)
+              (dl-saturate! db1)
+              (dl-load-program! db2 source)
+              (let
+                ((semi-count (len (dl-relation db1 "ancestor")))
+                  (magic-count
+                    (len (dl-magic-query
+                           db2 (list (quote ancestor) 0 (quote X))))))
+                ;; Magic returns only descendants of 0 (12 of them).
+                (and (= semi-count 78) (= magic-count 12))))))
+        true)
+
       (dl-mt-test! "magic skips irrelevant clusters"
         (let
           ;; Two disjoint chains. Query is rooted in cluster 1.

From fc6979a371abd2a46c3d7e74b33918ee0ddfbea7 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:15:29 +0000
Subject: [PATCH 41/89] datalog: dl-saturated? fixpoint predicate (212/212)

Returns true iff one more saturation step would derive no new
tuples. Walks every rule under the current bindings and short-
circuits as soon as one derivation would add a fresh tuple.
Useful in tests that want to assert "no work left" after a call,
or for tooling that wants to know whether `dl-saturate!` would
do anything.

3 new eval tests cover the after-saturation, before-saturation,
and after-assert states.
---
 lib/datalog/eval.sx         | 29 +++++++++++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 25 +++++++++++++++++++++++++
 4 files changed, 60 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index 32db2f7f..e0fc1554 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -134,6 +134,35 @@
           (dl-find-bindings body db (dl-empty-subst)))
         new?))))
 
+;; Returns true iff one more saturation step would derive no new
+;; tuples (i.e. the db is at fixpoint). Useful in tests that want
+;; to assert "no work left" after a saturation call. Works under
+;; either saturator since both compute the same fixpoint.
+(define
+  dl-saturated?
+  (fn
+    (db)
+    (let ((any-new false))
+      (do
+        (for-each
+          (fn
+            (rule)
+            (when (not any-new)
+              (for-each
+                (fn
+                  (s)
+                  (let ((derived (dl-apply-subst (get rule :head) s)))
+                    (when
+                      (and (not any-new)
+                           (not (dl-tuple-member?
+                                  derived
+                                  (dl-rel-tuples
+                                    db (dl-rel-name derived)))))
+                      (set! any-new true))))
+                (dl-find-bindings (get rule :body) db (dl-empty-subst)))))
+          (dl-rules db))
+        (not any-new)))))
+
 (define
   dl-saturate-naive!
   (fn
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 1a302808..95bc068c 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 209,
+  "total_passed": 212,
   "total_failed": 0,
-  "total": 209,
+  "total": 212,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
-    {"name":"eval","passed":25,"failed":0,"total":25},
+    {"name":"eval","passed":28,"failed":0,"total":28},
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":22,"failed":0,"total":22},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T10:13:00+00:00"
+  "generated": "2026-05-08T10:15:09+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 1e78dc45..4cb73b51 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**209 / 209 passing** (0 failure(s)).
+**212 / 212 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
 | parse | 18 | 18 | ok |
 | unify | 28 | 28 | ok |
-| eval | 25 | 25 | ok |
+| eval | 28 | 28 | ok |
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index 8030f3f1..9c688f86 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -258,6 +258,31 @@
           (do (dl-set-strategy! db :magic) (dl-get-strategy db)))
         :magic)
 
+      ;; dl-saturated?: no-work-left predicate.
+      (dl-et-test! "saturated? after saturation"
+        (let ((db (dl-program
+                    "parent(a, b).
+                     ancestor(X, Y) :- parent(X, Y).")))
+          (do (dl-saturate! db) (dl-saturated? db)))
+        true)
+
+      (dl-et-test! "saturated? before saturation"
+        (let ((db (dl-program
+                    "parent(a, b).
+                     ancestor(X, Y) :- parent(X, Y).")))
+          (dl-saturated? db))
+        false)
+
+      (dl-et-test! "saturated? after assert"
+        (let ((db (dl-program
+                    "parent(a, b).
+                     ancestor(X, Y) :- parent(X, Y).")))
+          (do
+            (dl-saturate! db)
+            (dl-add-fact! db (list (quote parent) (quote b) (quote c)))
+            (dl-saturated? db)))
+        false)
+
       (dl-et-test-set! "magic-set still derives correctly"
         (let
           ((db (dl-program

From 9695d31dab67c50425d876cc580de79622448c11 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:17:44 +0000
Subject: [PATCH 42/89] datalog: dl-rules-of relation-inspection helper
 (214/214)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

(dl-rules-of db rel-name) → list of rules with head matching
the given relation name. Useful for tooling and debugging
("show me how this relation is derived") without exposing the
internal :rules list directly.

2 new api tests cover hit and miss cases.
---
 lib/datalog/api.sx          | 18 ++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/api.sx    | 14 ++++++++++++++
 4 files changed, 38 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/api.sx b/lib/datalog/api.sx
index 07fcea10..925c8728 100644
--- a/lib/datalog/api.sx
+++ b/lib/datalog/api.sx
@@ -198,6 +198,24 @@
                 (dl-magic-query db (first qbody)))
               (else (dl-query db qbody)))))))))
 
+;; List rules whose head's relation matches `rel-name`. Useful for
+;; inspection ("show me how this relation is derived") without
+;; exposing the internal `:rules` list.
+(define
+  dl-rules-of
+  (fn
+    (db rel-name)
+    (let ((out (list)))
+      (do
+        (for-each
+          (fn
+            (rule)
+            (when
+              (= (dl-rel-name (get rule :head)) rel-name)
+              (append! out rule)))
+          (dl-rules db))
+        out))))
+
 (define
   dl-rule-head-rels
   (fn
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 95bc068c..c34b0adb 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 212,
+  "total_passed": 214,
   "total_failed": 0,
-  "total": 212,
+  "total": 214,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -12,9 +12,9 @@
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":18,"failed":0,"total":18},
-    {"name":"api","passed":17,"failed":0,"total":17},
+    {"name":"api","passed":19,"failed":0,"total":19},
     {"name":"magic","passed":22,"failed":0,"total":22},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T10:15:09+00:00"
+  "generated": "2026-05-08T10:17:32+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 4cb73b51..8633cec0 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**212 / 212 passing** (0 failure(s)).
+**214 / 214 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -12,6 +12,6 @@
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 18 | 18 | ok |
-| api | 17 | 17 | ok |
+| api | 19 | 19 | ok |
 | magic | 22 | 22 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/api.sx b/lib/datalog/tests/api.sx
index b2334dff..7cddd4cb 100644
--- a/lib/datalog/tests/api.sx
+++ b/lib/datalog/tests/api.sx
@@ -213,6 +213,20 @@
           "?- p(X), q(X).")
         (list {:X 2} {:X 3}))
 
+      ;; dl-rules-of: rules with head matching a relation name.
+      (dl-api-test! "dl-rules-of count"
+        (let
+          ((db (dl-program
+                 "p(1). q(X) :- p(X). r(X) :- p(X). q(2).")))
+          (len (dl-rules-of db "q")))
+        1)
+
+      (dl-api-test! "dl-rules-of empty"
+        (let
+          ((db (dl-program "p(1). p(2).")))
+          (len (dl-rules-of db "q")))
+        0)
+
       ;; dl-clear-idb!: wipe rule-headed relations.
       (dl-api-test! "dl-clear-idb! wipes IDB"
         (let

From 7a64be22d8af17e5c5b302020a365d339ea41405 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:19:58 +0000
Subject: [PATCH 43/89] =?UTF-8?q?datalog:=20dl-eval=20=E2=89=A1=20dl-eval-?=
 =?UTF-8?q?magic=20equivalence=20test=20(215/215)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/api.sx    | 14 ++++++++++++++
 3 files changed, 20 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index c34b0adb..26342bda 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 214,
+  "total_passed": 215,
   "total_failed": 0,
-  "total": 214,
+  "total": 215,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -12,9 +12,9 @@
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":18,"failed":0,"total":18},
-    {"name":"api","passed":19,"failed":0,"total":19},
+    {"name":"api","passed":20,"failed":0,"total":20},
     {"name":"magic","passed":22,"failed":0,"total":22},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T10:17:32+00:00"
+  "generated": "2026-05-08T10:19:48+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 8633cec0..c97ea81e 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**214 / 214 passing** (0 failure(s)).
+**215 / 215 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -12,6 +12,6 @@
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 18 | 18 | ok |
-| api | 19 | 19 | ok |
+| api | 20 | 20 | ok |
 | magic | 22 | 22 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/api.sx b/lib/datalog/tests/api.sx
index 7cddd4cb..b46df8f8 100644
--- a/lib/datalog/tests/api.sx
+++ b/lib/datalog/tests/api.sx
@@ -261,6 +261,20 @@
           "?- ancestor(a, X).")
         (list {:X (quote b)} {:X (quote c)}))
 
+      ;; Equivalence: dl-eval and dl-eval-magic produce the same
+      ;; answers for any well-formed query (magic-sets is a perf
+      ;; alternative, not a semantic change).
+      (dl-api-test! "dl-eval ≡ dl-eval-magic on ancestor"
+        (let
+          ((source "parent(a, b). parent(b, c). parent(c, d).
+                    ancestor(X, Y) :- parent(X, Y).
+                    ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z)."))
+          (let
+            ((semi (dl-eval source "?- ancestor(a, X)."))
+              (magic (dl-eval-magic source "?- ancestor(a, X).")))
+            (= (len semi) (len magic))))
+        true)
+
       ;; Comprehensive integration: recursion + stratified negation
       ;; + aggregation + comparison composed in a single program.
       ;; (Uses _Anything as a regular var instead of `_` so the

From de734b27b81036f473809688508055b11555d3e6 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:22:03 +0000
Subject: [PATCH 44/89] datalog: group-by-via-aggregate-in-rule test (216/216)

---
 lib/datalog/scoreboard.json     |  8 ++++----
 lib/datalog/scoreboard.md       |  4 ++--
 lib/datalog/tests/aggregates.sx | 16 ++++++++++++++++
 3 files changed, 22 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 26342bda..82d72289 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 215,
+  "total_passed": 216,
   "total_failed": 0,
-  "total": 215,
+  "total": 216,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -11,10 +11,10 @@
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
-    {"name":"aggregates","passed":18,"failed":0,"total":18},
+    {"name":"aggregates","passed":19,"failed":0,"total":19},
     {"name":"api","passed":20,"failed":0,"total":20},
     {"name":"magic","passed":22,"failed":0,"total":22},
     {"name":"demo","passed":18,"failed":0,"total":18}
   ],
-  "generated": "2026-05-08T10:19:48+00:00"
+  "generated": "2026-05-08T10:21:54+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index c97ea81e..9da23bc9 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**215 / 215 passing** (0 failure(s)).
+**216 / 216 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -11,7 +11,7 @@
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
-| aggregates | 18 | 18 | ok |
+| aggregates | 19 | 19 | ok |
 | api | 20 | 20 | ok |
 | magic | 22 | 22 | ok |
 | demo | 18 | 18 | ok |
diff --git a/lib/datalog/tests/aggregates.sx b/lib/datalog/tests/aggregates.sx
index 6392ce29..bca13375 100644
--- a/lib/datalog/tests/aggregates.sx
+++ b/lib/datalog/tests/aggregates.sx
@@ -227,6 +227,22 @@
         (list {:L (list)}))
 
       ;; Aggregate vs single distinct.
+      ;; Group-by via aggregate-in-rule-body. Per-user friend count
+      ;; over a friends relation. The U var is bound by the prior
+      ;; positive lit u(U) so the aggregate counts only U-rooted
+      ;; friends per group.
+      (dl-at-test-set! "group-by per-user friend count"
+        (dl-query
+          (dl-program
+            "u(alice). u(bob). u(carol).
+             f(alice, x). f(alice, y). f(bob, x).
+             counts(U, N) :- u(U), count(N, X, f(U, X)).")
+          (list (quote counts) (quote U) (quote N)))
+        (list
+          {:U (quote alice) :N 2}
+          {:U (quote bob) :N 1}
+          {:U (quote carol) :N 0}))
+
       ;; Stratification: recursion through aggregation is rejected.
       (dl-at-test! "agg recursion rejected"
         (dl-at-throws?

From e0c7de1a1c1e63b3b8c3aeac4d521410b16d555e Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:24:10 +0000
Subject: [PATCH 45/89] datalog: org-chart + transitive headcount demo
 (219/219)

Adds dl-demo-org-rules: (subordinate Mgr Emp) over a (manager
EMP MGR) graph, and (headcount Mgr N) using count aggregation
grouped by manager. Demonstrates real-world hierarchy queries
(e.g. "everyone reporting up to the CEO") + per-manager rollup.

3 new demo tests: transitive subordinates of CEO (5 entries),
CEO headcount, and direct manager headcount.
---
 lib/datalog/demo.sx         | 21 ++++++++++++++++++++-
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/demo.sx   | 36 ++++++++++++++++++++++++++++++++++++
 4 files changed, 62 insertions(+), 7 deletions(-)

diff --git a/lib/datalog/demo.sx b/lib/datalog/demo.sx
index f15dd645..657c64c1 100644
--- a/lib/datalog/demo.sx
+++ b/lib/datalog/demo.sx
@@ -6,7 +6,7 @@
 ;; below show the shape of queries we want, and the test suite runs
 ;; them against synthetic in-memory tuples loaded via dl-program-data.
 ;;
-;; Six thematic demos:
+;; Seven thematic demos:
 ;;
 ;;   1. Federation — follow graph, transitive reach, mutuals, FOAF.
 ;;   2. Content    — posts, tags, likes, popularity, "for you" feed.
@@ -15,6 +15,7 @@
 ;;                      follow (transitively)" multi-domain query.
 ;;   5. Tag co-occurrence — distinct (T1, T2) pairs with counts.
 ;;   6. Shortest path  — weighted-DAG path enumeration + min agg.
+;;   7. Org chart      — transitive subordinate + headcount per mgr.
 
 ;; ── Demo 1: federation follow graph ─────────────────────────────
 ;; EDB: (follows ACTOR-A ACTOR-B) — A follows B.
@@ -132,6 +133,24 @@
        (is W (+ W1 W2)))
      (shortest X Y W <- (path X Y _) (min W C (path X Y C))))))
 
+;; ── Demo 7: org chart + transitive headcount ───────────────────
+;; Manager graph: each employee has a single manager. Compute the
+;; transitive subordinate set and headcount per manager.
+;;
+;; EDB:
+;;   (manager EMP MGR)            — EMP reports directly to MGR
+;; IDB:
+;;   (subordinate MGR EMP)        — EMP is in MGR's subtree
+;;   (headcount MGR N)            — number of subordinates under MGR
+(define
+  dl-demo-org-rules
+  (quote
+    ((subordinate Mgr Emp <- (manager Emp Mgr))
+     (subordinate Mgr Emp
+       <- (manager Mid Mgr) (subordinate Mid Emp))
+     (headcount Mgr N
+       <- (subordinate Mgr Anyone) (count N E (subordinate Mgr E))))))
+
 ;; ── Loader stub ──────────────────────────────────────────────────
 ;; Wiring to PostgreSQL would replace these helpers with calls into
 ;; rose-ash's internal HTTP RPC (fetch_data → /internal/data/...).
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 82d72289..28545113 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 216,
+  "total_passed": 219,
   "total_failed": 0,
-  "total": 216,
+  "total": 219,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -14,7 +14,7 @@
     {"name":"aggregates","passed":19,"failed":0,"total":19},
     {"name":"api","passed":20,"failed":0,"total":20},
     {"name":"magic","passed":22,"failed":0,"total":22},
-    {"name":"demo","passed":18,"failed":0,"total":18}
+    {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T10:21:54+00:00"
+  "generated": "2026-05-08T10:23:54+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 9da23bc9..590c3c02 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**216 / 216 passing** (0 failure(s)).
+**219 / 219 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -14,4 +14,4 @@
 | aggregates | 19 | 19 | ok |
 | api | 20 | 20 | ok |
 | magic | 22 | 22 | ok |
-| demo | 18 | 18 | ok |
+| demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/demo.sx b/lib/datalog/tests/demo.sx
index 1559f800..c893ade3 100644
--- a/lib/datalog/tests/demo.sx
+++ b/lib/datalog/tests/demo.sx
@@ -262,6 +262,42 @@
           (quote (shortest a d W)))
         (list))
 
+      ;; ── Org chart + headcount ─────────────────────────────
+      (dl-demo-test-set! "ceo subordinate transitive"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((manager ic1 mgr1) (manager ic2 mgr1)
+               (manager mgr1 vp1) (manager ic3 vp1)
+               (manager vp1 ceo)))
+            dl-demo-org-rules)
+          (quote (subordinate ceo X)))
+        (list
+          {:X (quote vp1)} {:X (quote mgr1)} {:X (quote ic1)}
+          {:X (quote ic2)} {:X (quote ic3)}))
+
+      (dl-demo-test-set! "ceo headcount = 5"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((manager ic1 mgr1) (manager ic2 mgr1)
+               (manager mgr1 vp1) (manager ic3 vp1)
+               (manager vp1 ceo)))
+            dl-demo-org-rules)
+          (quote (headcount ceo N)))
+        (list {:N 5}))
+
+      (dl-demo-test-set! "mgr1 headcount = 2"
+        (dl-query
+          (dl-demo-make
+            (quote
+              ((manager ic1 mgr1) (manager ic2 mgr1)
+               (manager mgr1 vp1) (manager ic3 vp1)
+               (manager vp1 ceo)))
+            dl-demo-org-rules)
+          (quote (headcount mgr1 N)))
+        (list {:N 2}))
+
       (dl-demo-test-set! "no access without grant"
         (dl-query
           (dl-demo-make

From 30880927f22361ea759ea161c860bca89e665c89 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:24:45 +0000
Subject: [PATCH 46/89] datalog-plan: rolling status update (219/219, 7 demos)

---
 plans/datalog-on-sx.md | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 802451fb..3670cf02 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,16 +15,17 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **208/208 across 11 suites**
+`bash lib/datalog/conformance.sh` → **219/219 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
-api, magic, demo). Source is ~3000 LOC, tests ~2700 LOC, public API
+api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
 
 Phases 1–9 are functionally complete; Phase 10 covers the rose-ash
-domain demos (in `lib/datalog/demo.sx`). The PostgreSQL loader and
-`/internal/datalog` HTTP endpoint listed in Phase 10 require service-
-tree edits outside `lib/datalog/**` and are flagged as out-of-scope
-for this loop.
+domain demos (in `lib/datalog/demo.sx` — federation, content,
+permissions, cooking-posts, tag co-occurrence, shortest path, org chart).
+The PostgreSQL loader and `/internal/datalog` HTTP endpoint listed in
+Phase 10 require service-tree edits outside `lib/datalog/**` and are
+flagged as out-of-scope for this loop.
 
 ## Ground rules
 

From 549cb5ea84ae31938a3bdfea9dfabc16dc64024b Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:27:45 +0000
Subject: [PATCH 47/89] datalog: mixed-EDB+IDB-same-relation regression test
 (220/220)

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 11 +++++++++++
 3 files changed, 17 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 28545113..43ef5417 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 219,
+  "total_passed": 220,
   "total_failed": 0,
-  "total": 219,
+  "total": 220,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
-    {"name":"eval","passed":28,"failed":0,"total":28},
+    {"name":"eval","passed":29,"failed":0,"total":29},
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":22,"failed":0,"total":22},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T10:23:54+00:00"
+  "generated": "2026-05-08T10:27:32+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 590c3c02..65bbd501 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**219 / 219 passing** (0 failure(s)).
+**220 / 220 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
 | parse | 18 | 18 | ok |
 | unify | 28 | 28 | ok |
-| eval | 28 | 28 | ok |
+| eval | 29 | 29 | ok |
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index 9c688f86..c3e056ea 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -273,6 +273,17 @@
           (dl-saturated? db))
         false)
 
+      ;; A relation can be both EDB-seeded and rule-derived;
+      ;; saturate combines facts + derivations.
+      (dl-et-test-set! "mixed EDB + IDB same relation"
+        (dl-query
+          (dl-program
+            "link(a, b). link(c, d). link(e, c).
+             via(a, e).
+             link(X, Y) :- via(X, M), link(M, Y).")
+          (list (quote link) (quote a) (quote X)))
+        (list {:X (quote b)} {:X (quote c)}))
+
       (dl-et-test! "saturated? after assert"
         (let ((db (dl-program
                     "parent(a, b).

From 5a3db1a4582c88e3d849cdae7d3a739bb78ec2ea Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:29:14 +0000
Subject: [PATCH 48/89] datalog: magic preserves arithmetic test (221/221)

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 12 ++++++++++++
 3 files changed, 18 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 43ef5417..b1366855 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 220,
+  "total_passed": 221,
   "total_failed": 0,
-  "total": 220,
+  "total": 221,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":19,"failed":0,"total":19},
     {"name":"api","passed":20,"failed":0,"total":20},
-    {"name":"magic","passed":22,"failed":0,"total":22},
+    {"name":"magic","passed":23,"failed":0,"total":23},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T10:27:32+00:00"
+  "generated": "2026-05-08T10:29:04+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 65bbd501..dda4e89d 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**220 / 220 passing** (0 failure(s)).
+**221 / 221 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 19 | 19 | ok |
 | api | 20 | 20 | ok |
-| magic | 22 | 22 | ok |
+| magic | 23 | 23 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index 6527aa42..d5a6ca0f 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -256,6 +256,18 @@
                 (and (= semi-count 78) (= magic-count 12))))))
         true)
 
+      ;; Magic + arithmetic: rules with `is` clauses pass through
+      ;; the rewriter unchanged (built-ins aren't propagated).
+      (dl-mt-test! "magic preserves arithmetic"
+        (let
+          ((source "n(1). n(2). n(3).
+                    doubled(X, Y) :- n(X), is(Y, *(X, 2))."))
+          (let
+            ((semi (dl-eval source "?- doubled(2, Y)."))
+              (magic (dl-eval-magic source "?- doubled(2, Y).")))
+            (= (len semi) (len magic))))
+        true)
+
       (dl-mt-test! "magic skips irrelevant clusters"
         (let
           ;; Two disjoint chains. Query is rooted in cluster 1.

From a648247ae40a2b130d8da44f12580e69f7d04575 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:32:01 +0000
Subject: [PATCH 49/89] datalog: dl-magic-query falls back on built-in/agg/neg
 goals (222/222)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bug: dl-magic-query was always trying to seed a magic_<rel>^<adn>
fact for the query goal. For aggregate goals like (count N X (p X))
this produced a non-ground "fact" (magic_count^... N X (p X)) and
dl-add-fact! correctly rejected it, surfacing as an error.

Fix: dl-magic-query now detects built-in / aggregate / negation
goals up front and dispatches to plain dl-query for those cases —
magic-sets only applies to positive non-builtin literals against
rule-defined relations. Other shapes don't benefit from the
rewrite anyway.

1 new test confirms (count N X (p X)) returns the expected
{:N 3} via dl-magic-query.
---
 lib/datalog/magic.sx        | 30 ++++++++++++++++++++----------
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 12 ++++++++++++
 4 files changed, 38 insertions(+), 16 deletions(-)

diff --git a/lib/datalog/magic.sx b/lib/datalog/magic.sx
index 7ea1b548..4a2953f0 100644
--- a/lib/datalog/magic.sx
+++ b/lib/datalog/magic.sx
@@ -376,16 +376,26 @@
   dl-magic-query
   (fn
     (db query-goal)
-    (let
-      ((query-rel (dl-rel-name query-goal))
-        (query-adn (dl-adorn-goal query-goal)))
-      (let
-        ((query-args (dl-bound-args query-goal query-adn))
-          (rules (dl-rules db)))
+    ;; Magic-sets only applies to positive non-builtin / non-aggregate
+    ;; literals against rule-defined relations. For other goal shapes
+    ;; (built-ins, aggregates, EDB-only relations) the seed is either
+    ;; non-ground or unused; fall back to dl-query.
+    (cond
+      ((or (dl-builtin? query-goal)
+           (dl-aggregate? query-goal)
+           (and (dict? query-goal) (has-key? query-goal :neg)))
+        (dl-query db query-goal))
+      (else
         (let
-          ((rewritten (dl-magic-rewrite rules query-rel query-adn query-args))
-            (mdb (dl-make-db))
-            (rule-heads (dl-magic-rule-heads rules)))
+          ((query-rel (dl-rel-name query-goal))
+            (query-adn (dl-adorn-goal query-goal)))
+          (let
+            ((query-args (dl-bound-args query-goal query-adn))
+              (rules (dl-rules db)))
+            (let
+              ((rewritten (dl-magic-rewrite rules query-rel query-adn query-args))
+                (mdb (dl-make-db))
+                (rule-heads (dl-magic-rule-heads rules)))
           (do
             ;; Copy EDB facts (relations not headed by any caller rule).
             (for-each
@@ -400,4 +410,4 @@
             ;; Seed + rewritten rules.
             (dl-add-fact! mdb (get rewritten :seed))
             (for-each (fn (r) (dl-add-rule! mdb r)) (get rewritten :rules))
-            (dl-query mdb query-goal)))))))
+            (dl-query mdb query-goal)))))))))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index b1366855..2c9f5834 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 221,
+  "total_passed": 222,
   "total_failed": 0,
-  "total": 221,
+  "total": 222,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":19,"failed":0,"total":19},
     {"name":"api","passed":20,"failed":0,"total":20},
-    {"name":"magic","passed":23,"failed":0,"total":23},
+    {"name":"magic","passed":24,"failed":0,"total":24},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T10:29:04+00:00"
+  "generated": "2026-05-08T10:31:43+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index dda4e89d..7b0b251a 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**221 / 221 passing** (0 failure(s)).
+**222 / 222 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 19 | 19 | ok |
 | api | 20 | 20 | ok |
-| magic | 23 | 23 | ok |
+| magic | 24 | 24 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index d5a6ca0f..e9ebefb3 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -197,6 +197,18 @@
         6)
 
       ;; dl-magic-query: end-to-end driver, doesn't mutate caller's db.
+      ;; dl-magic-query falls back to dl-query for built-in,
+      ;; aggregate, and negation goals (the magic seed would
+      ;; otherwise be non-ground).
+      (dl-mt-test! "magic-query falls back on aggregate"
+        (let
+          ((r (dl-magic-query
+                (dl-program "p(1). p(2). p(3).")
+                (list (quote count) (quote N) (quote X)
+                      (list (quote p) (quote X))))))
+          (and (= (len r) 1) (= (get (first r) "N") 3)))
+        true)
+
       (dl-mt-test! "magic-query equivalent to dl-query"
         (let
           ((db (dl-program

From 370df5b8e5749d22b9d3c8ba8091d36cd4e81576 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:33:45 +0000
Subject: [PATCH 50/89] datalog: diagonal query (repeated var) regression test
 (223/223)

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 10 ++++++++++
 3 files changed, 16 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 2c9f5834..8b9218d9 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 222,
+  "total_passed": 223,
   "total_failed": 0,
-  "total": 222,
+  "total": 223,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
-    {"name":"eval","passed":29,"failed":0,"total":29},
+    {"name":"eval","passed":30,"failed":0,"total":30},
     {"name":"builtins","passed":19,"failed":0,"total":19},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":24,"failed":0,"total":24},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T10:31:43+00:00"
+  "generated": "2026-05-08T10:33:34+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 7b0b251a..ebeab7d4 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**222 / 222 passing** (0 failure(s)).
+**223 / 223 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
 | parse | 18 | 18 | ok |
 | unify | 28 | 28 | ok |
-| eval | 29 | 29 | ok |
+| eval | 30 | 30 | ok |
 | builtins | 19 | 19 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index c3e056ea..8bc70a2b 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -273,6 +273,16 @@
           (dl-saturated? db))
         false)
 
+      ;; Repeated variable (diagonal): p(X, X) only matches tuples
+      ;; whose two args are equal. The unifier handles this via the
+      ;; subst chain — first occurrence binds X, second occurrence
+      ;; checks against the binding.
+      (dl-et-test-set! "diagonal query"
+        (dl-query
+          (dl-program "p(1, 1). p(2, 3). p(4, 4). p(5, 5).")
+          (list (quote p) (quote X) (quote X)))
+        (list {:X 1} {:X 4} {:X 5}))
+
       ;; A relation can be both EDB-seeded and rule-derived;
       ;; saturate combines facts + derivations.
       (dl-et-test-set! "mixed EDB + IDB same relation"

From ec7e4dd5c4ac88e7ba530ccb20f3d6d76331ad8c Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:36:13 +0000
Subject: [PATCH 51/89] datalog: bounded-successor regression test (224/224)

---
 lib/datalog/scoreboard.json   |  8 ++++----
 lib/datalog/scoreboard.md     |  4 ++--
 lib/datalog/tests/builtins.sx | 11 +++++++++++
 3 files changed, 17 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 8b9218d9..9692afe3 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,14 +1,14 @@
 {
   "lang": "datalog",
-  "total_passed": 223,
+  "total_passed": 224,
   "total_failed": 0,
-  "total": 223,
+  "total": 224,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
     {"name":"eval","passed":30,"failed":0,"total":30},
-    {"name":"builtins","passed":19,"failed":0,"total":19},
+    {"name":"builtins","passed":20,"failed":0,"total":20},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":19,"failed":0,"total":19},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":24,"failed":0,"total":24},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T10:33:34+00:00"
+  "generated": "2026-05-08T10:36:02+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index ebeab7d4..7810f66a 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**223 / 223 passing** (0 failure(s)).
+**224 / 224 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -8,7 +8,7 @@
 | parse | 18 | 18 | ok |
 | unify | 28 | 28 | ok |
 | eval | 30 | 30 | ok |
-| builtins | 19 | 19 | ok |
+| builtins | 20 | 20 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 19 | 19 | ok |
diff --git a/lib/datalog/tests/builtins.sx b/lib/datalog/tests/builtins.sx
index f5136134..840b30af 100644
--- a/lib/datalog/tests/builtins.sx
+++ b/lib/datalog/tests/builtins.sx
@@ -179,6 +179,17 @@
           ((db (dl-program "n(0). n(1). n(2). n(3). n(4). n(5). n(6). n(7). n(8). n(9).\n                  big(X) :- n(X), >=(X, 5).")))
           (do (dl-saturate! db) (len (dl-relation db "big"))))
         5)
+      ;; Bounded successor: a recursive rule with a comparison
+      ;; guard terminates because the Herbrand base is effectively
+      ;; bounded.
+      (dl-bt-test-set! "bounded successor"
+        (dl-query
+          (dl-program
+            "nat(0).
+             nat(Y) :- nat(X), is(Y, +(X, 1)), <(Y, 5).")
+          (list (quote nat) (quote X)))
+        (list {:X 0} {:X 1} {:X 2} {:X 3} {:X 4}))
+
       (dl-bt-test!
         "unsafe — comparison without binder"
         (dl-bt-throws? (fn () (dl-program "p(X) :- <(X, 5).")))

From 254052a43bef949c569dbc9642443b63f7a1890d Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:36:40 +0000
Subject: [PATCH 52/89] datalog-plan: rolling status 224/224

---
 plans/datalog-on-sx.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 3670cf02..98c47837 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **219/219 across 11 suites**
+`bash lib/datalog/conformance.sh` → **224/224 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.

From 96f66d3596865f14da065be03779501a6766465a Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 10:41:36 +0000
Subject: [PATCH 53/89] datalog: dl-magic-query handles mixed EDB+IDB relations
 (225/225)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bug: dl-magic-query was skipping EDB facts for relations that had
rules ("rule-headed"). When a single relation has both EDB facts
and rules deriving more (mixed EDB+IDB), the rewritten run would
miss the EDB portion entirely, producing too few or zero results.

Fix: copy ALL existing facts to the internal mdb regardless of
whether the relation has rules. EDB-only relations bring their
tuples; mixed relations bring both EDB and any pre-saturated IDB
(which the rewritten rules would re-derive anyway).

1 new test: link relation seeded with 3 EDB tuples plus a
recursive rule via via/2. dl-magic-query rooted at `a` returns
2 results (a→b direct, a→c via via(a,e), link(e,c)).
---
 lib/datalog/magic.sx        | 15 +++++++++------
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 13 +++++++++++++
 4 files changed, 28 insertions(+), 12 deletions(-)

diff --git a/lib/datalog/magic.sx b/lib/datalog/magic.sx
index 4a2953f0..97168a4e 100644
--- a/lib/datalog/magic.sx
+++ b/lib/datalog/magic.sx
@@ -397,15 +397,18 @@
                 (mdb (dl-make-db))
                 (rule-heads (dl-magic-rule-heads rules)))
           (do
-            ;; Copy EDB facts (relations not headed by any caller rule).
+            ;; Copy ALL existing facts. EDB-only relations bring their
+            ;; tuples; mixed EDB+IDB relations bring both their EDB
+            ;; portion and any pre-saturated IDB tuples (which the
+            ;; rewritten rules would re-derive anyway). Skipping facts
+            ;; for rule-headed relations would leave the magic run
+            ;; without the EDB portion of mixed relations.
             (for-each
               (fn
                 (rel)
-                (when
-                  (not (dl-member-string? rel rule-heads))
-                  (for-each
-                    (fn (t) (dl-add-fact! mdb t))
-                    (dl-rel-tuples db rel))))
+                (for-each
+                  (fn (t) (dl-add-fact! mdb t))
+                  (dl-rel-tuples db rel)))
               (keys (get db :facts)))
             ;; Seed + rewritten rules.
             (dl-add-fact! mdb (get rewritten :seed))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 9692afe3..a566115b 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 224,
+  "total_passed": 225,
   "total_failed": 0,
-  "total": 224,
+  "total": 225,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":19,"failed":0,"total":19},
     {"name":"api","passed":20,"failed":0,"total":20},
-    {"name":"magic","passed":24,"failed":0,"total":24},
+    {"name":"magic","passed":25,"failed":0,"total":25},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T10:36:02+00:00"
+  "generated": "2026-05-08T10:40:13+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 7810f66a..a6d1976d 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**224 / 224 passing** (0 failure(s)).
+**225 / 225 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 19 | 19 | ok |
 | api | 20 | 20 | ok |
-| magic | 24 | 24 | ok |
+| magic | 25 | 25 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index e9ebefb3..90855cd2 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -197,6 +197,19 @@
         6)
 
       ;; dl-magic-query: end-to-end driver, doesn't mutate caller's db.
+      ;; Mixed EDB + IDB: a relation can be both EDB-seeded and
+      ;; rule-derived. dl-magic-query must include the EDB portion
+      ;; even though the relation has rules.
+      (dl-mt-test! "magic mixed EDB+IDB"
+        (len
+          (dl-magic-query
+            (dl-program
+              "link(a, b). link(c, d). link(e, c).
+               via(a, e).
+               link(X, Y) :- via(X, M), link(M, Y).")
+            (list (quote link) (quote a) (quote X))))
+        2)
+
       ;; dl-magic-query falls back to dl-query for built-in,
       ;; aggregate, and negation goals (the magic seed would
       ;; otherwise be non-ground).

From d20df7aa8c95af5efa1f894c633f766aeea48083 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 12:28:52 +0000
Subject: [PATCH 54/89] datalog: magic over rule with aggregate body literal
 (226/226)

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 18 ++++++++++++++++++
 3 files changed, 24 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index a566115b..c89da138 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 225,
+  "total_passed": 226,
   "total_failed": 0,
-  "total": 225,
+  "total": 226,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":19,"failed":0,"total":19},
     {"name":"api","passed":20,"failed":0,"total":20},
-    {"name":"magic","passed":25,"failed":0,"total":25},
+    {"name":"magic","passed":26,"failed":0,"total":26},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T10:40:13+00:00"
+  "generated": "2026-05-08T12:28:42+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index a6d1976d..b0593332 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**225 / 225 passing** (0 failure(s)).
+**226 / 226 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 19 | 19 | ok |
 | api | 20 | 20 | ok |
-| magic | 25 | 25 | ok |
+| magic | 26 | 26 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index 90855cd2..96b9f81e 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -197,6 +197,24 @@
         6)
 
       ;; dl-magic-query: end-to-end driver, doesn't mutate caller's db.
+      ;; Magic over a rule whose body contains an aggregate.
+      ;; The rewriter passes aggregate body lits through unchanged
+      ;; (no propagation generated for them), so semi-naive's count
+      ;; logic still fires correctly under the rewritten program.
+      (dl-mt-test! "magic over rule with aggregate body"
+        (let
+          ((db (dl-program
+                 "post(p1). post(p2). post(p3).
+                  liked(u1, p1). liked(u2, p1). liked(u3, p1).
+                  liked(u1, p2).
+                  rich(P) :- post(P), count(N, U, liked(U, P)),
+                             >=(N, 2).")))
+          (let
+            ((semi (dl-query db (list (quote rich) (quote P))))
+              (magic (dl-magic-query db (list (quote rich) (quote P)))))
+            (= (len semi) (len magic))))
+        true)
+
       ;; Mixed EDB + IDB: a relation can be both EDB-seeded and
       ;; rule-derived. dl-magic-query must include the EDB portion
       ;; even though the relation has rules.

From 5f4defe99eb7fba4b0a0307b81db60e52d4737b8 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 12:31:50 +0000
Subject: [PATCH 55/89] datalog: magic over rule with negation regression test
 (227/227)

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 14 ++++++++++++++
 3 files changed, 20 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index c89da138..9d8fb6d2 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 226,
+  "total_passed": 227,
   "total_failed": 0,
-  "total": 226,
+  "total": 227,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":19,"failed":0,"total":19},
     {"name":"api","passed":20,"failed":0,"total":20},
-    {"name":"magic","passed":26,"failed":0,"total":26},
+    {"name":"magic","passed":27,"failed":0,"total":27},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T12:28:42+00:00"
+  "generated": "2026-05-08T12:31:39+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index b0593332..98e6ecc0 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**226 / 226 passing** (0 failure(s)).
+**227 / 227 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 19 | 19 | ok |
 | api | 20 | 20 | ok |
-| magic | 26 | 26 | ok |
+| magic | 27 | 27 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index 96b9f81e..90b6f75b 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -197,6 +197,20 @@
         6)
 
       ;; dl-magic-query: end-to-end driver, doesn't mutate caller's db.
+      ;; Magic over a rule with negated body literal — propagation
+      ;; rules generated only for positive lits; negated lits pass
+      ;; through unchanged.
+      (dl-mt-test! "magic over rule with negation"
+        (let
+          ((db (dl-program
+                 "u(a). u(b). u(c). banned(b).
+                  active(X) :- u(X), not(banned(X)).")))
+          (let
+            ((semi (dl-query db (list (quote active) (quote X))))
+              (magic (dl-magic-query db (list (quote active) (quote X)))))
+            (= (len semi) (len magic))))
+        true)
+
       ;; Magic over a rule whose body contains an aggregate.
       ;; The rewriter passes aggregate body lits through unchanged
       ;; (no propagation generated for them), so semi-naive's count

From 8e508bc90fdce710c2c084a6490af5e12681c4b5 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 12:35:33 +0000
Subject: [PATCH 56/89] datalog: magic existence check (bb-adornment)
 regression test (228/228)

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 17 +++++++++++++++++
 3 files changed, 23 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 9d8fb6d2..72e9732b 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 227,
+  "total_passed": 228,
   "total_failed": 0,
-  "total": 227,
+  "total": 228,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":19,"failed":0,"total":19},
     {"name":"api","passed":20,"failed":0,"total":20},
-    {"name":"magic","passed":27,"failed":0,"total":27},
+    {"name":"magic","passed":28,"failed":0,"total":28},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T12:31:39+00:00"
+  "generated": "2026-05-08T12:35:21+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 98e6ecc0..39b7704f 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**227 / 227 passing** (0 failure(s)).
+**228 / 228 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 19 | 19 | ok |
 | api | 20 | 20 | ok |
-| magic | 27 | 27 | ok |
+| magic | 28 | 28 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index 90b6f75b..fc4707d3 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -211,6 +211,23 @@
             (= (len semi) (len magic))))
         true)
 
+      ;; All-bound query (existence check) generates an "bb"
+      ;; adornment chain. Verifies the rewriter walks multiple
+      ;; (rel, adn) pairs through the worklist.
+      (dl-mt-test! "magic existence check via bb"
+        (let
+          ((db (dl-program
+                 "parent(a, b). parent(b, c). parent(c, d).
+                  ancestor(X, Y) :- parent(X, Y).
+                  ancestor(X, Z) :- parent(X, Y), ancestor(Y, Z).")))
+          (let
+            ((found (dl-magic-query
+                      db (list (quote ancestor) (quote a) (quote c))))
+              (missing (dl-magic-query
+                         db (list (quote ancestor) (quote a) (quote z)))))
+            (and (= (len found) 1) (= (len missing) 0))))
+        true)
+
       ;; Magic over a rule whose body contains an aggregate.
       ;; The rewriter passes aggregate body lits through unchanged
       ;; (no propagation generated for them), so semi-naive's count

From 9edccb8f3393be3db280aaa6e8f1efdac89d7e9d Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 12:39:04 +0000
Subject: [PATCH 57/89] datalog: bipartite friends-with-hobby join test
 (229/229)

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 12 ++++++++++++
 3 files changed, 18 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 72e9732b..2267c839 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 228,
+  "total_passed": 229,
   "total_failed": 0,
-  "total": 228,
+  "total": 229,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
-    {"name":"eval","passed":30,"failed":0,"total":30},
+    {"name":"eval","passed":31,"failed":0,"total":31},
     {"name":"builtins","passed":20,"failed":0,"total":20},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":28,"failed":0,"total":28},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T12:35:21+00:00"
+  "generated": "2026-05-08T12:38:51+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 39b7704f..d0fbaa9b 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**228 / 228 passing** (0 failure(s)).
+**229 / 229 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
 | parse | 18 | 18 | ok |
 | unify | 28 | 28 | ok |
-| eval | 30 | 30 | ok |
+| eval | 31 | 31 | ok |
 | builtins | 20 | 20 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index 8bc70a2b..fafb4c7a 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -273,6 +273,18 @@
           (dl-saturated? db))
         false)
 
+      ;; Bipartite-style join: pair-of-friends who share a hobby.
+      ;; Three-relation join exercising the planner's join order.
+      (dl-et-test-set! "bipartite friends-with-hobby"
+        (dl-query
+          (dl-program
+            "hobby(alice, climb). hobby(bob, paint).
+             hobby(carol, climb).
+             friend(alice, carol). friend(bob, alice).
+             match(A, B, H) :- friend(A, B), hobby(A, H), hobby(B, H).")
+          (list (quote match) (quote A) (quote B) (quote H)))
+        (list {:A (quote alice) :B (quote carol) :H (quote climb)}))
+
       ;; Repeated variable (diagonal): p(X, X) only matches tuples
       ;; whose two args are equal. The unifier handles this via the
       ;; subst chain — first occurrence binds X, second occurrence

From f12edc8fd9df3acc7658a89434fed017da6b3a2f Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 14:08:02 +0000
Subject: [PATCH 58/89] datalog: indirect aggregate cycle rejected (230/230)

---
 lib/datalog/scoreboard.json     |  8 ++++----
 lib/datalog/scoreboard.md       |  4 ++--
 lib/datalog/tests/aggregates.sx | 18 ++++++++++++++++++
 3 files changed, 24 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 2267c839..5c6525fe 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 229,
+  "total_passed": 230,
   "total_failed": 0,
-  "total": 229,
+  "total": 230,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
@@ -11,10 +11,10 @@
     {"name":"builtins","passed":20,"failed":0,"total":20},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
-    {"name":"aggregates","passed":19,"failed":0,"total":19},
+    {"name":"aggregates","passed":20,"failed":0,"total":20},
     {"name":"api","passed":20,"failed":0,"total":20},
     {"name":"magic","passed":28,"failed":0,"total":28},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T12:38:51+00:00"
+  "generated": "2026-05-08T14:07:50+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index d0fbaa9b..d9b0b0c1 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**229 / 229 passing** (0 failure(s)).
+**230 / 230 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -11,7 +11,7 @@
 | builtins | 20 | 20 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
-| aggregates | 19 | 19 | ok |
+| aggregates | 20 | 20 | ok |
 | api | 20 | 20 | ok |
 | magic | 28 | 28 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/aggregates.sx b/lib/datalog/tests/aggregates.sx
index bca13375..63af21dc 100644
--- a/lib/datalog/tests/aggregates.sx
+++ b/lib/datalog/tests/aggregates.sx
@@ -244,6 +244,24 @@
           {:U (quote carol) :N 0}))
 
       ;; Stratification: recursion through aggregation is rejected.
+      ;; Indirect recursion through aggregation also rejected.
+      ;; q -> r (via positive lit), r -> q (via aggregate body).
+      ;; The aggregate edge counts as negation for stratification.
+      (dl-at-test! "indirect agg cycle rejected"
+        (dl-at-throws?
+          (fn ()
+            (let ((db (dl-make-db)))
+              (do
+                (dl-add-rule! db
+                  {:head (list (quote q) (quote N))
+                   :body (list (list (quote r) (quote N)))})
+                (dl-add-rule! db
+                  {:head (list (quote r) (quote N))
+                   :body (list (list (quote count) (quote N) (quote X)
+                                     (list (quote q) (quote X))))})
+                (dl-saturate! db)))))
+        true)
+
       (dl-at-test! "agg recursion rejected"
         (dl-at-throws?
           (fn ()

From 0985dc63862cb07b05b7f02f3ea4e230a10359f5 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 14:12:34 +0000
Subject: [PATCH 59/89] datalog: disjunction via multiple rules test (231/231)

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 13 +++++++++++++
 3 files changed, 19 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 5c6525fe..a5648c7c 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 230,
+  "total_passed": 231,
   "total_failed": 0,
-  "total": 230,
+  "total": 231,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":18,"failed":0,"total":18},
     {"name":"unify","passed":28,"failed":0,"total":28},
-    {"name":"eval","passed":31,"failed":0,"total":31},
+    {"name":"eval","passed":32,"failed":0,"total":32},
     {"name":"builtins","passed":20,"failed":0,"total":20},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":28,"failed":0,"total":28},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T14:07:50+00:00"
+  "generated": "2026-05-08T14:12:22+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index d9b0b0c1..9d109351 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**230 / 230 passing** (0 failure(s)).
+**231 / 231 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
 | parse | 18 | 18 | ok |
 | unify | 28 | 28 | ok |
-| eval | 31 | 31 | ok |
+| eval | 32 | 32 | ok |
 | builtins | 20 | 20 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index fafb4c7a..822e58fb 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -273,6 +273,19 @@
           (dl-saturated? db))
         false)
 
+      ;; Disjunction via multiple rules — Datalog has no `;` in
+      ;; body, so disjunction is expressed as separate rules with
+      ;; the same head. Here plant_based(X) is satisfied by either
+      ;; vegan(X) or vegetarian(X).
+      (dl-et-test-set! "disjunction via multiple rules"
+        (dl-query
+          (dl-program
+            "vegan(alice). vegetarian(bob). meat_eater(carol).
+             plant_based(X) :- vegan(X).
+             plant_based(X) :- vegetarian(X).")
+          (list (quote plant_based) (quote X)))
+        (list {:X (quote alice)} {:X (quote bob)}))
+
       ;; Bipartite-style join: pair-of-friends who share a hobby.
       ;; Three-relation join exercising the planner's join order.
       (dl-et-test-set! "bipartite friends-with-hobby"

From 21c541bd1bae8b0b615be9273c477b3e8ca4ca50 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 14:16:31 +0000
Subject: [PATCH 60/89] datalog: parser rejection tests for invalid relation
 names (233/233)

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/parse.sx  | 10 ++++++++++
 3 files changed, 16 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index a5648c7c..e70960f4 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,11 +1,11 @@
 {
   "lang": "datalog",
-  "total_passed": 231,
+  "total_passed": 233,
   "total_failed": 0,
-  "total": 231,
+  "total": 233,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
-    {"name":"parse","passed":18,"failed":0,"total":18},
+    {"name":"parse","passed":20,"failed":0,"total":20},
     {"name":"unify","passed":28,"failed":0,"total":28},
     {"name":"eval","passed":32,"failed":0,"total":32},
     {"name":"builtins","passed":20,"failed":0,"total":20},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":28,"failed":0,"total":28},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T14:12:22+00:00"
+  "generated": "2026-05-08T14:16:19+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 9d109351..b200d31a 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,11 +1,11 @@
 # datalog scoreboard
 
-**231 / 231 passing** (0 failure(s)).
+**233 / 233 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
-| parse | 18 | 18 | ok |
+| parse | 20 | 20 | ok |
 | unify | 28 | 28 | ok |
 | eval | 32 | 32 | ok |
 | builtins | 20 | 20 | ok |
diff --git a/lib/datalog/tests/parse.sx b/lib/datalog/tests/parse.sx
index 2af6e6ab..2080e77c 100644
--- a/lib/datalog/tests/parse.sx
+++ b/lib/datalog/tests/parse.sx
@@ -126,6 +126,16 @@
         "underscore var"
         (dl-parse "p(X) :- q(X, _).")
         (list {:body (list (list (quote q) (quote X) (quote _))) :head (list (quote p) (quote X))}))
+      (dl-pt-test!
+        "number as relation name raises"
+        (dl-pt-throws? (fn () (dl-parse "1(X) :- p(X).")))
+        true)
+
+      (dl-pt-test!
+        "var as relation name raises"
+        (dl-pt-throws? (fn () (dl-parse "P(X).")))
+        true)
+
       (dl-pt-test!
         "missing dot raises"
         (dl-pt-throws? (fn () (dl-parse "p(a)")))

From 4a7cff2f6b795bcc4641995f04bd71fd645aa361 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 14:19:25 +0000
Subject: [PATCH 61/89] datalog: built-in-only query goals (236/236)

---
 lib/datalog/scoreboard.json   |  8 ++++----
 lib/datalog/scoreboard.md     |  4 ++--
 lib/datalog/tests/builtins.sx | 14 ++++++++++++++
 3 files changed, 20 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index e70960f4..72fd7b50 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,14 +1,14 @@
 {
   "lang": "datalog",
-  "total_passed": 233,
+  "total_passed": 236,
   "total_failed": 0,
-  "total": 233,
+  "total": 236,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":20,"failed":0,"total":20},
     {"name":"unify","passed":28,"failed":0,"total":28},
     {"name":"eval","passed":32,"failed":0,"total":32},
-    {"name":"builtins","passed":20,"failed":0,"total":20},
+    {"name":"builtins","passed":23,"failed":0,"total":23},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":20,"failed":0,"total":20},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":28,"failed":0,"total":28},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T14:16:19+00:00"
+  "generated": "2026-05-08T14:19:14+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index b200d31a..0b89d9b1 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**233 / 233 passing** (0 failure(s)).
+**236 / 236 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -8,7 +8,7 @@
 | parse | 20 | 20 | ok |
 | unify | 28 | 28 | ok |
 | eval | 32 | 32 | ok |
-| builtins | 20 | 20 | ok |
+| builtins | 23 | 23 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 20 | 20 | ok |
diff --git a/lib/datalog/tests/builtins.sx b/lib/datalog/tests/builtins.sx
index 840b30af..9d7e1852 100644
--- a/lib/datalog/tests/builtins.sx
+++ b/lib/datalog/tests/builtins.sx
@@ -179,6 +179,20 @@
           ((db (dl-program "n(0). n(1). n(2). n(3). n(4). n(5). n(6). n(7). n(8). n(9).\n                  big(X) :- n(X), >=(X, 5).")))
           (do (dl-saturate! db) (len (dl-relation db "big"))))
         5)
+      ;; Built-in / arithmetic literals work as standalone query goals
+      ;; (without needing a wrapper rule).
+      (dl-bt-test-set! "comparison-only goal true"
+        (dl-eval "" "?- <(1, 2).")
+        (list {}))
+
+      (dl-bt-test-set! "comparison-only goal false"
+        (dl-eval "" "?- <(2, 1).")
+        (list))
+
+      (dl-bt-test-set! "is goal binds"
+        (dl-eval "" "?- is(N, +(2, 3)).")
+        (list {:N 5}))
+
       ;; Bounded successor: a recursive rule with a comparison
       ;; guard terminates because the Herbrand base is effectively
       ;; bounded.

From e981368dcf8a727499a0616c2b47d279534129ba Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 14:29:18 +0000
Subject: [PATCH 62/89] =?UTF-8?q?datalog:=20magic=20=E2=89=A1=20semi=20on?=
 =?UTF-8?q?=20federation=20foaf=20demo=20(237/237)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 14 ++++++++++++++
 3 files changed, 20 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 72fd7b50..60f7f14d 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 236,
+  "total_passed": 237,
   "total_failed": 0,
-  "total": 236,
+  "total": 237,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":20,"failed":0,"total":20},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":20,"failed":0,"total":20},
     {"name":"api","passed":20,"failed":0,"total":20},
-    {"name":"magic","passed":28,"failed":0,"total":28},
+    {"name":"magic","passed":29,"failed":0,"total":29},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T14:19:14+00:00"
+  "generated": "2026-05-08T14:29:08+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 0b89d9b1..cec0e73e 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**236 / 236 passing** (0 failure(s)).
+**237 / 237 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 20 | 20 | ok |
 | api | 20 | 20 | ok |
-| magic | 28 | 28 | ok |
+| magic | 29 | 29 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index fc4707d3..985ba4dc 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -228,6 +228,20 @@
             (and (= (len found) 1) (= (len missing) 0))))
         true)
 
+      ;; Magic equivalence on the federation demo.
+      (dl-mt-test! "magic ≡ semi on foaf demo"
+        (let
+          ((db (dl-program-data
+                 (quote ((follows alice bob)
+                         (follows bob carol)
+                         (follows alice dave)))
+                 dl-demo-federation-rules)))
+          (let
+            ((semi (dl-query db (quote (foaf alice X))))
+              (magic (dl-magic-query db (quote (foaf alice X)))))
+            (= (len semi) (len magic))))
+        true)
+
       ;; Magic over a rule whose body contains an aggregate.
       ;; The rewriter passes aggregate body lits through unchanged
       ;; (no propagation generated for them), so semi-naive's count

From 17d6f58cc5aa3146e1a5b866e5edda7a7b1ae822 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 14:41:05 +0000
Subject: [PATCH 63/89] datalog: dl-magic-rewrite worklist now drains across
 rule chains (239/239)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Real bug: the worklist used (set! queue (rest queue)) to pop the
head, which left queue bound to a fresh empty list as soon as the
last item was popped. Subsequent (append! queue ...) was a no-op
on the empty list — so when the head's rewrite generated new
(rel, adn) pairs to enqueue, they vanished. Multi-relation
programs (e.g. shortest -> path -> edge, or chained derived
relations) only had their head's rules rewritten; downstream
rules silently dropped.

Fix: use an index-based loop (idx 0 → len queue), with append!
adding to the same list. Items added after the current pointer
are picked up in subsequent iterations.

2 new regression tests:
- 4-level chain (a → r1 → r2 → r3 → r4) under magic returns 2
- shortest-path demo via magic equals dl-query (1 result)
---
 lib/datalog/magic.sx        | 41 +++++++++++++++++++------------------
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 26 +++++++++++++++++++++++
 4 files changed, 53 insertions(+), 26 deletions(-)

diff --git a/lib/datalog/magic.sx b/lib/datalog/magic.sx
index 97168a4e..ffdf4cf4 100644
--- a/lib/datalog/magic.sx
+++ b/lib/datalog/magic.sx
@@ -314,26 +314,27 @@
 
         (dl-mq-mark! query-rel query-adornment)
 
-        (define
-          dl-mq-process
-          (fn
-            ()
-            (when
-              (> (len queue) 0)
-              (let ((item (first queue)))
-                (do
-                  (set! queue (rest queue))
-                  (let
-                    ((rel (get item :rel)) (adn (get item :adn)))
-                    (for-each
-                      (fn
-                        (rule)
-                        (when
-                          (= (dl-rel-name (get rule :head)) rel)
-                          (dl-mq-rewrite-rule! rule adn)))
-                      rules))
-                  (dl-mq-process))))))
-        (dl-mq-process)
+        (let ((idx 0))
+          (define
+            dl-mq-process
+            (fn
+              ()
+              (when
+                (< idx (len queue))
+                (let ((item (nth queue idx)))
+                  (do
+                    (set! idx (+ idx 1))
+                    (let
+                      ((rel (get item :rel)) (adn (get item :adn)))
+                      (for-each
+                        (fn
+                          (rule)
+                          (when
+                            (= (dl-rel-name (get rule :head)) rel)
+                            (dl-mq-rewrite-rule! rule adn)))
+                        rules))
+                    (dl-mq-process))))))
+          (dl-mq-process))
 
         {:rules out
          :seed
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 60f7f14d..c5e44ea7 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 237,
+  "total_passed": 239,
   "total_failed": 0,
-  "total": 237,
+  "total": 239,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":20,"failed":0,"total":20},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":20,"failed":0,"total":20},
     {"name":"api","passed":20,"failed":0,"total":20},
-    {"name":"magic","passed":29,"failed":0,"total":29},
+    {"name":"magic","passed":31,"failed":0,"total":31},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T14:29:08+00:00"
+  "generated": "2026-05-08T14:40:44+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index cec0e73e..6e176c8b 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**237 / 237 passing** (0 failure(s)).
+**239 / 239 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 20 | 20 | ok |
 | api | 20 | 20 | ok |
-| magic | 29 | 29 | ok |
+| magic | 31 | 31 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index 985ba4dc..00edf4da 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -242,6 +242,32 @@
             (= (len semi) (len magic))))
         true)
 
+      ;; Multi-relation rewrite chain: query r4 → propagate to r3,
+      ;; r2, r1, a. The worklist must process all of them; an
+      ;; earlier bug stopped after only the head pair.
+      (dl-mt-test! "magic chain through 4 rule levels"
+        (let
+          ((db (dl-program
+                 "a(1). a(2). r1(X) :- a(X). r2(X) :- r1(X).
+                  r3(X) :- r2(X). r4(X) :- r3(X).")))
+          (= 2 (len (dl-magic-query db (list (quote r4) (quote X))))))
+        true)
+
+      ;; Shortest-path demo via magic — exercises the rewriter
+      ;; against rules that mix recursive positive lits with an
+      ;; aggregate body literal.
+      (dl-mt-test! "magic on shortest-path demo"
+        (let
+          ((db (dl-program-data
+                 (quote ((edge a b 5) (edge b c 3) (edge a c 10)))
+                 dl-demo-shortest-path-rules)))
+          (let
+            ((semi (dl-query db (quote (shortest a c W))))
+              (magic (dl-magic-query db (quote (shortest a c W)))))
+            (and (= (len semi) (len magic))
+                 (= (len semi) 1))))
+        true)
+
       ;; Magic over a rule whose body contains an aggregate.
       ;; The rewriter passes aggregate body lits through unchanged
       ;; (no propagation generated for them), so semi-naive's count

From 62a5a29d5b9e327ce31b8ccbc73b6560c4d1f9f9 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 14:41:29 +0000
Subject: [PATCH 64/89] datalog-plan: rolling status 239/239 (magic worklist
 bug fixed)

---
 plans/datalog-on-sx.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 98c47837..7ce6b29d 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **224/224 across 11 suites**
+`bash lib/datalog/conformance.sh` → **239/239 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.

From a4ef2714593048616af29385c5af517635275e91 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Fri, 8 May 2026 23:00:22 +0000
Subject: [PATCH 65/89] datalog: cousin (multi-adornment same-relation) magic
 test (240/240)

---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 18 ++++++++++++++++++
 3 files changed, 24 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index c5e44ea7..7619dbf7 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 239,
+  "total_passed": 240,
   "total_failed": 0,
-  "total": 239,
+  "total": 240,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":20,"failed":0,"total":20},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":20,"failed":0,"total":20},
     {"name":"api","passed":20,"failed":0,"total":20},
-    {"name":"magic","passed":31,"failed":0,"total":31},
+    {"name":"magic","passed":32,"failed":0,"total":32},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T14:40:44+00:00"
+  "generated": "2026-05-08T22:41:23+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 6e176c8b..aa4e3c96 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**239 / 239 passing** (0 failure(s)).
+**240 / 240 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 20 | 20 | ok |
 | api | 20 | 20 | ok |
-| magic | 31 | 31 | ok |
+| magic | 32 | 32 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index 00edf4da..a5c47f03 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -268,6 +268,24 @@
                  (= (len semi) 1))))
         true)
 
+      ;; Same relation called with different adornment patterns
+      ;; in different rules. The worklist must enqueue and process
+      ;; each (rel, adornment) pair.
+      (dl-mt-test! "magic with multi-adornment same relation"
+        (let
+          ((db (dl-program
+                 "parent(p1, alice). parent(p2, bob).
+                  parent(g, p1). parent(g, p2).
+                  sibling(P1, P2) :- parent(G, P1), parent(G, P2),
+                                     !=(P1, P2).
+                  cousin(X, Y) :- parent(P1, X), parent(P2, Y),
+                                  sibling(P1, P2).")))
+          (let
+            ((semi (dl-query db (list (quote cousin) (quote alice) (quote Y))))
+              (magic (dl-magic-query db (list (quote cousin) (quote alice) (quote Y)))))
+            (= (len semi) (len magic))))
+        true)
+
       ;; Magic over a rule whose body contains an aggregate.
       ;; The rewriter passes aggregate body lits through unchanged
       ;; (no propagation generated for them), so semi-naive's count

From d437727f1d0c898aa421706ec0fc15f25c50e0de Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Sat, 9 May 2026 13:11:47 +0000
Subject: [PATCH 66/89] datalog: magic regression tests from bug-hunt round
 (242/242)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bug-hunt round probed magic-sets against many edge cases. No new
bugs surfaced. Added regression tests for two patterns that
exercise the worklist post-fix:

- 3-stratum program (a → c via not-b → d via not-banned).
  Distinct rule heads at three strata; magic must rewrite each.
- Aggregate-derived chain (count(src) → cnt → active threshold).
  Magic correctly handles multi-step aggregate dependencies.

Magic-sets is robust against: 3-stratum negation, aggregate
chains, mutual recursion, all-bound goals, multi-arity rules,
diagonal queries, EDB-only goals, and rules whose body has
identical positive lits.
---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 28 ++++++++++++++++++++++++++++
 3 files changed, 34 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 7619dbf7..182ca67b 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 240,
+  "total_passed": 242,
   "total_failed": 0,
-  "total": 240,
+  "total": 242,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":20,"failed":0,"total":20},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":20,"failed":0,"total":20},
     {"name":"api","passed":20,"failed":0,"total":20},
-    {"name":"magic","passed":32,"failed":0,"total":32},
+    {"name":"magic","passed":34,"failed":0,"total":34},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-08T22:41:23+00:00"
+  "generated": "2026-05-09T13:11:25+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index aa4e3c96..f82a3b30 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**240 / 240 passing** (0 failure(s)).
+**242 / 242 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 20 | 20 | ok |
 | api | 20 | 20 | ok |
-| magic | 32 | 32 | ok |
+| magic | 34 | 34 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index a5c47f03..6778dc19 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -242,6 +242,34 @@
             (= (len semi) (len magic))))
         true)
 
+      ;; 3-stratum program under magic — distinct rule heads at
+      ;; strata 0/1/2 must all rewrite via the worklist.
+      (dl-mt-test! "magic 3-stratum program"
+        (let
+          ((db (dl-program
+                 "a(1). a(2). a(3). b(2).
+                  c(X) :- a(X), not(b(X)).
+                  d(X) :- c(X), not(banned(X)).
+                  banned(3).")))
+          (let
+            ((semi (dl-query db (list (quote d) (quote X))))
+              (magic (dl-magic-query db (list (quote d) (quote X)))))
+            (= (len semi) (len magic))))
+        true)
+
+      ;; Aggregate -> derived -> threshold chain via magic.
+      (dl-mt-test! "magic aggregate-derived chain"
+        (let
+          ((db (dl-program
+                 "src(1). src(2). src(3).
+                  cnt(N) :- count(N, X, src(X)).
+                  active(N) :- cnt(N), >=(N, 2).")))
+          (let
+            ((semi (dl-query db (list (quote active) (quote N))))
+              (magic (dl-magic-query db (list (quote active) (quote N)))))
+            (= (len semi) (len magic))))
+        true)
+
       ;; Multi-relation rewrite chain: query r4 → propagate to r3,
       ;; r2, r1, a. The worklist must process all of them; an
       ;; earlier bug stopped after only the head pair.

From 2c8c1f75b3c581c264b71f2b6211d1eaed2a7475 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Sun, 10 May 2026 20:51:56 +0000
Subject: [PATCH 67/89] datalog: reject reserved relation names as rule/fact
 heads (246/246)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Real bugs surfaced by parser/safety bug-hunt round:
- `not(X) :- p(X).` parsed as a regular literal with relation
  "not". The user could accidentally define a `not` relation,
  silently shadowing the negation construct.
- `count(N, X, p(X)) :- ...` defined a `count` relation that
  would conflict with the aggregate operator.
- `<(X, 5) :- p(X).` defined a `<` relation.
- `is(N, +(1, 2)) :- p(N).` defined an `is` relation.
- `+.` (operator alone) parsed as a 0-ary fact.

Fix: dl-add-fact! and dl-add-rule! now reject any literal whose
head's relation name is in dl-reserved-rel-names — built-in
operators (< <= > >= = != + - * /), aggregate operators
(count sum min max findall), `is`, `not`, and the arrows
(:-, ?-).

4 new eval tests cover the rejection cases.

Note: an initial "no compound args in facts" check was overly
strict — it would reject findall's list output (which derives a
fact like (all_p (a b c))). Reverted that branch; treating
findall results as opaque list values rather than function
symbols.
---
 lib/datalog/db.sx           | 20 ++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 22 ++++++++++++++++++++++
 4 files changed, 48 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index 7930fdda..798fcfa7 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -182,6 +182,20 @@
       ((facts (get db :facts)))
       (if (has-key? facts rel-key) (get facts rel-key) (list)))))
 
+;; Reserved relation names: built-in / aggregate / negation / arrow.
+;; Rules and facts may not have these as their head's relation, since
+;; the saturator treats them specially or they are not relation names
+;; at all.
+(define
+  dl-reserved-rel-names
+  (list "not" "count" "sum" "min" "max" "findall" "is"
+        "<" "<=" ">" ">=" "=" "!=" "+" "-" "*" "/" ":-" "?-"))
+
+(define
+  dl-reserved-rel?
+  (fn
+    (name) (dl-member-string? name dl-reserved-rel-names)))
+
 (define
   dl-add-fact!
   (fn
@@ -189,6 +203,9 @@
     (cond
       ((not (and (list? lit) (> (len lit) 0)))
         (error (str "dl-add-fact!: expected literal list, got " lit)))
+      ((dl-reserved-rel? (dl-rel-name lit))
+        (error (str "dl-add-fact!: '" (dl-rel-name lit)
+                    "' is a reserved name (built-in / aggregate / negation)")))
       ((not (dl-ground? lit (dl-empty-subst)))
         (error (str "dl-add-fact!: expected ground literal, got " lit)))
       (else
@@ -301,6 +318,9 @@
         (error (str "dl-add-rule!: expected rule dict, got " rule)))
       ((not (has-key? rule :head))
         (error (str "dl-add-rule!: rule missing :head, got " rule)))
+      ((dl-reserved-rel? (dl-rel-name (get rule :head)))
+        (error (str "dl-add-rule!: '" (dl-rel-name (get rule :head))
+                    "' is a reserved name (built-in / aggregate / negation)")))
       (else
         (let ((rule (dl-rename-anon-rule rule)))
           (let
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 182ca67b..b67356f8 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 242,
+  "total_passed": 246,
   "total_failed": 0,
-  "total": 242,
+  "total": 246,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
     {"name":"parse","passed":20,"failed":0,"total":20},
     {"name":"unify","passed":28,"failed":0,"total":28},
-    {"name":"eval","passed":32,"failed":0,"total":32},
+    {"name":"eval","passed":36,"failed":0,"total":36},
     {"name":"builtins","passed":23,"failed":0,"total":23},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":34,"failed":0,"total":34},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-09T13:11:25+00:00"
+  "generated": "2026-05-10T20:51:33+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index f82a3b30..7c5196ef 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**242 / 242 passing** (0 failure(s)).
+**246 / 246 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
 | parse | 20 | 20 | ok |
 | unify | 28 | 28 | ok |
-| eval | 32 | 32 | ok |
+| eval | 36 | 36 | ok |
 | builtins | 23 | 23 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index 822e58fb..75541282 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -165,6 +165,28 @@
           ((db (dl-program "edge(1, 2). edge(2, 3). edge(3, 1).\n                  reach(X, Y) :- edge(X, Y).\n                  reach(X, Z) :- edge(X, Y), reach(Y, Z).")))
           (do (dl-saturate! db) (len (dl-relation db "reach"))))
         9)
+      ;; Reserved relation names rejected as rule/fact heads.
+      (dl-et-test!
+        "reserved name `not` as head rejected"
+        (dl-et-throws? (fn () (dl-program "not(X) :- p(X).")))
+        true)
+
+      (dl-et-test!
+        "reserved name `count` as head rejected"
+        (dl-et-throws?
+          (fn () (dl-program "count(N, X, p(X)) :- p(X).")))
+        true)
+
+      (dl-et-test!
+        "reserved name `<` as head rejected"
+        (dl-et-throws? (fn () (dl-program "<(X, 5) :- p(X).")))
+        true)
+
+      (dl-et-test!
+        "reserved name `is` as head rejected"
+        (dl-et-throws? (fn () (dl-program "is(N, +(1, 2)) :- p(N).")))
+        true)
+
       (dl-et-test!
         "unsafe head var"
         (dl-et-throws? (fn () (dl-program "p(X, Y) :- q(X).")))

From 2a1d8eeab216d283327b903371a9c09c74a1e78d Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Sun, 10 May 2026 20:55:42 +0000
Subject: [PATCH 68/89] datalog: parser accepts negative integer literals
 (248/248)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bug: `n(-1).` failed to parse — the tokenizer produced op `-`
followed by number `1`, and dl-pp-parse-arg expected a term after
seeing `-` as an op (and a `(` for a compound) but found a bare
number. Users had to write `(- 0 1)` or compute via `is`.

Fix: dl-pp-parse-arg detects op `-` directly followed by a number
token (no intervening `(`) and consumes both as a single negative
number literal. Subtraction (`is(Y, -(X, 2))`) and compound
arithmetic via the operator form are unaffected — they use the
`-(` lookahead path.

2 new parser tests: negative integer literal and subtraction
compound preserved.
---
 lib/datalog/parser.sx       | 10 ++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/parse.sx  | 15 +++++++++++++++
 4 files changed, 31 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/parser.sx b/lib/datalog/parser.sx
index 66ff43dd..16701597 100644
--- a/lib/datalog/parser.sx
+++ b/lib/datalog/parser.sx
@@ -91,6 +91,16 @@
           ((= ty "number") (do (dl-pp-advance! st) vv))
           ((= ty "string") (do (dl-pp-advance! st) vv))
           ((= ty "var") (do (dl-pp-advance! st) (string->symbol vv)))
+          ;; Negative numeric literal: `-` op directly followed by a
+          ;; number (no `(`) is parsed as a single negative number.
+          ;; This keeps `(-X Y)` (compound) and `-N` (literal) distinct.
+          ((and (= ty "op") (= vv "-")
+                (= (get (dl-pp-peek2 st) :type) "number"))
+            (do
+              (dl-pp-advance! st)
+              (let
+                ((n (get (dl-pp-peek st) :value)))
+                (do (dl-pp-advance! st) (- 0 n)))))
           ((or (= ty "atom") (= ty "op"))
             (do
               (dl-pp-advance! st)
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index b67356f8..36aea08c 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,11 +1,11 @@
 {
   "lang": "datalog",
-  "total_passed": 246,
+  "total_passed": 248,
   "total_failed": 0,
-  "total": 246,
+  "total": 248,
   "suites": [
     {"name":"tokenize","passed":26,"failed":0,"total":26},
-    {"name":"parse","passed":20,"failed":0,"total":20},
+    {"name":"parse","passed":22,"failed":0,"total":22},
     {"name":"unify","passed":28,"failed":0,"total":28},
     {"name":"eval","passed":36,"failed":0,"total":36},
     {"name":"builtins","passed":23,"failed":0,"total":23},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":34,"failed":0,"total":34},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-10T20:51:33+00:00"
+  "generated": "2026-05-10T20:55:23+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 7c5196ef..53252867 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,11 +1,11 @@
 # datalog scoreboard
 
-**246 / 246 passing** (0 failure(s)).
+**248 / 248 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 26 | 26 | ok |
-| parse | 20 | 20 | ok |
+| parse | 22 | 22 | ok |
 | unify | 28 | 28 | ok |
 | eval | 36 | 36 | ok |
 | builtins | 23 | 23 | ok |
diff --git a/lib/datalog/tests/parse.sx b/lib/datalog/tests/parse.sx
index 2080e77c..9d0f7201 100644
--- a/lib/datalog/tests/parse.sx
+++ b/lib/datalog/tests/parse.sx
@@ -126,6 +126,21 @@
         "underscore var"
         (dl-parse "p(X) :- q(X, _).")
         (list {:body (list (list (quote q) (quote X) (quote _))) :head (list (quote p) (quote X))}))
+      ;; Negative number literals parse as one negative number,
+      ;; while subtraction (`-(X, Y)`) compound is preserved.
+      (dl-pt-test!
+        "negative integer literal"
+        (dl-parse "n(-3).")
+        (list {:head (list (quote n) -3) :body (list)}))
+
+      (dl-pt-test!
+        "subtraction compound preserved"
+        (dl-parse "r(X) :- is(X, -(10, 3)).")
+        (list
+          {:head (list (quote r) (quote X))
+           :body (list (list (quote is) (quote X)
+                             (list (string->symbol "-") 10 3)))}))
+
       (dl-pt-test!
         "number as relation name raises"
         (dl-pt-throws? (fn () (dl-parse "1(X) :- p(X).")))

From 4b5e75dc3e2c329a548e26fc175ed58a696380eb Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Sun, 10 May 2026 20:59:33 +0000
Subject: [PATCH 69/89] datalog: tokenizer raises on unterminated block comment
 (249/249)

Bug: `/* unclosed` was silently consumed to EOF, swallowing any
Datalog code that followed inside the (never-closing) comment.
Programs would produce empty parses with no error.

Fix: skip-block-comment! now raises when it hits EOF without
finding `*/`. Error message includes the position where the
problem was first detected. Line comments (`%`) and properly
closed block comments (`/* ... */`) are unaffected.

1 new tokenize test verifies the error path.
---
 lib/datalog/scoreboard.json   |  8 ++++----
 lib/datalog/scoreboard.md     |  4 ++--
 lib/datalog/tests/tokenize.sx | 10 ++++++++++
 lib/datalog/tokenizer.sx      |  4 +++-
 4 files changed, 19 insertions(+), 7 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 36aea08c..6c953f66 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,10 +1,10 @@
 {
   "lang": "datalog",
-  "total_passed": 248,
+  "total_passed": 249,
   "total_failed": 0,
-  "total": 248,
+  "total": 249,
   "suites": [
-    {"name":"tokenize","passed":26,"failed":0,"total":26},
+    {"name":"tokenize","passed":27,"failed":0,"total":27},
     {"name":"parse","passed":22,"failed":0,"total":22},
     {"name":"unify","passed":28,"failed":0,"total":28},
     {"name":"eval","passed":36,"failed":0,"total":36},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":34,"failed":0,"total":34},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-10T20:55:23+00:00"
+  "generated": "2026-05-10T20:59:17+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 53252867..d40d724f 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,10 +1,10 @@
 # datalog scoreboard
 
-**248 / 248 passing** (0 failure(s)).
+**249 / 249 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
-| tokenize | 26 | 26 | ok |
+| tokenize | 27 | 27 | ok |
 | parse | 22 | 22 | ok |
 | unify | 28 | 28 | ok |
 | eval | 36 | 36 | ok |
diff --git a/lib/datalog/tests/tokenize.sx b/lib/datalog/tests/tokenize.sx
index 920c7257..7ab73212 100644
--- a/lib/datalog/tests/tokenize.sx
+++ b/lib/datalog/tests/tokenize.sx
@@ -118,6 +118,16 @@
         "block comment"
         (dl-tk-types (dl-tokenize "/* a\nb */ x."))
         (list "atom" "punct" "eof"))
+      ;; Unterminated block comment must raise — previously it was
+      ;; silently consumed to EOF.
+      (dl-tk-test!
+        "unterminated block comment raises"
+        (let ((threw false))
+          (do
+            (guard (e (#t (set! threw true)))
+              (dl-tokenize "/* unclosed comment"))
+            threw))
+        true)
       (dl-tk-test!
         "whitespace"
         (dl-tk-types (dl-tokenize "  foo  ,\t bar  ."))
diff --git a/lib/datalog/tokenizer.sx b/lib/datalog/tokenizer.sx
index b169b64e..5b7b48d2 100644
--- a/lib/datalog/tokenizer.sx
+++ b/lib/datalog/tokenizer.sx
@@ -63,7 +63,9 @@
         (fn
           ()
           (cond
-            ((>= pos src-len) nil)
+            ((>= pos src-len)
+              (error (str "Tokenizer: unterminated block comment "
+                          "(started at position " pos ")")))
             ((and (= (cur) "*") (< (+ pos 1) src-len) (= (dl-peek 1) "/"))
               (advance! 2))
             (else (do (advance! 1) (skip-block-comment!))))))

From 5bcda5c88c3491066511b7d7adf2af54e8585ff3 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Sun, 10 May 2026 21:05:28 +0000
Subject: [PATCH 70/89] datalog: tokenizer raises on unterminated string +
 quoted atom (251/251)

Bug: read-quoted ran to EOF silently when the closing quote was
missing. The token's value was whatever ran-to-end string had been
accumulated; the parser later saw an unexpected EOF, but the error
message blamed the wrong location ("expected `)` got eof") and
hid the real problem.

Fix: read-quoted now raises with a message that distinguishes
strings from quoted atoms, including the position where the
opening quote was lost. The escape-sequence handling and proper
closing are unaffected.

2 new tokenize tests.
---
 lib/datalog/scoreboard.json   |  8 ++++----
 lib/datalog/scoreboard.md     |  4 ++--
 lib/datalog/tests/tokenize.sx | 19 +++++++++++++++++++
 lib/datalog/tokenizer.sx      |  6 +++++-
 4 files changed, 30 insertions(+), 7 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 6c953f66..f36dbeba 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,10 +1,10 @@
 {
   "lang": "datalog",
-  "total_passed": 249,
+  "total_passed": 251,
   "total_failed": 0,
-  "total": 249,
+  "total": 251,
   "suites": [
-    {"name":"tokenize","passed":27,"failed":0,"total":27},
+    {"name":"tokenize","passed":29,"failed":0,"total":29},
     {"name":"parse","passed":22,"failed":0,"total":22},
     {"name":"unify","passed":28,"failed":0,"total":28},
     {"name":"eval","passed":36,"failed":0,"total":36},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":34,"failed":0,"total":34},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-10T20:59:17+00:00"
+  "generated": "2026-05-10T21:05:12+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index d40d724f..b7adc8c8 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,10 +1,10 @@
 # datalog scoreboard
 
-**249 / 249 passing** (0 failure(s)).
+**251 / 251 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
-| tokenize | 27 | 27 | ok |
+| tokenize | 29 | 29 | ok |
 | parse | 22 | 22 | ok |
 | unify | 28 | 28 | ok |
 | eval | 36 | 36 | ok |
diff --git a/lib/datalog/tests/tokenize.sx b/lib/datalog/tests/tokenize.sx
index 7ab73212..6bf190fc 100644
--- a/lib/datalog/tests/tokenize.sx
+++ b/lib/datalog/tests/tokenize.sx
@@ -118,6 +118,25 @@
         "block comment"
         (dl-tk-types (dl-tokenize "/* a\nb */ x."))
         (list "atom" "punct" "eof"))
+      ;; Unterminated string / quoted-atom must raise.
+      (dl-tk-test!
+        "unterminated string raises"
+        (let ((threw false))
+          (do
+            (guard (e (#t (set! threw true)))
+              (dl-tokenize "\"unclosed"))
+            threw))
+        true)
+
+      (dl-tk-test!
+        "unterminated quoted atom raises"
+        (let ((threw false))
+          (do
+            (guard (e (#t (set! threw true)))
+              (dl-tokenize "'unclosed"))
+            threw))
+        true)
+
       ;; Unterminated block comment must raise — previously it was
       ;; silently consumed to EOF.
       (dl-tk-test!
diff --git a/lib/datalog/tokenizer.sx b/lib/datalog/tokenizer.sx
index 5b7b48d2..e48ca7df 100644
--- a/lib/datalog/tokenizer.sx
+++ b/lib/datalog/tokenizer.sx
@@ -123,7 +123,11 @@
               (fn
                 ()
                 (cond
-                  ((>= pos src-len) nil)
+                  ((>= pos src-len)
+                    (error
+                      (str "Tokenizer: unterminated "
+                           (if (= quote-char "'") "quoted atom" "string")
+                           " (started near position " pos ")")))
                   ((= (cur) "\\")
                     (do
                       (advance! 1)

From 96c9e90743bf39e3cfaa358a294e8656e9d4ba69 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Sun, 10 May 2026 21:09:33 +0000
Subject: [PATCH 71/89] datalog: rule-shape validators in dl-add-rule!
 (253/253)

Two malformed-rule paths used to slip through:

- Empty head list `{:head () :body ()}` was accepted; the rule
  would never fire but the relation-name lookup later returned
  nil with confusing downstream errors.
- Non-list body (`{:head (...) :body 42}`) crashed in `rest`
  during safety check with a cryptic "rest: 1 list arg".

dl-add-rule! now checks head shape (non-empty list with symbol
head) and body type (list) before any safety walk. Errors are
descriptive and surface at add time rather than during the next
saturation.

2 new eval tests.
---
 lib/datalog/db.sx           |  9 +++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 16 ++++++++++++++++
 4 files changed, 31 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index 798fcfa7..d8e4f153 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -318,6 +318,15 @@
         (error (str "dl-add-rule!: expected rule dict, got " rule)))
       ((not (has-key? rule :head))
         (error (str "dl-add-rule!: rule missing :head, got " rule)))
+      ((not (and (list? (get rule :head))
+                 (> (len (get rule :head)) 0)
+                 (symbol? (first (get rule :head)))))
+        (error (str "dl-add-rule!: head must be a non-empty list "
+                    "starting with a relation-name symbol, got "
+                    (get rule :head))))
+      ((not (list? (if (has-key? rule :body) (get rule :body) (list))))
+        (error (str "dl-add-rule!: body must be a list of literals, got "
+                    (get rule :body))))
       ((dl-reserved-rel? (dl-rel-name (get rule :head)))
         (error (str "dl-add-rule!: '" (dl-rel-name (get rule :head))
                     "' is a reserved name (built-in / aggregate / negation)")))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index f36dbeba..72c71703 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 251,
+  "total_passed": 253,
   "total_failed": 0,
-  "total": 251,
+  "total": 253,
   "suites": [
     {"name":"tokenize","passed":29,"failed":0,"total":29},
     {"name":"parse","passed":22,"failed":0,"total":22},
     {"name":"unify","passed":28,"failed":0,"total":28},
-    {"name":"eval","passed":36,"failed":0,"total":36},
+    {"name":"eval","passed":38,"failed":0,"total":38},
     {"name":"builtins","passed":23,"failed":0,"total":23},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":34,"failed":0,"total":34},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-10T21:05:12+00:00"
+  "generated": "2026-05-10T21:09:18+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index b7adc8c8..391f5d79 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**251 / 251 passing** (0 failure(s)).
+**253 / 253 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 29 | 29 | ok |
 | parse | 22 | 22 | ok |
 | unify | 28 | 28 | ok |
-| eval | 36 | 36 | ok |
+| eval | 38 | 38 | ok |
 | builtins | 23 | 23 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index 75541282..e1835a0c 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -165,6 +165,22 @@
           ((db (dl-program "edge(1, 2). edge(2, 3). edge(3, 1).\n                  reach(X, Y) :- edge(X, Y).\n                  reach(X, Z) :- edge(X, Y), reach(Y, Z).")))
           (do (dl-saturate! db) (len (dl-relation db "reach"))))
         9)
+      ;; Rule-shape sanity: empty-list head and non-list body raise
+      ;; clear errors rather than crashing inside the saturator.
+      (dl-et-test! "empty head rejected"
+        (dl-et-throws?
+          (fn ()
+            (dl-add-rule! (dl-make-db)
+              {:head (list) :body (list)})))
+        true)
+
+      (dl-et-test! "non-list body rejected"
+        (dl-et-throws?
+          (fn ()
+            (dl-add-rule! (dl-make-db)
+              {:head (list (quote p) (quote X)) :body 42})))
+        true)
+
       ;; Reserved relation names rejected as rule/fact heads.
       (dl-et-test!
         "reserved name `not` as head rejected"

From 69a53ece43a2306d5f91d1b36b50736a0dd6fc70 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Sun, 10 May 2026 21:13:30 +0000
Subject: [PATCH 72/89] datalog: dl-magic-query shape validator (255/255)

Bug: dl-magic-query crashed with cryptic "rest: 1 list arg" when
the goal argument was a string, number, or arbitrary dict. The
first thing the function does is dl-rel-name + dl-adorn-goal,
both of which assume a positive-literal list shape.

Fix: explicit shape check up front. A goal must be a non-empty
list whose first element is a symbol. Otherwise raise with a
clear diagnostic. Built-in / aggregate / negation dispatch (the
fall-back to dl-query) is unchanged.

2 new magic tests cover string and bare-dict goal rejection.
---
 lib/datalog/magic.sx        |  5 +++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/magic.sx  | 18 ++++++++++++++++++
 4 files changed, 29 insertions(+), 6 deletions(-)

diff --git a/lib/datalog/magic.sx b/lib/datalog/magic.sx
index ffdf4cf4..ce8b20a8 100644
--- a/lib/datalog/magic.sx
+++ b/lib/datalog/magic.sx
@@ -382,6 +382,11 @@
     ;; (built-ins, aggregates, EDB-only relations) the seed is either
     ;; non-ground or unused; fall back to dl-query.
     (cond
+      ((not (and (list? query-goal)
+                 (> (len query-goal) 0)
+                 (symbol? (first query-goal))))
+        (error (str "dl-magic-query: goal must be a positive literal "
+                    "(non-empty list with a symbol head), got " query-goal)))
       ((or (dl-builtin? query-goal)
            (dl-aggregate? query-goal)
            (and (dict? query-goal) (has-key? query-goal :neg)))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 72c71703..ba1017d8 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 253,
+  "total_passed": 255,
   "total_failed": 0,
-  "total": 253,
+  "total": 255,
   "suites": [
     {"name":"tokenize","passed":29,"failed":0,"total":29},
     {"name":"parse","passed":22,"failed":0,"total":22},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":20,"failed":0,"total":20},
     {"name":"api","passed":20,"failed":0,"total":20},
-    {"name":"magic","passed":34,"failed":0,"total":34},
+    {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-10T21:09:18+00:00"
+  "generated": "2026-05-10T21:13:14+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 391f5d79..a55a1dbb 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**253 / 253 passing** (0 failure(s)).
+**255 / 255 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 10 | 10 | ok |
 | aggregates | 20 | 20 | ok |
 | api | 20 | 20 | ok |
-| magic | 34 | 34 | ok |
+| magic | 36 | 36 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index 6778dc19..29508c87 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -242,6 +242,24 @@
             (= (len semi) (len magic))))
         true)
 
+      ;; Shape validation: dl-magic-query rejects non-list / non-
+      ;; dict goal shapes cleanly rather than crashing in `rest`.
+      (dl-mt-test! "magic rejects string goal"
+        (let ((threw false))
+          (do
+            (guard (e (#t (set! threw true)))
+              (dl-magic-query (dl-make-db) "foo"))
+            threw))
+        true)
+
+      (dl-mt-test! "magic rejects bare dict goal"
+        (let ((threw false))
+          (do
+            (guard (e (#t (set! threw true)))
+              (dl-magic-query (dl-make-db) {:foo "bar"}))
+            threw))
+        true)
+
       ;; 3-stratum program under magic — distinct rule heads at
       ;; strata 0/1/2 must all rewrite via the worklist.
       (dl-mt-test! "magic 3-stratum program"

From 3a1ecaa36209ff1fcc886aa411dc37057457692a Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Sun, 10 May 2026 21:17:07 +0000
Subject: [PATCH 73/89] datalog: tokenizer raises on unexpected characters
 (256/256)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bug: characters not recognised by any branch of `scan!` (`?`,
`!`, `#`, `@`, `&`, `|`, `\\`, `^`, etc.) were silently consumed
via `(else (advance! 1) (scan!))`. Programs with typos would
parse to a stripped version of themselves with no warning —
`?(X).` became `(X).` and produced confusing downstream errors.

Fix: the else branch now raises a clear "unexpected character"
error with the offending char and its position.

1 new tokenize test.
---
 lib/datalog/scoreboard.json   |  8 ++++----
 lib/datalog/scoreboard.md     |  4 ++--
 lib/datalog/tests/tokenize.sx | 12 ++++++++++++
 lib/datalog/tokenizer.sx      |  4 +++-
 4 files changed, 21 insertions(+), 7 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index ba1017d8..c8a61bf7 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,10 +1,10 @@
 {
   "lang": "datalog",
-  "total_passed": 255,
+  "total_passed": 256,
   "total_failed": 0,
-  "total": 255,
+  "total": 256,
   "suites": [
-    {"name":"tokenize","passed":29,"failed":0,"total":29},
+    {"name":"tokenize","passed":30,"failed":0,"total":30},
     {"name":"parse","passed":22,"failed":0,"total":22},
     {"name":"unify","passed":28,"failed":0,"total":28},
     {"name":"eval","passed":38,"failed":0,"total":38},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-10T21:13:14+00:00"
+  "generated": "2026-05-10T21:16:53+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index a55a1dbb..1055a8f9 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,10 +1,10 @@
 # datalog scoreboard
 
-**255 / 255 passing** (0 failure(s)).
+**256 / 256 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
-| tokenize | 29 | 29 | ok |
+| tokenize | 30 | 30 | ok |
 | parse | 22 | 22 | ok |
 | unify | 28 | 28 | ok |
 | eval | 38 | 38 | ok |
diff --git a/lib/datalog/tests/tokenize.sx b/lib/datalog/tests/tokenize.sx
index 6bf190fc..51470a44 100644
--- a/lib/datalog/tests/tokenize.sx
+++ b/lib/datalog/tests/tokenize.sx
@@ -118,6 +118,18 @@
         "block comment"
         (dl-tk-types (dl-tokenize "/* a\nb */ x."))
         (list "atom" "punct" "eof"))
+      ;; Unexpected characters surface at tokenize time rather
+      ;; than being silently consumed (previously `?(X)` parsed as
+      ;; if the leading `?` weren't there).
+      (dl-tk-test!
+        "unexpected char raises"
+        (let ((threw false))
+          (do
+            (guard (e (#t (set! threw true)))
+              (dl-tokenize "?(X)"))
+            threw))
+        true)
+
       ;; Unterminated string / quoted-atom must raise.
       (dl-tk-test!
         "unterminated string raises"
diff --git a/lib/datalog/tokenizer.sx b/lib/datalog/tokenizer.sx
index e48ca7df..a10a7ff7 100644
--- a/lib/datalog/tokenizer.sx
+++ b/lib/datalog/tokenizer.sx
@@ -254,7 +254,9 @@
                       (dl-emit! "op" "/" start)
                       (advance! 1)
                       (scan!)))
-                  (else (do (advance! 1) (scan!)))))))))
+                  (else (error
+                          (str "Tokenizer: unexpected character '" ch
+                               "' at position " start)))))))))
       (scan!)
       (dl-emit! "eof" nil pos)
       tokens)))

From a9e4eea3341920b697d1bddf7eac1ac109bf352b Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Sun, 10 May 2026 21:18:04 +0000
Subject: [PATCH 74/89] datalog-plan: log parser/safety bug-hunt round (7 bugs
 fixed)

---
 plans/datalog-on-sx.md | 17 ++++++++++++++++-
 1 file changed, 16 insertions(+), 1 deletion(-)

diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 7ce6b29d..8a10cd0d 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **239/239 across 11 suites**
+`bash lib/datalog/conformance.sh` → **256/256 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,21 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-10 — Bug-hunt round on parser/safety surfaced 7 real
+  bugs, each fixed with regression tests:
+  - Reserved relation names (`not`, `count`, `<`, `is`, ...) were
+    accepted as rule/fact heads — would silently shadow built-ins.
+  - Negative number literals (`n(-1).`) failed to parse — users
+    had to express them as `(- 0 1)` or via `is`.
+  - Unterminated block comment `/* ...` silently consumed the
+    rest of the input. Now raises with the position.
+  - Same silent-consume bug in unterminated string / quoted-atom.
+  - Empty-list rule head and non-list rule body weren't validated;
+    they'd crash later in `rest`. dl-add-rule! now checks shape.
+  - dl-magic-query with non-list / non-dict goal crashed cryptically.
+  - Tokenizer silently swallowed unrecognised characters (`?`, `!`,
+    `#`, `@`, etc.) — typos produced confusing downstream errors.
+
 - 2026-05-08 — Phase 6 driver: `dl-magic-query db query-goal`.
   Builds a fresh internal db from the caller's EDB + magic seed +
   rewritten rules, saturates, queries, returns substitutions —

From 9a16f27075df81be68be13cb4851fc11c7804fdb Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 07:20:20 +0000
Subject: [PATCH 75/89] datalog: dl-walk handles circular substitutions without
 infinite loop (257/257)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bug: dl-walk would infinite-loop on a circular substitution
(e.g. A→B and B→A simultaneously). The walk endlessly chased
the cycle. This couldn't be produced through dl-unify (which has
cycle-safe behavior via existing bindings), but raw dl-bind calls
or external manipulation of the subst dict could create it.

Fix: dl-walk now threads a visited-names list through the
recursion. If a variable name is already in the list, the walk
stops and returns the current term unchanged. Normal chained
walks are unaffected (A→B→C→42 still resolves to 42).

1 new unify test verifies circular substitutions don't hang.
---
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/unify.sx  |  9 +++++++++
 lib/datalog/unify.sx        | 22 +++++++++++++++++-----
 4 files changed, 32 insertions(+), 11 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index c8a61bf7..4115dc2e 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,12 +1,12 @@
 {
   "lang": "datalog",
-  "total_passed": 256,
+  "total_passed": 257,
   "total_failed": 0,
-  "total": 256,
+  "total": 257,
   "suites": [
     {"name":"tokenize","passed":30,"failed":0,"total":30},
     {"name":"parse","passed":22,"failed":0,"total":22},
-    {"name":"unify","passed":28,"failed":0,"total":28},
+    {"name":"unify","passed":29,"failed":0,"total":29},
     {"name":"eval","passed":38,"failed":0,"total":38},
     {"name":"builtins","passed":23,"failed":0,"total":23},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-10T21:16:53+00:00"
+  "generated": "2026-05-11T07:20:07+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 1055a8f9..3e5c0e4e 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,12 +1,12 @@
 # datalog scoreboard
 
-**256 / 256 passing** (0 failure(s)).
+**257 / 257 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 30 | 30 | ok |
 | parse | 22 | 22 | ok |
-| unify | 28 | 28 | ok |
+| unify | 29 | 29 | ok |
 | eval | 38 | 38 | ok |
 | builtins | 23 | 23 | ok |
 | semi_naive | 8 | 8 | ok |
diff --git a/lib/datalog/tests/unify.sx b/lib/datalog/tests/unify.sx
index 873cc655..3db114ed 100644
--- a/lib/datalog/tests/unify.sx
+++ b/lib/datalog/tests/unify.sx
@@ -129,6 +129,15 @@
             ((s2 (dl-unify (quote Y) (quote tom) s1)))
             (dl-walk (quote X) s2)))
         (quote tom))
+
+      ;; Walk with circular substitution must not infinite-loop.
+      ;; Cycles return the current term unchanged.
+      (dl-ut-test!
+        "walk circular subst no hang"
+        (let ((s (dl-bind (quote B) (quote A)
+                   (dl-bind (quote A) (quote B) (dl-empty-subst)))))
+          (dl-walk (quote A) s))
+        (quote A))
       (dl-ut-test!
         "apply subst on tuple"
         (let
diff --git a/lib/datalog/unify.sx b/lib/datalog/unify.sx
index 7313a603..d5de7eda 100644
--- a/lib/datalog/unify.sx
+++ b/lib/datalog/unify.sx
@@ -33,16 +33,28 @@
 ;; variable. The result is either a non-variable term or an unbound var.
 (define
   dl-walk
+  (fn (term subst) (dl-walk-aux term subst (list))))
+
+;; Internal: walk with a visited-var set so circular substitutions
+;; (from raw dl-bind misuse) don't infinite-loop. Cycles return the
+;; current term unchanged.
+(define
+  dl-walk-aux
   (fn
-    (term subst)
+    (term subst visited)
     (if
       (dl-var? term)
       (let
         ((name (symbol->string term)))
-        (if
-          (and (dict? subst) (has-key? subst name))
-          (dl-walk (get subst name) subst)
-          term))
+        (cond
+          ((dl-member? name visited) term)
+          ((and (dict? subst) (has-key? subst name))
+            (let ((seen (list)))
+              (do
+                (for-each (fn (v) (append! seen v)) visited)
+                (append! seen name)
+                (dl-walk-aux (get subst name) subst seen))))
+          (else term)))
       term)))
 
 ;; Bind a variable symbol to a value in subst, returning a new subst.

From dcae125955d1455268d74bf11d8124479e38ed04 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 07:26:48 +0000
Subject: [PATCH 76/89] datalog: aggregate arg validators (259/259)

Bug: dl-eval-aggregate accepted non-variable agg-vars and non-
literal goals silently, producing weird/incorrect counts:
- `count(N, 5, p(X))` would compute count over the single
  constant 5 (always 1), ignoring p entirely.
- `count(N, X, 42)` would crash with "unknown body-literal
  shape" at saturation time rather than at rule-add time.

Fix: dl-eval-aggregate now validates up front that the second
arg is a variable (the value to aggregate) and the third arg is
a positive literal (the goal). Errors are descriptive and
include the offending argument.

2 new aggregate tests.
---
 lib/datalog/aggregates.sx       | 44 +++++++++++++++++++--------------
 lib/datalog/scoreboard.json     |  8 +++---
 lib/datalog/scoreboard.md       |  4 +--
 lib/datalog/tests/aggregates.sx | 12 +++++++++
 4 files changed, 44 insertions(+), 24 deletions(-)

diff --git a/lib/datalog/aggregates.sx b/lib/datalog/aggregates.sx
index af0ef0f1..4911a330 100644
--- a/lib/datalog/aggregates.sx
+++ b/lib/datalog/aggregates.sx
@@ -104,24 +104,32 @@
         (result-var (nth lit 1))
         (agg-var (nth lit 2))
         (goal (nth lit 3)))
-      (let
-        ((substs (dl-find-bindings (list goal) db subst))
-          (vals (list)))
-        (do
-          (for-each
-            (fn
-              (s)
-              (let ((v (dl-apply-subst agg-var s)))
-                (when
-                  (not (dl-val-member? v vals))
-                  (append! vals v))))
-            substs)
-          (let ((agg-val (dl-do-aggregate op vals)))
-            (cond
-              ((= agg-val :empty) (list))
-              (else
-                (let ((s2 (dl-unify result-var agg-val subst)))
-                  (if (nil? s2) (list) (list s2)))))))))))
+      (cond
+        ((not (dl-var? agg-var))
+          (error (str "datalog aggregate (" op
+                      "): second arg must be a variable, got " agg-var)))
+        ((not (and (list? goal) (> (len goal) 0)
+                   (symbol? (first goal))))
+          (error (str "datalog aggregate (" op
+                      "): third arg must be a positive literal, got "
+                      goal)))
+        (else
+          (let ((vals (list)))
+            (do
+              (for-each
+                (fn
+                  (s)
+                  (let ((v (dl-apply-subst agg-var s)))
+                    (when (not (dl-val-member? v vals))
+                      (append! vals v))))
+                (dl-find-bindings (list goal) db subst))
+              (let ((agg-val (dl-do-aggregate op vals)))
+                (cond
+                  ((= agg-val :empty) (list))
+                  (else
+                    (let ((s2 (dl-unify result-var agg-val subst)))
+                      (if (nil? s2) (list) (list s2)))))))))))))
+
 
 ;; Stratification edges from aggregates: like negation, the goal's
 ;; relation must be in a strictly lower stratum so that the aggregate
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 4115dc2e..f2224ebf 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 257,
+  "total_passed": 259,
   "total_failed": 0,
-  "total": 257,
+  "total": 259,
   "suites": [
     {"name":"tokenize","passed":30,"failed":0,"total":30},
     {"name":"parse","passed":22,"failed":0,"total":22},
@@ -11,10 +11,10 @@
     {"name":"builtins","passed":23,"failed":0,"total":23},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
-    {"name":"aggregates","passed":20,"failed":0,"total":20},
+    {"name":"aggregates","passed":22,"failed":0,"total":22},
     {"name":"api","passed":20,"failed":0,"total":20},
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T07:20:07+00:00"
+  "generated": "2026-05-11T07:26:33+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 3e5c0e4e..0d02305b 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**257 / 257 passing** (0 failure(s)).
+**259 / 259 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -11,7 +11,7 @@
 | builtins | 23 | 23 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
-| aggregates | 20 | 20 | ok |
+| aggregates | 22 | 22 | ok |
 | api | 20 | 20 | ok |
 | magic | 36 | 36 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/aggregates.sx b/lib/datalog/tests/aggregates.sx
index 63af21dc..45b3ab88 100644
--- a/lib/datalog/tests/aggregates.sx
+++ b/lib/datalog/tests/aggregates.sx
@@ -244,6 +244,18 @@
           {:U (quote carol) :N 0}))
 
       ;; Stratification: recursion through aggregation is rejected.
+      ;; Aggregate validates that second arg is a variable.
+      (dl-at-test! "agg second arg must be var"
+        (dl-at-throws?
+          (fn () (dl-eval "p(1). q(N) :- count(N, 5, p(X))." "?- q(N).")))
+        true)
+
+      ;; Aggregate validates that third arg is a positive literal.
+      (dl-at-test! "agg third arg must be a literal"
+        (dl-at-throws?
+          (fn () (dl-eval "p(1). q(N) :- count(N, X, 42)." "?- q(N).")))
+        true)
+
       ;; Indirect recursion through aggregation also rejected.
       ;; q -> r (via positive lit), r -> q (via aggregate body).
       ;; The aggregate edge counts as negation for stratification.

From 285cd530eb3404c68c1bb3b7b6f85148204acecf Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 07:41:49 +0000
Subject: [PATCH 77/89] datalog: reject body lits with reserved names
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Nested `not(not(P))` silently misparsed: outer `not(...)` is
recognised as negation, but the inner `not(banned(X))` was parsed
as a positive call to a relation called `not`. With no `not`
relation present, the inner match was empty, the outer negation
succeeded vacuously, and `vip(X) :- u(X), not(not(banned(X))).`
collapsed to `vip(X) :- u(X).` — a silent double-negation = identity
fallacy.

Fix in `dl-rule-check-safety`: the positive-literal branch and
`dl-process-neg!` both reject any body literal whose relation
name is in `dl-reserved-rel-names`. Error message names the
relation and points the user at stratified negation through an
intermediate relation.

1 regression test; conformance 260/260.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/builtins.sx     | 44 +++++++++++++++++++++++++++----------
 lib/datalog/scoreboard.json |  8 +++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 18 +++++++++++++++
 plans/datalog-on-sx.md      | 15 ++++++++++++-
 5 files changed, 70 insertions(+), 19 deletions(-)

diff --git a/lib/datalog/builtins.sx b/lib/datalog/builtins.sx
index 11261c85..7bfd3d47 100644
--- a/lib/datalog/builtins.sx
+++ b/lib/datalog/builtins.sx
@@ -250,18 +250,29 @@
           (fn
             (lit)
             (let
-              ((needed (dl-vars-of (get lit :neg))))
+              ((inner (get lit :neg)))
               (let
-                ((missing (dl-vars-not-in needed bound)))
-                (when
-                  (> (len missing) 0)
-                  (set!
-                    err
-                    (str
-                      "negation refers to unbound variable(s) "
-                      missing
-                      " — they must be bound by an earlier "
-                      "positive body literal")))))))
+                ((inner-rn
+                   (cond
+                     ((and (list? inner) (> (len inner) 0))
+                       (dl-rel-name inner))
+                     (else nil)))
+                  (needed (dl-vars-of inner))
+                  (missing (dl-vars-not-in (dl-vars-of inner) bound)))
+                (cond
+                  ((and (not (nil? inner-rn)) (dl-reserved-rel? inner-rn))
+                    (set! err
+                      (str "negated literal uses reserved name '"
+                           inner-rn
+                           "' — nested `not(...)` / negated built-ins are "
+                           "not supported; introduce an intermediate "
+                           "relation and negate that")))
+                  ((> (len missing) 0)
+                    (set! err
+                      (str "negation refers to unbound variable(s) "
+                           missing
+                           " — they must be bound by an earlier "
+                           "positive body literal"))))))))
         (define
           dl-process-agg!
           (fn
@@ -289,7 +300,16 @@
                 ((dl-is? lit) (dl-process-is! lit))
                 ((dl-comparison? lit) (dl-process-cmp! lit))
                 ((and (list? lit) (> (len lit) 0))
-                  (dl-add-bound! (dl-vars-of lit)))))))
+                  (let ((rn (dl-rel-name lit)))
+                    (cond
+                      ((and (not (nil? rn)) (dl-reserved-rel? rn))
+                        (set! err
+                          (str "body literal uses reserved name '" rn
+                               "' — built-ins / aggregates have their own "
+                               "syntax; nested `not(...)` is not supported "
+                               "(use stratified negation via an "
+                               "intermediate relation)")))
+                      (else (dl-add-bound! (dl-vars-of lit))))))))))
         (for-each dl-process-lit! body)
         (when
           (nil? err)
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index f2224ebf..1f97c6d4 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 259,
+  "total_passed": 260,
   "total_failed": 0,
-  "total": 259,
+  "total": 260,
   "suites": [
     {"name":"tokenize","passed":30,"failed":0,"total":30},
     {"name":"parse","passed":22,"failed":0,"total":22},
     {"name":"unify","passed":29,"failed":0,"total":29},
-    {"name":"eval","passed":38,"failed":0,"total":38},
+    {"name":"eval","passed":39,"failed":0,"total":39},
     {"name":"builtins","passed":23,"failed":0,"total":23},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T07:26:33+00:00"
+  "generated": "2026-05-11T07:40:56+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 0d02305b..143f7201 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**259 / 259 passing** (0 failure(s)).
+**260 / 260 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 30 | 30 | ok |
 | parse | 22 | 22 | ok |
 | unify | 29 | 29 | ok |
-| eval | 38 | 38 | ok |
+| eval | 39 | 39 | ok |
 | builtins | 23 | 23 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index e1835a0c..9b0d6cd8 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -203,6 +203,24 @@
         (dl-et-throws? (fn () (dl-program "is(N, +(1, 2)) :- p(N).")))
         true)
 
+      ;; Body literal with a reserved-name positive head is rejected.
+      ;; The parser only treats outer-level `not(P)` as negation; nested
+      ;; `not(not(P))` would otherwise silently parse as a positive call
+      ;; to a relation named `not` and succeed vacuously. The safety
+      ;; checker now flags this so the user gets a clear error.
+      ;; Body literal with a reserved-name positive head is rejected.
+      ;; The parser only treats outer-level `not(P)` as negation; nested
+      ;; `not(not(P))` would otherwise silently parse as a positive call
+      ;; to a relation named `not` and succeed vacuously — so the safety
+      ;; checker now flags this to give the user a clear error.
+      (dl-et-test!
+        "nested not(not(...)) rejected"
+        (dl-et-throws?
+          (fn ()
+            (dl-program
+              "banned(a). u(a). vip(X) :- u(X), not(not(banned(X))).")))
+        true)
+
       (dl-et-test!
         "unsafe head var"
         (dl-et-throws? (fn () (dl-program "p(X, Y) :- q(X).")))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 8a10cd0d..42d90ca8 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **256/256 across 11 suites**
+`bash lib/datalog/conformance.sh` → **260/260 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,19 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — Eval-semantics bug-hunt: nested `not(not(P))` was
+  silently misinterpreted. Outer-level `not(...)` is parsed as
+  negation, but the inner `not(banned(X))` was parsed as a regular
+  positive literal naming a relation called `not`. Since no `not`
+  relation existed, the inner match was empty and the outer
+  negation succeeded vacuously, making `vip(X) :- u(X), not(not(banned(X))).`
+  equivalent to `vip(X) :- u(X).` (a silent double-negation = identity
+  fallacy). Fix in `dl-rule-check-safety`: both the positive-literal
+  branch and `dl-process-neg!` now flag any body literal whose head
+  is in `dl-reserved-rel-names`. Error message names the relation and
+  points the user at intermediate-relation stratified negation. 1 new
+  regression test; 260/260.
+
 - 2026-05-10 — Bug-hunt round on parser/safety surfaced 7 real
   bugs, each fixed with regression tests:
   - Reserved relation names (`not`, `count`, `<`, `is`, ...) were

From c6f646607ec0d5c2fc672fa5323dbf07bbb29697 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 07:51:08 +0000
Subject: [PATCH 78/89] datalog: dl-retract! preserves EDB in mixed relations
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

A "mixed" relation has both user-asserted facts AND rules with the
same head. Previously dl-retract! wiped every rule-head relation
wholesale before re-saturating — the saturator only re-derives the
IDB portion, so explicit EDB facts vanished even for a no-op retract
of a non-existent tuple. Repro:

  (let ((db (dl-program "p(a). p(b). p(X) :- q(X). q(c).")))
    (dl-retract! db (quote (p z)))
    (dl-query db (quote (p X))))

went from {a, b, c} to just {c}.

Fix: track :edb-keys provenance in the db.

  - dl-make-db now allocates an :edb-keys dict.
  - dl-add-fact! (public) marks (rel-key, tuple-key) in :edb-keys.
  - New internal dl-add-derived! does the append without marking.
  - Saturator (semi-naive + naive driver) now calls dl-add-derived!.
  - dl-retract! strips only the IDB-derived portion of rule-head
    relations (anything not in :edb-keys) and preserves the EDB
    portion through the re-saturate pass.

2 new regression tests; conformance 262/262.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/api.sx          | 84 +++++++++++++++++++++++++++++--------
 lib/datalog/db.sx           | 77 +++++++++++++++++++++++++++-------
 lib/datalog/eval.sx         |  4 +-
 lib/datalog/scoreboard.json |  8 ++--
 lib/datalog/scoreboard.md   |  4 +-
 lib/datalog/tests/api.sx    | 29 +++++++++++++
 plans/datalog-on-sx.md      | 18 +++++++-
 7 files changed, 184 insertions(+), 40 deletions(-)

diff --git a/lib/datalog/api.sx b/lib/datalog/api.sx
index 925c8728..ed014f1a 100644
--- a/lib/datalog/api.sx
+++ b/lib/datalog/api.sx
@@ -91,14 +91,18 @@
       (dl-saturate! db)
       db)))
 
-;; Remove a fact: drop matching tuples from EDB AND wipe all derived
-;; tuples (any IDB tuple may have transitively depended on the removed
-;; fact). Then re-saturate to repopulate IDB. EDB facts that were
-;; asserted via dl-add-fact! are preserved unless they match `lit`.
+;; Remove a fact and re-saturate. Mixed relations (which have BOTH
+;; user-asserted facts AND rules) are supported via :edb-keys provenance
+;; — explicit facts are marked at dl-add-fact! time, the saturator uses
+;; dl-add-derived! which doesn't mark them, so the retract pass can
+;; safely wipe IDB-derived tuples while preserving the user's EDB.
 ;;
-;; To distinguish EDB from IDB, we treat any fact for a relation that
-;; has rules as IDB; otherwise EDB. (Phase 9 simplification — Phase 10
-;; may track provenance.)
+;; Effect:
+;;   - remove tuples matching `lit` from :facts and :edb-keys
+;;   - for every relation that has a rule (i.e. potentially IDB or
+;;     mixed), drop the IDB-derived portion (anything not in :edb-keys)
+;;     so the saturator can re-derive cleanly
+;;   - re-saturate
 (define
   dl-retract!
   (fn
@@ -106,14 +110,20 @@
     (let
       ((rel-key (dl-rel-name lit)))
       (do
-        ;; Drop the matching tuple from its relation list (if EDB-only).
+        ;; Drop the matching tuple from its relation list, its facts-keys,
+        ;; its first-arg index, AND from :edb-keys (if present).
         (when
           (has-key? (get db :facts) rel-key)
           (let
             ((existing (get (get db :facts) rel-key))
               (kept (list))
               (kept-keys {})
-              (kept-index {}))
+              (kept-index {})
+              (edb-rel (cond
+                         ((has-key? (get db :edb-keys) rel-key)
+                           (get (get db :edb-keys) rel-key))
+                         (else nil)))
+              (kept-edb {}))
             (do
               (for-each
                 (fn
@@ -122,7 +132,13 @@
                     (not (dl-tuple-equal? t lit))
                     (do
                       (append! kept t)
-                      (dict-set! kept-keys (dl-tuple-key t) true)
+                      (let ((tk (dl-tuple-key t)))
+                        (do
+                          (dict-set! kept-keys tk true)
+                          (when
+                            (and (not (nil? edb-rel))
+                                 (has-key? edb-rel tk))
+                            (dict-set! kept-edb tk true))))
                       (when
                         (>= (len t) 2)
                         (let ((k (dl-arg-key (nth t 1))))
@@ -134,17 +150,51 @@
                 existing)
               (dict-set! (get db :facts) rel-key kept)
               (dict-set! (get db :facts-keys) rel-key kept-keys)
-              (dict-set! (get db :facts-index) rel-key kept-index))))
-        ;; Wipe all relations that have a rule (these are IDB) so the
-        ;; saturator regenerates them from the surviving EDB.
+              (dict-set! (get db :facts-index) rel-key kept-index)
+              (when
+                (not (nil? edb-rel))
+                (dict-set! (get db :edb-keys) rel-key kept-edb)))))
+        ;; For each rule-head relation, strip the IDB-derived tuples
+        ;; (anything not marked in :edb-keys) so the saturator can
+        ;; cleanly re-derive without leaving stale tuples that depended
+        ;; on the now-removed fact.
         (let ((rule-heads (dl-rule-head-rels db)))
           (for-each
             (fn
               (k)
-              (do
-                (dict-set! (get db :facts) k (list))
-                (dict-set! (get db :facts-keys) k {})
-                (dict-set! (get db :facts-index) k {})))
+              (when
+                (has-key? (get db :facts) k)
+                (let
+                  ((existing (get (get db :facts) k))
+                    (kept (list))
+                    (kept-keys {})
+                    (kept-index {})
+                    (edb-rel (cond
+                               ((has-key? (get db :edb-keys) k)
+                                 (get (get db :edb-keys) k))
+                               (else {}))))
+                  (do
+                    (for-each
+                      (fn
+                        (t)
+                        (let ((tk (dl-tuple-key t)))
+                          (when
+                            (has-key? edb-rel tk)
+                            (do
+                              (append! kept t)
+                              (dict-set! kept-keys tk true)
+                              (when
+                                (>= (len t) 2)
+                                (let ((kk (dl-arg-key (nth t 1))))
+                                  (do
+                                    (when
+                                      (not (has-key? kept-index kk))
+                                      (dict-set! kept-index kk (list)))
+                                    (append! (get kept-index kk) t))))))))
+                      existing)
+                    (dict-set! (get db :facts) k kept)
+                    (dict-set! (get db :facts-keys) k kept-keys)
+                    (dict-set! (get db :facts-index) k kept-index)))))
             rule-heads))
         (dl-saturate! db)
         db))))
diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index d8e4f153..d8e3be56 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -14,7 +14,39 @@
 
 (define
   dl-make-db
-  (fn () {:facts {} :facts-keys {} :facts-index {} :rules (list) :strategy :semi-naive}))
+  (fn ()
+    {:facts {}
+     :facts-keys {}
+     :facts-index {}
+     :edb-keys {}
+     :rules (list)
+     :strategy :semi-naive}))
+
+;; Record (rel-key, tuple-key) as user-asserted EDB. dl-add-fact! calls
+;; this when an explicit fact is added; the saturator (which uses
+;; dl-add-derived!) does NOT, so derived tuples never appear here.
+;; dl-retract! consults :edb-keys to know which tuples must survive
+;; the wipe-and-resaturate round-trip.
+(define
+  dl-mark-edb!
+  (fn
+    (db rel-key tk)
+    (let
+      ((edb (get db :edb-keys)))
+      (do
+        (when
+          (not (has-key? edb rel-key))
+          (dict-set! edb rel-key {}))
+        (dict-set! (get edb rel-key) tk true)))))
+
+(define
+  dl-edb-fact?
+  (fn
+    (db rel-key tk)
+    (let
+      ((edb (get db :edb-keys)))
+      (and (has-key? edb rel-key)
+           (has-key? (get edb rel-key) tk)))))
 
 ;; Evaluation strategy. Default :semi-naive (the only strategy
 ;; currently implemented). :magic is reserved for goal-directed
@@ -196,6 +228,29 @@
   (fn
     (name) (dl-member-string? name dl-reserved-rel-names)))
 
+;; Internal: append a derived tuple to :facts without the public
+;; validation pass and without marking :edb-keys. Used by the saturator
+;; (eval.sx) and magic-sets (magic.sx). Returns true if the tuple was
+;; new, false if already present.
+(define
+  dl-add-derived!
+  (fn
+    (db lit)
+    (let
+      ((rel-key (dl-rel-name lit)))
+      (let
+        ((tuples (dl-ensure-rel! db rel-key))
+          (key-dict (get (get db :facts-keys) rel-key))
+          (tk (dl-tuple-key lit)))
+        (cond
+          ((has-key? key-dict tk) false)
+          (else
+            (do
+              (dict-set! key-dict tk true)
+              (append! tuples lit)
+              (dl-index-add! db rel-key lit)
+              true)))))))
+
 (define
   dl-add-fact!
   (fn
@@ -210,19 +265,13 @@
         (error (str "dl-add-fact!: expected ground literal, got " lit)))
       (else
         (let
-          ((rel-key (dl-rel-name lit)))
-          (let
-            ((tuples (dl-ensure-rel! db rel-key))
-              (key-dict (get (get db :facts-keys) rel-key))
-              (tk (dl-tuple-key lit)))
-            (cond
-              ((has-key? key-dict tk) false)
-              (else
-                (do
-                  (dict-set! key-dict tk true)
-                  (append! tuples lit)
-                  (dl-index-add! db rel-key lit)
-                  true)))))))))
+          ((rel-key (dl-rel-name lit)) (tk (dl-tuple-key lit)))
+          (do
+            ;; Always mark EDB origin — even if the tuple key was already
+            ;; present (e.g. previously derived), so an explicit assert
+            ;; promotes it to EDB and protects it from the IDB wipe.
+            (dl-mark-edb! db rel-key tk)
+            (dl-add-derived! db lit)))))))
 
 ;; The full safety check lives in builtins.sx (it has to know which
 ;; predicates are built-ins). dl-add-rule! calls it via forward
diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index e0fc1554..17d9a4c6 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -130,7 +130,7 @@
             (s)
             (let
               ((derived (dl-apply-subst head s)))
-              (when (dl-add-fact! db derived) (set! new? true))))
+              (when (dl-add-derived! db derived) (set! new? true))))
           (dl-find-bindings body db (dl-empty-subst)))
         new?))))
 
@@ -326,7 +326,7 @@
       (fn
         (lit)
         (when
-          (dl-add-fact! db lit)
+          (dl-add-derived! db lit)
           (let
             ((rel (dl-rel-name lit)))
             (do
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 1f97c6d4..558a8a8e 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 260,
+  "total_passed": 262,
   "total_failed": 0,
-  "total": 260,
+  "total": 262,
   "suites": [
     {"name":"tokenize","passed":30,"failed":0,"total":30},
     {"name":"parse","passed":22,"failed":0,"total":22},
@@ -12,9 +12,9 @@
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":22,"failed":0,"total":22},
-    {"name":"api","passed":20,"failed":0,"total":20},
+    {"name":"api","passed":22,"failed":0,"total":22},
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T07:40:56+00:00"
+  "generated": "2026-05-11T07:50:41+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 143f7201..1b0e23de 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**260 / 260 passing** (0 failure(s)).
+**262 / 262 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -12,6 +12,6 @@
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 22 | 22 | ok |
-| api | 20 | 20 | ok |
+| api | 22 | 22 | ok |
 | magic | 36 | 36 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/api.sx b/lib/datalog/tests/api.sx
index b46df8f8..df430d30 100644
--- a/lib/datalog/tests/api.sx
+++ b/lib/datalog/tests/api.sx
@@ -159,6 +159,35 @@
             (dl-query db (quote (ancestor tom X)))))
         (list {:X (quote bob)}))
 
+      ;; dl-retract! on a relation with BOTH explicit facts AND a rule
+      ;; (a "mixed" relation) used to wipe the EDB portion when the IDB
+      ;; was re-derived, even when the retract didn't match anything.
+      ;; :edb-keys provenance now preserves user-asserted facts.
+      (dl-api-test-set! "dl-retract! preserves EDB in mixed relation"
+        (let
+          ((db (dl-program-data
+                 (quote ((p a) (p b) (q c)))
+                 (quote ((p X <- (q X)))))))
+          (do
+            (dl-saturate! db)
+            ;; Retract a non-existent tuple — should be a no-op.
+            (dl-retract! db (quote (p z)))
+            (dl-query db (quote (p X)))))
+        (list {:X (quote a)} {:X (quote b)} {:X (quote c)}))
+
+      ;; And retracting an actual EDB fact in a mixed relation drops
+      ;; only that fact; the derived portion stays.
+      (dl-api-test-set! "dl-retract! mixed: drop EDB, keep IDB"
+        (let
+          ((db (dl-program-data
+                 (quote ((p a) (p b) (q c)))
+                 (quote ((p X <- (q X)))))))
+          (do
+            (dl-saturate! db)
+            (dl-retract! db (quote (p a)))
+            (dl-query db (quote (p X)))))
+        (list {:X (quote b)} {:X (quote c)}))
+
       ;; dl-program-data + dl-query with constants in head.
       (dl-api-test-set! "constant-in-head data"
         (dl-query
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 42d90ca8..a245f56d 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **260/260 across 11 suites**
+`bash lib/datalog/conformance.sh` → **262/262 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,22 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — `dl-retract!` was silently destroying EDB facts in
+  "mixed" relations (those with BOTH user-asserted facts AND a rule
+  defining the same head). The retract pass wiped every rule-head
+  relation wholesale and then re-saturated — but the saturator only
+  re-derives the IDB portion, so explicit EDB facts vanished even
+  for a no-op retract of a non-existent tuple. Probe:
+  `(let ((db (dl-program "p(a). p(b). p(X) :- q(X). q(c).")))
+     (dl-retract! db (quote (p z))) (dl-query db (quote (p X))))`
+  went from `{a,b,c}` to just `{c}`.
+  Fix: tracked `:edb-keys` provenance in the db. `dl-add-fact!` (public
+  API) marks the tuple as EDB; saturator calls new internal
+  `dl-add-derived!` which doesn't mark it. `dl-retract!` now strips
+  only the IDB-derived portion of rule-head relations and preserves
+  EDB-marked tuples through the re-saturate pass. 2 new regression
+  tests; 262/262.
+
 - 2026-05-11 — Eval-semantics bug-hunt: nested `not(not(P))` was
   silently misinterpreted. Outer-level `not(...)` is parsed as
   negation, but the inner `not(banned(X))` was parsed as a regular

From 9e380fd96edf29b4cdc6e2abf3f390c752326e7f Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 07:57:01 +0000
Subject: [PATCH 79/89] datalog: aggregate validates that agg-var appears in
 goal
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`count(N, Y, p(X))` silently returned `N = 1` because `Y` was never
bound by the goal — every match contributed the same unbound symbol
which dl-val-member? deduped to a single entry. Similarly:

  sum(S, Y, p(X))    => raises "expected number, got symbol"
  findall(L, Y, p(X)) => L = (Y)  (a list containing the unbound symbol)
  count(N, Y, p(X))   => N = 1    (silent garbage)

Added a third validator in dl-eval-aggregate: the agg-var must
syntactically appear among the goal's variables. Error names the
variable and the goal and explains why the result would be
meaningless.

1 new test; conformance 263/263.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/aggregates.sx       |  8 ++++++++
 lib/datalog/scoreboard.json     |  8 ++++----
 lib/datalog/scoreboard.md       |  4 ++--
 lib/datalog/tests/aggregates.sx | 13 +++++++++++++
 plans/datalog-on-sx.md          | 11 ++++++++++-
 5 files changed, 37 insertions(+), 7 deletions(-)

diff --git a/lib/datalog/aggregates.sx b/lib/datalog/aggregates.sx
index 4911a330..0e62e536 100644
--- a/lib/datalog/aggregates.sx
+++ b/lib/datalog/aggregates.sx
@@ -113,6 +113,14 @@
           (error (str "datalog aggregate (" op
                       "): third arg must be a positive literal, got "
                       goal)))
+        ((not (dl-member-string?
+                (symbol->string agg-var)
+                (dl-vars-of goal)))
+          (error (str "datalog aggregate (" op
+                      "): aggregation variable " agg-var
+                      " does not appear in the goal " goal
+                      " — without it every match contributes the same "
+                      "(unbound) value and the result is meaningless")))
         (else
           (let ((vals (list)))
             (do
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 558a8a8e..8352bdbf 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 262,
+  "total_passed": 263,
   "total_failed": 0,
-  "total": 262,
+  "total": 263,
   "suites": [
     {"name":"tokenize","passed":30,"failed":0,"total":30},
     {"name":"parse","passed":22,"failed":0,"total":22},
@@ -11,10 +11,10 @@
     {"name":"builtins","passed":23,"failed":0,"total":23},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
-    {"name":"aggregates","passed":22,"failed":0,"total":22},
+    {"name":"aggregates","passed":23,"failed":0,"total":23},
     {"name":"api","passed":22,"failed":0,"total":22},
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T07:50:41+00:00"
+  "generated": "2026-05-11T07:56:45+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 1b0e23de..7bb4ab2b 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**262 / 262 passing** (0 failure(s)).
+**263 / 263 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -11,7 +11,7 @@
 | builtins | 23 | 23 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
-| aggregates | 22 | 22 | ok |
+| aggregates | 23 | 23 | ok |
 | api | 22 | 22 | ok |
 | magic | 36 | 36 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/aggregates.sx b/lib/datalog/tests/aggregates.sx
index 45b3ab88..42c687a6 100644
--- a/lib/datalog/tests/aggregates.sx
+++ b/lib/datalog/tests/aggregates.sx
@@ -256,6 +256,19 @@
           (fn () (dl-eval "p(1). q(N) :- count(N, X, 42)." "?- q(N).")))
         true)
 
+      ;; Aggregate validates that the agg-var (2nd arg) appears in the
+      ;; goal. Without it every match contributes the same unbound
+      ;; symbol — count silently returns 1, sum raises a confusing
+      ;; "expected number" error, etc. Catch the mistake at safety
+      ;; check time instead.
+      (dl-at-test! "agg-var must appear in goal"
+        (dl-at-throws?
+          (fn ()
+            (dl-eval
+              "p(1). p(2). c(N) :- count(N, Y, p(X))."
+              "?- c(N).")))
+        true)
+
       ;; Indirect recursion through aggregation also rejected.
       ;; q -> r (via positive lit), r -> q (via aggregate body).
       ;; The aggregate edge counts as negation for stratification.
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index a245f56d..0082efbd 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **262/262 across 11 suites**
+`bash lib/datalog/conformance.sh` → **263/263 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,15 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — Aggregate variable validation: `count(N, Y, p(X))`
+  silently returned `N = 1` because `Y` was never bound in `p(X)` —
+  every match contributed the same unbound symbol, which dl-val-member?
+  deduped to a single entry. Similarly `sum(S, Y, p(X))` raised a
+  confusing "expected number" error from the underlying `+`. Added
+  a third validator in `dl-eval-aggregate`: the agg-var must appear
+  in the goal literal. Error names the variable and the goal and
+  explains the consequence. 1 new test; 263/263.
+
 - 2026-05-11 — `dl-retract!` was silently destroying EDB facts in
   "mixed" relations (those with BOTH user-asserted facts AND a rule
   defining the same head). The retract pass wiped every rule-head

From 00881f84eb2e9b276347a615777d9f9f8b1f029a Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 07:59:25 +0000
Subject: [PATCH 80/89] datalog: arith / by zero raises instead of returning
 inf
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`is(R, /(X, 0))` was silently producing IEEE infinity:

  (dl-eval "p(10). q(R) :- p(X), is(R, /(X, 0))." "?- q(R).")
  => ({:R inf})

That value then flowed through comparisons (anything < inf, anything
> inf) and aggregations (sum of inf, max of inf) producing nonsense
results downstream. `dl-eval-arith` now checks the divisor before
the host `/` and raises "division by zero in <expr>" — surfacing
the bug at its source rather than letting infinity propagate.

1 new test; conformance 264/264.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/builtins.sx       |  8 +++++++-
 lib/datalog/scoreboard.json   |  8 ++++----
 lib/datalog/scoreboard.md     |  4 ++--
 lib/datalog/tests/builtins.sx | 12 +++++++++++-
 plans/datalog-on-sx.md        |  8 +++++++-
 5 files changed, 31 insertions(+), 9 deletions(-)

diff --git a/lib/datalog/builtins.sx b/lib/datalog/builtins.sx
index 7bfd3d47..fad58d5a 100644
--- a/lib/datalog/builtins.sx
+++ b/lib/datalog/builtins.sx
@@ -72,7 +72,13 @@
                     ((= rel "+") (+ a b))
                     ((= rel "-") (- a b))
                     ((= rel "*") (* a b))
-                    ((= rel "/") (/ a b))
+                    ((= rel "/")
+                      (cond
+                        ((= b 0)
+                          (error
+                            (str "datalog arith: division by zero in "
+                                 w)))
+                        (else (/ a b))))
                     (else (error (str "datalog arith: unknown op " rel)))))))))
         (else (error (str "datalog arith: not a number — " w)))))))
 
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 8352bdbf..0049c748 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,14 +1,14 @@
 {
   "lang": "datalog",
-  "total_passed": 263,
+  "total_passed": 264,
   "total_failed": 0,
-  "total": 263,
+  "total": 264,
   "suites": [
     {"name":"tokenize","passed":30,"failed":0,"total":30},
     {"name":"parse","passed":22,"failed":0,"total":22},
     {"name":"unify","passed":29,"failed":0,"total":29},
     {"name":"eval","passed":39,"failed":0,"total":39},
-    {"name":"builtins","passed":23,"failed":0,"total":23},
+    {"name":"builtins","passed":24,"failed":0,"total":24},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":23,"failed":0,"total":23},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T07:56:45+00:00"
+  "generated": "2026-05-11T07:59:10+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 7bb4ab2b..a60c5c5f 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**263 / 263 passing** (0 failure(s)).
+**264 / 264 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -8,7 +8,7 @@
 | parse | 22 | 22 | ok |
 | unify | 29 | 29 | ok |
 | eval | 39 | 39 | ok |
-| builtins | 23 | 23 | ok |
+| builtins | 24 | 24 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 23 | 23 | ok |
diff --git a/lib/datalog/tests/builtins.sx b/lib/datalog/tests/builtins.sx
index 9d7e1852..b7398fb8 100644
--- a/lib/datalog/tests/builtins.sx
+++ b/lib/datalog/tests/builtins.sx
@@ -239,7 +239,17 @@
         "safe — = binds head var"
         (dl-bt-throws?
           (fn () (dl-program "p(a). p(b). x(Y) :- p(X), =(Y, X).")))
-        false))))
+        false)
+
+      ;; Division by zero raises with a clear error. Without this guard
+      ;; SX's `/` returned IEEE infinity, which then silently flowed
+      ;; through comparisons and aggregations.
+      (dl-bt-test!
+        "is — division by zero raises"
+        (dl-bt-throws?
+          (fn ()
+            (dl-eval "p(10). q(R) :- p(X), is(R, /(X, 0))." "?- q(R).")))
+        true))))
 
 (define
   dl-builtins-tests-run!
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 0082efbd..ac3eb4f7 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **263/263 across 11 suites**
+`bash lib/datalog/conformance.sh` → **264/264 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,12 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — Division by zero in `is` silently produced IEEE
+  infinity instead of raising. `is(R, /(X, 0))` returned `R = inf`,
+  which then flowed through comparisons and aggregations to produce
+  nonsense results. `dl-eval-arith` now raises with a clear
+  "division by zero in <expr>" message. 1 new test; 264/264.
+
 - 2026-05-11 — Aggregate variable validation: `count(N, Y, p(X))`
   silently returned `N = 1` because `Y` was never bound in `p(X)` —
   every match contributed the same unbound symbol, which dl-val-member?

From ba60db2eef9dfb18edd8f0c5b6bab8e265cbb259 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 08:04:03 +0000
Subject: [PATCH 81/89] datalog: reject malformed dict body literals
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

A dict in a rule body that isn't `{:neg <positive-lit>}` (the only
recognised dict shape) used to silently fall through every dispatch
clause in dl-rule-check-safety, contributing zero bound variables.
The user would then see a confusing "head variable(s) X do not
appear in any positive body literal" pointing at the head — not at
the actual bug in the body. Typos like `{:negs ...}` are the typical
trigger.

dl-process-lit! now flags both:

  - a dict that lacks :neg
  - a bare number / string / symbol used as a body lit

with a clear error naming the offending literal.

1 new regression test; conformance 265/265.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/builtins.sx     | 22 +++++++++++++++++++++-
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 13 +++++++++++++
 plans/datalog-on-sx.md      | 11 ++++++++++-
 5 files changed, 50 insertions(+), 8 deletions(-)

diff --git a/lib/datalog/builtins.sx b/lib/datalog/builtins.sx
index fad58d5a..720a8025 100644
--- a/lib/datalog/builtins.sx
+++ b/lib/datalog/builtins.sx
@@ -301,6 +301,18 @@
               (cond
                 ((and (dict? lit) (has-key? lit :neg))
                   (dl-process-neg! lit))
+                ;; A bare dict that is not a recognised negation is
+                ;; almost certainly a typo (e.g. `{:negs ...}` instead
+                ;; of `{:neg ...}`). Without this guard the dict would
+                ;; silently fall through every clause; the head safety
+                ;; check would then flag the head variables as unbound
+                ;; even though the real bug is the malformed body lit.
+                ((dict? lit)
+                  (set! err
+                    (str "body literal is a dict but lacks :neg — "
+                         "the only dict-shaped body lit recognised is "
+                         "{:neg <positive-lit>} for stratified "
+                         "negation, got " lit)))
                 ((dl-aggregate? lit) (dl-process-agg! lit))
                 ((dl-eq? lit) (dl-process-eq! lit))
                 ((dl-is? lit) (dl-process-is! lit))
@@ -315,7 +327,15 @@
                                "syntax; nested `not(...)` is not supported "
                                "(use stratified negation via an "
                                "intermediate relation)")))
-                      (else (dl-add-bound! (dl-vars-of lit))))))))))
+                      (else (dl-add-bound! (dl-vars-of lit))))))
+                (else
+                  ;; Anything that's not a dict, not a list, or an
+                  ;; empty list. Numbers / strings / symbols as body
+                  ;; lits don't make sense — surface the type.
+                  (set! err
+                    (str "body literal must be a positive lit, "
+                         "built-in, aggregate, or {:neg ...} dict, "
+                         "got " lit)))))))
         (for-each dl-process-lit! body)
         (when
           (nil? err)
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 0049c748..8d8671c0 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 264,
+  "total_passed": 265,
   "total_failed": 0,
-  "total": 264,
+  "total": 265,
   "suites": [
     {"name":"tokenize","passed":30,"failed":0,"total":30},
     {"name":"parse","passed":22,"failed":0,"total":22},
     {"name":"unify","passed":29,"failed":0,"total":29},
-    {"name":"eval","passed":39,"failed":0,"total":39},
+    {"name":"eval","passed":40,"failed":0,"total":40},
     {"name":"builtins","passed":24,"failed":0,"total":24},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T07:59:10+00:00"
+  "generated": "2026-05-11T08:03:45+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index a60c5c5f..21c23323 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**264 / 264 passing** (0 failure(s)).
+**265 / 265 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 30 | 30 | ok |
 | parse | 22 | 22 | ok |
 | unify | 29 | 29 | ok |
-| eval | 39 | 39 | ok |
+| eval | 40 | 40 | ok |
 | builtins | 24 | 24 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index 9b0d6cd8..f859c2b2 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -221,6 +221,19 @@
               "banned(a). u(a). vip(X) :- u(X), not(not(banned(X))).")))
         true)
 
+      ;; A dict body literal that isn't `{:neg ...}` is almost always a
+      ;; typo — it would otherwise silently fall through to a confusing
+      ;; head-var-unbound safety error. Now caught with a clear message.
+      (dl-et-test!
+        "dict body lit without :neg rejected"
+        (dl-et-throws?
+          (fn ()
+            (let ((db (dl-make-db)))
+              (dl-add-rule! db
+                {:head (list (quote p) (quote X))
+                 :body (list {:weird "stuff"})}))))
+        true)
+
       (dl-et-test!
         "unsafe head var"
         (dl-et-throws? (fn () (dl-program "p(X, Y) :- q(X).")))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index ac3eb4f7..44f2cd32 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **264/264 across 11 suites**
+`bash lib/datalog/conformance.sh` → **265/265 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,15 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — Body literal shape validation in
+  `dl-rule-check-safety`: a dict that isn't `{:neg ...}` (e.g. typo'd
+  `{:negs ...}`) used to silently fall through every dispatch clause,
+  contributing zero bound vars; the user would then see a confusing
+  "head var X unbound" error pointing at the head, not the malformed
+  body. Same for body lits that are bare numbers / strings / symbols.
+  Both shapes now raise a clear error naming the offending lit. 1 new
+  regression test; 265/265.
+
 - 2026-05-11 — Division by zero in `is` silently produced IEEE
   infinity instead of raising. `is(R, /(X, 0))` returned `R = inf`,
   which then flowed through comparisons and aggregations to produce

From 917ffe5ccceb4dcc662a479ed5a978c360f307f0 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 08:07:40 +0000
Subject: [PATCH 82/89] datalog: comparison ops require same-type operands
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Type-mixed comparisons were silently inconsistent:

  <("hello", 5)  =>  no result, no error  (silent false)
  <(a, 5)        =>  raises "Expected number, got symbol"

Both should fail loudly with a comprehensible message. Added
dl-compare-typeok?: <, <=, >, >= now require both operands to share
a primitive type (both numbers or both strings) and raise a clear
"comparison <op> requires same-type operands" error otherwise.

`!=` is exempted because it's the polymorphic inequality test
built on dl-tuple-equal? — cross-type pairs are legitimately unequal
and the existing semantics for that case match user intuition.

2 new regression tests; conformance 267/267.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/builtins.sx       | 19 +++++++++++++++++++
 lib/datalog/scoreboard.json   |  8 ++++----
 lib/datalog/scoreboard.md     |  4 ++--
 lib/datalog/tests/builtins.sx | 24 +++++++++++++++++++++++-
 plans/datalog-on-sx.md        | 11 ++++++++++-
 5 files changed, 58 insertions(+), 8 deletions(-)

diff --git a/lib/datalog/builtins.sx b/lib/datalog/builtins.sx
index 720a8025..90d5faed 100644
--- a/lib/datalog/builtins.sx
+++ b/lib/datalog/builtins.sx
@@ -82,6 +82,20 @@
                     (else (error (str "datalog arith: unknown op " rel)))))))))
         (else (error (str "datalog arith: not a number — " w)))))))
 
+;; Comparable types — both operands must be the same primitive type
+;; (both numbers, both strings). `!=` is the exception: it's defined
+;; for any pair (returns true iff not equal) since dl-tuple-equal?
+;; handles type-mixed comparisons.
+(define
+  dl-compare-typeok?
+  (fn
+    (rel a b)
+    (cond
+      ((= rel "!=") true)
+      ((and (number? a) (number? b)) true)
+      ((and (string? a) (string? b)) true)
+      (else false))))
+
 (define
   dl-eval-compare
   (fn
@@ -98,6 +112,11 @@
               rel
               " has unbound argument; "
               "ensure prior body literal binds the variable")))
+        ((not (dl-compare-typeok? rel a b))
+          (error
+            (str "datalog: comparison " rel " requires same-type "
+                 "operands (both numbers or both strings), got "
+                 a " and " b)))
         (else
           (let
             ((ok (cond ((= rel "<") (< a b)) ((= rel "<=") (<= a b)) ((= rel ">") (> a b)) ((= rel ">=") (>= a b)) ((= rel "!=") (not (dl-tuple-equal? a b))) (else (error (str "datalog: unknown compare " rel))))))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 8d8671c0..9c394d50 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,14 +1,14 @@
 {
   "lang": "datalog",
-  "total_passed": 265,
+  "total_passed": 267,
   "total_failed": 0,
-  "total": 265,
+  "total": 267,
   "suites": [
     {"name":"tokenize","passed":30,"failed":0,"total":30},
     {"name":"parse","passed":22,"failed":0,"total":22},
     {"name":"unify","passed":29,"failed":0,"total":29},
     {"name":"eval","passed":40,"failed":0,"total":40},
-    {"name":"builtins","passed":24,"failed":0,"total":24},
+    {"name":"builtins","passed":26,"failed":0,"total":26},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
     {"name":"aggregates","passed":23,"failed":0,"total":23},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T08:03:45+00:00"
+  "generated": "2026-05-11T08:07:23+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 21c23323..89a66d4e 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**265 / 265 passing** (0 failure(s)).
+**267 / 267 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -8,7 +8,7 @@
 | parse | 22 | 22 | ok |
 | unify | 29 | 29 | ok |
 | eval | 40 | 40 | ok |
-| builtins | 24 | 24 | ok |
+| builtins | 26 | 26 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
 | aggregates | 23 | 23 | ok |
diff --git a/lib/datalog/tests/builtins.sx b/lib/datalog/tests/builtins.sx
index b7398fb8..13bb2709 100644
--- a/lib/datalog/tests/builtins.sx
+++ b/lib/datalog/tests/builtins.sx
@@ -249,7 +249,29 @@
         (dl-bt-throws?
           (fn ()
             (dl-eval "p(10). q(R) :- p(X), is(R, /(X, 0))." "?- q(R).")))
-        true))))
+        true)
+
+      ;; Comparison ops `<`, `<=`, `>`, `>=` require both operands to
+      ;; have the same primitive type. Cross-type comparisons used to
+      ;; silently return false (for some pairs) or raise a confusing
+      ;; host-level error (for others) — now they all raise with a
+      ;; message that names the offending values.
+      (dl-bt-test!
+        "comparison — string vs number raises"
+        (dl-bt-throws?
+          (fn ()
+            (dl-eval "p(\"hello\"). q(X) :- p(X), <(X, 5)." "?- q(X).")))
+        true)
+
+      ;; `!=` is the exception — it's a polymorphic inequality test
+      ;; (uses dl-tuple-equal? underneath) so cross-type pairs are
+      ;; legitimate (and trivially unequal).
+      (dl-bt-test-set! "!= works across types"
+        (dl-query
+          (dl-program
+            "p(1). p(\"1\"). q(X) :- p(X), !=(X, 1).")
+          (quote (q X)))
+        (list {:X "1"})))))
 
 (define
   dl-builtins-tests-run!
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 44f2cd32..a07670c2 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **265/265 across 11 suites**
+`bash lib/datalog/conformance.sh` → **267/267 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,15 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — Type-mixed comparisons were silently inconsistent:
+  `<(X, 5)` with `X` bound to a string returned `()` (no result, no
+  error), while `X` bound to a symbol raised "Expected number, got
+  symbol". Both should fail loudly. Added `dl-compare-typeok?` —
+  `<`, `<=`, `>`, `>=` now require both operands to share a primitive
+  type (both numbers or both strings) and raise otherwise. `!=` is
+  exempted since it's a polymorphic inequality test built on
+  `dl-tuple-equal?`. 2 new regression tests; 267/267.
+
 - 2026-05-11 — Body literal shape validation in
   `dl-rule-check-safety`: a dict that isn't `{:neg ...}` (e.g. typo'd
   `{:negs ...}`) used to silently fall through every dispatch clause,

From 7a94a47e26d7480b89aeb6ff6ae9dae74cd9d46a Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 08:39:24 +0000
Subject: [PATCH 83/89] datalog: quoted 'atoms' tokenize as strings
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Quoted atoms with uppercase- or underscore-leading names were
misclassified as variables. `p('Hello World').` flowed through the
tokenizer's "atom" branch and through the parser's string->symbol,
producing a symbol named "Hello World". dl-var? inspects the first
character — "H" is uppercase, so the fact was rejected as non-ground
("expected ground literal").

Tokenizer now emits "string" for any '...' quoted form. Quoted atoms
become opaque string constants — matching how Datalog idiomatically
treats them, and avoiding a per-symbol "quoted" marker that would
have rippled through unification and dl-var?. The trade-off is that
'a' and a are no longer the same value (string vs symbol); for
Datalog this is the safer default.

Updated the existing "quoted atom" tokenize test, added a regression
case for an uppercase-named quoted atom, and a parse-level test that
verifies the AST. Conformance 269/269.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/scoreboard.json   | 10 +++++-----
 lib/datalog/scoreboard.md     |  6 +++---
 lib/datalog/tests/parse.sx    |  7 +++++++
 lib/datalog/tests/tokenize.sx | 13 +++++++++++--
 lib/datalog/tokenizer.sx      | 13 ++++++++++---
 plans/datalog-on-sx.md        | 14 +++++++++++++-
 6 files changed, 49 insertions(+), 14 deletions(-)

diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 9c394d50..40f37987 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,11 +1,11 @@
 {
   "lang": "datalog",
-  "total_passed": 267,
+  "total_passed": 269,
   "total_failed": 0,
-  "total": 267,
+  "total": 269,
   "suites": [
-    {"name":"tokenize","passed":30,"failed":0,"total":30},
-    {"name":"parse","passed":22,"failed":0,"total":22},
+    {"name":"tokenize","passed":31,"failed":0,"total":31},
+    {"name":"parse","passed":23,"failed":0,"total":23},
     {"name":"unify","passed":29,"failed":0,"total":29},
     {"name":"eval","passed":40,"failed":0,"total":40},
     {"name":"builtins","passed":26,"failed":0,"total":26},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T08:07:23+00:00"
+  "generated": "2026-05-11T08:39:03+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 89a66d4e..174fc06d 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,11 +1,11 @@
 # datalog scoreboard
 
-**267 / 267 passing** (0 failure(s)).
+**269 / 269 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
-| tokenize | 30 | 30 | ok |
-| parse | 22 | 22 | ok |
+| tokenize | 31 | 31 | ok |
+| parse | 23 | 23 | ok |
 | unify | 29 | 29 | ok |
 | eval | 40 | 40 | ok |
 | builtins | 26 | 26 | ok |
diff --git a/lib/datalog/tests/parse.sx b/lib/datalog/tests/parse.sx
index 9d0f7201..6fc81b27 100644
--- a/lib/datalog/tests/parse.sx
+++ b/lib/datalog/tests/parse.sx
@@ -106,6 +106,13 @@
         "string arg"
         (dl-parse "label(x, \"hi\").")
         (list {:body (list) :head (list (quote label) (quote x) "hi")}))
+      ;; Quoted 'atoms' parse as strings — a uppercase-starting name
+      ;; in quotes used to misclassify as a variable and reject the
+      ;; fact as non-ground.
+      (dl-pt-test!
+        "quoted atom arg parses as string"
+        (dl-parse "p('Hello World').")
+        (list {:body (list) :head (list (quote p) "Hello World")}))
       (dl-pt-test!
         "comparison literal"
         (dl-parse "p(X) :- <(X, 5).")
diff --git a/lib/datalog/tests/tokenize.sx b/lib/datalog/tests/tokenize.sx
index 51470a44..6c7b94a9 100644
--- a/lib/datalog/tests/tokenize.sx
+++ b/lib/datalog/tests/tokenize.sx
@@ -58,14 +58,23 @@
         "string"
         (dl-tk-values (dl-tokenize "\"hello\""))
         (list "hello" nil))
+      ;; Quoted 'atoms' tokenize as strings — see the type-table
+      ;; comment in lib/datalog/tokenizer.sx for the rationale.
       (dl-tk-test!
-        "quoted atom"
+        "quoted atom as string"
         (dl-tk-types (dl-tokenize "'two words'"))
-        (list "atom" "eof"))
+        (list "string" "eof"))
       (dl-tk-test!
         "quoted atom value"
         (dl-tk-values (dl-tokenize "'two words'"))
         (list "two words" nil))
+      ;; A quoted atom whose name would otherwise be a variable
+      ;; (uppercase / leading underscore) is now safely a string —
+      ;; this was the bug that motivated the type change.
+      (dl-tk-test!
+        "quoted Uppercase as string"
+        (dl-tk-types (dl-tokenize "'Hello'"))
+        (list "string" "eof"))
       (dl-tk-test! ":-" (dl-tk-values (dl-tokenize ":-")) (list ":-" nil))
       (dl-tk-test! "?-" (dl-tk-values (dl-tokenize "?-")) (list "?-" nil))
       (dl-tk-test! "<=" (dl-tk-values (dl-tokenize "<=")) (list "<=" nil))
diff --git a/lib/datalog/tokenizer.sx b/lib/datalog/tokenizer.sx
index a10a7ff7..cf0aa730 100644
--- a/lib/datalog/tokenizer.sx
+++ b/lib/datalog/tokenizer.sx
@@ -2,10 +2,13 @@
 ;;
 ;; Tokens: {:type T :value V :pos P}
 ;; Types:
-;;   "atom"    — lowercase-start ident or quoted 'atom'
+;;   "atom"    — lowercase-start bare identifier
 ;;   "var"     — uppercase-start or _-start ident (value is the name)
 ;;   "number"  — numeric literal (decoded to number)
-;;   "string"  — "..." string literal
+;;   "string"  — "..." string literal OR quoted 'atom' (treated as a
+;;               string value to avoid the var-vs-atom ambiguity that
+;;               would arise from a quoted atom whose name starts with
+;;               an uppercase letter or underscore)
 ;;   "punct"   — ( ) , .
 ;;   "op"      — :- ?- <= >= != < > = + - * /
 ;;   "eof"
@@ -192,7 +195,11 @@
                       (dl-emit! "number" (read-number start) start)
                       (scan!)))
                   ((= ch "'")
-                    (do (dl-emit! "atom" (read-quoted "'") start) (scan!)))
+                    ;; Quoted 'atoms' tokenize as strings so a name
+                    ;; like 'Hello World' doesn't get misclassified
+                    ;; as a variable by dl-var? (which inspects the
+                    ;; symbol's first character).
+                    (do (dl-emit! "string" (read-quoted "'") start) (scan!)))
                   ((= ch "\"")
                     (do (dl-emit! "string" (read-quoted "\"") start) (scan!)))
                   ((dl-lower? ch)
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index a07670c2..29572e5c 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **267/267 across 11 suites**
+`bash lib/datalog/conformance.sh` → **269/269 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,18 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — Quoted atoms with uppercase-or-underscore-leading
+  names were misclassified as variables. `p('Hello World').` ran
+  through the tokenizer's `"atom"` branch and through the parser's
+  `string->symbol`, producing a symbol named "Hello World". dl-var?
+  checks the first character — "H" is uppercase, so the fact was
+  rejected as non-ground. Fix: tokenizer emits `"string"` for any
+  `'...'` quoted form, so quoted atoms become opaque string constants
+  (matching how Datalog idiomatically treats them — the alternative
+  was a per-symbol "quoted" marker which would have rippled through
+  unification and dl-var?). Updated the existing tokenize test and
+  added one for `'Hello'`; also added a parse-level regression. 269/269.
+
 - 2026-05-11 — Type-mixed comparisons were silently inconsistent:
   `<(X, 5)` with `X` bound to a string returned `()` (no result, no
   error), while `X` bound to a symbol raised "Expected number, got

From 6bae94bae1dedf4af31610e27a930d4fa8ed855c Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 08:44:30 +0000
Subject: [PATCH 84/89] datalog: reject compound terms in fact / rule-head args

Datalog has no function symbols in argument positions, but the
existing dl-add-fact! / dl-add-rule! validators only checked that
literals were ground (no free variables). A compound like `+(1, 2)`
contains no variables, so:

  p(+(1, 2)).
  => stored as the unreduced tuple `(p (+ 1 2))`

  double(*(X, 2)) :- n(X).  n(3).
  => saturates `double((* 3 2))` instead of `double(6)`

Added dl-simple-term? (number / string / symbol) and an
args-simple? walker, used by:

  - dl-add-fact!: all args must be simple terms
  - dl-add-rule!: rule head args must be simple terms (variables
    are symbols, so they pass)

Compounds remain legal in body literals where they encode `is` /
arithmetic / aggregate sub-goals. Error messages name the offending
literal and point the user at the body-only mechanism.

2 new regression tests; conformance 271/271.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/db.sx           | 28 ++++++++++++++++++++++++++++
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 18 ++++++++++++++++++
 plans/datalog-on-sx.md      | 12 +++++++++++-
 5 files changed, 63 insertions(+), 7 deletions(-)

diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index d8e3be56..230d1c1c 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -251,6 +251,24 @@
               (dl-index-add! db rel-key lit)
               true)))))))
 
+;; A simple term — number, string, or symbol — i.e. anything legal
+;; as an EDB fact arg. Compound (list) args belong only in body
+;; literals where they encode arithmetic / aggregate sub-goals.
+(define
+  dl-simple-term?
+  (fn
+    (term)
+    (or (number? term) (string? term) (symbol? term))))
+
+(define
+  dl-args-simple?
+  (fn
+    (lit i n)
+    (cond
+      ((>= i n) true)
+      ((not (dl-simple-term? (nth lit i))) false)
+      (else (dl-args-simple? lit (+ i 1) n)))))
+
 (define
   dl-add-fact!
   (fn
@@ -261,6 +279,11 @@
       ((dl-reserved-rel? (dl-rel-name lit))
         (error (str "dl-add-fact!: '" (dl-rel-name lit)
                     "' is a reserved name (built-in / aggregate / negation)")))
+      ((not (dl-args-simple? lit 1 (len lit)))
+        (error (str "dl-add-fact!: fact args must be numbers, strings, "
+                    "or symbols — compound args (e.g. arithmetic "
+                    "expressions) are body-only and aren't evaluated "
+                    "in fact position. got " lit)))
       ((not (dl-ground? lit (dl-empty-subst)))
         (error (str "dl-add-fact!: expected ground literal, got " lit)))
       (else
@@ -373,6 +396,11 @@
         (error (str "dl-add-rule!: head must be a non-empty list "
                     "starting with a relation-name symbol, got "
                     (get rule :head))))
+      ((not (dl-args-simple? (get rule :head) 1 (len (get rule :head))))
+        (error (str "dl-add-rule!: rule head args must be variables or "
+                    "constants — compound terms (e.g. `(*(X, 2))`) are "
+                    "not legal in head position; introduce an `is`-bound "
+                    "intermediate in the body. got " (get rule :head))))
       ((not (list? (if (has-key? rule :body) (get rule :body) (list))))
         (error (str "dl-add-rule!: body must be a list of literals, got "
                     (get rule :body))))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 40f37987..b30f55a4 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 269,
+  "total_passed": 271,
   "total_failed": 0,
-  "total": 269,
+  "total": 271,
   "suites": [
     {"name":"tokenize","passed":31,"failed":0,"total":31},
     {"name":"parse","passed":23,"failed":0,"total":23},
     {"name":"unify","passed":29,"failed":0,"total":29},
-    {"name":"eval","passed":40,"failed":0,"total":40},
+    {"name":"eval","passed":42,"failed":0,"total":42},
     {"name":"builtins","passed":26,"failed":0,"total":26},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":10,"failed":0,"total":10},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T08:39:03+00:00"
+  "generated": "2026-05-11T08:44:12+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 174fc06d..3ea409b0 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**269 / 269 passing** (0 failure(s)).
+**271 / 271 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 31 | 31 | ok |
 | parse | 23 | 23 | ok |
 | unify | 29 | 29 | ok |
-| eval | 40 | 40 | ok |
+| eval | 42 | 42 | ok |
 | builtins | 26 | 26 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 10 | 10 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index f859c2b2..1dd432de 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -234,6 +234,24 @@
                  :body (list {:weird "stuff"})}))))
         true)
 
+      ;; Facts may only have simple-term args (number / string / symbol).
+      ;; A compound arg like `+(1, 2)` would otherwise be silently
+      ;; stored as the unreduced expression `(+ 1 2)` because dl-ground?
+      ;; sees no free variables.
+      (dl-et-test!
+        "compound arg in fact rejected"
+        (dl-et-throws? (fn () (dl-program "p(+(1, 2)).")))
+        true)
+
+      ;; Rule heads may only have variable or constant args — no
+      ;; compounds. Compound heads would be saturated as unreduced
+      ;; tuples rather than the arithmetic result the user expected.
+      (dl-et-test!
+        "compound arg in rule head rejected"
+        (dl-et-throws?
+          (fn () (dl-program "n(3). double(*(X, 2)) :- n(X).")))
+        true)
+
       (dl-et-test!
         "unsafe head var"
         (dl-et-throws? (fn () (dl-program "p(X, Y) :- q(X).")))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 29572e5c..2c65125c 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **269/269 across 11 suites**
+`bash lib/datalog/conformance.sh` → **271/271 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,16 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — Compound terms in fact-arg / rule-head positions were
+  silently stored as unreduced expressions. `p(+(1, 2)).` resulted
+  in a tuple `(p (+ 1 2))` (dl-ground? sees no free variables, so it
+  passed). `double(*(X, 2)) :- n(X).` saturated to `double((* 3 2))`
+  rather than `double(6)`. Datalog has no function symbols in arg
+  positions — `dl-add-fact!` and `dl-add-rule!` now reject compound
+  args via a new `dl-simple-term?` (number / string / symbol).
+  Compounds remain legal in body literals where they encode `is` /
+  arithmetic / aggregate sub-goals. 2 new regression tests; 271/271.
+
 - 2026-05-11 — Quoted atoms with uppercase-or-underscore-leading
   names were misclassified as variables. `p('Hello World').` ran
   through the tokenizer's `"atom"` branch and through the parser's

From 66aa0034615b8848fb90b6cb28888861bbed7738 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 08:49:20 +0000
Subject: [PATCH 85/89] datalog: anonymous _ in negation is existential, not
 unbound
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The canonical Datalog idiom for "no X has any Y":

  orphan(X) :- person(X), not(parent(X, _)).

was rejected by the safety check with "negation refers to unbound
variable(s) (\"_anon1\")". The parser renames each anonymous `_`
to a fresh `_anon*` symbol so multiple `_` occurrences don't unify
with each other, and the negation safety walk then demanded all
free vars in the negated lit be bound by an earlier positive body
lit — including the renamed anonymous vars.

Anonymous vars in a negation are existentially quantified within
the negation, not requirements from outside. Added dl-non-anon-vars
to strip `_anon*` names from the `needed` set before the binding
check in dl-process-neg!. Real vars (like `X` in the orphan idiom)
still must be bound by an earlier positive body lit, just as before.

2 new regression tests (orphan idiom + multi-anon "solo" pattern);
conformance 273/273.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/builtins.sx       | 31 +++++++++++++++++++++++++++++--
 lib/datalog/scoreboard.json   |  8 ++++----
 lib/datalog/scoreboard.md     |  4 ++--
 lib/datalog/tests/negation.sx | 21 +++++++++++++++++++++
 plans/datalog-on-sx.md        | 14 +++++++++++++-
 5 files changed, 69 insertions(+), 9 deletions(-)

diff --git a/lib/datalog/builtins.sx b/lib/datalog/builtins.sx
index 90d5faed..9989c1ad 100644
--- a/lib/datalog/builtins.sx
+++ b/lib/datalog/builtins.sx
@@ -179,6 +179,27 @@
           vs)
         out))))
 
+;; Filter a list of variable-name strings to exclude anonymous-renamed
+;; vars (`_` in source → `_anon*` by dl-rename-anon-term). Used by
+;; the negation safety check, where anonymous vars are existential
+;; within the negated literal.
+(define
+  dl-non-anon-vars
+  (fn
+    (vs)
+    (let
+      ((out (list)))
+      (do
+        (for-each
+          (fn
+            (v)
+            (when
+              (not (and (>= (len v) 5)
+                        (= (slice v 0 5) "_anon")))
+              (append! out v)))
+          vs)
+        out))))
+
 (define
   dl-rule-check-safety
   (fn
@@ -282,8 +303,14 @@
                      ((and (list? inner) (> (len inner) 0))
                        (dl-rel-name inner))
                      (else nil)))
-                  (needed (dl-vars-of inner))
-                  (missing (dl-vars-not-in (dl-vars-of inner) bound)))
+                  ;; Anonymous variables (`_` in source → `_anon*` after
+                  ;; renaming) are existentially quantified within the
+                  ;; negated literal — they don't need to be bound by
+                  ;; an earlier body lit, since `not p(X, _)` is a
+                  ;; valid idiom for "no Y exists s.t. p(X, Y)". Filter
+                  ;; them out of the safety check.
+                  (needed (dl-non-anon-vars (dl-vars-of inner)))
+                  (missing (dl-vars-not-in needed bound)))
                 (cond
                   ((and (not (nil? inner-rn)) (dl-reserved-rel? inner-rn))
                     (set! err
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index b30f55a4..8f389f01 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 271,
+  "total_passed": 273,
   "total_failed": 0,
-  "total": 271,
+  "total": 273,
   "suites": [
     {"name":"tokenize","passed":31,"failed":0,"total":31},
     {"name":"parse","passed":23,"failed":0,"total":23},
@@ -10,11 +10,11 @@
     {"name":"eval","passed":42,"failed":0,"total":42},
     {"name":"builtins","passed":26,"failed":0,"total":26},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
-    {"name":"negation","passed":10,"failed":0,"total":10},
+    {"name":"negation","passed":12,"failed":0,"total":12},
     {"name":"aggregates","passed":23,"failed":0,"total":23},
     {"name":"api","passed":22,"failed":0,"total":22},
     {"name":"magic","passed":36,"failed":0,"total":36},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T08:44:12+00:00"
+  "generated": "2026-05-11T08:49:02+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 3ea409b0..b13d97c0 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**271 / 271 passing** (0 failure(s)).
+**273 / 273 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -10,7 +10,7 @@
 | eval | 42 | 42 | ok |
 | builtins | 26 | 26 | ok |
 | semi_naive | 8 | 8 | ok |
-| negation | 10 | 10 | ok |
+| negation | 12 | 12 | ok |
 | aggregates | 23 | 23 | ok |
 | api | 22 | 22 | ok |
 | magic | 36 | 36 | ok |
diff --git a/lib/datalog/tests/negation.sx b/lib/datalog/tests/negation.sx
index e4de6207..9a5aae3d 100644
--- a/lib/datalog/tests/negation.sx
+++ b/lib/datalog/tests/negation.sx
@@ -169,6 +169,27 @@
           (list (quote q) (quote X)))
         (list))
 
+      ;; Anonymous `_` in a negated literal is existentially quantified
+      ;; — it doesn't need to be bound by an earlier body lit. Without
+      ;; this exemption the safety check would reject the common idiom
+      ;; `orphan(X) :- person(X), not(parent(X, _))`.
+      (dl-nt-test-set! "negation with anonymous var — orphan idiom"
+        (dl-query
+          (dl-program
+            "person(a). person(b). person(c). parent(a, b).
+             orphan(X) :- person(X), not(parent(X, _)).")
+          (list (quote orphan) (quote X)))
+        (list {:X (quote b)} {:X (quote c)}))
+
+      ;; Multiple anonymous vars are each independently existential.
+      (dl-nt-test-set! "negation with multiple anonymous vars"
+        (dl-query
+          (dl-program
+            "u(a). u(b). u(c). edge(a, x). edge(b, y).
+             solo(X) :- u(X), not(edge(X, _)).")
+          (list (quote solo) (quote X)))
+        (list {:X (quote c)}))
+
       ;; Stratifiability checks.
       (dl-nt-test! "non-stratifiable rejected"
         (dl-nt-throws?
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 2c65125c..75d49ba2 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **271/271 across 11 suites**
+`bash lib/datalog/conformance.sh` → **273/273 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,18 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — Anonymous `_` in a negated literal was incorrectly
+  flagged by the safety check. The canonical idiom
+  `orphan(X) :- person(X), not(parent(X, _))` was rejected with
+  "negation refers to unbound variable(s) (\"_anon1\")" because the
+  parser renames each `_` to a fresh `_anon*` symbol and the negation
+  safety walk demanded all vars in the negated lit be bound by an
+  earlier positive body literal. Anonymous vars in negation are
+  existentially quantified — they shouldn't need outer binding.
+  Added `dl-non-anon-vars` filter; `dl-process-neg!` now strips
+  `_anon*` names from `needed` before the binding check. 2 new
+  regression tests; 273/273.
+
 - 2026-05-11 — Compound terms in fact-arg / rule-head positions were
   silently stored as unreduced expressions. `p(+(1, 2)).` resulted
   in a tuple `(p (+ 1 2))` (dl-ground? sees no free variables, so it

From 82dfa20e827b937b4f89e5a412cd8418d40eafe9 Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 08:59:28 +0000
Subject: [PATCH 86/89] datalog: dl-magic-query pre-saturates for aggregate
 correctness

dl-magic-query could silently diverge from dl-query when an
aggregate's inner-goal relation was IDB. The rewriter passes
aggregate body lits through unchanged (no magic propagation
generated for them), so the inner relation was empty in the magic
db and the aggregate returned 0. Repro:

  (dl-eval-magic
    "u(a). u(b). u(c). u(d). banned(b). banned(d).
     active(X) :- u(X), not(banned(X)).
     n(N) :- count(N, X, active(X))."
    "?- n(N).")
  => ({:N 0})   ; should be ({:N 2})

dl-magic-query now pre-saturates the source db before copying facts
into the magic db. This guarantees equivalence with dl-query for
every stratified program; the magic benefit still comes from
goal-directed re-derivation of the query relation under the seed
(which matters for large recursive joins). The existing test cases
happened to dodge this because their aggregate inner-goals were all
EDB.

1 new regression test; conformance 274/274.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/magic.sx        | 64 ++++++++++++++++++++++---------------
 lib/datalog/scoreboard.json |  8 ++---
 lib/datalog/scoreboard.md   |  4 +--
 lib/datalog/tests/magic.sx  | 23 +++++++++++++
 plans/datalog-on-sx.md      | 19 ++++++++++-
 5 files changed, 85 insertions(+), 33 deletions(-)

diff --git a/lib/datalog/magic.sx b/lib/datalog/magic.sx
index ce8b20a8..43ab7404 100644
--- a/lib/datalog/magic.sx
+++ b/lib/datalog/magic.sx
@@ -392,31 +392,43 @@
            (and (dict? query-goal) (has-key? query-goal :neg)))
         (dl-query db query-goal))
       (else
-        (let
-          ((query-rel (dl-rel-name query-goal))
-            (query-adn (dl-adorn-goal query-goal)))
+        (do
+          ;; Pre-saturate the source db. The magic rewriter passes
+          ;; aggregate body lits through unchanged (no magic
+          ;; propagation generated for them) — so if an aggregate's
+          ;; inner-goal relation is IDB, it would be empty in the
+          ;; magic db unless its tuples are already materialised in
+          ;; the source. Same for negation against IDB. Pre-saturating
+          ;; guarantees `dl-magic-query` returns the same answers as
+          ;; `dl-query` for every stratified program; the efficiency
+          ;; benefit then comes from goal-directed re-derivation of
+          ;; the query relation under the magic seed.
+          (dl-saturate! db)
           (let
-            ((query-args (dl-bound-args query-goal query-adn))
-              (rules (dl-rules db)))
+            ((query-rel (dl-rel-name query-goal))
+              (query-adn (dl-adorn-goal query-goal)))
             (let
-              ((rewritten (dl-magic-rewrite rules query-rel query-adn query-args))
-                (mdb (dl-make-db))
-                (rule-heads (dl-magic-rule-heads rules)))
-          (do
-            ;; Copy ALL existing facts. EDB-only relations bring their
-            ;; tuples; mixed EDB+IDB relations bring both their EDB
-            ;; portion and any pre-saturated IDB tuples (which the
-            ;; rewritten rules would re-derive anyway). Skipping facts
-            ;; for rule-headed relations would leave the magic run
-            ;; without the EDB portion of mixed relations.
-            (for-each
-              (fn
-                (rel)
-                (for-each
-                  (fn (t) (dl-add-fact! mdb t))
-                  (dl-rel-tuples db rel)))
-              (keys (get db :facts)))
-            ;; Seed + rewritten rules.
-            (dl-add-fact! mdb (get rewritten :seed))
-            (for-each (fn (r) (dl-add-rule! mdb r)) (get rewritten :rules))
-            (dl-query mdb query-goal)))))))))
+              ((query-args (dl-bound-args query-goal query-adn))
+                (rules (dl-rules db)))
+              (let
+                ((rewritten (dl-magic-rewrite rules query-rel query-adn query-args))
+                  (mdb (dl-make-db))
+                  (rule-heads (dl-magic-rule-heads rules)))
+            (do
+              ;; Copy ALL existing facts. EDB-only relations bring their
+              ;; tuples; mixed EDB+IDB relations bring both their EDB
+              ;; portion and any pre-saturated IDB tuples (which the
+              ;; rewritten rules would re-derive anyway). Skipping facts
+              ;; for rule-headed relations would leave the magic run
+              ;; without the EDB portion of mixed relations.
+              (for-each
+                (fn
+                  (rel)
+                  (for-each
+                    (fn (t) (dl-add-fact! mdb t))
+                    (dl-rel-tuples db rel)))
+                (keys (get db :facts)))
+              ;; Seed + rewritten rules.
+              (dl-add-fact! mdb (get rewritten :seed))
+              (for-each (fn (r) (dl-add-rule! mdb r)) (get rewritten :rules))
+              (dl-query mdb query-goal))))))))))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index 8f389f01..ae3a7255 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,8 +1,8 @@
 {
   "lang": "datalog",
-  "total_passed": 273,
+  "total_passed": 274,
   "total_failed": 0,
-  "total": 273,
+  "total": 274,
   "suites": [
     {"name":"tokenize","passed":31,"failed":0,"total":31},
     {"name":"parse","passed":23,"failed":0,"total":23},
@@ -13,8 +13,8 @@
     {"name":"negation","passed":12,"failed":0,"total":12},
     {"name":"aggregates","passed":23,"failed":0,"total":23},
     {"name":"api","passed":22,"failed":0,"total":22},
-    {"name":"magic","passed":36,"failed":0,"total":36},
+    {"name":"magic","passed":37,"failed":0,"total":37},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T08:49:02+00:00"
+  "generated": "2026-05-11T08:59:09+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index b13d97c0..0e44891b 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,6 +1,6 @@
 # datalog scoreboard
 
-**273 / 273 passing** (0 failure(s)).
+**274 / 274 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
@@ -13,5 +13,5 @@
 | negation | 12 | 12 | ok |
 | aggregates | 23 | 23 | ok |
 | api | 22 | 22 | ok |
-| magic | 36 | 36 | ok |
+| magic | 37 | 37 | ok |
 | demo | 21 | 21 | ok |
diff --git a/lib/datalog/tests/magic.sx b/lib/datalog/tests/magic.sx
index 29508c87..b6a895ca 100644
--- a/lib/datalog/tests/magic.sx
+++ b/lib/datalog/tests/magic.sx
@@ -388,6 +388,29 @@
             (= (len semi) (len magic))))
         true)
 
+      ;; The magic rewriter passes aggregate body lits through
+      ;; unchanged, so an aggregate over an IDB relation would see an
+      ;; empty inner-goal in the magic db unless the IDB is already
+      ;; materialised. dl-magic-query now pre-saturates the source db
+      ;; to guarantee equivalence with dl-query for every stratified
+      ;; program. Previously this returned `({:N 0})` because `active`
+      ;; (IDB, derived through negation) was never derived in the
+      ;; magic db.
+      (dl-mt-test! "magic over aggregate-of-IDB matches vanilla"
+        (let
+          ((src
+             "u(a). u(b). u(c). u(d). banned(b). banned(d).
+              active(X) :- u(X), not(banned(X)).
+              n(N) :- count(N, X, active(X))."))
+          (let
+            ((vanilla (dl-eval src "?- n(N)."))
+              (magic (dl-eval-magic src "?- n(N).")))
+            (and (= (len vanilla) 1)
+                 (= (len magic) 1)
+                 (= (get (first vanilla) "N")
+                    (get (first magic) "N")))))
+        true)
+
       ;; magic-query doesn't mutate caller db.
       (dl-mt-test! "magic-query preserves caller db"
         (let
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 75d49ba2..81a5ddf0 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **273/273 across 11 suites**
+`bash lib/datalog/conformance.sh` → **274/274 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,23 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — `dl-magic-query` could silently diverge from
+  `dl-query` when an aggregate's inner-goal relation was IDB. The
+  rewriter passes aggregate body lits through unchanged (no magic
+  propagation for them), so the inner relation was empty in the
+  magic db and the aggregate returned 0. Probe:
+  `dl-eval-magic "u(a). u(b). u(c). u(d). banned(b). banned(d).
+                  active(X) :- u(X), not(banned(X)).
+                  n(N) :- count(N, X, active(X))." "?- n(N)."`
+  returned `N=0` instead of `N=2`. Fix: `dl-magic-query` now
+  pre-saturates the source db before copying facts into the magic
+  db. This guarantees equivalence with `dl-query` for every
+  stratified program; the magic benefit comes from goal-directed
+  re-derivation of the query relation under the seed (which still
+  matters for large recursive joins). The existing test suite's
+  aggregate cases happened to dodge this because the inner goals
+  were all EDB. 1 new regression test; 274/274.
+
 - 2026-05-11 — Anonymous `_` in a negated literal was incorrectly
   flagged by the safety check. The canonical idiom
   `orphan(X) :- person(X), not(parent(X, _))` was rejected with

From ce98d97728eb112fcad2b0ada6ce313ded5475da Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 09:34:41 +0000
Subject: [PATCH 87/89] datalog: anonymous-renamer avoids user `_anon<N>`
 collision
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The renamer for anonymous `_` variables started at counter 0 and
produced `_anon1, _anon2, ...` unconditionally. A user writing the
same naming convention would see their variables shadowed:

  (dl-eval "p(a, b). p(c, d). q(_anon1) :- p(_anon1, _)."
           "?- q(X).")
  => ()    ; should be ({:X a} {:X c})

The `_` got renamed to `_anon1` too, collapsing the two positions
of `p` to a single var (forcing args to be equal — which neither
tuple satisfies).

Fix: scan each rule (and query goal) for the highest `_anon<N>`
already present and start the renamer past it. New helpers
`dl-max-anon-num` / `dl-max-anon-num-list` / `dl-try-parse-int`
walk the rule tree; `dl-make-anon-renamer` now takes a `start`
argument; `dl-rename-anon-rule` and the query-time renamer in
`dl-query` both compute the start from the input.

1 regression test; conformance 275/275.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/db.sx           | 75 ++++++++++++++++++++++++++++++++++---
 lib/datalog/eval.sx         |  5 ++-
 lib/datalog/scoreboard.json |  8 ++--
 lib/datalog/scoreboard.md   |  4 +-
 lib/datalog/tests/eval.sx   | 14 +++++++
 plans/datalog-on-sx.md      | 13 ++++++-
 6 files changed, 105 insertions(+), 14 deletions(-)

diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index 230d1c1c..9df4234b 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -367,19 +367,82 @@
 (define
   dl-make-anon-renamer
   (fn
-    ()
-    (let ((counter 0))
+    (start)
+    (let ((counter start))
       (fn () (do (set! counter (+ counter 1))
                  (string->symbol (str "_anon" counter)))))))
 
+;; Scan a rule for variables already named `_anon<N>` (which would
+;; otherwise collide with the renamer's output). Returns the max N
+;; seen, or 0 if none. The renamer then starts at that max + 1, so
+;; freshly-introduced anonymous names can't shadow a user-written
+;; `_anon<N>` symbol.
+(define
+  dl-max-anon-num
+  (fn
+    (term acc)
+    (cond
+      ((symbol? term)
+        (let ((s (symbol->string term)))
+          (cond
+            ((and (>= (len s) 6) (= (slice s 0 5) "_anon"))
+              (let ((n (dl-try-parse-int (slice s 5 (len s)))))
+                (cond
+                  ((nil? n) acc)
+                  ((> n acc) n)
+                  (else acc))))
+            (else acc))))
+      ((dict? term)
+        (cond
+          ((has-key? term :neg)
+            (dl-max-anon-num (get term :neg) acc))
+          (else acc)))
+      ((list? term) (dl-max-anon-num-list term acc 0))
+      (else acc))))
+
+(define
+  dl-max-anon-num-list
+  (fn
+    (xs acc i)
+    (cond
+      ((>= i (len xs)) acc)
+      (else
+        (dl-max-anon-num-list xs (dl-max-anon-num (nth xs i) acc) (+ i 1))))))
+
+;; Cheap "is this string a decimal int" check. Returns the number or
+;; nil. Avoids relying on host parse-number, which on non-int strings
+;; might raise rather than return nil.
+(define
+  dl-try-parse-int
+  (fn
+    (s)
+    (cond
+      ((= (len s) 0) nil)
+      ((not (dl-all-digits? s 0 (len s))) nil)
+      (else (parse-number s)))))
+
+(define
+  dl-all-digits?
+  (fn
+    (s i n)
+    (cond
+      ((>= i n) true)
+      ((let ((c (slice s i (+ i 1))))
+         (not (and (>= c "0") (<= c "9"))))
+        false)
+      (else (dl-all-digits? s (+ i 1) n)))))
+
 (define
   dl-rename-anon-rule
   (fn
     (rule)
-    (let ((next-name (dl-make-anon-renamer)))
-      {:head (dl-rename-anon-term (get rule :head) next-name)
-       :body (map (fn (lit) (dl-rename-anon-lit lit next-name))
-                  (get rule :body))})))
+    (let
+      ((start (dl-max-anon-num (get rule :head)
+                (dl-max-anon-num-list (get rule :body) 0 0))))
+      (let ((next-name (dl-make-anon-renamer start)))
+        {:head (dl-rename-anon-term (get rule :head) next-name)
+         :body (map (fn (lit) (dl-rename-anon-lit lit next-name))
+                    (get rule :body))}))))
 
 (define
   dl-add-rule!
diff --git a/lib/datalog/eval.sx b/lib/datalog/eval.sx
index 17d9a4c6..abf8e458 100644
--- a/lib/datalog/eval.sx
+++ b/lib/datalog/eval.sx
@@ -428,7 +428,10 @@
       ;; names.
       (let
         ((goals (dl-query-coerce goal))
-          (renamer (dl-make-anon-renamer)))
+          ;; Start the renamer past any `_anon<N>` symbols the user
+          ;; may have written in the query — avoids collision.
+          (renamer
+            (dl-make-anon-renamer (dl-max-anon-num-list goal 0 0))))
         (let
           ((user-vars (dl-query-user-vars goals))
             (renamed (map (fn (g) (dl-rename-anon-lit g renamer)) goals)))
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index ae3a7255..e7621023 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 274,
+  "total_passed": 275,
   "total_failed": 0,
-  "total": 274,
+  "total": 275,
   "suites": [
     {"name":"tokenize","passed":31,"failed":0,"total":31},
     {"name":"parse","passed":23,"failed":0,"total":23},
     {"name":"unify","passed":29,"failed":0,"total":29},
-    {"name":"eval","passed":42,"failed":0,"total":42},
+    {"name":"eval","passed":43,"failed":0,"total":43},
     {"name":"builtins","passed":26,"failed":0,"total":26},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":12,"failed":0,"total":12},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":37,"failed":0,"total":37},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T08:59:09+00:00"
+  "generated": "2026-05-11T09:34:17+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 0e44891b..4676d363 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**274 / 274 passing** (0 failure(s)).
+**275 / 275 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 31 | 31 | ok |
 | parse | 23 | 23 | ok |
 | unify | 29 | 29 | ok |
-| eval | 42 | 42 | ok |
+| eval | 43 | 43 | ok |
 | builtins | 26 | 26 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 12 | 12 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index 1dd432de..937a49dc 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -252,6 +252,20 @@
           (fn () (dl-program "n(3). double(*(X, 2)) :- n(X).")))
         true)
 
+      ;; The anonymous-variable renamer used to start at `_anon1`
+      ;; unconditionally; a rule that wrote `q(_anon1) :- p(_anon1, _)`
+      ;; (the user picking the same name the renamer would generate)
+      ;; would see the `_` renamed to `_anon1` too, collapsing the
+      ;; two positions in `p(_anon1, _)` to a single var. Now the
+      ;; renamer scans the rule for the max `_anon<N>` and starts past
+      ;; it, so user-written names of that form are preserved.
+      (dl-et-test-set! "anonymous-rename avoids user `_anon` collision"
+        (dl-query
+          (dl-program
+            "p(a, b). p(c, d). q(_anon1) :- p(_anon1, _).")
+          (quote (q X)))
+        (list {:X (quote a)} {:X (quote c)}))
+
       (dl-et-test!
         "unsafe head var"
         (dl-et-throws? (fn () (dl-program "p(X, Y) :- q(X).")))
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 81a5ddf0..791c77d8 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **274/274 across 11 suites**
+`bash lib/datalog/conformance.sh` → **275/275 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,17 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — Anonymous-variable renamer collided with user-written
+  `_anon<N>` symbols. The renamer started counter at 0 and produced
+  `_anon1, _anon2, ...` unconditionally; if the user wrote
+  `q(_anon1) :- p(_anon1, _).` the `_` got renamed to `_anon1` too,
+  collapsing the two positions of `p` to a single var and returning
+  the empty result instead of `{a, c}`. Fix: scan each rule (and
+  query) for the max `_anon<N>` and start the renamer past it. The
+  renamer constructor now takes a `start` arg; new helpers
+  `dl-max-anon-num` / `dl-max-anon-num-list` walk the rule tree.
+  1 regression test; 275/275.
+
 - 2026-05-11 — `dl-magic-query` could silently diverge from
   `dl-query` when an aggregate's inner-goal relation was IDB. The
   rewriter passes aggregate body lits through unchanged (no magic

From fadcdbd6a9497188add5416b5c810cecad69805a Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 09:40:29 +0000
Subject: [PATCH 88/89] datalog: dl-set-strategy! validates known strategy
 values
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`dl-set-strategy!` accepted any keyword silently — typos like
`:semi_naive` or `:semiNaive` were stored uninspected and the
saturator then used the default. The user never learned their
setting was wrong.

Validator added: strategy must be one of `:semi-naive`, `:naive`,
`:magic` (the values currently recognised by the saturator and
magic-sets driver). Unknown values raise with a clear message that
lists the accepted set.

1 regression test; conformance 276/276.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/db.sx           | 34 +++++++++++++++++++++++++++-------
 lib/datalog/scoreboard.json |  8 ++++----
 lib/datalog/scoreboard.md   |  4 ++--
 lib/datalog/tests/eval.sx   | 10 ++++++++++
 plans/datalog-on-sx.md      |  9 ++++++++-
 5 files changed, 51 insertions(+), 14 deletions(-)

diff --git a/lib/datalog/db.sx b/lib/datalog/db.sx
index 9df4234b..93544c7e 100644
--- a/lib/datalog/db.sx
+++ b/lib/datalog/db.sx
@@ -48,17 +48,37 @@
       (and (has-key? edb rel-key)
            (has-key? (get edb rel-key) tk)))))
 
-;; Evaluation strategy. Default :semi-naive (the only strategy
-;; currently implemented). :magic is reserved for goal-directed
-;; magic-sets evaluation — calling it now logs a one-time "deferred"
-;; note and falls back to semi-naive.
+;; Evaluation strategy. Default :semi-naive (used by dl-saturate!).
+;; :naive selects dl-saturate-naive! (slower but easier to reason
+;; about). :magic is a marker — goal-directed magic-sets evaluation
+;; is invoked separately via `dl-magic-query`; setting :magic here
+;; is purely informational. Any other value is rejected so typos
+;; don't silently fall back to the default.
+(define
+  dl-strategy-values
+  (list :semi-naive :naive :magic))
+
 (define
   dl-set-strategy!
   (fn
     (db strategy)
-    (do
-      (dict-set! db :strategy strategy)
-      db)))
+    (cond
+      ((not (dl-keyword-member? strategy dl-strategy-values))
+        (error (str "dl-set-strategy!: unknown strategy " strategy
+                    " — must be one of " dl-strategy-values)))
+      (else
+        (do
+          (dict-set! db :strategy strategy)
+          db)))))
+
+(define
+  dl-keyword-member?
+  (fn
+    (k xs)
+    (cond
+      ((= (len xs) 0) false)
+      ((= k (first xs)) true)
+      (else (dl-keyword-member? k (rest xs))))))
 
 (define
   dl-get-strategy
diff --git a/lib/datalog/scoreboard.json b/lib/datalog/scoreboard.json
index e7621023..4dd9e4b1 100644
--- a/lib/datalog/scoreboard.json
+++ b/lib/datalog/scoreboard.json
@@ -1,13 +1,13 @@
 {
   "lang": "datalog",
-  "total_passed": 275,
+  "total_passed": 276,
   "total_failed": 0,
-  "total": 275,
+  "total": 276,
   "suites": [
     {"name":"tokenize","passed":31,"failed":0,"total":31},
     {"name":"parse","passed":23,"failed":0,"total":23},
     {"name":"unify","passed":29,"failed":0,"total":29},
-    {"name":"eval","passed":43,"failed":0,"total":43},
+    {"name":"eval","passed":44,"failed":0,"total":44},
     {"name":"builtins","passed":26,"failed":0,"total":26},
     {"name":"semi_naive","passed":8,"failed":0,"total":8},
     {"name":"negation","passed":12,"failed":0,"total":12},
@@ -16,5 +16,5 @@
     {"name":"magic","passed":37,"failed":0,"total":37},
     {"name":"demo","passed":21,"failed":0,"total":21}
   ],
-  "generated": "2026-05-11T09:34:17+00:00"
+  "generated": "2026-05-11T09:40:12+00:00"
 }
diff --git a/lib/datalog/scoreboard.md b/lib/datalog/scoreboard.md
index 4676d363..c06a2f24 100644
--- a/lib/datalog/scoreboard.md
+++ b/lib/datalog/scoreboard.md
@@ -1,13 +1,13 @@
 # datalog scoreboard
 
-**275 / 275 passing** (0 failure(s)).
+**276 / 276 passing** (0 failure(s)).
 
 | Suite | Passed | Total | Status |
 |-------|--------|-------|--------|
 | tokenize | 31 | 31 | ok |
 | parse | 23 | 23 | ok |
 | unify | 29 | 29 | ok |
-| eval | 43 | 43 | ok |
+| eval | 44 | 44 | ok |
 | builtins | 26 | 26 | ok |
 | semi_naive | 8 | 8 | ok |
 | negation | 12 | 12 | ok |
diff --git a/lib/datalog/tests/eval.sx b/lib/datalog/tests/eval.sx
index 937a49dc..2625f04e 100644
--- a/lib/datalog/tests/eval.sx
+++ b/lib/datalog/tests/eval.sx
@@ -359,6 +359,16 @@
           (do (dl-set-strategy! db :magic) (dl-get-strategy db)))
         :magic)
 
+      ;; Unknown strategy values are rejected so typos don't silently
+      ;; fall back to the default.
+      (dl-et-test!
+        "unknown strategy rejected"
+        (dl-et-throws?
+          (fn ()
+            (let ((db (dl-make-db)))
+              (dl-set-strategy! db :semi_naive))))
+        true)
+
       ;; dl-saturated?: no-work-left predicate.
       (dl-et-test! "saturated? after saturation"
         (let ((db (dl-program
diff --git a/plans/datalog-on-sx.md b/plans/datalog-on-sx.md
index 791c77d8..d1b84163 100644
--- a/plans/datalog-on-sx.md
+++ b/plans/datalog-on-sx.md
@@ -15,7 +15,7 @@ for rose-ash data (e.g. federation graph, content relationships).
 
 ## Status (rolling)
 
-`bash lib/datalog/conformance.sh` → **275/275 across 11 suites**
+`bash lib/datalog/conformance.sh` → **276/276 across 11 suites**
 (tokenize, parse, unify, eval, builtins, semi_naive, negation, aggregates,
 api, magic, demo). Source is ~3100 LOC, tests ~2900 LOC, public API
 documented in `lib/datalog/datalog.sx`.
@@ -320,6 +320,13 @@ large graphs.
 
 _Newest first._
 
+- 2026-05-11 — `dl-set-strategy!` accepted arbitrary keyword values
+  silently. Typos like `:semi_naive` or `:semiNaive` were stored
+  uninspected; the saturator then used the default and the user
+  never learned their setting was a typo. Validator added: strategy
+  must be one of `:semi-naive`, `:naive`, `:magic`. 1 regression test;
+  276/276.
+
 - 2026-05-11 — Anonymous-variable renamer collided with user-written
   `_anon<N>` symbols. The renamer started counter at 0 and produced
   `_anon1, _anon2, ...` unconditionally; if the user wrote

From 0df5e92c4663206fcb9b400050938a7bd88b58aa Mon Sep 17 00:00:00 2001
From: giles <giles.bradshaw@rose-ash.com>
Date: Mon, 11 May 2026 10:15:05 +0000
Subject: [PATCH 89/89] datalog: magic pre-saturation is conditional, not
 unconditional
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Previously dl-magic-query always pre-saturated the source db so it
gave correct results for stratified programs (where the rewriter
doesn't propagate magic to aggregate inner-goals or negated rels).
Pure positive programs paid the full bottom-up cost twice.

Add dl-rules-need-presaturation? — checks whether any rule body
contains an aggregate or negation. Only pre-saturate in that case.
Pure positive programs (the common case for magic-sets) keep their
full goal-directed efficiency.

276/276; identical answers on the existing aggregate-of-IDB test.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 lib/datalog/magic.sx | 52 ++++++++++++++++++++++++++++++++++----------
 1 file changed, 41 insertions(+), 11 deletions(-)

diff --git a/lib/datalog/magic.sx b/lib/datalog/magic.sx
index 43ab7404..448042e9 100644
--- a/lib/datalog/magic.sx
+++ b/lib/datalog/magic.sx
@@ -373,6 +373,35 @@
           rules)
         seen))))
 
+;; True iff any rule's body contains a literal kind that the magic
+;; rewriter doesn't propagate magic to — i.e. an aggregate or a
+;; negation. Used by dl-magic-query to decide whether to pre-saturate
+;; the source db (for correctness on stratified programs) or skip
+;; that step (preserving full magic-sets efficiency for pure
+;; positive programs).
+(define
+  dl-rule-has-nonprop-lit?
+  (fn
+    (body i n)
+    (cond
+      ((>= i n) false)
+      ((let ((lit (nth body i)))
+         (or (and (dict? lit) (has-key? lit :neg))
+             (dl-aggregate? lit)))
+        true)
+      (else (dl-rule-has-nonprop-lit? body (+ i 1) n)))))
+
+(define
+  dl-rules-need-presaturation?
+  (fn
+    (rules)
+    (cond
+      ((= (len rules) 0) false)
+      ((let ((body (get (first rules) :body)))
+         (dl-rule-has-nonprop-lit? body 0 (len body)))
+        true)
+      (else (dl-rules-need-presaturation? (rest rules))))))
+
 (define
   dl-magic-query
   (fn
@@ -393,17 +422,18 @@
         (dl-query db query-goal))
       (else
         (do
-          ;; Pre-saturate the source db. The magic rewriter passes
-          ;; aggregate body lits through unchanged (no magic
-          ;; propagation generated for them) — so if an aggregate's
-          ;; inner-goal relation is IDB, it would be empty in the
-          ;; magic db unless its tuples are already materialised in
-          ;; the source. Same for negation against IDB. Pre-saturating
-          ;; guarantees `dl-magic-query` returns the same answers as
-          ;; `dl-query` for every stratified program; the efficiency
-          ;; benefit then comes from goal-directed re-derivation of
-          ;; the query relation under the magic seed.
-          (dl-saturate! db)
+          ;; If the rule set has aggregates or negation, pre-saturate
+          ;; the source db before copying facts. The magic rewriter
+          ;; passes aggregate body lits and negated lits through
+          ;; unchanged (no magic propagation generated for them) — so
+          ;; if their inner-goal relation is IDB, it would be empty in
+          ;; the magic db. Pre-saturating ensures equivalence with
+          ;; `dl-query` for every stratified program. Pure positive
+          ;; programs skip this and keep the full magic-sets perf win
+          ;; from goal-directed re-derivation.
+          (when
+            (dl-rules-need-presaturation? (dl-rules db))
+            (dl-saturate! db))
           (let
             ((query-rel (dl-rel-name query-goal))
               (query-adn (dl-adorn-goal query-goal)))