Files
rose-ash/spec/canonical.sx
giles e6d7a08f8c Add canonical serialization and content identity spec
spec/canonical.sx defines:
- canonical-serialize: deterministic s-expression serialization
  (sorted dict keys, normalized numbers, minimal escaping)
- content-id: SHA3-256 of canonical form = CID of any s-expression
- Bytecode module format: (sxbc version source-hash (code ...))
- Provenance records linking source CID → bytecode CID → compiler CID

The CID is the identity model for SX. A component, a bytecode module,
a test suite — anything expressed as an s-expression — is addressable
by content hash. Annotation layers (source maps, variable names, test
results, documentation) reference CIDs without polluting the artifacts.

Requires host primitives: sha3-256, sort. Tests in test-canonical.sx.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
2026-03-27 14:35:33 +00:00

118 lines
2.5 KiB
Plaintext

(define
canonical-serialize
:effects ()
(fn
(val)
(case
(type-of val)
"nil"
"nil"
"boolean"
(if val "true" "false")
"number"
(canonical-number val)
"string"
(str "\"" (escape-string val) "\"")
"symbol"
(symbol-name val)
"keyword"
(str ":" (keyword-name val))
"list"
(str "(" (join " " (map canonical-serialize val)) ")")
"dict"
(canonical-dict val)
:else (str val))))
(define
canonical-number
:effects ()
(fn
(n)
(let
((s (str n)))
(if
(ends-with? s ".0")
(slice s 0 (- (len s) 2))
(if
(contains-char? s ".")
(let
((trimmed (trim-right s "0")))
(if (ends-with? trimmed ".") (str trimmed "0") trimmed))
s)))))
(define
canonical-dict
:effects ()
(fn
(d)
(let
((sorted-keys (sort (keys d))))
(str
"{"
(join
" "
(reduce
(fn
(acc key)
(concat
acc
(list (str ":" key) (canonical-serialize (dict-get d key)))))
(list)
sorted-keys))
"}"))))
(define
content-id
:effects ()
(fn (expr) (sha3-256 (canonical-serialize expr))))
(define
content-id-short
:effects ()
(fn (expr) (slice (content-id expr) 0 16)))
(define
make-bytecode-module
:effects ()
(fn
(version source-hash code)
(list (quote sxbc) version source-hash code)))
(define
bytecode-module?
:effects ()
(fn
(expr)
(and (list? expr) (>= (len expr) 4) (= (first expr) (quote sxbc)))))
(define bytecode-module-version :effects () (fn (m) (nth m 1)))
(define bytecode-module-source-hash :effects () (fn (m) (nth m 2)))
(define bytecode-module-code :effects () (fn (m) (nth m 3)))
(define
make-code-object
:effects ()
(fn
(arity upvalue-count bytecode constants)
(let
((parts (list (quote code))))
(when (> arity 0) (set! parts (concat parts (list :arity arity))))
(when
(> upvalue-count 0)
(set! parts (concat parts (list :upvalue-count upvalue-count))))
(concat parts (list :bytecode bytecode :constants constants)))))
(define
make-provenance
:effects ()
(fn
(source-cid bytecode-cid compiler-cid timestamp)
(list
(quote provenance)
:source-cid source-cid
:bytecode-cid bytecode-cid
:compiler-cid compiler-cid
:timestamp timestamp)))