#lang racket/base (require racket/contract/base) (provide (struct-out terminal-derivation) (struct-out nonterminal-derivation) (struct-out datum-label) (contract-out [parser-derivation? predicate/c] [parser-derivation-first-terminal (-> parser-derivation? any/c)] [parser-derivation-last-terminal (-> parser-derivation? any/c)] [parser-derivation (case-> (-> any/c terminal-derivation?) (-> derivation-label? parser-derivation? #:rest (listof parser-derivation?) nonterminal-derivation?))] [parser-derivation->syntax (-> parser-derivation? syntax?)] [derivation-label? predicate/c] [cut-label cut-label?] [cut-label? predicate/c] [splice-label splice-label?] [splice-label? predicate/c] [syntax-label? predicate/c] [syntax-label (->* (any/c) (#:properties hash? #:expression-properties hash?) syntax-label?)] [syntax-label-value (-> syntax-label? any/c)] [syntax-label-properties (-> syntax-label? hash?)] [syntax-label-expression-properties (-> syntax-label? hash?)])) (require racket/match racket/sequence racket/struct rebellion/collection/vector rebellion/private/static-name yaragg/base/token) (module+ test (require (submod "..") racket/syntax-srcloc rackunit)) ;@---------------------------------------------------------------------------------------------------- (define (parser-derivation? v) (or (terminal-derivation? v) (nonterminal-derivation? v))) ;; A (Terminal-Derivation V) represents a terminal that was matched by the grammar. It contains the ;; value V of the (Token T V) that was matched. (struct terminal-derivation (value) #:transparent) ;; A (Nonterminal-Derivation V L) represents a nonterminal that was matched by the grammar. It ;; contains the label of type L of the production rule that matched, and an immutable vector of ;; subderivations (struct nonterminal-derivation (label children) #:guard (let ([contract-guard (struct-guard/c any/c (sequence/c parser-derivation? #:min-count 1))]) (λ (label children name) (let-values ([(label children) (contract-guard label children name)]) (values label (sequence->vector children))))) #:transparent #:property prop:custom-print-quotable 'never #:methods gen:custom-write [(define write-proc (make-constructor-style-printer (λ (_) 'nonterminal-derivation) (λ (this) (cons (nonterminal-derivation-label this) (vector->list (nonterminal-derivation-children this))))))]) (define parser-derivation (case-lambda [(value) (terminal-derivation value)] [(label first-child . children) (nonterminal-derivation label (cons first-child children))])) (define (parser-derivation-first-terminal derivation) (match derivation [(terminal-derivation value) value] [(nonterminal-derivation _ (vector first-child _ ...)) (parser-derivation-first-terminal first-child)])) (define (parser-derivation-last-terminal derivation) (match derivation [(terminal-derivation value) value] [(nonterminal-derivation _ (vector _ ... last-child)) (parser-derivation-last-terminal last-child)])) (module+ test (test-case (name-string parser-derivation-first-terminal) (test-case "terminal" (check-equal? (parser-derivation-first-terminal (terminal-derivation 1)) 1)) (test-case "nonterminal of terminals" (define derivation (parser-derivation (datum-label 'a) (parser-derivation 1) (parser-derivation 2) (parser-derivation 3))) (check-equal? (parser-derivation-first-terminal derivation) 1)) (test-case "nonterminal of nonterminals and terminals" (define derivation (parser-derivation (datum-label 'a) (parser-derivation (datum-label 'b) (parser-derivation 1)) (parser-derivation 2) (parser-derivation 3))) (check-equal? (parser-derivation-first-terminal derivation) 1))) (test-case (name-string parser-derivation-last-terminal) (test-case "terminal" (check-equal? (parser-derivation-last-terminal (terminal-derivation 1)) 1)) (test-case "nonterminal of terminals" (define derivation (parser-derivation (datum-label 'a) (parser-derivation 1) (parser-derivation 2) (parser-derivation 3))) (check-equal? (parser-derivation-last-terminal derivation) 3)) (test-case "nonterminal of nonterminals and terminals" (define derivation (parser-derivation (datum-label 'a) (parser-derivation 1) (parser-derivation 2) (parser-derivation (datum-label 'b) (parser-derivation 3)))) (check-equal? (parser-derivation-last-terminal derivation) 3)))) (define (derivation-label? v) (or (cut-label? v) (splice-label? v) (datum-label? v) (syntax-label? v))) (struct cut-label () #:transparent #:constructor-name constructor:cut-label #:omit-define-syntaxes) (define cut-label (constructor:cut-label)) (struct splice-label () #:transparent #:constructor-name constructor:splice-label #:omit-define-syntaxes) (define splice-label (constructor:splice-label)) (struct datum-label (value) #:transparent) (struct syntax-label (value expression-properties properties) #:transparent #:constructor-name constructor:syntax-label #:omit-define-syntaxes #:guard (struct-guard/c any/c (hash/c any/c any/c #:immutable #true #:flat? #true) (hash/c any/c any/c #:immutable #true #:flat? #true))) (define (syntax-label value #:properties [properties (hash)] #:expression-properties [expression-properties (hash)]) (constructor:syntax-label value properties expression-properties)) (define (parser-derivation->syntax derivation) (define (->splice derivation) (match derivation [(terminal-derivation t) (list (syntax-token->syntax t))] [(nonterminal-derivation (? cut-label?) _) '()] [(nonterminal-derivation (? splice-label?) children) (for*/list ([child (in-vector children)] [stx (in-list (->splice child))]) stx)] [(nonterminal-derivation (? syntax-label? label) children) (define first-token (parser-derivation-first-terminal derivation)) (define label-location (srcloc (syntax-token-source first-token) (syntax-token-line first-token) (syntax-token-column first-token) (syntax-token-position first-token) 0)) (define label-stx (for/fold ([stx (datum->syntax #false (syntax-label-value label) label-location #false)]) ([(key value) (in-hash (syntax-label-properties label))]) (syntax-property stx key value))) (define children-syntaxes (for*/list ([child (in-vector children)] [spliced-child (in-list (->splice child))]) spliced-child)) (define last-token (parser-derivation-last-terminal derivation)) (define expression-location (srcloc (syntax-token-source first-token) (syntax-token-line first-token) (syntax-token-column first-token) (syntax-token-position first-token) (- (syntax-token-end-position last-token) (syntax-token-position first-token)))) (define expression-stx (datum->syntax #false (cons label-stx children-syntaxes) expression-location #false)) (list (for/fold ([expression-stx expression-stx]) ([(key value) (in-hash (syntax-label-expression-properties label))]) (syntax-property expression-stx key value)))])) (define first-token (parser-derivation-first-terminal derivation)) (define last-token (parser-derivation-last-terminal derivation)) (define top-level-location (srcloc (syntax-token-source first-token) (syntax-token-line first-token) (syntax-token-column first-token) (syntax-token-position first-token) (- (syntax-token-end-position last-token) (syntax-token-position first-token)))) (define top-level-stxs (->splice derivation)) (match top-level-stxs [(list stx) stx])) (define (parser-derivation->datum derivation) (define (->splice derivation) (match derivation [(terminal-derivation t) (list t)] [(nonterminal-derivation (? cut-label?) _) '()] [(nonterminal-derivation (? splice-label?) children) (for*/list ([child (in-vector children)] [datum (in-list (->splice child))]) datum)] [(nonterminal-derivation (datum-label value) children) (define child-data (for*/list ([child (in-vector children)] [spliced-child (in-list (->splice child))]) spliced-child)) (list (cons value child-data))])) (define top-level-data (->splice derivation)) (match top-level-data [(list datum) datum])) (module+ test (test-case (name-string parser-derivation->datum) (test-case "datum terminals" (define derivation (parser-derivation 'a)) (check-equal? (parser-derivation->datum derivation) 'a)) (test-case "datum nonterminals" (define derivation (parser-derivation (datum-label 'a) (parser-derivation 'b) (parser-derivation 'c) (parser-derivation 'd))) (check-equal? (parser-derivation->datum derivation) '(a b c d))) (test-case "datum cuts" (define derivation (parser-derivation (datum-label 'a) (parser-derivation cut-label (parser-derivation 'b)) (parser-derivation 'c) (parser-derivation cut-label (parser-derivation 'd)))) (check-equal? (parser-derivation->datum derivation) '(a c))) (test-case "datum splices" (define derivation (parser-derivation (datum-label 'a) (parser-derivation 'b) (parser-derivation splice-label (parser-derivation 'c1) (parser-derivation 'c2) (parser-derivation 'c3)) (parser-derivation 'd))) (check-equal? (parser-derivation->datum derivation) '(a b c1 c2 c3 d)))) (test-case (name-string parser-derivation->syntax) (test-case "syntax terminals" (define derivation (parser-derivation (syntax-token 'a #:position 1 #:span 1))) (define actual (parser-derivation->syntax derivation)) (check-equal? (syntax->datum actual) 'a) (check-equal? (syntax-srcloc actual) (srcloc #false #false #false 1 1))) (test-case "syntax nonterminals" (define derivation (parser-derivation (syntax-label 'a) (parser-derivation (syntax-token 'b #:position 1 #:span 1)) (parser-derivation (syntax-token 'c #:position 2 #:span 1)) (parser-derivation (syntax-token 'd #:position 3 #:span 1)))) (define actual (parser-derivation->syntax derivation)) (check-equal? (syntax->datum actual) '(a b c d)) (check-equal? (syntax-srcloc actual) (srcloc #false #false #false 1 3))) (test-case "syntax cuts" (define derivation (parser-derivation (syntax-label 'a) (parser-derivation cut-label (parser-derivation (syntax-token 'b #:position 1 #:span 1))) (parser-derivation (syntax-token 'c #:position 2 #:span 1)) (parser-derivation cut-label (parser-derivation (syntax-token 'd #:position 3 #:span 1))))) (define actual (parser-derivation->syntax derivation)) (check-equal? (syntax->datum actual) '(a c)) (check-equal? (syntax-srcloc actual) (srcloc #false #false #false 1 3))) (test-case "syntax splices" (define derivation (parser-derivation (syntax-label 'a) (parser-derivation (syntax-token 'b #:position 1 #:span 1)) (parser-derivation splice-label (parser-derivation (syntax-token 'c1 #:position 2 #:span 1)) (parser-derivation (syntax-token 'c2 #:position 3 #:span 1)) (parser-derivation (syntax-token 'c3 #:position 4 #:span 1))) (parser-derivation (syntax-token 'd #:position 5 #:span 1)))) (define actual (parser-derivation->syntax derivation)) (check-equal? (syntax->datum actual) '(a b c1 c2 c3 d)) (check-equal? (syntax-srcloc actual) (srcloc #false #false #false 1 5)))))