streamline decode
parent
95478ba824
commit
7c138d2915
@ -1,30 +1,61 @@
|
|||||||
#lang racket/base
|
#lang racket/base
|
||||||
(require racket/contract xml txexpr)
|
(require xml txexpr sugar/define)
|
||||||
(require "decode/fast.rkt" "predicates.rkt" "decode/typography-fast.rkt")
|
(require "predicates.rkt" "decode/typography.rkt")
|
||||||
|
|
||||||
(provide to-string (contract-out [register-block-tag (symbol? . -> . void?)]
|
(provide (all-from-out "decode/typography.rkt"))
|
||||||
[decode ((xexpr/c) ;; use xexpr/c for contract on nx because it gives better error messages
|
|
||||||
|
|
||||||
;; todo: how to write more specific contracts for these procedures?
|
|
||||||
;; e.g., string-proc should be restricted to procs that accept a string as input
|
(define+provide (to-string x)
|
||||||
;; and return a string as output
|
(if (string? x)
|
||||||
|
x ; fast exit for strings
|
||||||
|
(with-handlers ([exn:fail? (λ(exn) (error (format "Pollen parser: can't convert ~v to ~a" x 'string)))])
|
||||||
|
(cond
|
||||||
|
[(equal? '() x) ""]
|
||||||
|
[(symbol? x) (symbol->string x)]
|
||||||
|
[(number? x) (number->string x)]
|
||||||
|
[(path? x) (path->string x)]
|
||||||
|
[(char? x) (format "~a" x)]
|
||||||
|
[else (error)])))) ; put this last so other xexprish things don't get caught
|
||||||
|
|
||||||
|
;; add a block tag to the list
|
||||||
|
(define+provide/contract (register-block-tag tag)
|
||||||
|
(symbol? . -> . void?)
|
||||||
|
(append-block-tag tag))
|
||||||
|
|
||||||
|
|
||||||
|
;; decoder wireframe
|
||||||
|
(define+provide/contract (decode nx
|
||||||
|
#:exclude-xexpr-tags [excluded-xexpr-tags '()]
|
||||||
|
#:xexpr-tag-proc [xexpr-tag-proc (λ(x)x)]
|
||||||
|
#:xexpr-attrs-proc [xexpr-attrs-proc (λ(x)x)]
|
||||||
|
#:xexpr-elements-proc [xexpr-elements-proc (λ(x)x)]
|
||||||
|
#:block-xexpr-proc [block-xexpr-proc (λ(x)x)]
|
||||||
|
#:inline-xexpr-proc [inline-xexpr-proc (λ(x)x)]
|
||||||
|
#:string-proc [string-proc (λ(x)x)])
|
||||||
|
((xexpr/c)
|
||||||
(#:exclude-xexpr-tags list?
|
(#:exclude-xexpr-tags list?
|
||||||
#:xexpr-tag-proc procedure?
|
#:xexpr-tag-proc procedure?
|
||||||
#:xexpr-attrs-proc procedure?
|
#:xexpr-attrs-proc procedure?
|
||||||
#:xexpr-elements-proc procedure?
|
#:xexpr-elements-proc procedure?
|
||||||
#:block-xexpr-proc procedure?
|
#:block-xexpr-proc procedure?
|
||||||
#:inline-xexpr-proc procedure?
|
#:inline-xexpr-proc procedure?
|
||||||
#:string-proc procedure?)
|
#:string-proc procedure?) . ->* . txexpr?)
|
||||||
. ->* . txexpr?)]
|
|
||||||
|
|
||||||
[typogrify (string? . -> . string?)]
|
(let loop ([x (validate-txexpr? nx)])
|
||||||
[nonbreaking-last-space ((txexpr?) (#:nbsp string? #:minimum-word-length integer?) . ->* . txexpr?)]
|
(cond
|
||||||
[wrap-hanging-quotes ((txexpr?) (#:single-prepend list? #:double-prepend list?) . ->* . txexpr?)]
|
[(txexpr? x) (let-values([(tag attr elements) (txexpr->values x)])
|
||||||
[convert-linebreaks ((txexpr-elements?) (#:newline string?) . ->* . txexpr-elements?)]
|
(if (member tag excluded-xexpr-tags)
|
||||||
[whitespace? (any/c . -> . boolean?)]
|
x ; let x pass through untouched
|
||||||
[paragraph-break? ((any/c) (#:pattern pregexp?) . ->* . boolean?)]
|
(let ([decoded-xexpr (apply make-txexpr (map loop (list tag attr elements)))])
|
||||||
[merge-newlines (list? . -> . list?)]
|
((if (block-xexpr? decoded-xexpr)
|
||||||
[prep-paragraph-flow (txexpr-elements? . -> . txexpr-elements?)]
|
block-xexpr-proc
|
||||||
[wrap-paragraph ((txexpr-elements?) (#:tag symbol?) . ->* . block-xexpr?)]
|
inline-xexpr-proc) decoded-xexpr))))]
|
||||||
[detect-paragraphs (txexpr-elements? . -> . txexpr-elements?)]
|
[(txexpr-tag? x) (xexpr-tag-proc x)]
|
||||||
))
|
[(txexpr-attrs? x) (xexpr-attrs-proc x)]
|
||||||
|
;; need this for operations that may depend on context in list
|
||||||
|
[(txexpr-elements? x) (map loop (xexpr-elements-proc x))]
|
||||||
|
[(string? x) (string-proc x)]
|
||||||
|
;; if something has made it through undecoded, that's a problem
|
||||||
|
[else (error "decode: can't decode" x)])))
|
||||||
|
|
||||||
|
@ -1,63 +0,0 @@
|
|||||||
#lang racket/base
|
|
||||||
(require racket/match xml)
|
|
||||||
(require "../tools.rkt" "../predicates.rkt" txexpr "typography-fast.rkt")
|
|
||||||
|
|
||||||
|
|
||||||
(provide (all-defined-out) (all-from-out "typography-fast.rkt"))
|
|
||||||
|
|
||||||
;; general way of coercing to string
|
|
||||||
(define (to-string x)
|
|
||||||
(if (string? x)
|
|
||||||
x ; fast exit for strings
|
|
||||||
(with-handlers ([exn:fail? (λ(exn) (error (format "Pollen parser: can't convert ~v to ~a" x 'string)))])
|
|
||||||
(cond
|
|
||||||
[(equal? '() x) ""]
|
|
||||||
[(symbol? x) (symbol->string x)]
|
|
||||||
[(number? x) (number->string x)]
|
|
||||||
[(path? x) (path->string x)]
|
|
||||||
[(char? x) (format "~a" x)]
|
|
||||||
[else (error)])))) ; put this last so other xexprish things don't get caught
|
|
||||||
|
|
||||||
|
|
||||||
;; add a block tag to the list
|
|
||||||
;; this function is among the predicates because it alters a predicate globally.
|
|
||||||
(define (register-block-tag tag)
|
|
||||||
(append-block-tag tag))
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
;; decoder wireframe
|
|
||||||
(define (decode nx
|
|
||||||
#:exclude-xexpr-tags [excluded-xexpr-tags '()]
|
|
||||||
#:xexpr-tag-proc [xexpr-tag-proc (λ(x)x)]
|
|
||||||
#:xexpr-attrs-proc [xexpr-attrs-proc (λ(x)x)]
|
|
||||||
#:xexpr-elements-proc [xexpr-elements-proc (λ(x)x)]
|
|
||||||
#:block-xexpr-proc [block-xexpr-proc (λ(x)x)]
|
|
||||||
#:inline-xexpr-proc [inline-xexpr-proc (λ(x)x)]
|
|
||||||
#:string-proc [string-proc (λ(x)x)])
|
|
||||||
|
|
||||||
(when (not (txexpr? nx))
|
|
||||||
(error (format "decode: ~v not a full txexpr" nx)))
|
|
||||||
|
|
||||||
|
|
||||||
(define (&decode x)
|
|
||||||
(cond
|
|
||||||
[(txexpr? x) (let-values([(tag attr elements) (txexpr->values x)])
|
|
||||||
(if (member tag excluded-xexpr-tags)
|
|
||||||
x ; let x pass through untouched
|
|
||||||
(let ([decoded-xexpr (apply make-txexpr
|
|
||||||
(map &decode (list tag attr elements)))])
|
|
||||||
((if (block-xexpr? decoded-xexpr)
|
|
||||||
block-xexpr-proc
|
|
||||||
inline-xexpr-proc) decoded-xexpr))))]
|
|
||||||
[(txexpr-tag? x) (xexpr-tag-proc x)]
|
|
||||||
[(txexpr-attrs? x) (xexpr-attrs-proc x)]
|
|
||||||
;; need this for operations that may depend on context in list
|
|
||||||
[(txexpr-elements? x) (map &decode (xexpr-elements-proc x))]
|
|
||||||
[(string? x) (string-proc x)]
|
|
||||||
;; if something has made it through undecoded, that's a problem
|
|
||||||
[else (error "Can't decode" x)]))
|
|
||||||
|
|
||||||
|
|
||||||
(&decode nx))
|
|
||||||
|
|
Loading…
Reference in New Issue