You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
pollen/pollen/private/external/output.rkt

342 lines
15 KiB
Racket

#lang racket/base
(require racket/promise
racket/contract/base
pollen/setup) ; to get splicing char
#|
161017:
This is a slightly amended version of scribble/text/output
that cooperates with the project splicing character.
Ordinarily, when the output function comes across a list, it will splice it into the surrounding string.
This version will also splice lists that begin with the splicing char.
|#
(provide
outputable/c
(contract-out
[output (->* (outputable/c) (output-port?) void?)]))
;; See also `provide-special` below
;; Outputs values for the `scribble/text' language:
;; - several atomic values are printed as in `display',
;; - promises, thunks, and boxes are indirections for the value they contain
;; (useful in various cases),
;; - some "special" values are used for controlling output (eg, flushing,
;; prefix changes, etc),
;; - specifically, `block's delimit indentation levels, `splice's do not,
;; - lists (more generally, pairs) are like either one depending on the context
;; (same as blocks/splices when inside a `block'/`splice'), at the toplevel
;; they default to blocks.
;;
;; Uses global state because `output' is wrapped around each expression in a
;; scribble/text file so this is much more convenient than wrapping the whole
;; module's body in a `list' (which will be difficult with definitions etc).
;; The state is a pair of prefixes -- one that is the prefix for the current
;; value (which gets extended with nested blocks), and the other is the prefix
;; for the current "line" (which is reset after a newline). The line-prefix is
;; needed because a line can hold a block, which means that the line-prefix
;; will apply for the contents of the block including newlines in it. This
;; state is associated with a port via a hash table. Another state that is
;; used is the port's column position, which is maintained by the system (when
;; line counts are enabled) -- this is used to tell what part of a prefix is
;; already displayed.
;;
;; Each prefix is either an integer (for a number of spaces) or a string. The
;; prefix mechanism can be disabled by using #f for the global prefix, and in
;; this case the line prefix can have (cons pfx lpfx) so it can be restored --
;; used by `disable-prefix' and `restore-prefix' resp. (This is different from
;; a 0 prefix -- #f means that no prefix will be accumulated).
;;
(define (output x [p (current-output-port)])
;; these are the global prefix and the one that is local to the current line
(define pfxs (port->state p))
;; the current mode for lists
(define list=block? #t)
;; the low-level string output function (can change with `with-writer')
(define write write-string)
;; to get the output column
(define (getcol) (let-values ([(line col pos) (port-next-location p)]) col))
;; total size of the two prefixes
(define (2pfx-length pfx1 pfx2)
(if (and pfx1 pfx2)
(+ (if (number? pfx1) pfx1 (string-length pfx1))
(if (number? pfx2) pfx2 (string-length pfx2)))
0))
;; combines a prefix with a target column to get to
(define (pfx+col pfx)
(and pfx (let ([col (getcol)])
(cond [(number? pfx) (max pfx col)]
[(>= (string-length pfx) col) pfx]
[else (string-append
pfx (make-spaces (- col (string-length pfx))))]))))
;; adds two prefixes
(define (pfx+ pfx1 pfx2)
(and pfx1 pfx2
(if (and (number? pfx1) (number? pfx2)) (+ pfx1 pfx2)
(string-append (if (number? pfx1) (make-spaces pfx1) pfx1)
(if (number? pfx2) (make-spaces pfx2) pfx2)))))
;; prints two prefixes
(define (output-pfx col pfx1 pfx2)
(define-syntax-rule (->str pfx) (if (number? pfx) (make-spaces pfx) pfx))
(define-syntax-rule (show pfx) ; optimize when not needed
(unless (eq? pfx 0) (write (->str pfx) p)))
(when (and pfx1 pfx2)
(if (eq? 0 col)
(begin (show pfx1) (show pfx2))
(let ([len1 (if (number? pfx1) pfx1 (string-length pfx1))])
(cond [(< col len1) (write (->str pfx1) p col) (show pfx2)]
[(= col len1) (show pfx2)]
[(eq? 0 pfx2)]
[else
(let ([col (- col len1)]
[len2 (if (number? pfx2) pfx2 (string-length pfx2))])
(when (< col len2) (write (->str pfx2) p col)))])))))
;; the basic printing unit: strings
(define (output-string x)
(define pfx (mcar pfxs))
(if (not pfx) ; prefix disabled?
(write x p)
(let ([len (string-length x)]
[nls (regexp-match-positions* #rx"\n" x)])
(let loop ([start 0] [nls nls] [lpfx (mcdr pfxs)] [col (getcol)])
(cond [(pair? nls)
(define nl (car nls))
(if (regexp-match? #rx"^ *$" x start (car nl))
(newline p) ; only spaces before the end of the line
(begin (output-pfx col pfx lpfx)
(write x p start (cdr nl))))
(loop (cdr nl) (cdr nls) 0 0)]
;; last substring from here (always set lpfx state when done)
[(start . = . len)
(set-mcdr! pfxs lpfx)]
[(col . > . (2pfx-length pfx lpfx))
(set-mcdr! pfxs lpfx)
;; the prefix was already shown, no accumulation needed
(write x p start)]
[else
(define m (regexp-match-positions #rx"^ +" x start))
;; accumulate spaces to lpfx, display if it's not all spaces
(define lpfx* (if m (pfx+ lpfx (- (cdar m) (caar m))) lpfx))
(set-mcdr! pfxs lpfx*)
(unless (and m (= len (cdar m)))
(output-pfx col pfx lpfx*)
;; the spaces were already added to lpfx
(write x p (if m (cdar m) start)))])))))
;; blocks and splices
(define (output-block c)
(define pfx (mcar pfxs))
(define lpfx (mcdr pfxs))
(define npfx (pfx+col (pfx+ pfx lpfx)))
(set-mcar! pfxs npfx) (set-mcdr! pfxs 0)
(if (list? c)
(let ([c (if (eq? (setup:splicing-tag) (car c)) ; patch to cooperate with splicing char
(cdr c)
c)])
(for ([c (in-list c)]) (loop c)))
(begin (loop (car c)) (loop (cdr c))))
(set-mcar! pfxs pfx) (set-mcdr! pfxs lpfx))
(define (output-splice c)
(for-each loop c))
;; main loop
(define (loop x)
(cond
;; no output for these
[(or (void? x) (not x) (null? x)) (void)]
;; for lists and pairs the current line prefix is added to the global
;; one, then output the contents recursively (no need to change the
;; state, since we pass the values in the loop, and we'd need to restore
;; it afterwards anyway)
[(pair? x) (if list=block? (output-block x) (output-splice x))]
;; delayed values
[(and (procedure? x) (procedure-arity-includes? x 0)) (loop (x))]
[(promise? x) (loop (force x))]
[(box? x) (loop (unbox x))]
;; special output wrappers
[(special? x)
(define c (special-contents x))
(case (special-flag x)
;; preserve tailness & avoid `set!' for blocks/splices if possible
[(block) (if list=block?
(output-block c)
(begin (set! list=block? #t)
(output-block c)
(set! list=block? #f)))]
[(splice) (if list=block?
(begin (set! list=block? #f)
(output-splice c)
(set! list=block? #t))
(output-splice c))]
[(flush) ; useful before `disable-prefix'
(output-pfx (getcol) (mcar pfxs) (mcdr pfxs))]
[(disable-prefix) ; save the previous pfxs
(define pfx (mcar pfxs))
(define lpfx (mcdr pfxs))
(set-mcar! pfxs #f) (set-mcdr! pfxs (cons pfx lpfx))
(for-each loop c)
(set-mcar! pfxs pfx) (set-mcdr! pfxs lpfx)]
[(restore-prefix) ; restore the previous pfxs
(define pfx (mcar pfxs))
(define lpfx (mcdr pfxs))
(define npfx (pfx+col (if (and (not pfx) (pair? lpfx))
(pfx+ (car lpfx) (cdr lpfx))
(pfx+ pfx lpfx))))
(set-mcar! pfxs npfx) (set-mcdr! pfxs 0)
(for-each loop c)
(set-mcar! pfxs pfx) (set-mcdr! pfxs lpfx)]
[(add-prefix) ; add to the current prefix (unless it's #f)
(define pfx (mcar pfxs))
(define lpfx (mcdr pfxs))
(define npfx (pfx+ (pfx+col (pfx+ pfx lpfx)) (car c)))
(set-mcar! pfxs npfx) (set-mcdr! pfxs 0)
(for-each loop (cdr c))
(set-mcar! pfxs pfx) (set-mcdr! pfxs lpfx)]
[(set-prefix)
(define pfx (mcar pfxs))
(define lpfx (mcdr pfxs))
(set-mcar! pfxs (car c)) (set-mcdr! pfxs 0)
(for-each loop (cdr c))
(set-mcar! pfxs pfx) (set-mcdr! pfxs lpfx)]
[(with-writer)
(define old write)
(set! write (or (car c) write-string))
(for-each loop (cdr c))
(set! write old)]
#; ; no need for this hack yet
[(with-writer-change)
;; The function gets the old writer and return a new one (useful to
;; save the current writer and restore it inside). Could also be
;; used to extend a writer, but that shows why a customizable writer
;; is a bad choice: instead, it should be a list of substitutions
;; that can be extended more conveniently. A simple implementation
;; would be to chain functions that do substitutions. But that runs
;; into problems when functions want to substitute the same thing,
;; and worse: when the output of one function would get substituted
;; again by another. Another approach would be to join matcher
;; regexps with "|" after wrapping each one with parens, then find
;; out which one matched by looking at the result and applying its
;; substitution, but the problem with that is that is that it forbids
;; having parens in the regexps -- this could be fixed by not
;; parenthesizing each expression, and instead running the found
;; match against each of the input regexps to find the matching one,
;; but that can be very inefficient. Yet another issue is that in
;; some cases we might *want* the "worse" feature mentioned earlier:
;; for example, when we want to do some massaging of the input texts
;; yet still have the result encoded for HTML output -- so perhaps
;; the simple approach is still better. The only difference from the
;; current `with-writer' is using a substituting function, so it can
;; be composed with the current one instead of replacing it
;; completely.
(define old write)
(set! write ((car c) write))
(for-each loop (cdr c))
(set! write old)]
[else (error 'output "unknown special value flag: ~e"
(special-flag x))])]
[else
(output-string
(cond [(string? x) x]
[(bytes? x) (bytes->string/utf-8 x)]
[(symbol? x) (symbol->string x)]
[(path? x) (path->string x)]
[(keyword? x) (keyword->string x)]
[(number? x) (number->string x)]
[(char? x) (string x)]
;; generic fallback: throw an error (could use `display' so new
;; values can define how they're shown, but the same
;; functionality can be achieved with thunks and prop:procedure)
[else (error 'output "don't know how to render value: ~v" x)]))]))
;;
(port-count-lines! p)
(loop x)
(void))
(define port->state
(let ([t (make-weak-hasheq)]
[last '(#f #f)]) ; cache for the last port, to avoid a hash lookup
(λ (p)
(if (eq? p (car last)) (cdr last)
(let ([s (or (hash-ref t p #f)
(let ([s (mcons 0 0)]) (hash-set! t p s) s))])
(set! last (cons p s))
s)))))
;; special constructs
(define-struct special (flag contents))
(define-syntax define/provide-special
(syntax-rules ()
[(_ (name))
(begin (provide (contract-out [name (->* () () #:rest (listof outputable/c) any/c)]))
(define (name . contents)
(make-special 'name contents)))]
[(_ (name [x ctc] ...))
(begin (provide (contract-out [name (->* (ctc ...) () #:rest (listof outputable/c) any/c)]))
(define (name x ... . contents)
(make-special 'name (list* x ... contents))))]
[(_ name)
(begin (provide name)
(define name (make-special 'name #f)))]))
(define/provide-special (block))
(define/provide-special (splice))
(define/provide-special flush)
(define/provide-special (disable-prefix))
(define/provide-special (restore-prefix))
(define/provide-special (add-prefix [pfx (or/c string? exact-nonnegative-integer?)]))
(define/provide-special (set-prefix [pfx (or/c string? exact-nonnegative-integer?)]))
(define/provide-special (with-writer [writer (or/c #f (->* (string? output-port?) (exact-nonnegative-integer? exact-nonnegative-integer?) any/c))]))
#; ; no need for this hack yet
(define/provide-special (with-writer-change writer))
(define make-spaces ; (efficiently)
(let ([t (make-hasheq)] [v (make-vector 200 #f)])
(λ (n)
(or (if (< n 200) (vector-ref v n) (hash-ref t n #f))
(let ([spaces (make-string n #\space)])
(if (< n 200) (vector-set! v n spaces) (hash-set! t n spaces))
spaces)))))
;; Convenient utilities
(provide add-newlines)
(define (add-newlines list #:sep [sep "\n"])
(define r
(let loop ([list list])
(if (null? list)
null
(let ([1st (car list)])
(if (or (not 1st) (void? 1st))
(loop (cdr list))
(list* sep 1st (loop (cdr list))))))))
(if (null? r) r (cdr r)))
(provide split-lines)
(define (split-lines list)
(let loop ([list list] [cur '()] [r '()])
(cond
[(null? list) (reverse (cons (reverse cur) r))]
[(equal? "\n" (car list)) (loop (cdr list) '() (cons (reverse cur) r))]
[else (loop (cdr list) (cons (car list) cur) r)])))
(define outputable/c
(lambda (v) #t)
;; too expensive:
#;
(recursive-contract
(or/c void?
#f
null?
(cons/c outputable/c outputable/c)
(-> outputable/c)
promise?
(box/c outputable/c)
special?
string?
bytes?
symbol?
path?
keyword?
number?
char?)))