pollen/decode.rkt

#lang racket/base
(require racket/contract racket/list racket/string racket/match)
(require (only-in racket/format ~a))
(require (only-in racket/bool nor))
(require (only-in xml xexpr/c))
(module+ test (require rackunit))

(require "tools.rkt")
(provide (all-defined-out))

;; split list into list of sublists using test-proc
(define/contract (splitf-at* xs split-test)
  ;; todo: better error message when split-test is not a predicate
  (list? predicate/c . -> . (listof list?))
  (define (&splitf-at* xs [acc '()]) ; use acc for tail recursion
    (if (empty? xs) 
        ;; reverse because accumulation is happening backward 
        ;; (because I'm using cons to push latest match onto front of list)
        (reverse acc)
        (let-values ([(item rest) 
                      ;; drop matching elements from front
                      ;; then split on nonmatching 
                      ;; = nonmatching item + other elements (which will start with matching)
                      (splitf-at (dropf xs split-test) (compose1 not split-test))])
          ;; recurse, and store new item in accumulator
          (&splitf-at* rest (cons item acc)))))
  
  ;; trim off elements matching split-test
  (&splitf-at* (trim xs split-test)))

(module+ test
  (check-equal? (splitf-at* '(1 2 3 4 5 6) even?) '((1)(3)(5)))
  (check-equal? (splitf-at* '("foo" " " "bar" "\n" "\n" "ino") whitespace?) '(("foo")("bar")("ino"))))


;; Find adjacent newline characters in a list and merge them into one item
;; Scribble, by default, makes each newline a separate list item
;; In practice, this is worthless.
(define/contract (merge-newlines x)
  (list? . -> . list?)
  (define (newline? x)
    (and (string? x) (equal? "\n" x)))
  (define (not-newline? x)
    (not (newline? x)))
  
  (define (really-merge-newlines xs [acc '()])
    (if (empty? xs)
        acc
        ;; Try to peel the newlines off the front.
        (let-values ([(leading-newlines remainder) (splitf-at xs newline?)])
          (if (not (empty? leading-newlines)) ; if you got newlines ...
              ;; combine them into a string and append them to the accumulator, 
              ;; and recurse on the rest
              (really-merge-newlines remainder (append acc (list (string-join leading-newlines ""))))
              ;; otherwise peel off elements up to the next newline, append them to accumulator,
              ;; and recurse on the rest
              (really-merge-newlines (dropf remainder not-newline?) 
                                     (append acc (takef remainder not-newline?)))))))
  
  (cond
    [(list? x) (really-merge-newlines (map merge-newlines x))]
    [else x]))

(module+ test
  (check-equal? (merge-newlines '(p "\n" "foo" "\n" "\n" "bar" (em "\n" "\n" "\n"))) 
                '(p "\n" "foo" "\n\n" "bar" (em "\n\n\n"))))


;; todo: add native support for list-xexpr
;; decode triple newlines to list items


;; convert numbers to strings
;; maybe this isn't necessary
(define (stringify x)
  (map-tree (λ(i) (if (number? i) (->string i) i)) x))

(module+ test
  (check-equal? (stringify '(p 1 2 "foo" (em 4 "bar"))) '(p "1" "2" "foo" (em "4" "bar"))))


;; trim from beginning & end of list
(define (trim items test-proc)
  (list? procedure? . -> . list?)
  (dropf-right (dropf items test-proc) test-proc))

(module+ test
  (check-equal? (trim (list "\n" " " 1 2 3 "\n") whitespace?) '(1 2 3))
  (check-equal? (trim (list 1 3 2 4 5 6 8 9 13) odd?) '(2 4 5 6 8)))


;; decoder wireframe
(define/contract (decode nx
                         #:exclude-xexpr-tags [excluded-xexpr-tags '()]
                         #:xexpr-tag-proc [xexpr-tag-proc (λ(x)x)]
                         #:xexpr-attr-proc [xexpr-attr-proc (λ(x)x)]
                         #:xexpr-elements-proc [xexpr-elements-proc (λ(x)x)]
                         #:block-xexpr-proc [block-xexpr-proc (λ(x)x)]
                         #:inline-xexpr-proc [inline-xexpr-proc (λ(x)x)]
                         #:string-proc [string-proc (λ(x)x)])
  ;; use xexpr/c for contract because it gives better error messages
  ((xexpr/c) (#:exclude-xexpr-tags list?
                                   #:xexpr-tag-proc procedure?
                                   #:xexpr-attr-proc procedure?
                                   #:xexpr-elements-proc procedure?
                                   #:block-xexpr-proc procedure?
                                   #:inline-xexpr-proc procedure?
                                   #:string-proc procedure?)
             . ->* . tagged-xexpr?)
  (when (not (tagged-xexpr? nx))
    (error (format "decode: ~v not a full tagged-xexpr" nx)))
  
  
  (define (&decode x)
    (cond
      [(tagged-xexpr? x) (let-values([(tag attr elements) (break-tagged-xexpr x)]) 
                           (if (tag . in? . excluded-xexpr-tags)    
                               x ; let x pass through untouched
                               (let ([decoded-xexpr (apply make-tagged-xexpr 
                                             (map &decode (list tag attr elements)))])
                                 ((if (block-xexpr? decoded-xexpr)
                                      block-xexpr-proc
                                      inline-xexpr-proc) decoded-xexpr))))]
      [(xexpr-tag? x) (xexpr-tag-proc x)]
      [(xexpr-attr? x) (xexpr-attr-proc x)]
      ;; need this for operations that may depend on context in list
      [(xexpr-elements? x) (map &decode (xexpr-elements-proc x))]
      [(string? x) (string-proc x)]
      ;; if something has made it through undecoded, that's a problem
      [else (error "Can't decode" x)]))
  
  
  (&decode nx))
sun eve 11 years ago			`#lang racket/base`
Upgrading decode 11 years ago			`(require racket/contract racket/list racket/string racket/match)`
mon eve 11 years ago			`(require (only-in racket/format ~a))`
			`(require (only-in racket/bool nor))`
			`(require (only-in xml xexpr/c))`
sun eve 11 years ago			`(module+ test (require rackunit))`

renamings: convert named-xexpr to tagged-xexpr, name to tag, content to elements 11 years ago			`(require "tools.rkt")`
sun eve 11 years ago			`(provide (all-defined-out))`

added contracts & tests 11 years ago			`;; split list into list of sublists using test-proc`
various tidying. all files compile now. 11 years ago			`(define/contract (splitf-at* xs split-test)`
			`;; todo: better error message when split-test is not a predicate`
			`(list? predicate/c . -> . (listof list?))`
			`(define (&splitf-at* xs [acc '()]) ; use acc for tail recursion`
			`(if (empty? xs)`
			`;; reverse because accumulation is happening backward`
			`;; (because I'm using cons to push latest match onto front of list)`
			`(reverse acc)`
decode improvements 11 years ago			`(let-values ([(item rest)`
various tidying. all files compile now. 11 years ago			`;; drop matching elements from front`
			`;; then split on nonmatching`
			`;; = nonmatching item + other elements (which will start with matching)`
			`(splitf-at (dropf xs split-test) (compose1 not split-test))])`
			`;; recurse, and store new item in accumulator`
			`(&splitf-at* rest (cons item acc)))))`

			`;; trim off elements matching split-test`
			`(&splitf-at* (trim xs split-test)))`
added contracts & tests 11 years ago
			`(module+ test`
			`(check-equal? (splitf-at* '(1 2 3 4 5 6) even?) '((1)(3)(5)))`
			`(check-equal? (splitf-at* '("foo" " " "bar" "\n" "\n" "ino") whitespace?) '(("foo")("bar")("ino"))))`

decode improvements 11 years ago

sun eve 11 years ago			`;; Find adjacent newline characters in a list and merge them into one item`
			`;; Scribble, by default, makes each newline a separate list item`
			`;; In practice, this is worthless.`
			`(define/contract (merge-newlines x)`
			`(list? . -> . list?)`
			`(define (newline? x)`
			`(and (string? x) (equal? "\n" x)))`
			`(define (not-newline? x)`
			`(not (newline? x)))`

			`(define (really-merge-newlines xs [acc '()])`
			`(if (empty? xs)`
			`acc`
			`;; Try to peel the newlines off the front.`
			`(let-values ([(leading-newlines remainder) (splitf-at xs newline?)])`
			`(if (not (empty? leading-newlines)) ; if you got newlines ...`
			`;; combine them into a string and append them to the accumulator,`
			`;; and recurse on the rest`
			`(really-merge-newlines remainder (append acc (list (string-join leading-newlines ""))))`
			`;; otherwise peel off elements up to the next newline, append them to accumulator,`
			`;; and recurse on the rest`
			`(really-merge-newlines (dropf remainder not-newline?)`
mon eve 11 years ago			`(append acc (takef remainder not-newline?)))))))`
sun eve 11 years ago
			`(cond`
			`[(list? x) (really-merge-newlines (map merge-newlines x))]`
			`[else x]))`

			`(module+ test`
			`(check-equal? (merge-newlines '(p "\n" "foo" "\n" "\n" "bar" (em "\n" "\n" "\n")))`
			`'(p "\n" "foo" "\n\n" "bar" (em "\n\n\n"))))`


fix? 11 years ago
decode improvements 11 years ago			`;; todo: add native support for list-xexpr`
			`;; decode triple newlines to list items`
conflicting commit 11 years ago
tues eve 11 years ago
Upgrading decode 11 years ago			`;; convert numbers to strings`
			`;; maybe this isn't necessary`
			`(define (stringify x)`
tues eve 11 years ago			`(map-tree (λ(i) (if (number? i) (->string i) i)) x))`

			`(module+ test`
			`(check-equal? (stringify '(p 1 2 "foo" (em 4 "bar"))) '(p "1" "2" "foo" (em "4" "bar"))))`


decode improvements 11 years ago			`;; trim from beginning & end of list`
			`(define (trim items test-proc)`
			`(list? procedure? . -> . list?)`
			`(dropf-right (dropf items test-proc) test-proc))`

			`(module+ test`
			`(check-equal? (trim (list "\n" " " 1 2 3 "\n") whitespace?) '(1 2 3))`
			`(check-equal? (trim (list 1 3 2 4 5 6 8 9 13) odd?) '(2 4 5 6 8)))`


Upgrading decode 11 years ago			`;; decoder wireframe`
			`(define/contract (decode nx`
renamings: convert named-xexpr to tagged-xexpr, name to tag, content to elements 11 years ago			`#:exclude-xexpr-tags [excluded-xexpr-tags '()]`
			`#:xexpr-tag-proc [xexpr-tag-proc (λ(x)x)]`
Upgrading decode 11 years ago			`#:xexpr-attr-proc [xexpr-attr-proc (λ(x)x)]`
renamings: convert named-xexpr to tagged-xexpr, name to tag, content to elements 11 years ago			`#:xexpr-elements-proc [xexpr-elements-proc (λ(x)x)]`
Upgrading decode 11 years ago			`#:block-xexpr-proc [block-xexpr-proc (λ(x)x)]`
			`#:inline-xexpr-proc [inline-xexpr-proc (λ(x)x)]`
change pollen language to export a hash called 'metas (rather than storing metas as xexprs within main) 11 years ago			`#:string-proc [string-proc (λ(x)x)])`
tues eve 11 years ago			`;; use xexpr/c for contract because it gives better error messages`
various tidying. all files compile now. 11 years ago			`((xexpr/c) (#:exclude-xexpr-tags list?`
added contracts & tests 11 years ago			`#:xexpr-tag-proc procedure?`
			`#:xexpr-attr-proc procedure?`
			`#:xexpr-elements-proc procedure?`
			`#:block-xexpr-proc procedure?`
			`#:inline-xexpr-proc procedure?`
change pollen language to export a hash called 'metas (rather than storing metas as xexprs within main) 11 years ago			`#:string-proc procedure?)`
renamings: convert named-xexpr to tagged-xexpr, name to tag, content to elements 11 years ago			`. ->* . tagged-xexpr?)`
			`(when (not (tagged-xexpr? nx))`
			`(error (format "decode: ~v not a full tagged-xexpr" nx)))`
Upgrading decode 11 years ago
fix? 11 years ago
tues eve 11 years ago			`(define (&decode x)`
Upgrading decode 11 years ago			`(cond`
renamings: convert named-xexpr to tagged-xexpr, name to tag, content to elements 11 years ago			`[(tagged-xexpr? x) (let-values([(tag attr elements) (break-tagged-xexpr x)])`
various tidying. all files compile now. 11 years ago			`(if (tag . in? . excluded-xexpr-tags)`
			`x ; let x pass through untouched`
			`(let ([decoded-xexpr (apply make-tagged-xexpr`
			`(map &decode (list tag attr elements)))])`
added contracts & tests 11 years ago			`((if (block-xexpr? decoded-xexpr)`
			`block-xexpr-proc`
			`inline-xexpr-proc) decoded-xexpr))))]`
renamings: convert named-xexpr to tagged-xexpr, name to tag, content to elements 11 years ago			`[(xexpr-tag? x) (xexpr-tag-proc x)]`
Upgrading decode 11 years ago			`[(xexpr-attr? x) (xexpr-attr-proc x)]`
various tidying. all files compile now. 11 years ago			`;; need this for operations that may depend on context in list`
renamings: convert named-xexpr to tagged-xexpr, name to tag, content to elements 11 years ago			`[(xexpr-elements? x) (map &decode (xexpr-elements-proc x))]`
Upgrading decode 11 years ago			`[(string? x) (string-proc x)]`
various tidying. all files compile now. 11 years ago			`;; if something has made it through undecoded, that's a problem`
			`[else (error "Can't decode" x)]))`
tues eve 11 years ago
Upgrading decode 11 years ago
change pollen language to export a hash called 'metas (rather than storing metas as xexprs within main) 11 years ago			`(&decode nx))`