You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
typesetting/quad2/unicode/unicode-class-prep.rkt

55 lines
2.3 KiB
Racket

#lang debug racket/base
(require (for-syntax racket/base)
racket/match
racket/port
racket/string)
(module+ reader
(require syntax/strip-context)
(provide (rename-out [rs read-syntax]))
(define (rs name ip)
(define src-lines (port->lines ip))
(define pred-id (string->symbol (string-trim (cadr src-lines))))
(define lines
(for*/list ([line (in-list (cddr src-lines))]
[str (in-value (string-trim (string-trim line #px"#.*" #:left? #false)))]
#:when (non-empty-string? str))
(match-define (list* codepoints tag _) (string-split str ";"))
;; codepoints might be a single value, an x..y range, or two values (base value and modifier)
;; we want to ignore the modifier
(define cp-or-range (match (string-split (string-trim codepoints) " ")
[(list cp-or-range) cp-or-range]
[(list cp modifiers ...) cp]))
(list (map (λ (str) (string->number (string-trim str) 16)) (string-split cp-or-range ".."))
(string->symbol (string-trim tag)))))
(strip-context
(with-syntax ([PRED-ID pred-id]
[LINES lines])
#'(module _ quad/unicode/unicode-class-prep
PRED-ID
. LINES)))))
(define-syntax (make-cond stx)
(syntax-case stx ()
[(_ ID VAL) #'(eq? ID VAL)] ;; I believe `eq?` is OK because a codepoint is a fixnum
[(_ ID LVAL RVAL) #'(<= LVAL ID RVAL)]))
(provide (rename-out [mb #%module-begin])
(except-out (all-from-out racket/base) #%module-begin))
(define-syntax (mb stx)
(syntax-case stx ()
[(_ PRED-ID (VALS RES) ...)
#'(#%module-begin
(provide PRED-ID)
(define (PRED-ID x)
(define cint (let loop ([x x])
(match x
[(? char? c) (char->integer c)]
[(? string? s) #:when (= 1 (string-length s))
(loop (car (string->list s)))]
[(? integer?) x]
[_ (raise-argument-error 'PRED-ID "integer, character, or one-character string" x)])))
(cond
[(make-cond cint . VALS) 'RES] ...
[else #f])))]))