Beautiful Racket: Day 3

Beautiful Racket / racket school 2019

(define-lex-abbrev regex-chars (char-set "()*+?.^$|<!=[]"))

(define lex
  (lexer
   [(:+ "\n") (token 'NEWLINE lexeme)]
   [(from/stop-before ";" "\n") (token 'COMMENT #:skip? #t)]
   [(:+ whitespace) (token 'SP lexeme #:skip? #t)]
   [regex-chars lexeme]
   [alphabetic (token 'LITERAL lexeme)]))
(define-lex-abbrev regex-chars (char-set "()*+?.^$|<!=[]"))

(define lex
  (lexer
   [(:+ "\n") (token 'NEWLINE lexeme)]
   [(from/stop-before ";" "\n") (token 'COMMENT #:skip? #t)]
   [(:+ whitespace) (token 'SP lexeme #:skip? #t)]
   [regex-chars lexeme]
   [alphabetic (token 'LITERAL lexeme)]))


The token structure type lets us create a token that cooperates specially with a brag parser. The first field of the structure is the value matched in the grammar. But the second field of the structure is the value inserted in the parse tree.

SYMBOLIC-NAMES (in all caps) are used to classify a set of tokens (like identifiers, numbers, or strings). When used in the grammar, these names can be referenced without surrounding quotes:
#lang brag
top : ("x" | FOO)+
1 2
#lang brag top : ("x" | FOO)+

We make a token with a symbolic name by passing a symbol as the first argument, and the token value as the second:
(token 'FOO 42)
1
(token 'FOO 42)

So when we feed these tokens to our parser:
(parse-to-datum (list "x" (token 'FOO 42)))
1
(parse-to-datum (list "x" (token 'FOO 42)))

We get this result:
'(top "x" 42)
1
'(top "x" 42)

The lexer supports many useful matching operators, e.g. :+, from/stop-before, char-set, and alphabetic.

define-lex-abbrev lets us assign names to lexer patterns. This can be handy for defining a set of “reserved” characters that are assigned special meaning in our language.

token structures with #:skip? #t are ignored by a brag parser.

algebra/test.rkt

#lang algebra
fun f(x,y) = x + y
# fun f(x,y) = x * y
fun g(zz) = f(zz,zz)
g(10)
g(23)

#lang algebra
fun f(x,y) = x + y
# fun f(x,y) = x * y
fun g(zz) = f(zz,zz)
g(10)
g(23)

algebra/main.rkt

#lang br/quicklang
(require brag/support "grammar.rkt")
(provide top fun expr app)

(module+ reader
  (provide read-syntax))

(define-lex-abbrev reserved-toks
  (:or #;···))

(define tokenize-1
  (lexer
   [whitespace #;···]
   [(from/stop-before "#" "\n") #;···]
   [reserved-toks #;···]
   [(:+ alphabetic) #;···]
   [(:+ (char-set "0123456789")) #;···]))

(define-macro top #;···)

(define-macro-cases fun
  #;···)

(define-macro-cases expr
  #;···)

(define-macro app #;···)

(define (read-syntax src ip)
  (define parse-tree (parse src (λ () (tokenize-1 ip))))
  (strip-bindings
   (with-syntax ([PT parse-tree])
     #'(module algebra-mod algebra
         PT))))
#lang br/quicklang
(require brag/support "grammar.rkt")
(provide top fun expr app)

(module+ reader
  (provide read-syntax))

(define-lex-abbrev reserved-toks
  (:or #;···))

(define tokenize-1
  (lexer
   [whitespace #;···]
   [(from/stop-before "#" "\n") #;···]
   [reserved-toks #;···]
   [(:+ alphabetic) #;···]
   [(:+ (char-set "0123456789")) #;···]))

(define-macro top #;···)

(define-macro-cases fun
  #;···)

(define-macro-cases expr
  #;···)

(define-macro app #;···)

(define (read-syntax src ip)
  (define parse-tree (parse src (λ () (tokenize-1 ip))))
  (strip-bindings
   (with-syntax ([PT parse-tree])
     #'(module algebra-mod algebra
         PT))))

algebra/grammar.rkt

#lang brag

top : # ···
fun : # ···
expr : # ···
app : # ···

#lang brag

top : # ···
fun : # ···
expr : # ···
app : # ···

Beautiful Racket / racket school 2019

Day 3

Powerful points

Mission

Summary

Beau­tiful Racket / racket school 2019

Day 3

Powerful points

Mission

Summary

Beautiful Racket / racket school 2019