phc-graph/flexible-with2.hl.rkt

392 lines
17 KiB
Racket

#lang hyper-literate #:♦ (dotlambda/unhygienic . type-expander/lang)
♦title[#:style manual-doc-style ;#:style (with-html5 manual-doc-style)
#:tag "flexible-with"
#:tag-prefix "phc-graph/flexible-with"]{Flexible functional
modification and extension of records}
(chunks-toc-prefix
'("(lib phc-graph/scribblings/phc-graph-implementation.scrbl)"
"phc-graph/flexible-with"))
♦section{Goals}
Our goal here is to have strongly typed records, with row polymorphism (a
♦racket[Rest] row type variable can range over multiple possibly-present
fields), and structural type equivalence (two record types are identical if
they have the same fields, and these fields have the same types).
♦section{Overview}
We represent flexible records using a tree, where the leaves are field values.
Every field which occurs anywhere in the program is assigned a constant index.
This index determines which leaf is used to store that field's values. In
order to avoid storing a huge tree for every tree-record, the actual fields
are captured by a closure, and the tree is lazily generated (node by node)
upon access.
The type for a flexible record can support row polymorphism: the type of
fields which may optionally be present are represented by a polymorphic type
variable. Note that this means that no only one row type variable is used, but
several. We define below facilities to automatically generate this list of
polymorphic type variables. In order to avoid having a huge number of type
variables, a branch containing only optional fields can be collapsed into a
single type variable. An exception to this rule is when a field needs to be
added by the user code in the middle of a branch: in this case the branch may
not be collapsed.
♦section{Type of a tree-record, with a hole}
♦CHUNK[<tree-type-with-replacement>
(define-for-syntax (tree-type-with-replacement n last τ*)
(define-values (next mod) (quotient/remainder n 2))
(cond [(null? τ*) last]
[(= mod 0)
(tree-type-with-replacement next
#`(Pairof #,last #,(car τ*))
(cdr τ*))]
[else
(tree-type-with-replacement next
#`(Pairof #,(car τ*) #,last)
(cdr τ*))]))]
♦section{Functionally updating a tree-record}
♦subsection{Adding and modifying fields}
Since we only deal with functional updates of immutable records, modifying a
field does little more than discarding the old value, and injecting the new
value instead into the new, updated record.
Adding a new field is done using the same exact operation: missing fields are
denoted by a special value, ♦racket['NONE], while present fields are
represented as instances of the polymorphic struct ♦racket[(Some T)]. Adding a
new field is therefore as simple as discarding the old ♦racket['NONE] marker,
and replacing it with the new value, wrapped with ♦racket[Some]. A field
update would instead discard the old instance of ♦racket[Some], and replace it
with a new one.
♦CHUNK[<make-replace-in-tree-body>
(if (= i 1)
#'(delay/pure/stateless replacement)
(let* ([bits (to-bits i)]
[next (from-bits (cons #t (cddr bits)))]
[mod (cadr bits)])
(define/with-syntax next-id (vector-ref low-names (sub1 next)))
(if mod
#`(replace-right (inst next-id #,@τ*-limited+T-next)
tree-thunk
replacement)
#`(replace-left (inst next-id #,@τ*-limited+T-next)
tree-thunk
replacement))))]
♦CHUNK[<define-replace-in-tree>
(: replace-right ( (A B C R) ( ( (Promise B) R (Promise C))
(Promise (Pairof A B))
R
(Promise (Pairof A C)))))
(define-pure/stateless
#:∀ (A B C R)
(replace-right [next-id : ( (Promise B) R (Promise C))]
[tree-thunk : (Promise (Pairof A B))]
[replacement : R])
(delay/pure/stateless
(let ([tree (force tree-thunk)])
(let ([left-subtree (car tree)]
[right-subtree (cdr tree)])
(cons left-subtree
(force (next-id (delay/pure/stateless right-subtree)
replacement)))))))
(: replace-left ( (A B C R) ( ( (Promise A) R (Promise C))
(Promise (Pairof A B))
R
(Promise (Pairof C B)))))
(define-pure/stateless
#:∀ (A B C R)
(replace-left [next-id : ( (Promise A) R (Promise C))]
[tree-thunk : (Promise (Pairof A B))]
[replacement : R])
(delay/pure/stateless
(let ([tree (force tree-thunk)])
(let ([left-subtree (car tree)]
[right-subtree (cdr tree)])
(cons (force (next-id (delay/pure/stateless left-subtree)
replacement))
right-subtree)))))
(define-for-syntax (define-replace-in-tree low-names names rm-names τ* i depth)
(define/with-syntax name (vector-ref names (sub1 i)))
(define/with-syntax rm-name (vector-ref rm-names (sub1 i)))
(define/with-syntax low-name (vector-ref low-names (sub1 i)))
(define/with-syntax tree-type-with-replacement-name (gensym 'tree-type-with-replacement))
(define/with-syntax tree-replacement-type-name (gensym 'tree-replacement-type))
(define τ*-limited (take τ* depth))
(define τ*-limited+T-next (if (= depth 0)
(list #'T)
(append (take τ* (sub1 depth)) (list #'T))))
#`(begin
(provide name rm-name)
(define-type (tree-type-with-replacement-name #,@τ*-limited T)
(Promise #,(tree-type-with-replacement i #'T τ*-limited)))
(: low-name
( (#,@τ*-limited T)
( (tree-type-with-replacement-name #,@τ*-limited Any)
T
(tree-type-with-replacement-name #,@τ*-limited T))))
(define-pure/stateless
#:∀ (#,@τ*-limited T)
(low-name [tree-thunk : (tree-type-with-replacement-name #,@τ*-limited Any)]
[replacement : T])
: (Promise #,(tree-type-with-replacement i #'T τ*-limited))
#,<make-replace-in-tree-body>)
(: name
( (#,@τ*-limited T)
( (tree-type-with-replacement-name #,@τ*-limited Any)
T
(tree-type-with-replacement-name #,@τ*-limited (Some T)))))
(define (name tree-thunk replacement)
(low-name tree-thunk (Some replacement)))
(: rm-name
( (#,@τ*-limited)
( (tree-type-with-replacement-name #,@τ*-limited (Some Any))
(tree-type-with-replacement-name #,@τ*-limited 'NONE))))
(define (rm-name tree-thunk)
(low-name tree-thunk 'NONE))))]
♦section{Auxiliary values}
The following sections reuse a few values which are derived from the list of
fields:
♦CHUNK[<utils>
(define all-fields #'(field ))
(define depth-above (ceiling-log2 (length (syntax->list #'(field )))))
(define offset (expt 2 depth-above))
(define i*-above (range 1 (expt 2 depth-above)))
(define names (list->vector
(append (map (λ (i) (format-id #'here "-with-~a" i))
i*-above)
(stx-map (λ (f) (format-id f "with-~a" f))
#'(field )))))
(define rm-names (list->vector
(append (map (λ (i) (format-id #'here "-without-~a" i))
i*-above)
(stx-map (λ (f) (format-id f "without-~a" f))
#'(field )))))
(define low-names (list->vector
(append (map (λ (i) (format-id #'here "-u-with-~a" i))
i*-above)
(stx-map (λ (f) (format-id f "u-with-~a" f))
#'(field )))))]
♦section{Type of a tree-record}
♦CHUNK[<τ-tree-with-fields>
(define-for-syntax (τ-tree-with-fields struct-fields fields)
(define/with-syntax (struct-field ) struct-fields)
(define/with-syntax (field ) fields)
<utils>
;; Like in convert-from-struct
(define lookup
(make-free-id-table
(for/list ([n (in-syntax all-fields)]
[i (in-naturals)])
(cons n (+ i offset)))))
(define fields+indices
(sort (stx-map λ.(cons % (free-id-table-ref lookup %))
#'(struct-field ))
<
#:key cdr))
(define up (* offset 2))
;; Like in convert-fields, but with Pairof
(define (f i)
;(displayln (list i '/ up (syntax->datum #`#,fields+indices)))
(if (and (pair? fields+indices) (= i (cdar fields+indices)))
(begin0
`(Some ,(caar fields+indices))
(set! fields+indices (cdr fields+indices)))
(if (>= (* i 2) up) ;; DEPTH
''NONE
(begin
`(Pairof ,(f (* i 2))
,(f (add1 (* i 2))))))))
(f 1))]
♦section{Conversion to and from record-trees}
♦CHUNK[<define-struct↔tree>
(define-for-syntax (define-struct↔tree
offset all-fields τ* struct-name fields)
(define/with-syntax (field ) fields)
(define/with-syntax fields→tree-name
(format-id struct-name "~a→tree" struct-name))
(define/with-syntax tree→fields-name
(format-id struct-name "tree→~a" struct-name))
(define lookup
(make-free-id-table
(for/list ([n (in-syntax all-fields)]
[i (in-naturals)])
(cons n (+ i offset)))))
(define fields+indices
(sort (stx-map λ.(cons % (free-id-table-ref lookup %))
fields)
<
#:key cdr))
#`(begin
(: fields→tree-name ( (field )
( field
(Promise #,(τ-tree-with-fields #'(field )
all-fields)))))
(define (fields→tree-name field )
(delay/pure/stateless
#,(convert-fields (* offset 2) fields+indices)))
(: tree→fields-name ( (field )
( (Promise #,(τ-tree-with-fields #'(field )
all-fields))
(Values field ))))
(define (tree→fields-name tree-thunk)
(define tree (force tree-thunk))
#,(convert-back-fields (* offset 2) fields+indices))))]
♦subsection{Creating a new tree-record}
♦CHUNK[<convert-fields>
(define-for-syntax (convert-fields up fields+indices)
;(displayln fields+indices)
(define (f i)
;(displayln (list i '/ up (syntax->datum #`#,fields+indices)))
(if (and (pair? fields+indices) (= i (cdar fields+indices)))
(begin0
`(Some ,(caar fields+indices))
(set! fields+indices (cdr fields+indices)))
(if (>= (* i 2) up) ;; DEPTH
''NONE
`(cons ,(f (* i 2))
,(f (add1 (* i 2)))))))
;(displayln (syntax->datum #`#,(f 1)))
(f 1))]
♦subsection{Extracting all the fields from a tree-record}
We traverse the tree in preorder, and accumulate definitions naming the
interesting subparts of the trees (those where there are fields).
♦CHUNK[<convert-back-fields>
(define-for-syntax (convert-back-fields up fields+indices)
(define result '())
(define definitions '())
(define (f i t)
(if (and (pair? fields+indices) (= i (cdar fields+indices)))
(begin0
(begin
(set! result (cons #`(Some-v #,t) result))
#t)
(set! fields+indices (cdr fields+indices)))
(if (>= (* i 2) up) ;; DEPTH
#f
(let* ([left-t (string->symbol
(format "subtree-~a" (* i 2)))]
[right-t (string->symbol
(format "subtree-~a" (add1 (* i 2))))]
[left (f (* i 2) left-t)]
[right (f (add1 (* i 2)) right-t)])
(cond
[(and left right)
(set! definitions (cons #`(define #,left-t (car #,t))
definitions))
(set! definitions (cons #`(define #,right-t (cdr #,t))
definitions))
#t]
[left
(set! definitions (cons #`(define #,left-t (car #,t))
definitions))
#t]
[right
(set! definitions (cons #`(define #,right-t (cdr #,t))
definitions))
#t]
[else
#f])))))
(f 1 #'tree)
#`(begin #,@definitions (values . #,(reverse result))))]
♦section{Defining the converters and accessors for each known record type}
♦CHUNK[<define-trees>
(define-for-syntax (define-trees stx)
(syntax-case stx ()
[(bt-fields-id (field ) [struct struct-field ] )
(let ()
<utils>
(define ∀-types (map λ.(format-id #'here "τ~a" %)
(range (add1 depth-above))))
(define total-nb-functions (vector-length names))
<define-trees-result>)]))]
♦CHUNK[<bt-fields-type>
(define-for-syntax (bt-fields-type fields)
(λ (stx)
(syntax-case stx ()
[(_ . fs)
#`( fs (Promise #,(τ-tree-with-fields #'fs
fields)))])))]
♦CHUNK[<define-trees-result>
#`(begin
(define-type-expander bt-fields-id
(bt-fields-type #'#,(syntax-local-introduce #'(field ))))
#,@(map λ.(define-replace-in-tree low-names
names rm-names ∀-types % (floor-log2 %))
(range 1 (add1 total-nb-functions)))
#;#,@(map λ.(define-remove-in-tree rm-names ∀-types % (floor-log2 %))
(range 1 (add1 total-nb-functions)))
#,@(map λ.(define-struct↔tree
offset all-fields ∀-types %1 %2)
(syntax->list #'(struct ))
(syntax->list #'([struct-field ] ))))]
♦subsection{Putting it all together}
♦chunk[<maybe>
(struct (T) Some ([v : T]) #:transparent)
(define-type (Maybe T) (U (Some T) 'NONE))]
♦chunk[<*>
(require delay-pure
"flexible-with-utils.hl.rkt"
(for-syntax (rename-in racket/base [... ])
syntax/stx
racket/syntax
racket/list
syntax/id-table
racket/sequence)
(for-meta 2 racket/base))
(provide (for-syntax define-trees)
;; For tests:
(struct-out Some)
;;DEBUG:
(for-syntax τ-tree-with-fields)
)
<maybe>
<tree-type-with-replacement>
<define-replace-in-tree>
;<define-remove-in-tree>
<convert-fields>
<convert-back-fields>
<τ-tree-with-fields>
<define-struct↔tree>
<define-trees>
<bt-fields-type>]
♦include-section[(submod "flexible-with-utils.hl.rkt" doc)]