whalesong/resource/coerse-content-bytes.rkt
2011-09-04 17:58:56 -04:00

22 lines
717 B
Racket

#lang racket/base
(provide coerse-content-bytes)
;; We need at least version 1.2 of the html-parsing library, because
;; there's a nasty bug in 1.0.
(require (planet neil/html-parsing:1:2)
(planet neil/html-writing))
;; coerse-content-bytes: path bytes -> bytes
;; Given some bytes, we may need to do some data validation or cleanup.
;; In particular, when the file's HTML, we need to make sure we're
;; storing syntactically valid HTML.
(define (coerse-content-bytes a-path bytes)
(cond
[(regexp-match #rx"\\.html$"
(path->string a-path))
(define op (open-output-bytes))
(write-html (html->xexp (open-input-bytes bytes)) op)
(get-output-bytes op)]
[else
bytes]))