no message

original commit: fdd4883bef661bfd92969bc7a825ba9f31f6625c
This commit is contained in:
Robby Findler 2001-04-09 20:34:51 +00:00
parent 85317e5400
commit 9fd3522c22

View File

@ -1,433 +1,442 @@
(unit/sig help:search^
(import help:doc-position^ (module search mzscheme
mzlib:function^) (require (lib "unitsig.ss")
"sig.ss"
"../help-sig.ss"
(lib "list.ss"))
; Define an order for the documentation: (provide search@)
; and the names of the standard documentation
(define-values (standard-html-doc-position known-manuals)
(let ([pr (require-library "docpos.ss" "help")])
(values (car pr) (cdr pr))))
(define (html-doc-position x) (define search@
(or (user-defined-doc-position x) (unit/sig search^
(standard-html-doc-position x))) (import help:doc-position^)
; These are set by reset-doc-lists: ; Define an order for the documentation:
;; docs, doc-names and doc-kinds are parallel lists. doc-kinds ; and the names of the standard documentation
;; distinguishes between the two variants of docs. (define-values (standard-html-doc-position known-manuals)
;; docs : (list-of (union string (list string string))) (let ([pr (require-library "docpos.ss" "help")])
(define docs null) (values (car pr) (cdr pr))))
;; doc-names : (list-of string)
(define doc-names null) (define (html-doc-position x)
;; doc-kinds : (list-of symbol) (or (user-defined-doc-position x)
(define doc-kinds null) (standard-html-doc-position x)))
;; doc-collection-date : ??
(define doc-collection-date #f) ; These are set by reset-doc-lists:
; docs, doc-names and doc-kinds are parallel lists. doc-kinds
(define colldocs (require-library "colldocs.ss" "help")) ; distinguishes between the two variants of docs.
; docs : (list-of (union string (list string string)))
(define re:title (regexp "<[tT][iI][tT][lL][eE]>(.*)</[tT][iI][tT][lL][eE]>")) (define docs null)
; doc-names : (list-of string)
;; get-std-doc-title : string -> string (define doc-names null)
;; gets the standard title of the documentation, from the ; doc-kinds : (list-of symbol)
;; known docs list. (define doc-kinds null)
(define (get-std-doc-title path doc) ; doc-collection-date : ??
(let ([a (assoc doc known-manuals)]) (define doc-collection-date #f)
(if a
(cdr a) (define colldocs (require-library "colldocs.ss" "help"))
(let ([index-file (build-path path doc "index.htm")])
(if (file-exists? index-file) (define re:title (regexp "<[tT][iI][tT][lL][eE]>(.*)</[tT][iI][tT][lL][eE]>"))
(call-with-input-file index-file
(lambda (port) ; get-std-doc-title : string -> string
(let loop () ; gets the standard title of the documentation, from the
(let ([l (read-line port)]) ; known docs list.
(cond (define (get-std-doc-title path doc)
[(eof-object? l) (let ([a (assoc doc known-manuals)])
doc] (if a
[(regexp-match re:title l) (cdr a)
=> (let ([index-file (build-path path doc "index.htm")])
(lambda (m) (if (file-exists? index-file)
(apply (call-with-input-file index-file
string (lambda (port)
(map (lambda (x) (if (char-whitespace? x) #\space x)) (let loop ()
(string->list (cadr m)))))] (let ([l (read-line port)])
[else (loop)]))))) (cond
doc))))) [(eof-object? l)
doc]
[(regexp-match re:title l)
(define (reset-doc-lists) =>
; Locate standard HTML documentation (lambda (m)
(define-values (std-docs std-doc-names) (apply
(let* ([path (with-handlers ([void (lambda (x) #f)]) string
(collection-path "doc"))]) (map (lambda (x) (if (char-whitespace? x) #\space x))
(if path (string->list (cadr m)))))]
(let* ([doc-collections (directory-list path)] [else (loop)])))))
[docs (map (lambda (x) (build-path path x)) doc-collections)] doc)))))
[doc-names (map (lambda (x) (get-std-doc-title path x)) doc-collections)])
;; Order the standard docs:
(let ([ordered (quicksort (define (reset-doc-lists)
(map cons docs doc-names) ; Locate standard HTML documentation
(lambda (a b) (define-values (std-docs std-doc-names)
(< (html-doc-position (cdr a)) (let* ([path (with-handlers ([void (lambda (x) #f)])
(html-doc-position (cdr b)))))]) (collection-path "doc"))])
(values (map car ordered) (map cdr ordered)))) (if path
(values null null)))) (let* ([doc-collections (directory-list path)]
[docs (map (lambda (x) (build-path path x)) doc-collections)]
; Check collections for doc.txt files: [doc-names (map (lambda (x) (get-std-doc-title path x)) doc-collections)])
(define-values (txt-docs txt-doc-names) ; Order the standard docs:
(colldocs quicksort)) (let ([ordered (quicksort
(map cons docs doc-names)
(set! docs (append std-docs txt-docs)) (lambda (a b)
(set! doc-names (append (< (html-doc-position (cdr a))
std-doc-names (html-doc-position (cdr b)))))])
(map (lambda (s) (format "the ~a collection" s)) (values (map car ordered) (map cdr ordered))))
txt-doc-names))) (values null null))))
(set! doc-kinds (append (map (lambda (x) 'html) std-docs) (map (lambda (x) 'text) txt-docs)))
; Check collections for doc.txt files:
(with-handlers ([void (lambda (x) (define-values (txt-docs txt-doc-names)
(set! doc-collection-date 'none))]) (colldocs quicksort))
(set! doc-collection-date
(file-or-directory-modify-seconds (set! docs (append std-docs txt-docs))
(collection-path "doc"))))) (set! doc-names (append
std-doc-names
(define MAX-HIT-COUNT 300) (map (lambda (s) (format "the ~a collection" s))
txt-doc-names)))
(define (clean-html s) (set! doc-kinds (append (map (lambda (x) 'html) std-docs) (map (lambda (x) 'text) txt-docs)))
(regexp-replace*
"&[^;]*;" (with-handlers ([void (lambda (x)
(regexp-replace* (set! doc-collection-date 'none))])
"<[^>]*>" (set! doc-collection-date
(regexp-replace* (file-or-directory-modify-seconds
"&amp;" (collection-path "doc")))))
(regexp-replace*
"&gt;" (define MAX-HIT-COUNT 300)
(regexp-replace*
"&lt;" (define (clean-html s)
s (regexp-replace*
"<") "&[^;]*;"
">") (regexp-replace*
"\\&") "<[^>]*>"
"") (regexp-replace*
"")) "&amp;"
(regexp-replace*
(define not-break? (lambda (x) (not (exn:misc:user-break? x)))) "&gt;"
(regexp-replace*
; One lock for all hash table operations is good enough "&lt;"
(define ht-lock (make-semaphore 1)) s
"<")
(define (with-hash-table ht key compute) ">")
(dynamic-wind "\\&")
(lambda () (semaphore-wait ht-lock)) "")
(lambda () ""))
(let ([sym (string->symbol key)])
(hash-table-get (define not-break? (lambda (x) (not (exn:misc:user-break? x))))
ht
sym ; One lock for all hash table operations is good enough
(lambda () (define ht-lock (make-semaphore 1))
(let ([v (compute)])
(hash-table-put! ht sym v) (define (with-hash-table ht key compute)
v))))) (dynamic-wind
(lambda () (semaphore-post ht-lock)))) (lambda () (semaphore-wait ht-lock))
(lambda ()
(define html-keywords (make-hash-table)) (let ([sym (string->symbol key)])
(define (load-html-keywords doc) (hash-table-get
(with-hash-table ht
html-keywords sym
doc (lambda ()
(lambda () (let ([v (compute)])
(with-handlers ([not-break? (lambda (x) null)]) (hash-table-put! ht sym v)
(with-input-from-file (build-path doc "keywords") v)))))
read))))) (lambda () (semaphore-post ht-lock))))
(define html-indices (make-hash-table)) (define html-keywords (make-hash-table))
(define (load-html-index doc) (define (load-html-keywords doc)
(with-hash-table (with-hash-table
html-indices html-keywords
doc doc
(lambda () (lambda ()
(with-handlers ([not-break? (lambda (x) null)]) (with-handlers ([not-break? (lambda (x) null)])
(with-input-from-file (build-path doc "hdindex") (with-input-from-file (build-path doc "keywords")
read))))) read)))))
(define (parse-txt-file doc ht handle-one) (define html-indices (make-hash-table))
(with-hash-table (define (load-html-index doc)
ht (with-hash-table
doc html-indices
(lambda () doc
(with-handlers ([not-break? (lambda (x) null)]) (lambda ()
(with-input-from-file doc (with-handlers ([not-break? (lambda (x) null)])
(lambda () (with-input-from-file (build-path doc "hdindex")
(let loop ([start 0]) read)))))
(let* ([r (read-line (current-input-port) 'any)]
[next (if (eof-object? r) (define (parse-txt-file doc ht handle-one)
start (with-hash-table
(+ start (string-length r) 1))]) ht
(cond doc
[(eof-object? r) null] (lambda ()
[(handle-one r start) => (lambda (vs) (append vs (loop next)))] (with-handlers ([not-break? (lambda (x) null)])
[else (loop next)]))))))))) (with-input-from-file doc
(lambda ()
(define re:keyword-line (regexp "^>")) (let loop ([start 0])
(define text-keywords (make-hash-table)) (let* ([r (read-line (current-input-port) 'any)]
(define (load-txt-keywords doc) [next (if (eof-object? r)
(parse-txt-file start
(apply build-path doc) (+ start (string-length r) 1))])
text-keywords (cond
(lambda (r start) [(eof-object? r) null]
(cond [(handle-one r start) => (lambda (vs) (append vs (loop next)))]
[(regexp-match re:keyword-line r) [else (loop next)])))))))))
(let* ([p (open-input-string (substring r 1 (string-length r)))]
[entry (parameterize ([read-accept-bar-quote #f]) (define re:keyword-line (regexp "^>"))
(read p))] (define text-keywords (make-hash-table))
[key (let loop ([entry entry]) (define (load-txt-keywords doc)
(cond (parse-txt-file
[(symbol? entry) entry] (apply build-path doc)
[(pair? entry) (if (eq? (car entry) 'quote) text-keywords
(loop (cadr entry)) (lambda (r start)
(loop (car entry)))] (cond
[else (error "bad entry")]))] [(regexp-match re:keyword-line r)
[content (if (symbol? entry) (let* ([p (open-input-string (substring r 1 (string-length r)))]
(with-handlers ([not-break? (lambda (x) #f)]) [entry (parameterize ([read-accept-bar-quote #f])
(let ([s (read p)]) (read p))]
(if (eq? s '::) [key (let loop ([entry entry])
(read p) (cond
#f))) [(symbol? entry) entry]
#f)]) [(pair? entry) (if (eq? (car entry) 'quote)
(list (loop (cadr entry))
; Make the keyword entry: (loop (car entry)))]
(list (symbol->string key) ; the keyword name [else (error "bad entry")]))]
(let ([p (open-output-string)]) [content (if (symbol? entry)
(if content (with-handlers ([not-break? (lambda (x) #f)])
(display content p) (let ([s (read p)])
(if (and (pair? entry) (if (eq? s '::)
(eq? (car entry) 'quote)) (read p)
(fprintf p "'~s" (cadr entry)) #f)))
(display entry p))) #f)])
(get-output-string p)) ; the text to display (list
(cadr doc) ; file ; Make the keyword entry:
start ; label (a position in this case) (list (symbol->string key) ; the keyword name
"doc.txt")))] ; title (let ([p (open-output-string)])
[else #f])))) (if content
(display content p)
(define re:index-line (regexp "_([^_]*)_(.*)")) (if (and (pair? entry)
(define text-indices (make-hash-table)) (eq? (car entry) 'quote))
(define (load-txt-index doc) (fprintf p "'~s" (cadr entry))
(parse-txt-file (display entry p)))
(apply build-path doc) (get-output-string p)) ; the text to display
text-indices (cadr doc) ; file
(lambda (r start) start ; label (a position in this case)
(cond "doc.txt")))] ; title
[(regexp-match re:index-line r) [else #f]))))
=> (lambda (m)
(let loop ([m m]) (define re:index-line (regexp "_([^_]*)_(.*)"))
(let ([s (cadr m)]) (define text-indices (make-hash-table))
(cons (define (load-txt-index doc)
; Make an index entry: (parse-txt-file
(cons s start) (apply build-path doc)
(let ([m (regexp-match re:index-line (caddr m))]) text-indices
(if m (lambda (r start)
(loop m) (cond
null))))))] [(regexp-match re:index-line r)
[else #f])))) => (lambda (m)
(let loop ([m m])
(define re:splitter (regexp "^ *([^ ]+)(.*)")) (let ([s (cadr m)])
(define (split-words s) (cons
(let ([m (regexp-match re:splitter s)]) ; Make an index entry:
(if m (cons s start)
(cons (cadr m) (let ([m (regexp-match re:index-line (caddr m))])
(split-words (caddr m))) (if m
null))) (loop m)
null))))))]
(define (non-regexp s) [else #f]))))
(list->string
(apply (define re:splitter (regexp "^ *([^ ]+)(.*)"))
append (define (split-words s)
(map (let ([m (regexp-match re:splitter s)])
(lambda (c) (if m
(cond (cons (cadr m)
[(memq c '(#\$ #\| #\\ #\[ #\] #\. #\* #\? #\+ #\( #\) #\^)) (split-words (caddr m)))
(list #\\ c)] null)))
[(char-alphabetic? c)
(list #\[ (char-upcase c) (char-downcase c) #\])] (define (non-regexp s)
[else (list c)])) (list->string
(string->list s))))) (apply
append
(define (doc-collections-changed) (map
(set! doc-collection-date #f)) (lambda (c)
(cond
(define re:url-dir (regexp "^([^/]*)/(.*)$")) [(memq c '(#\$ #\| #\\ #\[ #\] #\. #\* #\? #\+ #\( #\) #\^))
(define (combine-path/url-path path url-path) (list #\\ c)]
(let loop ([path path] [(char-alphabetic? c)
[url-path url-path]) (list #\[ (char-upcase c) (char-downcase c) #\])]
(cond [else (list c)]))
[(regexp-match re:url-dir url-path) (string->list s)))))
=>
(lambda (m) (define (doc-collections-changed)
(let* ([url-dir (cadr m)] (set! doc-collection-date #f))
[rest (caddr m)]
[dir (define re:url-dir (regexp "^([^/]*)/(.*)$"))
(cond (define (combine-path/url-path path url-path)
[(string=? ".." url-dir) 'up] (let loop ([path path]
[(string=? "." url-dir) 'same] [url-path url-path])
[(string=? "" url-dir) 'same] (cond
[else url-dir])]) [(regexp-match re:url-dir url-path)
(loop (build-path path dir) =>
rest)))] (lambda (m)
[else (build-path path url-path)]))) (let* ([url-dir (cadr m)]
[rest (caddr m)]
;; do-search : ((? -> ?) [dir
;; ?? (cond
;; boolean [(string=? ".." url-dir) 'up]
;; boolean [(string=? "." url-dir) 'same]
;; ?? [(string=? "" url-dir) 'same]
;; (-> A) ;; doesn't return [else url-dir])])
;; (?? -> ??) (loop (build-path path dir)
;; (?? -> ??) rest)))]
;; (?? ?? ?? ?? ?? ?? -> ??) [else (build-path path url-path)])))
;; ->
;; (union string #f)) ; do-search : ((? -> ?)
(define (do-search given-find search-level regexp? exact? ckey maxxed-out ; ??
add-doc-section add-kind-section add-choice) ; boolean
; When new docs are installed, the directory's modification date changes: ; boolean
(unless (eq? doc-collection-date 'none) ; ??
(when (or (not doc-collection-date) ; (-> A) ; doesn't return
(> (file-or-directory-modify-seconds (collection-path "doc")) ; (?? -> ??)
doc-collection-date)) ; (?? -> ??)
(reset-doc-lists))) ; (?? ?? ?? ?? ?? ?? -> ??)
(let* ([hit-count 0] ; ->
[string-finds (list given-find)] ; (union string #f))
[finds (cond (define (do-search given-find search-level regexp? exact? ckey maxxed-out
[exact? (list given-find)] add-doc-section add-kind-section add-choice)
[regexp? (list (regexp given-find))] ; When new docs are installed, the directory's modification date changes:
[else (let ([wl (split-words given-find)]) (unless (eq? doc-collection-date 'none)
(set! string-finds wl) (when (or (not doc-collection-date)
(map regexp (map non-regexp wl)))])]) (> (file-or-directory-modify-seconds (collection-path "doc"))
(for-each doc-collection-date))
(lambda (doc doc-name doc-kind) (reset-doc-lists)))
(define found-one #f) (let* ([hit-count 0]
(define (found kind) [string-finds (list given-find)]
(unless found-one [finds (cond
(add-doc-section doc-name ckey)) [exact? (list given-find)]
(unless (equal? found-one kind) [regexp? (list (regexp given-find))]
(set! found-one kind) [else (let ([wl (split-words given-find)])
(add-kind-section kind ckey)) (set! string-finds wl)
(set! hit-count (add1 hit-count)) (map regexp (map non-regexp wl)))])])
(unless (< hit-count MAX-HIT-COUNT) (for-each
(maxxed-out))) (lambda (doc doc-name doc-kind)
(define found-one #f)
;; Keyword search (define (found kind)
(let ([keys (case doc-kind (unless found-one
[(html) (load-html-keywords doc)] (add-doc-section doc-name ckey))
[(text) (load-txt-keywords doc)] (unless (equal? found-one kind)
[else null])] (set! found-one kind)
[add-key-choice (lambda (v) (add-kind-section kind ckey))
(found "keyword entries") (set! hit-count (add1 hit-count))
(add-choice (unless (< hit-count MAX-HIT-COUNT)
(car v) ; key (maxxed-out)))
(cadr v) ; display
(list-ref v 4) ; title ; Keyword search
(if (eq? 'text doc-kind) (let ([keys (case doc-kind
(apply build-path doc) [(html) (load-html-keywords doc)]
(build-path doc (list-ref v 2))) ; file [(text) (load-txt-keywords doc)]
(list-ref v 3) ; label [else null])]
ckey))]) [add-key-choice (lambda (v)
(found "keyword entries")
(unless regexp? (add-choice
(for-each (car v) ; key
(lambda (v) (cadr v) ; display
(when (string=? given-find (car v)) (list-ref v 4) ; title
(add-key-choice v))) (if (eq? 'text doc-kind)
keys)) (apply build-path doc)
(unless (or exact? (null? finds)) (build-path doc (list-ref v 2))) ; file
(for-each (list-ref v 3) ; label
(lambda (v) ckey))])
(when (andmap (lambda (find) (regexp-match find (car v))) finds)
(unless (and (not regexp?) (string=? given-find (car v))) (unless regexp?
(add-key-choice v)))) (for-each
keys))) (lambda (v)
;; Index search (when (string=? given-find (car v))
(unless (< search-level 1) (add-key-choice v)))
(let ([index (case doc-kind keys))
[(html) (load-html-index doc)] (unless (or exact? (null? finds))
[(text) (load-txt-index doc)] (for-each
[else null])] (lambda (v)
[add-index-choice (lambda (name desc) (when (andmap (lambda (find) (regexp-match find (car v))) finds)
(case doc-kind (unless (and (not regexp?) (string=? given-find (car v)))
[(html) (add-key-choice v))))
(found "index entries") keys)))
(add-choice "" name ; Index search
(list-ref desc 2) (unless (< search-level 1)
(combine-path/url-path doc (list-ref desc 0)) (let ([index (case doc-kind
(list-ref desc 1) [(html) (load-html-index doc)]
ckey)] [(text) (load-txt-index doc)]
[(text) [else null])]
(found "index entries") [add-index-choice (lambda (name desc)
(add-choice "" name (case doc-kind
"indexed content" [(html)
(apply build-path doc) (found "index entries")
desc (add-choice "" name
ckey)]))]) (list-ref desc 2)
(when index (combine-path/url-path doc (list-ref desc 0))
(unless regexp? (list-ref desc 1)
(for-each ckey)]
(lambda (v) [(text)
(when (string=? given-find (car v)) (found "index entries")
(add-index-choice (car v) (cdr v)))) (add-choice "" name
index)) "indexed content"
(unless (or exact? (null? finds)) (apply build-path doc)
(for-each desc
(lambda (v) ckey)]))])
(when (andmap (lambda (find) (regexp-match find (car v))) finds) (when index
(unless (and (not regexp?) (string=? given-find (car v))) (unless regexp?
(add-index-choice (car v) (cdr v))))) (for-each
index))))) (lambda (v)
;; Content Search (when (string=? given-find (car v))
(unless (or (< search-level 2) exact? (null? finds)) (add-index-choice (car v) (cdr v))))
(let ([files (case doc-kind index))
[(html) (with-handlers ([not-break? (lambda (x) null)]) (unless (or exact? (null? finds))
(map (lambda (x) (build-path doc x)) (for-each
(filter (lambda (v)
(lambda (x) (file-exists? (build-path doc x))) (when (andmap (lambda (find) (regexp-match find (car v))) finds)
(directory-list doc))))] (unless (and (not regexp?) (string=? given-find (car v)))
[(text) (list (apply build-path doc))] (add-index-choice (car v) (cdr v)))))
[else null])]) index)))))
(for-each ; Content Search
(lambda (f) (unless (or (< search-level 2) exact? (null? finds))
(with-handlers ([not-break? (lambda (x) #f)]) (let ([files (case doc-kind
(with-input-from-file f [(html) (with-handlers ([not-break? (lambda (x) null)])
(lambda () (map (lambda (x) (build-path doc x))
(let loop () (filter
(let ([pos (file-position (current-input-port))] (lambda (x) (file-exists? (build-path doc x)))
[r (read-line)]) (directory-list doc))))]
(unless (eof-object? r) [(text) (list (apply build-path doc))]
(let ([m (andmap (lambda (find) (regexp-match find r)) finds)]) [else null])])
(when m (for-each
(found "text") (lambda (f)
(add-choice (car m) (with-handlers ([not-break? (lambda (x) #f)])
; Strip leading space and clean HTML (with-input-from-file f
(regexp-replace (lambda ()
"^ [ ]*" (let loop ()
(if (eq? doc-kind 'html) (let ([pos (file-position (current-input-port))]
(clean-html r) [r (read-line)])
r) (unless (eof-object? r)
"") (let ([m (andmap (lambda (find) (regexp-match find r)) finds)])
"content" (when m
f (found "text")
(if (eq? doc-kind 'text) pos "NO TAG") (add-choice (car m)
ckey))) ; Strip leading space and clean HTML
(loop)))))))) (regexp-replace
files)))) "^ [ ]*"
docs doc-names doc-kinds) (if (eq? doc-kind 'html)
(if (= 0 hit-count) (clean-html r)
(apply r)
string-append "")
"Nothing found for " "content"
(cond f
[(null? string-finds) (list "the empty search.")] (if (eq? doc-kind 'text) pos "NO TAG")
[else ckey)))
(append (loop))))))))
(cons (format "\"~a\"" (car string-finds)) files))))
(map (lambda (i) (format " and \"~a\"" i)) docs doc-names doc-kinds)
(cdr string-finds))) (if (= 0 hit-count)
(list "."))])) (apply
#f)))) string-append
"Nothing found for "
(cond
[(null? string-finds) (list "the empty search.")]
[else
(append
(cons (format "\"~a\"" (car string-finds))
(map (lambda (i) (format " and \"~a\"" i))
(cdr string-finds)))
(list "."))]))
#f))))))