Changed BibTeX parser to recognize any sequence of words starting with a lower case letter as the "von"-like part of the author name

This commit is contained in:
Georges Dupéron 2017-05-18 11:45:40 +02:00
parent d34569cebe
commit 05f85e8463

View File

@ -225,8 +225,9 @@
(author-name (trim one) (trim two) #:suffix (trim suffix))] (author-name (trim one) (trim two) #:suffix (trim suffix))]
[(pregexp #px"^(.*),(.*)$" (list _ two one)) [(pregexp #px"^(.*),(.*)$" (list _ two one))
(author-name (string-trim one) (string-trim two))] (author-name (string-trim one) (string-trim two))]
[(pregexp #px"^(.*) (von|de la|van der) (.*)$" (list _ one von-like two)) [(pregexp #px"^(.*?)\\s+(\\p{Ll}[^\\s]*(\\s+\\p{Ll}[^\\s]*)*)\\s+(.*)$" (list _ one von-like _ two))
(author-name (string-trim one) (string-append von-like " " (string-trim two)))] (author-name (string-trim one)
(string-append (string-trim von-like) " " (string-trim two)))]
[space-separated [space-separated
(match (regexp-split #px"\\s+" space-separated) (match (regexp-split #px"\\s+" space-separated)
[(list one) (org-author-name one)] [(list one) (org-author-name one)]
@ -380,6 +381,24 @@
(authors (authors
(author-name "James Jack" "van der Earl Jones"))) (author-name "James Jack" "van der Earl Jones")))
(check
print-as-equal-string?
(parse-author "James Jack von de la Earl Jones")
(authors
(author-name "James Jack" "von de la Earl Jones")))
(check
print-as-equal-string?
(parse-author "James Jack di Earl Jones")
(authors
(author-name "James Jack" "di Earl Jones")))
(check
print-as-equal-string?
(parse-author "First fOn bER Last")
(authors
(author-name "First" "fOn bER Last")))
(check (check
print-as-equal-string? print-as-equal-string?
(parse-author "Deci, Edward L. and Robert J. Vallerand and Pelletier, Luc G. and Ryan, Jr, Richard M.") (parse-author "Deci, Edward L. and Robert J. Vallerand and Pelletier, Luc G. and Ryan, Jr, Richard M.")