X-Git-Url: https://git.donarmstrong.com/?a=blobdiff_plain;f=scm%2Fencoding.scm;h=9a441ac8816aa8ce1a58a4e84f9823b60fbb66e8;hb=c74bf739ec32b015c711c460aa831092a08478b3;hp=09ed12a368f16e5dc1ec42ce4dde9e93545fb942;hpb=9b7d53f2929f6ac0b4f3cfc488f0a58e758c5090;p=lilypond.git diff --git a/scm/encoding.scm b/scm/encoding.scm index 09ed12a368..9a441ac881 100644 --- a/scm/encoding.scm +++ b/scm/encoding.scm @@ -1,122 +1,60 @@ ;;;; encoding.scm -- font encoding ;;;; ;;;; source file of the GNU LilyPond music typesetter -;;;; -;;;; (c) 2004 Jan Nieuwenhuizen - -;; WIP -;; cp /usr/share/texmf/dvips/base/*.enc mf/out -;; cp /usr/share/texmf/dvips/tetex/*.enc mf/out -;; encoding.ly: -;; #(display (reencode-string "adobe" "latin1" "hellö fóebär")) -;; - - -(define (read-encoding-file filename) - "Read .enc file, returning a vector of symbols." - (let* ((raw (ly:gulp-file filename)) - (string (regexp-substitute/global #f "%[^\n]*" raw 'pre "" 'post)) - (start (string-index string #\[)) - (end (string-index string #\])) - (ps-lst (string-tokenize (substring string (+ start 1) end))) - (lst (map (lambda (x) (substring x 1)) ps-lst)) - (vector (list->vector lst))) - - vector)) - -(define (make-encoding-table encoding-vector) - "Return a hash table mapping names to chars. ENCODING-VECTOR is a -vector of symbols." - - (let* ((h (make-hash-table 256))) - - (for-each - (lambda (i) - (hash-set! h (vector-ref encoding-vector i) - (integer->char i))) - (iota 256)) - - h)) - -(define-public (reencode-string permutation str) - "Apply PERMUTATION, a vector of [0..256) -> char, to STR" - (string-map (lambda (chr) - (vector-ref permutation (char->integer chr))) - str)) - -(define-public (encoding-permutation input-encoding - output-encoding) - - "Contruct a permutation by applying output-encoding after input-encoding " - (list->vector - (map - (lambda (chr) - (let* - ((new-char (hash-ref output-encoding - (vector-ref input-encoding (char->integer chr)) #f))) - - ;; substitute space for unknown characters. - (if (char? new-char) - new-char - #\ ))) - (iota 256)))) - - -(define (get-coding-from-file filename) - "Read FILENAME, return a list containing encoding vector and table" - - (let* - ((vec (read-encoding-file filename)) - (tab (make-encoding-table vec))) - (list vec tab))) - -;; coding-alist maps NAME -> (list VECTOR TAB) -(define coding-alist - - (map (lambda (x) - (cons (car x) - (delay (get-coding-from-file (cdr x))))) - - '( - ;; teTeX - ("TeX typewriter text" . "09fbbfac.enc") ;; cmtt10 - ("TeX math symbols" . "10037936.enc") ;; cmbsy - ("ASCII caps and digits" . "1b6d048e.enc") ;; cminch - ("TeX math italic" . "aae443f0.enc") ;; cmmi10 - ("TeX extended ASCII" . "d9b29452.enc") - ("TeX text" . "f7b6d320.enc") - ("TeX text without f-ligatures" . "0ef0afca.enc") - ("Extended TeX Font Encoding - Latin" . "tex256.enc") - - ("T1" . "tex256.enc") - - ;; for testing -- almost adome - ("adobe" . "ad.enc") - ("latin1" . "cork.enc") - - ;; LilyPond. - ("feta braces" . "feta-braces0.enc") - ("feta number" . "feta-nummer10.enc") - ("feta music" . "feta20.enc") - ("parmesan music" . "parmesan20.enc")) - )) - -(define (get-coding coding-name) - (force (assoc-get coding-name coding-alist ))) - -(define (get-coding-vector coding-name) - (car (get-coding coding-name))) - -(define (get-coding-table coding-name) - (cadr (get-coding coding-name))) - - -;;; what's this for? --hwn -(define-public (encoded-index font-coding input-coding code) - (format (current-error-port) "CODE: ~S\n" code) - (let* ((font (get-coding-table font-coding)) - (in (get-coding-vector input-coding)) - (char (vector-ref in code))) - (format (current-error-port) "CHAR: ~S\n" char) - (hash-ref font char))) - +;;;; +;;;; (c) 2004--2009 Jan Nieuwenhuizen + +(define-public latin1-coding-vector + #(.notdef .notdef .notdef .notdef .notdef .notdef .notdef .notdef + .notdef .notdef .notdef .notdef .notdef .notdef .notdef .notdef + .notdef .notdef .notdef .notdef .notdef .notdef .notdef .notdef + .notdef .notdef .notdef .notdef .notdef .notdef .notdef .notdef + %% 0x20 + space exclam quotedbl numbersign dollar percent ampersand quoteright + parenleft parenright asterisk plus comma hyphen period slash + zero one two three four five six seven + eight nine colon semicolon less equal greater question + %% 0x40 + at A B C D E F G + H I J K L M N O + P Q R S T U V W + X Y Z bracketleft backslash bracketright asciicircum underscore + %% 0x60 + `quoteleft a b c d e f g + h i j k l m n o + p q r s t u v w + x y z braceleft bar braceright asciitilde .notdef + %% 0x80 + .notdef .notdef .notdef .notdef .notdef .notdef .notdef .notdef + .notdef .notdef .notdef .notdef .notdef .notdef .notdef .notdef + dotlessi grave acute circumflex tilde macron breve dotaccent + dieresis .notdef ring cedilla .notdef hungarumlaut ogonek caron + %% 0xA0 + space exclamdown cent sterling currency yen brokenbar section + dieresis copyright ordfeminine guillemotleft logicalnot hyphen registered macron + degree plusminus twosuperior threesuperior acute mu paragraph periodcentered + cedilla onesuperior ordmasculine guillemotright onequarter onehalf threequarters questiondown + %% 0xC0 + Agrave Aacute Acircumflex Atilde Adieresis Aring AE Ccedilla + Egrave Eacute Ecircumflex Edieresis Igrave Iacute Icircumflex Idieresis + Eth Ntilde Ograve Oacute Ocircumflex Otilde Odieresis multiply + Oslash Ugrave Uacute Ucircumflex Udieresis Yacute Thorn germandbls + %% 0xE0 + agrave aacute acircumflex atilde adieresis aring ae ccedilla + egrave eacute ecircumflex edieresis igrave iacute icircumflex idieresis + eth ntilde ograve oacute ocircumflex otilde odieresis divide + oslash ugrave uacute ucircumflex udieresis yacute thorn ydieresis)) + + +(define-public (decode-byte-string str) + "Return vector of glyphname symbols that correspond to string, +assuming that STR is byte-coded using ENCODING-NAME." + + (let* ((len (string-length str)) + (output-vector (make-vector len '.notdef))) + (do + ((idx 0 (1+ idx))) + ((>= idx len) output-vector) + (vector-set! output-vector idx + (vector-ref latin1-coding-vector + (char->integer (string-ref str idx)))))))