From: ntakahas Date: Thu, 12 Jul 2007 12:04:10 +0000 (+0000) Subject: Rewritten with new algorithm. X-Git-Tag: REL-1-4-0~6 X-Git-Url: http://git.chise.org/cgi-bin/gitweb.cgi?a=commitdiff_plain;h=32669b01fd7792108453e33e39b172bd795e771e;p=m17n%2Fm17n-db.git Rewritten with new algorithm. --- diff --git a/FLT/KNDA-OTF.flt b/FLT/KNDA-OTF.flt index b4fe1be..2eab1e8 100644 --- a/FLT/KNDA-OTF.flt +++ b/FLT/KNDA-OTF.flt @@ -30,131 +30,133 @@ (font (nil nil unicode-bmp :otf=knda=rphf))) (category - ;; C: general consonant + ;; C: consonant (except for RA) ;; R: RA + ;; n: NUKTA ;; H: HALANT - ;; u: MATRA (above) - ;; b: MATRA (below) - ;; p: MATRA (post) - ;; t: MATRA (two-part) - ;; T: MATRA (three-part) + ;; u: vowel sign (above) + ;; b: vowel sign (below) + ;; p: vowel sign (post) + ;; l: length mark ;; a: vowel modifier (post) ;; V: independent vowel ;; N: ZWNJ (ZERO WIDTH NON-JOINER) ;; J: ZWJ (ZERO WIDTH JOINER) - ;; E: ELSE - ;; - (0x200C ?N) ; ZWNJ - (0x200D ?J) ; ZWJ - (0x0964 ?E) ; DANDA - (0x0965 ?E) ; DOUBLE DANDA - (0x0C80 0x0CFF ?E) ; ELSE - (0x0C82 0x0C83 ?a) ; SIGN ANUSVARA, VISARGA + ;; X: generic + (0x0C80 0x0CFF ?X) ; generic + (0x0C82 0x0C83 ?a) ; SIGN ANUSVARA .. VISARGA (0x0C85 0x0C94 ?V) ; LETTER A .. LETTER AU (0x0C95 0x0CB9 ?C) ; LETTER KA .. LETTER HA (0x0CB0 ?R) ; LETTER RA (0x0CBC ?n) ; SIGN NUKTA - (0x0CBE ?p) ; VOWEL SIGN AA (post) - (0x0CBF ?u) ; VOWEL SIGN I (above) - (0x0CC0 ?t) ; VOWEL SIGN II (two-part) - (0x0CC1 0x0CC4 ?p) ; VOWEL SIGN U, UU, R, RR (post) - (0x0CC6 ?u) ; VOWEL SIGN E (above) - (0x0CC7 0x0CCA ?t) ; VOWEL SIGN EE, AI, O (two-part) - (0x0CCB ?T) ; VOWEL SIGN OO (three-part) - (0x0CCC ?u) ; VOWEL SIGN AU (above) - (0x0CCD ?H) ; SIGN VIRAMA (HALANT) - (0x0CD5 0x0CD6 ?l) ; LENGTH MARK (length post) + (0x0CBE ?p) ; VOWEL SIGN AA + (0x0CBF ?u) ; VOWEL SIGN I + (0x0CC1 0x0CC4 ?p) ; VOWEL SIGN U .. RR + (0x0CC6 ?u) ; VOWEL SIGN E + (0x0CCC ?u) ; VOWEL SIGN AU + (0x0CCD ?H) ; SIGN VIRAMA + (0x0CD5 0x0CD6 ?l) ; LENGTH MARK .. AI LENGTH MARK (0x0CDE ?C) ; LETTER FA (LLLA) - (0x0CE0 0x0CE1 ?V) ; LETTER VOCALIC RR, LL - (0x0CE2 0x0CE3 ?b) ; VOWEL SIGN VOCALIC L, LL - (0x0CFD ?Z) ; internal use - (0x0CFE ?Y) ; internal use - (0x0CFF ?X) ; internal use + (0x0CE0 0x0CE1 ?V) ; LETTER VOCALIC RR .. LL + (0x0CE2 0x0CE3 ?b) ; VOWEL SIGN VOCALIC L .. LL + (0x0964 0x0965 ?X) ; DANDA .. DOUBLE DANDA + (0x200C ?N) ; ZWNJ + (0x200D ?J) ; ZWJ ) -;; Step 1 : Syllable identification and Halant movement. +;; Preprocessing (generator (0 (cond - ;; A syllable containing a three-part vowel sign. - ("([CR]J?n?(H[CR]n?)*)(T)(a)?" - < | (1 move-base-Halant) (3 0x0CC6 0x0CC2 0x0CD5) (4 =) | >) - - ;; A syllable containing a two-part vowel sign. - ("([CR]J?n?(H[CR]n?)*)(t)(a)?" - < | (1 move-base-Halant) (3 two-part) (4 =) | >) - - ;; A syllable ending with vowel signs and/or a vowel modifier. - ("([CR]J?n?(H[CR]n?)*)([ubpl]+a?|a)" - < | (1 move-base-Halant) (3 = *) | >) + ;; Decompose two-part and three-part vowels + ((0x0CC0) + 0x0CBF 0x0CD5) + ((0x0CC7) + 0x0CC6 0x0CD5) + ((0x0CC8) + 0x0CC6 0x0CD6) + ((0x0CCA) + 0x0CC6 0x0CC2) + ((0x0CCB) + 0x0CC6 0x0CC2 0x0CD5) + ;; Move ZWJ between RA and HARANT. + ("(R)(J)(H)" + (2 =) (1 =) (3 =)) + ("." =)) + *)) - ;; Forced Halant form. - ("([CR]n?H)N" - < | (1 move-base-Halant) | >) +;; Syllable identification. +;; Apply 'nukt' and 'akhn' before reordering. - ;; A syllable without a vowel sign nor a vowel modifier. - ("[CR]J?n?(H[CR]n?)*H?" - < | move-base-Halant | >) +(generator + (0 + (cond + ;; A syllable with an above vowel sign. + ;;1 2 3 4 + ("(J)?([CR]n?(H[CR]n?)*)(up?l?a?)" + < | (1 =) (2 otf:knda=nukt,akhn+) (4 = *) | >) + + ;; A syllable with a post- or below vowel sign. + ;;1 2 3 4 5 + ("(J)?([CR]n?(H[CR]n?)*)(p|b)(a)?" + < | (1 =) (2 otf:knda=nukt,akhn+) (4 =) (5 =) | >) + + ;; A syllable with a vowel modifier, but without vowel signs. + ;;1 2 3 4 + ("(J)?([CR]n?(H[CR]n?)*)(a)" + < | (1 =) (2 otf:knda=nukt,akhn+) (4 =) | >) + + ;; No vowel signs, no vowel modifiers. + ;;1 2 3 4 + ("(J)?([CR]n?(H[CR]n?)*)(H|HN)?" + < | (1 =) (2 otf:knda=nukt,akhn+) (4 = *) | >) ;; A syllable starting with an independent vowel. ("Va?" - < | = * | > ) + < | = * | >) ("." =)) - *) - - ;; Move Halant on the base consonant to the tail if the syllable ends - ;; with a consonant. - ;; A leading 0x0CFF means Halant movement. - ;; A leading 0x0CFE means a syllable ending with a Halant. - ;; A leading 0x0CFD means Halant & Reph movements. - (move-base-Halant - (cond - (".*H$" - 0x0CFE = *) - ("(RH)([CR]n?)$" - 0x0CFD (2 = *) (1 = =)) - ("(RH)([CR]n?)(H)(.*)" - 0x0CFD (2 = *) (4 = *) (3 =) (1 = =)) - ("(R)J(H)(.*)" - 0x0CFF (1 =) (3 = *) (2 =)) - ("(Cn?)(H)(.*)" - 0x0CFF (1 = *) (3 = *) (2 =)) - (".*" - = *))) - - ;; Divide a two-part Matra into elements. - (two-part - (cond - ((0x0CC0) 0x0CBF 0x0CD5) - ((0x0CC7) 0x0CC6 0x0CD5) - ((0x0CC8) 0x0CC6 0x0CD6) - ((0x0CCA) 0x0CC6 0x0CC2))) - ) + *)) -;; Step 2 : Move Matra if applicable. -;; The base consonant in a Halant-ending syllable is changed into Halant form. +;; Reordering. The base consonant is always the first one, because +;; all Kannada consonants have a below form. (generator (0 (cond - ;; 1 2 3 4 5 6 7 8 - (" Z([CR]n?)([CRnH]*)(RH)(u)?(b)?(p)?(l*)(a)? " - | (1 = *) (4 =) (5 =) (6 =) (2 = *) (7 = *) (3 otf:knda=rphf) (8 =) |) - ;; 1 2 3 4 5 6 7 - (" X([CR]n?)([CRnH]*)(u)?(b)?(p)?(l*)(a)? " - | (1 = *) (3 =) (4 =) (5 =) (2 = *) (6 = *) (7 =) |) - (" Y([CR]n?H)([^ ]*) " - ;; Kedage-n.ttf lacks the haln feature, so "otf:knda=haln" does not work. - | (1 otf:knda=~rphf,~blwf,*) (2 = *) |) + ;; 1 2 34 5 6 7 8 + (" (RH)?(.)((H.)*)(u|b)?(p)?(l)?(a)? " + | (2 =) (5 =) (6 =) (3 move-h) (7 =) (1 otf:knda=rphf+) (8 =) |) + + ;; A syllable ending with a halant. + ;; 1 2 34 + (" (RH)?(.H)((.H)*)N? " + ;; WORKAROUND : Kedage fonts produce halant form with 'psts'. + | (2 otf:knda=haln,psts+)(3 = *) (1 otf:knda=rphf+) |) + + ;; No reph movement if preceded by a ZWJ. + ;; 1 23 4 5 6 + (" J(.)((H.)*)(u|b)?(p)?(l?a?) " + | (1 =) (4 =) (5 =) (2 move-h) (6 = *) |) + + ;; 1 23 + (" J(.H)((.H)*)N? " + | (1 otf:knda=haln,psts+) (2 = *) |) + ("." =)) - *)) + *) -;; Step 3 : Drive OTF tables. + (move-h + (cond + ("(H)(.+)" + (2 = *) (1 =))))) + +;; Apply other OTF features. (generator (0 (cond - (" ([^ ]*) " - (1 otf:knda=~rphf,*)) + (" ([^ ]+) " + (1 otf:knda=blwf,abvs,blws,psts)) + ("." [ otf:knda=+ ])) *))