File: //usr/share/m17n/th-pattachote.mim
;; th-pattachote.mim -- Thai input method with Pattachote keyboard layout
;; Copyright (C) 2006, 2007, 2008, 2009
;;   National Institute of Advanced Industrial Science and Technology (AIST)
;;   Registration Number H15PRO112
;; This file is part of the m17n database; a sub-part of the m17n
;; library.
;; The m17n library is free software; you can redistribute it and/or
;; modify it under the terms of the GNU Lesser General Public License
;; as published by the Free Software Foundation; either version 2.1 of
;; the License, or (at your option) any later version.
;; The m17n library is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
;; Lesser General Public License for more details.
;; You should have received a copy of the GNU Lesser General Public
;; License along with the m17n library; if not, write to the Free
;; Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
;; 02110-1301, USA.
(input-method th pattachote)
(description "Thai input method simulating the Pattachote keyboard
with WTT 2.0 input sequence correction.
The correction algorithm follows the one shown in the following 
  <http://linux.thai.net/~thep/th-xim/>
")
(title "ท")
(variable
 (level (_"Acceptance level
The level of character sequence acceptance defined in WTT 2.0.
0 accepts any key sequence.  2 accepts only orthographic ones.
1 is somewhere between.")
	1 0 1 2))
(include (th kesmanee) macro)
(map
 (map
  ("!" "+")
  ("\"" "ฑ")
  ("#" "/")
  ("$" ",")
  ("%" "?")
  ("&" "_")
  ("'" "ข")
  ("(" "(")
  (")" ")")
  ("*" ".")
  ("+" "%")
  ("," "ะ")
  ("-" "๑")
  ("." "จ")
  ("/" "พ")
  ("0" "๐")
  ("1" "=")
  ("2" "๒")
  ("3" "๓")
  ("4" "๔")
  ("5" "๕")
  ("6" "ู")
  ("7" "๗")
  ("8" "๘")
  ("9" "๙")
  (":" "ฆ")
  (";" "ไ")
  ("<" "ฟ")
  ("=" "๖")
  (">" "ฉ")
  ("?" "ฬ")
  ("@" "\"")
  ("A" "๋")
  ("B" "ฺ")
  ("C" "ฐ")
  ("D" "ำ")
  ("E" "ๆ")
  ("F" "ณ")
  ("G" "์")
  ("H" "ื")
  ("I" "ซ")
  ("J" "ผ")
  ("K" "ช")
  ("L" "โ")
  ("M" "ฮ")
  ("N" "ศ")
  ("O" "ถ")
  ("P" "ฒ")
  ("Q" "๊")
  ("R" "ญ")
  ("S" "ธ")
  ("T" "ษ")
  ("U" "ฝ")
  ("V" "ภ")
  ("W" "ฤ")
  ("X" "ฏ")
  ("Y" "ึ")
  ("Z" "ฎ")
  ("[" "ใ")
  ("\\" "ๅ")
  ("]" "ฌ")
  ("^" "ุ")
  ("_" "-")
  ("`" "_")
  ("a" "้")
  ("b" "ิ")
  ("c" "ล")
  ("d" "ง")
  ("e" "ย")
  ("f" "ก")
  ("g" "ั")
  ("h" "ี")
  ("i" "ม")
  ("j" "า")
  ("k" "น")
  ("l" "เ")
  ("m" "ส")
  ("n" "ค")
  ("o" "ว")
  ("p" "แ")
  ("q" "็")
  ("r" "อ")
  ("s" "ท")
  ("t" "ร")
  ("u" "ด")
  ("v" "ห")
  ("w" "ต")
  ("x" "ป")
  ("y" "่")
  ("z" "บ")
  ("{" "ฯ")
  ("|" "ํ")
  ("}" "ฦ")
  ("~" "฿")))
(state
 (init
  (map
   (delete @<)
   (pushback 1)
   (shift main)))
 
 (main
  (map
   (set x @-3)
   (set y @-2)
   (set z @-1)
   (set arg1 y)
   (set arg2 z)
   (cp)
   (cond
    ((= ret 1)) ;; CP(y,z) succeeded.
    (1
     (ac)
     (cond
      ((= ret 1)) ;; AC(y,z) succeeded.
      (1
       ;; WTT-based input sequence correction starts here.
       ;; begin
       ;; if CP(x,z) then
       (set arg1 x)
       (set arg2 z)
       (cp)
       (cond
	((= ret 1)
	 ;; if CP(z,y) then
	 (set arg1 z)
	 (set arg2 y)
	 (cp)
	 (cond
	  ((= ret 1)
	   ;; reorder(y -> zy)
	   (delete @-2)
	   (insert z)
	   (insert y))
	  ;; elif CP(x,y) then
	  (1
	   (set arg1 x)
	   (set arg2 y)
	   (cp)
	   (cond
	    ((= ret 1)
	     ;; replace(y -> z)
	     (delete @-2)
	     (insert z))
	    ;; elif y is FV1 and z is TONE then
	    ((& (| (= y 0x0E30) (= y 0x0E32) (= y 0x0E33))
		(>= z 0x0E48)
		(<= z 0x0E4B))
	     ;; reorder(y -> zy)
	     (delete @-2)
	     (insert z)
	     (insert y))
	    ;; else
	    ;; reject(z)
	    (1
	     (delete @-1))
	    ;;endif
	    ))))
	;; elif AC(x,z) then
	(1
	 (set arg1 x)
	 (set arg2 z)
	 (ac)
	 (cond
	  ((& (= ret 1)
	      ;; Only Thai characters should be replaced.
	      (& (>= y 0x0E01) (<= y 0x0E5B))
	      (& (>= z 0x0E01) (<= z 0x0E5B)))
	   ;; replace(y -> z)
	   (delete @-2)
	   (insert z))
	  ;; else
	  ;; reject(z)
	  (1
	   (delete @-1))
	  ;; endif
	  )))
       ;; end
       ))))
   ;; Now we commit the preedit chars that are fixed.
   (set w @-1)
   (cond
    ;; If surrounding text is supported, commit the only char in preedit.
    ((> @-0 -2)
     (commit))
    ;; If the last char is CTRL or NON, we can commit everything.
    ((| (& (>= w 0x0000) (<= w 0x0E00))
	(= w 0x0E2F)
	(= w 0x0E3F)
	(= w 0x0E46)
	(>= w 0x0E4F))
     (commit))
    ;; If the last char is CONS, we can commit everything but the last
    ;; unless the second last is FV3.
    ((| (& (>= w 0x0E01) (<= w 0x0E23))
	(= w 0x0E25)
	(& (>= w 0x0E27) (<= w 0x0E2E)))
     (cond
      ((| (= @-2 0x0E24) (= @-2 0x0E26))
       ; not commit yet
       )
      (1
       (delete @-1)
       (commit)
       (insert w))))
    ;; If the last char is LV, FV2 or FV3, we can commit
    ;; everything but the last.
    ((| (& (>= w 0x0E40) (<= w 0x0E45))
	(= w 0x0E24)
	(= w 0x0E26))
     (delete @-1)
     (commit)
     (insert w))
    ;; If the last char is FV1 (excluding AM) and ...
    ((| (= w 0x0E30) (= w 0x0E32))
     (delete @-1)
     (set v @-1)
     (cond
      ;; ... the before last is CONS, we can commit other than the
      ;; last two.
      ((| (& (>= v 0x0E01) (<= v 0x0E23))
	  (= v 0x0E25)
	  (& (>= v 0x0E27) (<= v 0x0E2E)))
       (delete @-1)
       (commit)
       (insert v)
       (insert w))
      ;; ... else if the before last is not CONS, we can commit
      ;; everything but the last.
      (1
       (commit)
       (insert w))))
    ))))
;; Local Variables:
;; coding: utf-8
;; mode: emacs-lisp
;; End: