From: Kenichi Handa Date: Fri, 25 Aug 2000 01:47:27 +0000 (+0000) Subject: Renamed from skkdic-utl.el. X-Git-Tag: emacs-pretest-21.0.90~1983 X-Git-Url: http://git.eshelyaron.com/gitweb/?a=commitdiff_plain;h=383a3ccf9fa4f5a69f421de38e0c7731c8569c5d;p=emacs.git Renamed from skkdic-utl.el. Provide ja-dic-utl instead of skkdic-utl. (skkdic-lookup-key): Load ja-dic/ja-dic, not skkdic/skkdic. --- diff --git a/lisp/international/ja-dic-utl.el b/lisp/international/ja-dic-utl.el new file mode 100644 index 00000000000..8c5cd8dde44 --- /dev/null +++ b/lisp/international/ja-dic-utl.el @@ -0,0 +1,216 @@ +;;; ja-dic-utl.el --- Utilities for handling Japanese dictionary (SKK-JISYO.L) + +;; Copyright (C) 1995, 2000 Electrotechnical Laboratory, JAPAN. +;; Licensed to the Free Software Foundation. + +;; Keywords: mule, multilingual, Japanese + +;; This file is part of GNU Emacs. + +;; GNU Emacs is free software; you can redistribute it and/or modify +;; it under the terms of the GNU General Public License as published by +;; the Free Software Foundation; either version 2, or (at your option) +;; any later version. + +;; GNU Emacs is distributed in the hope that it will be useful, +;; but WITHOUT ANY WARRANTY; without even the implied warranty of +;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +;; GNU General Public License for more details. + +;; You should have received a copy of the GNU General Public License +;; along with GNU Emacs; see the file COPYING. If not, write to the +;; Free Software Foundation, Inc., 59 Temple Place - Suite 330, +;; Boston, MA 02111-1307, USA. + +;;; Commentary: + +;; This file provides a generic function to look up a Japanese +;; dictionary of SKK format. +;; +;; SKK is a free Japanese input method running on Mule created by +;; Masahiko Sato . The Emacs Lisp +;; library kkc.el provides a facility to convert a Japanese kana +;; string to a kanji-kana-mixed string by using SKK's dictionary. +;; +;; The original SKK dictionary SKK-JISYO.L is converted to ja-dic.el +;; by ja-dic-cnv.el. We get entries of the dictionary in four +;; variables (listed below) by loading that file (or byte-compiled +;; version ja-dic.elc). + +;;; Code: + +;; The following four variables are set by loading ja-dic.el[c]. +(defvar skkdic-okuri-ari nil + "Nested alist for OKURI-ARI entries of SKK dictionary.") + +(defvar skkdic-postfix nil + "Nested alist for SETSUBIJI (postfix) entries of SKK dictionary.") + +(defvar skkdic-prefix nil + "Nested alist SETTOUJI (prefix) entries of SKK dictionary.") + +(defvar skkdic-okuri-nasi nil + "Nested alist for OKURI-NASI entries of SKK dictionary.") + +(defconst skkdic-okurigana-table + '((?ぁ . ?a) (?あ . ?a) (?ぃ . ?i) (?い . ?i) (?ぅ . ?u) + (?う . ?u) (?ぇ . ?e) (?え . ?e) (?ぉ . ?o) (?お . ?o) + (?か . ?k) (?が . ?g) (?き . ?k) (?ぎ . ?g) (?く . ?k) + (?ぐ . ?g) (?け . ?k) (?げ . ?g) (?こ . ?k) (?ご . ?g) + (?さ . ?s) (?ざ . ?z) (?し . ?s) (?じ . ?j) (?す . ?s) + (?ず . ?z) (?せ . ?s) (?ぜ . ?z) (?そ . ?s) (?ぞ . ?z) + (?た . ?t) (?だ . ?d) (?ち . ?t) (?ぢ . ?d) (?っ . ?t) + (?つ . ?t) (?づ . ?d) (?て . ?t) (?で . ?d) (?と . ?t) (?ど . ?d) + (?な . ?n) (?に . ?n) (?ぬ . ?n) (?ね . ?n) (?の . ?n) + (?は . ?h) (?ば . ?b) (?ぱ . ?p) (?ひ . ?h) (?び . ?b) + (?ぴ . ?p) (?ふ . ?h) (?ぶ . ?b) (?ぷ . ?p) (?へ . ?h) + (?べ . ?b) (?ぺ . ?p) (?ほ . ?h) (?ぼ . ?b) (?ぽ . ?p) + (?ま . ?m) (?み . ?m) (?む . ?m) (?め . ?m) (?も . ?m) + (?ゃ . ?y) (?や . ?y) (?ゅ . ?y) (?ゆ . ?y) (?ょ . ?y) (?よ . ?y) + (?ら . ?r) (?り . ?r) (?る . ?r) (?れ . ?r) (?ろ . ?r) + (?わ . ?w) (?ゐ . ?w) (?ゑ . ?w) (?を . ?w) + (?ん . ?n) + ) + "Alist of Okuriganas vs trailing ASCII letters in OKURI-ARI entry.") + +(defun skkdic-merge-head-and-tail (heads tails postfix) + (let ((min-len 2) + l) + (while heads + (if (or (not postfix) + (>= (length (car heads)) min-len)) + (let ((tail tails)) + (while tail + (if (or postfix + (>= (length (car tail)) min-len)) + (setq l (cons (concat (car heads) (car tail)) l))) + (setq tail (cdr tail))))) + (setq heads (cdr heads))) + l)) + +(defconst skkdic-jisx0208-hiragana-block (nth 1 (split-char ?あ))) + +(defun skkdic-lookup-key (seq len &optional postfix prefer-noun) + "Return a list of conversion string for sequence SEQ of length LEN. + +SEQ is a vector of Kana characters to be converted by SKK dictionary. +If LEN is shorter than the length of KEYSEQ, the first LEN keys in SEQ +are took into account. + +Optional 3rd arg POSTFIX non-nil means SETSUBIJI (postfix) are also +considered to find conversion strings. + +Optional 4th arg PREFER-NOUN non-nil means that the conversions +without okurigana are placed at the head of the returned list." + (or skkdic-okuri-nasi + (condition-case err + (load-library "ja-dic/ja-dic") + (error (ding) + (with-output-to-temp-buffer "*Help*" + (princ "The library `ja-dic' can't be loaded. + +The most common case is that you have not yet installed the library +included in LEIM (Libraries of Emacs Input Method) which is +distributed separately from Emacs. + +LEIM is available from the same ftp directory as Emacs.")) + (signal (car err) (cdr err))))) + + (let ((vec (make-vector len 0)) + (i 0) + entry) + ;; At first, generate vector VEC from SEQ for looking up SKK + ;; alists. Nth element in VEC corresponds to Nth element in SEQ. + ;; The values are decided as follows. + ;; If SEQ[N] is `ー', VEC[N] is 0, + ;; else if SEQ[N] is a Hiragana character, VEC[N] is: + ;; ((The 2nd position code of SEQ[N]) - 32), + ;; else VEC[N] is 128. + (while (< i len) + (let ((ch (aref seq i)) + elts) + (if (= ch ?ー) + (aset vec i 0) + (setq elts (split-char ch)) + (if (and (eq (car elts) 'japanese-jisx0208) + (= (nth 1 elts) skkdic-jisx0208-hiragana-block)) + (aset vec i (- (nth 2 elts) 32)) + (aset vec i 128)))) + (setq i (1+ i))) + + ;; Search OKURI-NASI entries. + (setq entry (lookup-nested-alist vec skkdic-okuri-nasi len 0 t)) + (if (consp (car entry)) + (setq entry (copy-sequence (car entry))) + (setq entry nil)) + + (if postfix + ;; Search OKURI-NASI entries with postfixes. + (let ((break (max (- len (car skkdic-postfix)) 1)) + entry-head entry-postfix entry2) + (while (< break len) + (if (and (setq entry-head + (lookup-nested-alist vec skkdic-okuri-nasi + break 0 t)) + (consp (car entry-head)) + (setq entry-postfix + (lookup-nested-alist vec skkdic-postfix + len break t)) + (consp (car entry-postfix)) + (setq entry2 (skkdic-merge-head-and-tail + (car entry-head) (car entry-postfix) t))) + (if entry + (nconc entry entry2) + (setq entry entry2))) + (setq break (1+ break))))) + + ;; Search OKURI-NASI entries with prefixes. + (let ((break (min (car skkdic-prefix) (- len 2))) + entry-prefix entry-tail entry2) + (while (> break 0) + (if (and (setq entry-prefix + (lookup-nested-alist vec skkdic-prefix break 0 t)) + (consp (car entry-prefix)) + (setq entry-tail + (lookup-nested-alist vec skkdic-okuri-nasi len break t)) + (consp (car entry-tail)) + (setq entry2 (skkdic-merge-head-and-tail + (car entry-prefix) (car entry-tail) nil))) + (progn + (if entry + (nconc entry entry2) + (setq entry entry2)))) + (setq break (1- break)))) + + ;; Search OKURI-ARI entries. + (let ((okurigana (assq (aref seq (1- len)) skkdic-okurigana-table)) + orig-element entry2) + (if okurigana + (progn + (setq orig-element (aref vec (1- len))) + (aset vec (1- len) (- (cdr okurigana))) + (if (and (setq entry2 (lookup-nested-alist vec skkdic-okuri-ari + len 0 t)) + (consp (car entry2))) + (progn + (setq entry2 (copy-sequence (car entry2))) + (let ((l entry2) + (okuri (char-to-string (aref seq (1- len))))) + (while l + (setcar l (concat (car l) okuri)) + (setq l (cdr l))) + (if entry + (if prefer-noun + (nconc entry entry2) + (setq entry2 (nreverse entry2)) + (nconc entry2 entry) + (setq entry entry2)) + (setq entry (nreverse entry2)))))) + (aset vec (1- len) orig-element)))) + + entry)) + +;; +(provide 'ja-dic-utl) + +;; ja-dic-utl.el ends here