PATH:
usr
/
lib64
/
aspell-0.60
# phonetic_english.h - phonetic transformation rules for use with phonetic.c # Copyright (C) 2000 Bj�rn Jacke # # This rule set is based on Lawrence Phillips original metaphone # algorithm with modifications made by Michael Kuhn in his # C implantation, more modifications by Bj�rn Jacke when # converting the algorithm to a rule set and minor # touch ups by Kevin Atkinson # # This library is free software; you can redistribute it and/or # modify it under the terms of the GNU Lesser General Public # License version 2.1 as published by the Free Software Foundation; # # This library is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU # Lesser General Public License for more details. # # You should have received a copy of the GNU Lesser General Public # License along with this library; if not, write to the Free Software # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA # # Bj�rn Jacke may be reached by email at bjoern.jacke@gmx.de # # Changelog: # # 2000-01-05 Bj�rn Jacke <bjoern.jacke@gmx.de> # - first version with translation rules derived from # metaphone.cc distributed with aspell 0.28.3 # - "TH" is now representated as "@" because "0" is a # meta character # - removed TH(!vowel) --> T; always use TH --> # instead # - dropped "^AE" -> "E" (redundant) # - "ing" is transformed to "N", not "NK" # - "SCH(EO)" transforms to "SK" now # - added R --> SILENT if (after a vowel) and no (vowel or # "y" follows) like in "Marcy" or "abort" # - H is SILENT in RH at beginning of words # - H is SILENT if vowel leads and "Y" follows # - some ".OUGH.." --> ...F exceptions added # - "^V" transforms to "W" # 2000-01-07 Kevin Atkinson <kevinatk@home.com> # Converted from header to data file. # version 1.1 AH(AEIOUY)-^ *H AR(AEIOUY)-^ *R A(HR)^ * A^ * AH(AEIOUY)- H AR(AEIOUY)- R A(HR) _ BB- _ B B CQ- _ CIA X CH X C(EIY)- S CK K COUGH^ KF CC< C C K DG(EIY) K DD- _ D T �< E EH(AEIOUY)-^ *H ER(AEIOUY)-^ *R E(HR)^ * ENOUGH^$ *NF E^ * EH(AEIOUY)- H ER(AEIOUY)- R E(HR) _ FF- _ F F GN^ N GN$ N GNS$ NS GNED$ N GH(AEIOUY)- K GH _ GG9 K G K H H IH(AEIOUY)-^ *H IR(AEIOUY)-^ *R I(HR)^ * I^ * ING6 N IH(AEIOUY)- H IR(AEIOUY)- R I(HR) _ J K KN^ N KK- _ K K LAUGH^ LF LL- _ L L MB$ M MM M M M NN- _ N N OH(AEIOUY)-^ *H OR(AEIOUY)-^ *R O(HR)^ * O^ * OH(AEIOUY)- H OR(AEIOUY)- R O(HR) _ PH F PN^ N PP- _ P P Q K RH^ R ROUGH^ RF RR- _ R R SCH(EOU)- SK SC(IEY)- S SH X SI(AO)- X SS- _ S S TI(AO)- X TH @ TCH-- _ TOUGH^ TF TT- _ T T UH(AEIOUY)-^ *H UR(AEIOUY)-^ *R U(HR)^ * U^ * UH(AEIOUY)- H UR(AEIOUY)- R U(HR) _ V^ W V F WR^ R WH^ W W(AEIOU)- W X^ S X KS Y(AEIOU)- Y ZZ- _ Z S #The rules in a different view: # # Exceptions: # # Beginning of word: "gn", "kn-", "pn-", "wr-" ----> drop first letter # "Aebersold", "Gnagy", "Knuth", "Pniewski", "Wright" # # Beginning of word: "x" ----> change to "s" # as in "Deng Xiaopeng" # # Beginning of word: "wh-" ----> change to "w" # as in "Whalen" # Beginning of word: leading vowels are transformed to "*" # # "[crt]ough" and "enough" are handled separately because of "F" sound # # # A --> A at beginning # _ otherwise # # B --> B unless at the end of word after "m", as in "dumb", "McComb" # # C --> X (sh) if "-cia-" or "-ch-" # S if "-ci-", "-ce-", or "-cy-" # SILENT if "-sci-", "-sce-", or "-scy-", or "-cq-" # K otherwise, including in "-sch-" # # D --> K if in "-dge-", "-dgy-", or "-dgi-" # T otherwise # # E --> A at beginnig # _ SILENT otherwise # # F --> F # # G --> SILENT if in "-gh-" and not at end or before a vowel # in "-gn" or "-gned" or "-gns" # in "-dge-" etc., as in above rule # K if before "i", or "e", or "y" if not double "gg" # # K otherwise (incl. "GG"!) # # H --> SILENT if after vowel and no vowel or "Y" follows # or after "-ch-", "-sh-", "-ph-", "-th-", "-gh-" # or after "rh-" at beginning # H otherwise # # I --> A at beginning # _ SILENT otherwise # # J --> K # # K --> SILENT if after "c" # K otherwise # # L --> L # # M --> M # # N --> N # # O --> A at beginning # _ SILENT otherwise # # P --> F if before "h" # P otherwise # # Q --> K # # R --> SILENT if after vowel and no vowel or "Y" follows # R otherwise # # S --> X (sh) if before "h" or in "-sio-" or "-sia-" # SK if followed by "ch(eo)" (SCH(EO)) # S otherwise # # T --> X (sh) if "-tia-" or "-tio-" # 0 (th) if before "h" # silent if in "-tch-" # T otherwise # # U --> A at beginning # _ SILENT otherwise # # V --> V if first letter of word # F otherwise # # W --> SILENT if not followed by a vowel # W if followed by a vowel # # X --> KS # # Y --> SILENT if not followed by a vowel # Y if followed by a vowel # # Z --> S
[+]
..
[-] cp1257.cmap
[edit]
[-] split.kbd
[edit]
[-] en_US-w_accents.multi
[edit]
[-] dvorak.kbd
[edit]
[-] iso-8859-11.cmap
[edit]
[-] en_GB-ise.multi
[edit]
[-] markdown-filter.info
[edit]
[-] en_GB-variant_0.rws
[edit]
[-] en-variant_1.multi
[edit]
[-] english-w_accents.alias
[edit]
[-] en_GB-ize-wo_accents.multi
[edit]
[-] english-wo_accents.alias
[edit]
[-] cp1251.cset
[edit]
[-] british-ise-w_accents.alias
[edit]
[-] cp1256.cset
[edit]
[-] iso-8859-9.cmap
[edit]
[-] iso-8859-13.cset
[edit]
[-] en-w_accents.multi
[edit]
[-] texinfo.amf
[edit]
[-] koi8-u.cset
[edit]
[-] en-variant_2.rws
[edit]
[-] iso-8859-15.cset
[edit]
[-] cp1250.cmap
[edit]
[-] en_CA-variant_1.rws
[edit]
[-] context-filter.info
[edit]
[-] british-w_accents.alias
[edit]
[-] british-ise.alias
[edit]
[-] nroff-filter.info
[edit]
[-] cp1255.cset
[edit]
[-] british.alias
[edit]
[-] en_AU-variant_0.multi
[edit]
[-] en_US-variant_1.multi
[edit]
[-] australian-variant_0.alias
[edit]
[-] en-w_accents-only.rws
[edit]
[-] australian-wo_accents.alias
[edit]
[-] en_AU.multi
[edit]
[-] british-ize-w_accents.alias
[edit]
[-] ccpp.amf
[edit]
[-] iso-8859-10.cset
[edit]
[-] en-variant_1.rws
[edit]
[-] cp1257.cset
[edit]
[-] en_GB.multi
[edit]
[-] texinfo-filter.so
[edit]
[-] en_GB-variant_1.multi
[edit]
[-] canadian-variant_0.alias
[edit]
[-] en_CA-variant_1.multi
[edit]
[-] en_GB-w_accents.multi
[edit]
[-] en_US-wo_accents-only.rws
[edit]
[-] english-variant_0.alias
[edit]
[-] en.dat
[edit]
[-] cp1254.cmap
[edit]
[-] en_CA-wo_accents-only.rws
[edit]
[-] sgml-filter.so
[edit]
[-] nroff-filter.so
[edit]
[-] context-filter.so
[edit]
[-] koi8-u.cmap
[edit]
[-] en-wo_accents.multi
[edit]
[-] english-variant_2.alias
[edit]
[-] en-variant_2.multi
[edit]
[-] australian-variant_1.alias
[edit]
[-] en_AU-wo_accents.multi
[edit]
[-] iso-8859-14.cset
[edit]
[-] american-variant_1.alias
[edit]
[-] en_GB-ize-wo_accents-only.rws
[edit]
[-] comment.amf
[edit]
[-] en_AU-w_accents.multi
[edit]
[-] cp1254.cset
[edit]
[-] tex-filter.info
[edit]
[-] en_GB-ize-w_accents.multi
[edit]
[-] en_GB-ise-w_accents.multi
[edit]
[-] en_AU-variant_0.rws
[edit]
[-] british-variant_0.alias
[edit]
[-] british-wo_accents.alias
[edit]
[-] texinfo-filter.info
[edit]
[-] koi8-r.cmap
[edit]
[-] en.multi
[edit]
[-] en-wo_accents-only.rws
[edit]
[-] iso-8859-5.cset
[edit]
[-] en_US.multi
[edit]
[-] english-variant_1.alias
[edit]
[-] en-common.rws
[edit]
[-] email-filter.so
[edit]
[-] cp1250.cset
[edit]
[-] cp1258.cset
[edit]
[-] en_GB-variant_0.multi
[edit]
[-] canadian-variant_1.alias
[edit]
[-] iso-8859-16.cmap
[edit]
[-] canadian-w_accents.alias
[edit]
[-] en_AU-variant_1.multi
[edit]
[-] cp1253.cmap
[edit]
[-] perl.amf
[edit]
[-] en_GB-ise-wo_accents.multi
[edit]
[-] cp1255.cmap
[edit]
[-] american-variant_0.alias
[edit]
[-] standard.kbd
[edit]
[-] cp1252.cmap
[edit]
[-] iso-8859-7.cmap
[edit]
[-] iso-8859-8.cmap
[edit]
[-] en_US-w_accents-only.rws
[edit]
[-] british-ize-wo_accents.alias
[edit]
[-] canadian.alias
[edit]
[-] email-filter.info
[edit]
[-] cp1251.cmap
[edit]
[-] british-variant_1.alias
[edit]
[-] iso-8859-9.cset
[edit]
[-] iso-8859-4.cset
[edit]
[-] en_AU-w_accents-only.rws
[edit]
[-] canadian-wo_accents.alias
[edit]
[-] en_CA.multi
[edit]
[-] australian-w_accents.alias
[edit]
[-] html-filter.info
[edit]
[-] american.alias
[edit]
[-] en_GB-ise-wo_accents-only.rws
[edit]
[-] iso-8859-1.cmap
[edit]
[-] cp1253.cset
[edit]
[-] en_GB-ize-w_accents-only.rws
[edit]
[-] iso-8859-13.cmap
[edit]
[-] iso-8859-3.cset
[edit]
[-] iso-8859-4.cmap
[edit]
[-] markdown.amf
[edit]
[-] iso-8859-2.cmap
[edit]
[-] iso-8859-1.cset
[edit]
[-] en_CA-w_accents.multi
[edit]
[-] en_affix.dat
[edit]
[-] en_US-wo_accents.multi
[edit]
[-] en_AU-wo_accents-only.rws
[edit]
[-] en_phonet.dat
[edit]
[-] cp1256.cmap
[edit]
[-] iso-8859-2.cset
[edit]
[-] none.amf
[edit]
[-] american-w_accents.alias
[edit]
[-] en-variant_0.rws
[edit]
[-] en_CA-w_accents-only.rws
[edit]
[-] sgml-filter.info
[edit]
[-] sgml.amf
[edit]
[-] american-wo_accents.alias
[edit]
[-] en_US-variant_0.multi
[edit]
[-] iso-8859-14.cmap
[edit]
[-] en_AU-variant_1.rws
[edit]
[-] british-ise-wo_accents.alias
[edit]
[-] en_GB-ise-w_accents-only.rws
[edit]
[-] email.amf
[edit]
[-] html.amf
[edit]
[-] iso-8859-6.cset
[edit]
[-] iso-8859-11.cset
[edit]
[-] en_CA-variant_0.rws
[edit]
[-] cp1258.cmap
[edit]
[-] iso-8859-7.cset
[edit]
[-] british-ize.alias
[edit]
[-] nroff.amf
[edit]
[-] iso-8859-5.cmap
[edit]
[-] iso-8859-15.cmap
[edit]
[-] australian.alias
[edit]
[-] en_GB-variant_1.rws
[edit]
[-] en_CA-variant_0.multi
[edit]
[-] markdown-filter.so
[edit]
[-] en_GB-wo_accents.multi
[edit]
[-] cp1252.cset
[edit]
[-] english.alias
[edit]
[-] iso-8859-10.cmap
[edit]
[-] iso-8859-3.cmap
[edit]
[-] tex-filter.so
[edit]
[-] iso-8859-8.cset
[edit]
[-] en-variant_0.multi
[edit]
[-] tex.amf
[edit]
[-] url.amf
[edit]
[-] en_GB-ize.multi
[edit]
[-] koi8-r.cset
[edit]
[-] iso-8859-16.cset
[edit]
[-] en_CA-wo_accents.multi
[edit]
[-] iso-8859-6.cmap
[edit]