mirror of
https://github.com/FirebirdSQL/firebird.git
synced 2025-01-24 00:03:03 +01:00
57 lines
1.9 KiB
Plaintext
57 lines
1.9 KiB
Plaintext
|
// -*- Coding: utf-8; -*-
|
||
|
//--------------------------------------------------------------------
|
||
|
// Copyright (c) 1999-2004, International Business Machines
|
||
|
// Corporation and others. All Rights Reserved.
|
||
|
//--------------------------------------------------------------------
|
||
|
// THIS IS A MACHINE-GENERATED FILE
|
||
|
// Tool: \icu4j\src\com\ibm\icu\dev\tool\translit\dumpICURules.bat
|
||
|
// Source: \icu4j\src\com\ibm\icu\impl\data/Transliterator_Latin_NumericPinyin.txt
|
||
|
// Date: Fri May 28 17:07:31 2004
|
||
|
//--------------------------------------------------------------------
|
||
|
|
||
|
// Latin_NumericPinyin
|
||
|
|
||
|
t_Latn_NPinyn {
|
||
|
Rule {
|
||
|
//--------------------------------------------------------------------
|
||
|
//--------------------------------------------------------------------
|
||
|
|
||
|
// According to the pinyin definitions I've been able to find:
|
||
|
// 'a', 'e' are the preferred bases
|
||
|
// otherwise 'o'
|
||
|
// otherwise last vowel
|
||
|
|
||
|
// The trailing form of syllables are the following:
|
||
|
// "a", "ai", "ao", "an", "ang",
|
||
|
// "o", "ou", "ong",
|
||
|
// "e", "ei", "er", "en", "eng",
|
||
|
// "i", "ia", "iao", "ie", "iu", "ian", "in", "iang", "ing", "iong",
|
||
|
// "u", "ua", "uo", "uai", "ui", "uan", "un", "uang", "ueng",
|
||
|
// "ü", "üe", "üan", "ün"
|
||
|
// so the letters the tone will 'hop' are:
|
||
|
|
||
|
"::NFD (NFC);"
|
||
|
"$tone = [\u0304\u0301\u030C\u0300\u0306] ;"
|
||
|
|
||
|
// Move the tone to the end of a syllable, and convert to number
|
||
|
"e {($tone) r} > r &tone-digit($1);"
|
||
|
"($tone) ( [i o n u {o n} {n g}]) > $2 &tone-digit($1);"
|
||
|
"($tone) > &tone-digit($1);"
|
||
|
|
||
|
// The following backs up until it finds the right vowel, then deposits the tone
|
||
|
|
||
|
"$vowel = [aAeEiIoOuUüÜ];"
|
||
|
"$consonant = [[a-z A-Z] - [$vowel]];"
|
||
|
"$digit = [1-5];"
|
||
|
"$1 &digit-tone($3) $2 < ([aAeE]) ($vowel* $consonant*) ($digit);"
|
||
|
"$1 &digit-tone($3) $2 < ([oO]) ([$vowel-[aeAE]]* $consonant*) ($digit);"
|
||
|
"$1 &digit-tone($3) $2 < ($vowel) ($consonant*) ($digit);"
|
||
|
"&digit-tone($1) < [:letter:] {($digit)};"
|
||
|
|
||
|
"::NFC (NFD);"
|
||
|
|
||
|
|
||
|
|
||
|
}
|
||
|
}
|