Skip to content

Commit 3e8e338

Browse files
committed
taking as kCOnsonant in validate_grapheme
1 parent a6c6b34 commit 3e8e338

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

src/training/validate_grapheme.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,7 @@ Validator::CharClass ValidateGrapheme::UnicodeToCharClass(char32 ch) const {
5252
if (u_hasBinaryProperty(ch, UCHAR_GRAPHEME_LINK)) return CharClass::kVirama;
5353
if (u_isUWhiteSpace(ch)) return CharClass::kWhitespace;
5454
// Workaround for Javanese Aksara's Taling, do not label it as a combiner
55-
if (ch == 0xa9ba) return CharClass::kOther;
55+
if (ch == 0xa9ba) return CharClass::kConsonant;
5656
int char_type = u_charType(ch);
5757
if (char_type == U_NON_SPACING_MARK || char_type == U_ENCLOSING_MARK ||
5858
char_type == U_COMBINING_SPACING_MARK || ch == kZeroWidthNonJoiner ||

src/training/validate_javanese.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,7 @@ Validator::CharClass ValidateJavanese::UnicodeToCharClass(char32 ch) const {
7575
if (off == 0x33) return CharClass::kNukta; // A9B3 CECAK TELU
7676
if (off == 0x34) return CharClass::kMatraPiece; // A9B4 TARUNG two part vowels
7777
if (off <= 0x39) return CharClass::kMatra;
78-
if (off <= 0x3a) return CharClass::kMatraPiece; // A9BA TALING
78+
if (off <= 0x3a) return CharClass::kConsonant; // A9BA TALING - pre base vowel
7979
if (off <= 0x3d) return CharClass::kMatra;
8080
if (off <= 0x3f) return CharClass::kNukta; // A9BE-A9BF PENGKAL-CAKRA medial consonants
8181
if (off == 0x40) return CharClass::kVirama; // A9C0 PANGKON

0 commit comments

Comments
 (0)