static const unsigned short punct_chars[] = { | static const unsigned short punct_chars[] = { | ||||
0x00a1, // inverted exclamation | 0x00a1, // inverted exclamation | ||||
0x00bf, // inverted question | 0x00bf, // inverted question | ||||
0x055b, // Armenian emphasis mark | |||||
0 | 0 | ||||
}; | }; | ||||
static const unsigned int punct_attributes[] = { | static const unsigned int punct_attributes[] = { | ||||
CLAUSE_SEMICOLON | CLAUSE_OPTIONAL_SPACE_AFTER, // inverted exclamation | CLAUSE_SEMICOLON | CLAUSE_OPTIONAL_SPACE_AFTER, // inverted exclamation | ||||
CLAUSE_SEMICOLON | CLAUSE_OPTIONAL_SPACE_AFTER, // inverted question | CLAUSE_SEMICOLON | CLAUSE_OPTIONAL_SPACE_AFTER, // inverted question | ||||
CLAUSE_PERIOD | CLAUSE_PUNCTUATION_IN_WORD, // Armenian emphasis mark | |||||
0 | 0 | ||||
}; | }; | ||||
{ | { | ||||
printf("testing Armenian (Armn) script classification\n"); | printf("testing Armenian (Armn) script classification\n"); | ||||
assert(clause_type_from_codepoint(0x055B) == (CLAUSE_PERIOD | CLAUSE_PUNCTUATION_IN_WORD)); | |||||
assert(clause_type_from_codepoint(0x055B) == (CLAUSE_EXCLAMATION | CLAUSE_PUNCTUATION_IN_WORD)); | |||||
assert(clause_type_from_codepoint(0x055C) == (CLAUSE_EXCLAMATION | CLAUSE_PUNCTUATION_IN_WORD)); | assert(clause_type_from_codepoint(0x055C) == (CLAUSE_EXCLAMATION | CLAUSE_PUNCTUATION_IN_WORD)); | ||||
assert(clause_type_from_codepoint(0x055D) == CLAUSE_COMMA); | assert(clause_type_from_codepoint(0x055D) == CLAUSE_COMMA); | ||||
assert(clause_type_from_codepoint(0x055E) == (CLAUSE_QUESTION | CLAUSE_PUNCTUATION_IN_WORD)); | assert(clause_type_from_codepoint(0x055E) == (CLAUSE_QUESTION | CLAUSE_PUNCTUATION_IN_WORD)); |