/* * Copyright 2010, The Android Open Source Project * Copyright 2010, Google Inc. All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * * Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * * Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include "harfbuzz-external.h" #include <unicode/uchar.h> #include <unicode/utypes.h> /* We use ICU APIs to get the character's Unicode property. This module replaces the harfbuzz-unicode-tables.c which is using static Unicode tables. */ static int hb_category_for_char(HB_UChar32 ch) { switch (u_charType(ch)) { case U_CONTROL_CHAR: return HB_Other_Control; case U_FORMAT_CHAR: return HB_Other_Format; case U_UNASSIGNED: return HB_Other_NotAssigned; case U_PRIVATE_USE_CHAR: return HB_Other_PrivateUse; case U_SURROGATE: return HB_Other_Surrogate; case U_LOWERCASE_LETTER: return HB_Letter_Lowercase; case U_MODIFIER_LETTER: return HB_Letter_Modifier; case U_OTHER_LETTER: return HB_Letter_Other; case U_TITLECASE_LETTER: return HB_Letter_Titlecase; case U_UPPERCASE_LETTER: return HB_Letter_Uppercase; case U_COMBINING_SPACING_MARK: return HB_Mark_SpacingCombining; case U_ENCLOSING_MARK: return HB_Mark_Enclosing; case U_NON_SPACING_MARK: return HB_Mark_NonSpacing; case U_DECIMAL_DIGIT_NUMBER : return HB_Number_DecimalDigit; case U_LETTER_NUMBER: return HB_Number_Letter; case U_OTHER_NUMBER: return HB_Number_Other; case U_CONNECTOR_PUNCTUATION: return HB_Punctuation_Connector; case U_DASH_PUNCTUATION: return HB_Punctuation_Dash; case U_END_PUNCTUATION: return HB_Punctuation_Close; case U_FINAL_PUNCTUATION: return HB_Punctuation_FinalQuote; case U_INITIAL_PUNCTUATION: return HB_Punctuation_InitialQuote; case U_OTHER_PUNCTUATION: return HB_Punctuation_Other; case U_START_PUNCTUATION: return HB_Punctuation_Open; case U_CURRENCY_SYMBOL: return HB_Symbol_Currency; case U_MODIFIER_SYMBOL: return HB_Symbol_Modifier; case U_MATH_SYMBOL: return HB_Symbol_Math; case U_OTHER_SYMBOL: return HB_Symbol_Other; case U_LINE_SEPARATOR: return HB_Separator_Line; case U_PARAGRAPH_SEPARATOR: return HB_Separator_Paragraph; case U_SPACE_SEPARATOR: return HB_Separator_Space; default: return HB_Symbol_Other; } } HB_LineBreakClass HB_GetLineBreakClass(HB_UChar32 ch) { switch ((ULineBreak)u_getIntPropertyValue(ch, UCHAR_LINE_BREAK)) { case U_LB_MANDATORY_BREAK: return HB_LineBreak_BK; case U_LB_CARRIAGE_RETURN: return HB_LineBreak_CR; case U_LB_LINE_FEED: return HB_LineBreak_LF; case U_LB_COMBINING_MARK: return HB_LineBreak_CM; case U_LB_SURROGATE: return HB_LineBreak_SG; case U_LB_ZWSPACE: return HB_LineBreak_ZW; case U_LB_INSEPARABLE: return HB_LineBreak_IN; case U_LB_GLUE: return HB_LineBreak_GL; case U_LB_CONTINGENT_BREAK: return HB_LineBreak_AL; case U_LB_SPACE: return HB_LineBreak_SP; case U_LB_BREAK_AFTER: return HB_LineBreak_BA; case U_LB_BREAK_BEFORE: return HB_LineBreak_BB; case U_LB_BREAK_BOTH: return HB_LineBreak_B2; case U_LB_HYPHEN: return HB_LineBreak_HY; case U_LB_NONSTARTER: return HB_LineBreak_NS; case U_LB_OPEN_PUNCTUATION: return HB_LineBreak_OP; case U_LB_CLOSE_PUNCTUATION: return HB_LineBreak_CL; case U_LB_QUOTATION: return HB_LineBreak_QU; case U_LB_EXCLAMATION: return HB_LineBreak_EX; case U_LB_IDEOGRAPHIC: return HB_LineBreak_ID; case U_LB_NUMERIC: return HB_LineBreak_NU; case U_LB_INFIX_NUMERIC: return HB_LineBreak_IS; case U_LB_BREAK_SYMBOLS: return HB_LineBreak_SY; case U_LB_ALPHABETIC: return HB_LineBreak_AL; case U_LB_PREFIX_NUMERIC: return HB_LineBreak_PR; case U_LB_POSTFIX_NUMERIC: return HB_LineBreak_PO; case U_LB_COMPLEX_CONTEXT: return HB_LineBreak_SA; case U_LB_AMBIGUOUS: return HB_LineBreak_AL; case U_LB_UNKNOWN: return HB_LineBreak_AL; case U_LB_NEXT_LINE: return HB_LineBreak_AL; case U_LB_WORD_JOINER: return HB_LineBreak_WJ; case U_LB_JL: return HB_LineBreak_JL; case U_LB_JV: return HB_LineBreak_JV; case U_LB_JT: return HB_LineBreak_JT; case U_LB_H2: return HB_LineBreak_H2; case U_LB_H3: return HB_LineBreak_H3; default: return HB_LineBreak_AL; } } int HB_GetUnicodeCharCombiningClass(HB_UChar32 ch) { return u_getCombiningClass(ch); } void HB_GetUnicodeCharProperties(HB_UChar32 ch, HB_CharCategory *category, int *combiningClass) { *category = hb_category_for_char(ch); *combiningClass = u_getCombiningClass(ch); } HB_CharCategory HB_GetUnicodeCharCategory(HB_UChar32 ch) { return hb_category_for_char(ch); }