blob: d07b60b5257edc022979671b13416d0a32517b38 [file] [log] [blame]
/*
* Copyright 2010, The Android Open Source Project
* Copyright 2010, Google Inc. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* * Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* * Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#include "harfbuzz-external.h"
#include <unicode/uchar.h>
#include <unicode/utypes.h>
/*
We use ICU APIs to get the character's Unicode property.
This module replaces the harfbuzz-unicode-tables.c which is
using static Unicode tables.
*/
static int
hb_category_for_char(HB_UChar32 ch) {
switch (u_charType(ch)) {
case U_CONTROL_CHAR:
return HB_Other_Control;
case U_FORMAT_CHAR:
return HB_Other_Format;
case U_UNASSIGNED:
return HB_Other_NotAssigned;
case U_PRIVATE_USE_CHAR:
return HB_Other_PrivateUse;
case U_SURROGATE:
return HB_Other_Surrogate;
case U_LOWERCASE_LETTER:
return HB_Letter_Lowercase;
case U_MODIFIER_LETTER:
return HB_Letter_Modifier;
case U_OTHER_LETTER:
return HB_Letter_Other;
case U_TITLECASE_LETTER:
return HB_Letter_Titlecase;
case U_UPPERCASE_LETTER:
return HB_Letter_Uppercase;
case U_COMBINING_SPACING_MARK:
return HB_Mark_SpacingCombining;
case U_ENCLOSING_MARK:
return HB_Mark_Enclosing;
case U_NON_SPACING_MARK:
return HB_Mark_NonSpacing;
case U_DECIMAL_DIGIT_NUMBER :
return HB_Number_DecimalDigit;
case U_LETTER_NUMBER:
return HB_Number_Letter;
case U_OTHER_NUMBER:
return HB_Number_Other;
case U_CONNECTOR_PUNCTUATION:
return HB_Punctuation_Connector;
case U_DASH_PUNCTUATION:
return HB_Punctuation_Dash;
case U_END_PUNCTUATION:
return HB_Punctuation_Close;
case U_FINAL_PUNCTUATION:
return HB_Punctuation_FinalQuote;
case U_INITIAL_PUNCTUATION:
return HB_Punctuation_InitialQuote;
case U_OTHER_PUNCTUATION:
return HB_Punctuation_Other;
case U_START_PUNCTUATION:
return HB_Punctuation_Open;
case U_CURRENCY_SYMBOL:
return HB_Symbol_Currency;
case U_MODIFIER_SYMBOL:
return HB_Symbol_Modifier;
case U_MATH_SYMBOL:
return HB_Symbol_Math;
case U_OTHER_SYMBOL:
return HB_Symbol_Other;
case U_LINE_SEPARATOR:
return HB_Separator_Line;
case U_PARAGRAPH_SEPARATOR:
return HB_Separator_Paragraph;
case U_SPACE_SEPARATOR:
return HB_Separator_Space;
default:
return HB_Symbol_Other;
}
}
HB_LineBreakClass
HB_GetLineBreakClass(HB_UChar32 ch) {
switch ((ULineBreak)u_getIntPropertyValue(ch, UCHAR_LINE_BREAK)) {
case U_LB_MANDATORY_BREAK:
return HB_LineBreak_BK;
case U_LB_CARRIAGE_RETURN:
return HB_LineBreak_CR;
case U_LB_LINE_FEED:
return HB_LineBreak_LF;
case U_LB_COMBINING_MARK:
return HB_LineBreak_CM;
case U_LB_SURROGATE:
return HB_LineBreak_SG;
case U_LB_ZWSPACE:
return HB_LineBreak_ZW;
case U_LB_INSEPARABLE:
return HB_LineBreak_IN;
case U_LB_GLUE:
return HB_LineBreak_GL;
case U_LB_CONTINGENT_BREAK:
return HB_LineBreak_AL;
case U_LB_SPACE:
return HB_LineBreak_SP;
case U_LB_BREAK_AFTER:
return HB_LineBreak_BA;
case U_LB_BREAK_BEFORE:
return HB_LineBreak_BB;
case U_LB_BREAK_BOTH:
return HB_LineBreak_B2;
case U_LB_HYPHEN:
return HB_LineBreak_HY;
case U_LB_NONSTARTER:
return HB_LineBreak_NS;
case U_LB_OPEN_PUNCTUATION:
return HB_LineBreak_OP;
case U_LB_CLOSE_PUNCTUATION:
return HB_LineBreak_CL;
case U_LB_QUOTATION:
return HB_LineBreak_QU;
case U_LB_EXCLAMATION:
return HB_LineBreak_EX;
case U_LB_IDEOGRAPHIC:
return HB_LineBreak_ID;
case U_LB_NUMERIC:
return HB_LineBreak_NU;
case U_LB_INFIX_NUMERIC:
return HB_LineBreak_IS;
case U_LB_BREAK_SYMBOLS:
return HB_LineBreak_SY;
case U_LB_ALPHABETIC:
return HB_LineBreak_AL;
case U_LB_PREFIX_NUMERIC:
return HB_LineBreak_PR;
case U_LB_POSTFIX_NUMERIC:
return HB_LineBreak_PO;
case U_LB_COMPLEX_CONTEXT:
return HB_LineBreak_SA;
case U_LB_AMBIGUOUS:
return HB_LineBreak_AL;
case U_LB_UNKNOWN:
return HB_LineBreak_AL;
case U_LB_NEXT_LINE:
return HB_LineBreak_AL;
case U_LB_WORD_JOINER:
return HB_LineBreak_WJ;
case U_LB_JL:
return HB_LineBreak_JL;
case U_LB_JV:
return HB_LineBreak_JV;
case U_LB_JT:
return HB_LineBreak_JT;
case U_LB_H2:
return HB_LineBreak_H2;
case U_LB_H3:
return HB_LineBreak_H3;
default:
return HB_LineBreak_AL;
}
}
int
HB_GetUnicodeCharCombiningClass(HB_UChar32 ch) {
return u_getCombiningClass(ch);
}
void
HB_GetUnicodeCharProperties(HB_UChar32 ch,
HB_CharCategory *category,
int *combiningClass) {
*category = hb_category_for_char(ch);
*combiningClass = u_getCombiningClass(ch);
}
HB_CharCategory
HB_GetUnicodeCharCategory(HB_UChar32 ch) {
return hb_category_for_char(ch);
}