blob: 3b72516324152af2362fffdce6e62e7a436edd54 [file] [log] [blame]
// Copyright 2014 PDFium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
#ifndef CORE_FXCRT_FX_UCD_H_
#define CORE_FXCRT_FX_UCD_H_
#include "core/fxcrt/cfx_retain_ptr.h"
#include "core/fxcrt/fx_basic.h"
constexpr uint32_t FX_BIDICLASSBITS = 6;
constexpr uint32_t FX_BIDICLASSBITSMASK = 0x1F << FX_BIDICLASSBITS;
enum FX_BIDICLASS {
FX_BIDICLASS_ON = 0, // Other Neutral
FX_BIDICLASS_L = 1, // Left Letter
FX_BIDICLASS_R = 2, // Right Letter
FX_BIDICLASS_AN = 3, // Arabic Number
FX_BIDICLASS_EN = 4, // European Number
FX_BIDICLASS_AL = 5, // Arabic Letter
FX_BIDICLASS_NSM = 6, // Non-spacing Mark
FX_BIDICLASS_CS = 7, // Common Number Separator
FX_BIDICLASS_ES = 8, // European Separator
FX_BIDICLASS_ET = 9, // European Number Terminator
FX_BIDICLASS_BN = 10, // Boundary Neutral
FX_BIDICLASS_S = 11, // Segment Separator
FX_BIDICLASS_WS = 12, // Whitespace
FX_BIDICLASS_B = 13, // Paragraph Separator
FX_BIDICLASS_RLO = 14, // Right-to-Left Override
FX_BIDICLASS_RLE = 15, // Right-to-Left Embedding
FX_BIDICLASS_LRO = 16, // Left-to-Right Override
FX_BIDICLASS_LRE = 17, // Left-to-Right Embedding
FX_BIDICLASS_PDF = 18, // Pop Directional Format
FX_BIDICLASS_N = FX_BIDICLASS_ON,
};
extern const uint32_t kTextLayoutCodeProperties[];
extern const size_t kTextLayoutCodePropertiesSize;
extern const uint16_t kFXTextLayoutBidiMirror[];
extern const size_t kFXTextLayoutBidiMirrorSize;
uint32_t FX_GetUnicodeProperties(wchar_t wch);
wchar_t FX_GetMirrorChar(wchar_t wch);
#ifdef PDF_ENABLE_XFA
// As defined in http://www.unicode.org/reports/tr14/
enum FXCHAR_BREAKPROP {
FX_CBP_OP = 0, // Opening Punctuation
FX_CBP_CL = 1, // Closing Punctuation
FX_CBP_QU = 2, // Ambiguous Quotation
FX_CBP_GL = 3, // Non-breaking ("Glue")
FX_CBP_NS = 4, // Non Starter
FX_CBP_EX = 5, // Exclamation/Interrogation
FX_CBP_SY = 6, // Symbols Allowing Breaks
FX_CBP_IS = 7, // Infix Separator (Numeric)
FX_CBP_PR = 8, // Prefix (Numeric)
FX_CBP_PO = 9, // Postfix (Numeric)
FX_CBP_NU = 10, // Numeric
FX_CBP_AL = 11, // Ordinary Alphabetic and Symbol Characters
FX_CBP_ID = 12, // Ideographic
FX_CBP_IN = 13, // Inseparable
FX_CBP_HY = 14, // Hyphen
FX_CBP_BA = 15, // Break Opportunity After
FX_CBP_BB = 16, // Break Opportunity Before
FX_CBP_B2 = 17, // Break Opportunity Before and After
FX_CBP_ZW = 18, // Zero Width Space
FX_CBP_CM = 19, // Attached Characters and Combining Marks
FX_CBP_WJ = 20, // Word Joiner
FX_CBP_H2 = 21, // Hangul LV Syllable
FX_CBP_H3 = 22, // Hangul LVT Syllable
FX_CBP_JL = 23, // Hangul Leading Jamo
FX_CBP_JV = 24, // Hangul Vowel Jamo
FX_CBP_JT = 25, // Hangul Trailing Jamo
FX_CBP_BK = 26, // Mandatory Break
FX_CBP_CR = 27, // Carriage Return
FX_CBP_LF = 28, // Line Feed
FX_CBP_NL = 29, // Next Line
FX_CBP_SA = 30, // Complex Context (South East Asian)
FX_CBP_SG = 31, // Surrogate
FX_CBP_CB = 32, // Contingent Break Opportunity
FX_CBP_XX = 33, // Unknown
FX_CBP_AI = 34, // Ambiguous (Alphabetic or Ideographic)
FX_CBP_SP = 35, // Space
FX_CBP_NONE = 36,
FX_CBP_TB = 37, // ?
};
constexpr uint32_t FX_CHARTYPEBITS = 11;
constexpr uint32_t FX_CHARTYPEBITSMASK = 0xF << FX_CHARTYPEBITS;
enum FX_CHARTYPE {
FX_CHARTYPE_Unknown = 0,
FX_CHARTYPE_Tab = (1 << FX_CHARTYPEBITS),
FX_CHARTYPE_Space = (2 << FX_CHARTYPEBITS),
FX_CHARTYPE_Control = (3 << FX_CHARTYPEBITS),
FX_CHARTYPE_Combination = (4 << FX_CHARTYPEBITS),
FX_CHARTYPE_Numeric = (5 << FX_CHARTYPEBITS),
FX_CHARTYPE_Normal = (6 << FX_CHARTYPEBITS),
FX_CHARTYPE_ArabicAlef = (7 << FX_CHARTYPEBITS),
FX_CHARTYPE_ArabicSpecial = (8 << FX_CHARTYPEBITS),
FX_CHARTYPE_ArabicDistortion = (9 << FX_CHARTYPEBITS),
FX_CHARTYPE_ArabicNormal = (10 << FX_CHARTYPEBITS),
FX_CHARTYPE_ArabicForm = (11 << FX_CHARTYPEBITS),
FX_CHARTYPE_Arabic = (12 << FX_CHARTYPEBITS),
};
inline FX_CHARTYPE GetCharTypeFromProp(uint32_t prop) {
return static_cast<FX_CHARTYPE>(prop & FX_CHARTYPEBITSMASK);
}
wchar_t FX_GetMirrorChar(wchar_t wch, uint32_t dwProps);
#endif // PDF_ENABLE_XFA
#endif // CORE_FXCRT_FX_UCD_H_