1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
|
// Copyright 2014 PDFium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
#ifndef CORE_FXCRT_FX_UCD_H_
#define CORE_FXCRT_FX_UCD_H_
#include "core/fxcrt/cfx_retain_ptr.h"
#include "core/fxcrt/fx_basic.h"
#define FX_BIDICLASSBITS 6
#define FX_BIDICLASSBITSMASK (31 << FX_BIDICLASSBITS)
enum FX_BIDICLASS {
FX_BIDICLASS_ON = 0, // Other Neutral
FX_BIDICLASS_L = 1, // Left Letter
FX_BIDICLASS_R = 2, // Right Letter
FX_BIDICLASS_AN = 3, // Arabic Number
FX_BIDICLASS_EN = 4, // European Number
FX_BIDICLASS_AL = 5, // Arabic Letter
FX_BIDICLASS_NSM = 6, // Non-spacing Mark
FX_BIDICLASS_CS = 7, // Common Number Separator
FX_BIDICLASS_ES = 8, // European Separator
FX_BIDICLASS_ET = 9, // European Number Terminator
FX_BIDICLASS_BN = 10, // Boundary Neutral
FX_BIDICLASS_S = 11, // Segment Separator
FX_BIDICLASS_WS = 12, // Whitespace
FX_BIDICLASS_B = 13, // Paragraph Separator
FX_BIDICLASS_RLO = 14, // Right-to-Left Override
FX_BIDICLASS_RLE = 15, // Right-to-Left Embedding
FX_BIDICLASS_LRO = 16, // Left-to-Right Override
FX_BIDICLASS_LRE = 17, // Left-to-Right Embedding
FX_BIDICLASS_PDF = 18, // Pop Directional Format
FX_BIDICLASS_N = FX_BIDICLASS_ON,
};
extern const uint32_t kTextLayoutCodeProperties[];
extern const size_t kTextLayoutCodePropertiesSize;
extern const uint16_t kFXTextLayoutVerticalMirror[];
extern const size_t kFXTextLayoutVerticalMirrorSize;
extern const uint16_t kFXTextLayoutBidiMirror[];
extern const size_t kFXTextLayoutBidiMirrorSize;
uint32_t FX_GetUnicodeProperties(FX_WCHAR wch);
FX_WCHAR FX_GetMirrorChar(FX_WCHAR wch, bool bRTL, bool bVertical);
#ifdef PDF_ENABLE_XFA
// As defined in http://www.unicode.org/reports/tr14/
enum FX_CHARBREAKPROP {
FX_CBP_OP = 0, // Opening Punctuation
FX_CBP_CL = 1, // Closing Punctuation
FX_CBP_QU = 2, // Ambiguous Quotation
FX_CBP_GL = 3, // Non-breaking ("Glue")
FX_CBP_NS = 4, // Non Starter
FX_CBP_EX = 5, // Exclamation/Interrogation
FX_CBP_SY = 6, // Symbols Allowing Breaks
FX_CBP_IS = 7, // Infix Separator (Numeric)
FX_CBP_PR = 8, // Prefix (Numeric)
FX_CBP_PO = 9, // Postfix (Numeric)
FX_CBP_NU = 10, // Numeric
FX_CBP_AL = 11, // Ordinary Alphabetic and Symbol Characters
FX_CBP_ID = 12, // Ideographic
FX_CBP_IN = 13, // Inseparable
FX_CBP_HY = 14, // Hyphen
FX_CBP_BA = 15, // Break Opportunity After
FX_CBP_BB = 16, // Break Opportunity Before
FX_CBP_B2 = 17, // Break Opportunity Before and After
FX_CBP_ZW = 18, // Zero Width Space
FX_CBP_CM = 19, // Attached Characters and Combining Marks
FX_CBP_WJ = 20, // Word Joiner
FX_CBP_H2 = 21, // Hangul LV Syllable
FX_CBP_H3 = 22, // Hangul LVT Syllable
FX_CBP_JL = 23, // Hangul Leading Jamo
FX_CBP_JV = 24, // Hangul Vowel Jamo
FX_CBP_JT = 25, // Hangul Trailing Jamo
FX_CBP_BK = 26, // Mandatory Break
FX_CBP_CR = 27, // Carriage Return
FX_CBP_LF = 28, // Line Feed
FX_CBP_NL = 29, // Next Line
FX_CBP_SA = 30, // Complex Context (South East Asian)
FX_CBP_SG = 31, // Surrogate
FX_CBP_CB = 32, // Contingent Break Opportunity
FX_CBP_XX = 33, // Unknown
FX_CBP_AI = 34, // Ambiguous (Alphabetic or Ideographic)
FX_CBP_SP = 35, // Space
FX_CBP_NONE = 36,
FX_CBP_TB = 37, // ?
};
#define FX_CHARTYPEBITS 11
#define FX_CHARTYPEBITSMASK (15 << FX_CHARTYPEBITS)
enum FX_CHARTYPE {
FX_CHARTYPE_Unknown = 0,
FX_CHARTYPE_Tab = (1 << FX_CHARTYPEBITS),
FX_CHARTYPE_Space = (2 << FX_CHARTYPEBITS),
FX_CHARTYPE_Control = (3 << FX_CHARTYPEBITS),
FX_CHARTYPE_Combination = (4 << FX_CHARTYPEBITS),
FX_CHARTYPE_Numeric = (5 << FX_CHARTYPEBITS),
FX_CHARTYPE_Normal = (6 << FX_CHARTYPEBITS),
FX_CHARTYPE_ArabicAlef = (7 << FX_CHARTYPEBITS),
FX_CHARTYPE_ArabicSpecial = (8 << FX_CHARTYPEBITS),
FX_CHARTYPE_ArabicDistortion = (9 << FX_CHARTYPEBITS),
FX_CHARTYPE_ArabicNormal = (10 << FX_CHARTYPEBITS),
FX_CHARTYPE_ArabicForm = (11 << FX_CHARTYPEBITS),
FX_CHARTYPE_Arabic = (12 << FX_CHARTYPEBITS),
};
inline FX_CHARTYPE GetCharTypeFromProp(uint32_t prop) {
return static_cast<FX_CHARTYPE>(prop & FX_CHARTYPEBITSMASK);
}
FX_WCHAR FX_GetMirrorChar(FX_WCHAR wch,
uint32_t dwProps,
bool bRTL,
bool bVertical);
enum class CFX_BreakType { None = 0, Piece, Line, Paragraph, Page };
class CFX_Char {
public:
CFX_Char()
: m_dwStatus(CFX_BreakType::None),
m_wCharCode(0),
m_nBreakType(0),
m_dwCharProps(0),
m_iCharWidth(0),
m_iHorizontalScale(100),
m_iVerticalScale(100) {}
CFX_Char(uint16_t wCharCode, uint32_t dwCharProps)
: m_wCharCode(wCharCode),
m_nBreakType(0),
m_dwCharProps(dwCharProps),
m_iCharWidth(0),
m_iHorizontalScale(100),
m_iVerticalScale(100) {}
FX_CHARTYPE GetCharType() const { return GetCharTypeFromProp(m_dwCharProps); }
CFX_BreakType m_dwStatus;
uint16_t m_wCharCode;
uint8_t m_nBreakType;
uint32_t m_dwCharProps;
int32_t m_iCharWidth;
int32_t m_iHorizontalScale;
int32_t m_iVerticalScale;
};
class CFX_TxtChar : public CFX_Char {
public:
CFX_TxtChar()
: m_nRotation(0),
m_dwCharStyles(0),
m_iBidiClass(0),
m_iBidiLevel(0),
m_iBidiPos(0),
m_iBidiOrder(0) {}
int8_t m_nRotation;
uint32_t m_dwCharStyles;
int16_t m_iBidiClass;
int16_t m_iBidiLevel;
int16_t m_iBidiPos;
int16_t m_iBidiOrder;
};
class CFX_RTFChar : public CFX_Char {
public:
CFX_RTFChar();
CFX_RTFChar(const CFX_RTFChar& other);
~CFX_RTFChar();
int32_t m_iFontSize;
int32_t m_iFontHeight;
int16_t m_iBidiClass;
int16_t m_iBidiLevel;
int16_t m_iBidiPos;
int16_t m_iBidiOrder;
uint32_t m_dwIdentity;
CFX_RetainPtr<CFX_Retainable> m_pUserData;
};
inline CFX_RTFChar::CFX_RTFChar()
: m_iFontSize(0),
m_iFontHeight(0),
m_iBidiClass(0),
m_iBidiLevel(0),
m_iBidiPos(0),
m_dwIdentity(0),
m_pUserData(nullptr) {}
inline CFX_RTFChar::CFX_RTFChar(const CFX_RTFChar& other) = default;
inline CFX_RTFChar::~CFX_RTFChar() = default;
#endif // PDF_ENABLE_XFA
#endif // CORE_FXCRT_FX_UCD_H_
|