|  | // Copyright 2016 PDFium Authors. All rights reserved. | 
|  | // Use of this source code is governed by a BSD-style license that can be | 
|  | // found in the LICENSE file. | 
|  |  | 
|  | // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com | 
|  |  | 
|  | #include "core/fpdfapi/font/cpdf_cidfont.h" | 
|  |  | 
|  | #include <algorithm> | 
|  | #include <limits> | 
|  | #include <vector> | 
|  |  | 
|  | #include "build/build_config.h" | 
|  | #include "core/fpdfapi/cmaps/fpdf_cmaps.h" | 
|  | #include "core/fpdfapi/font/cfx_cttgsubtable.h" | 
|  | #include "core/fpdfapi/font/cpdf_cid2unicodemap.h" | 
|  | #include "core/fpdfapi/font/cpdf_cmap.h" | 
|  | #include "core/fpdfapi/font/cpdf_cmapparser.h" | 
|  | #include "core/fpdfapi/font/cpdf_fontencoding.h" | 
|  | #include "core/fpdfapi/font/cpdf_fontglobals.h" | 
|  | #include "core/fpdfapi/parser/cpdf_array.h" | 
|  | #include "core/fpdfapi/parser/cpdf_dictionary.h" | 
|  | #include "core/fpdfapi/parser/cpdf_stream_acc.h" | 
|  | #include "core/fxcrt/fx_safe_types.h" | 
|  | #include "core/fxge/fx_font.h" | 
|  | #include "third_party/base/ptr_util.h" | 
|  | #include "third_party/base/span.h" | 
|  | #include "third_party/base/stl_util.h" | 
|  |  | 
|  | namespace { | 
|  |  | 
|  | const uint16_t g_CharsetCPs[CIDSET_NUM_SETS] = {0, 936, 950, 932, 949, 1200}; | 
|  |  | 
|  | const struct CIDTransform { | 
|  | uint16_t cid; | 
|  | uint8_t a; | 
|  | uint8_t b; | 
|  | uint8_t c; | 
|  | uint8_t d; | 
|  | uint8_t e; | 
|  | uint8_t f; | 
|  | } g_Japan1_VertCIDs[] = { | 
|  | {97, 129, 0, 0, 127, 55, 0},     {7887, 127, 0, 0, 127, 76, 89}, | 
|  | {7888, 127, 0, 0, 127, 79, 94},  {7889, 0, 129, 127, 0, 17, 127}, | 
|  | {7890, 0, 129, 127, 0, 17, 127}, {7891, 0, 129, 127, 0, 17, 127}, | 
|  | {7892, 0, 129, 127, 0, 17, 127}, {7893, 0, 129, 127, 0, 17, 127}, | 
|  | {7894, 0, 129, 127, 0, 17, 127}, {7895, 0, 129, 127, 0, 17, 127}, | 
|  | {7896, 0, 129, 127, 0, 17, 127}, {7897, 0, 129, 127, 0, 17, 127}, | 
|  | {7898, 0, 129, 127, 0, 17, 127}, {7899, 0, 129, 127, 0, 17, 104}, | 
|  | {7900, 0, 129, 127, 0, 17, 127}, {7901, 0, 129, 127, 0, 17, 104}, | 
|  | {7902, 0, 129, 127, 0, 17, 127}, {7903, 0, 129, 127, 0, 17, 127}, | 
|  | {7904, 0, 129, 127, 0, 17, 127}, {7905, 0, 129, 127, 0, 17, 114}, | 
|  | {7906, 0, 129, 127, 0, 17, 127}, {7907, 0, 129, 127, 0, 17, 127}, | 
|  | {7908, 0, 129, 127, 0, 17, 127}, {7909, 0, 129, 127, 0, 17, 127}, | 
|  | {7910, 0, 129, 127, 0, 17, 127}, {7911, 0, 129, 127, 0, 17, 127}, | 
|  | {7912, 0, 129, 127, 0, 17, 127}, {7913, 0, 129, 127, 0, 17, 127}, | 
|  | {7914, 0, 129, 127, 0, 17, 127}, {7915, 0, 129, 127, 0, 17, 114}, | 
|  | {7916, 0, 129, 127, 0, 17, 127}, {7917, 0, 129, 127, 0, 17, 127}, | 
|  | {7918, 127, 0, 0, 127, 18, 25},  {7919, 127, 0, 0, 127, 18, 25}, | 
|  | {7920, 127, 0, 0, 127, 18, 25},  {7921, 127, 0, 0, 127, 18, 25}, | 
|  | {7922, 127, 0, 0, 127, 18, 25},  {7923, 127, 0, 0, 127, 18, 25}, | 
|  | {7924, 127, 0, 0, 127, 18, 25},  {7925, 127, 0, 0, 127, 18, 25}, | 
|  | {7926, 127, 0, 0, 127, 18, 25},  {7927, 127, 0, 0, 127, 18, 25}, | 
|  | {7928, 127, 0, 0, 127, 18, 25},  {7929, 127, 0, 0, 127, 18, 25}, | 
|  | {7930, 127, 0, 0, 127, 18, 25},  {7931, 127, 0, 0, 127, 18, 25}, | 
|  | {7932, 127, 0, 0, 127, 18, 25},  {7933, 127, 0, 0, 127, 18, 25}, | 
|  | {7934, 127, 0, 0, 127, 18, 25},  {7935, 127, 0, 0, 127, 18, 25}, | 
|  | {7936, 127, 0, 0, 127, 18, 25},  {7937, 127, 0, 0, 127, 18, 25}, | 
|  | {7938, 127, 0, 0, 127, 18, 25},  {7939, 127, 0, 0, 127, 18, 25}, | 
|  | {8720, 0, 129, 127, 0, 19, 102}, {8721, 0, 129, 127, 0, 13, 127}, | 
|  | {8722, 0, 129, 127, 0, 19, 108}, {8723, 0, 129, 127, 0, 19, 102}, | 
|  | {8724, 0, 129, 127, 0, 19, 102}, {8725, 0, 129, 127, 0, 19, 102}, | 
|  | {8726, 0, 129, 127, 0, 19, 102}, {8727, 0, 129, 127, 0, 19, 102}, | 
|  | {8728, 0, 129, 127, 0, 19, 114}, {8729, 0, 129, 127, 0, 19, 114}, | 
|  | {8730, 0, 129, 127, 0, 38, 108}, {8731, 0, 129, 127, 0, 13, 108}, | 
|  | {8732, 0, 129, 127, 0, 19, 108}, {8733, 0, 129, 127, 0, 19, 108}, | 
|  | {8734, 0, 129, 127, 0, 19, 108}, {8735, 0, 129, 127, 0, 19, 108}, | 
|  | {8736, 0, 129, 127, 0, 19, 102}, {8737, 0, 129, 127, 0, 19, 102}, | 
|  | {8738, 0, 129, 127, 0, 19, 102}, {8739, 0, 129, 127, 0, 19, 102}, | 
|  | {8740, 0, 129, 127, 0, 19, 102}, {8741, 0, 129, 127, 0, 19, 102}, | 
|  | {8742, 0, 129, 127, 0, 19, 102}, {8743, 0, 129, 127, 0, 19, 102}, | 
|  | {8744, 0, 129, 127, 0, 19, 102}, {8745, 0, 129, 127, 0, 19, 102}, | 
|  | {8746, 0, 129, 127, 0, 19, 114}, {8747, 0, 129, 127, 0, 19, 114}, | 
|  | {8748, 0, 129, 127, 0, 19, 102}, {8749, 0, 129, 127, 0, 19, 102}, | 
|  | {8750, 0, 129, 127, 0, 19, 102}, {8751, 0, 129, 127, 0, 19, 102}, | 
|  | {8752, 0, 129, 127, 0, 19, 102}, {8753, 0, 129, 127, 0, 19, 102}, | 
|  | {8754, 0, 129, 127, 0, 19, 102}, {8755, 0, 129, 127, 0, 19, 102}, | 
|  | {8756, 0, 129, 127, 0, 19, 102}, {8757, 0, 129, 127, 0, 19, 102}, | 
|  | {8758, 0, 129, 127, 0, 19, 102}, {8759, 0, 129, 127, 0, 19, 102}, | 
|  | {8760, 0, 129, 127, 0, 19, 102}, {8761, 0, 129, 127, 0, 19, 102}, | 
|  | {8762, 0, 129, 127, 0, 19, 102}, {8763, 0, 129, 127, 0, 19, 102}, | 
|  | {8764, 0, 129, 127, 0, 19, 102}, {8765, 0, 129, 127, 0, 19, 102}, | 
|  | {8766, 0, 129, 127, 0, 19, 102}, {8767, 0, 129, 127, 0, 19, 102}, | 
|  | {8768, 0, 129, 127, 0, 19, 102}, {8769, 0, 129, 127, 0, 19, 102}, | 
|  | {8770, 0, 129, 127, 0, 19, 102}, {8771, 0, 129, 127, 0, 19, 102}, | 
|  | {8772, 0, 129, 127, 0, 19, 102}, {8773, 0, 129, 127, 0, 19, 102}, | 
|  | {8774, 0, 129, 127, 0, 19, 102}, {8775, 0, 129, 127, 0, 19, 102}, | 
|  | {8776, 0, 129, 127, 0, 19, 102}, {8777, 0, 129, 127, 0, 19, 102}, | 
|  | {8778, 0, 129, 127, 0, 19, 102}, {8779, 0, 129, 127, 0, 19, 114}, | 
|  | {8780, 0, 129, 127, 0, 19, 108}, {8781, 0, 129, 127, 0, 19, 114}, | 
|  | {8782, 0, 129, 127, 0, 13, 114}, {8783, 0, 129, 127, 0, 19, 108}, | 
|  | {8784, 0, 129, 127, 0, 13, 114}, {8785, 0, 129, 127, 0, 19, 108}, | 
|  | {8786, 0, 129, 127, 0, 19, 108}, {8787, 0, 129, 127, 0, 19, 108}, | 
|  | {8788, 0, 129, 127, 0, 19, 108}, {8789, 0, 129, 127, 0, 19, 108}, | 
|  | {8790, 0, 129, 127, 0, 19, 108}, {8791, 0, 129, 127, 0, 19, 108}, | 
|  | {8792, 0, 129, 127, 0, 19, 108}, {8793, 0, 129, 127, 0, 19, 108}, | 
|  | {8794, 0, 129, 127, 0, 19, 108}, {8795, 0, 129, 127, 0, 19, 108}, | 
|  | {8796, 0, 129, 127, 0, 19, 108}, {8797, 0, 129, 127, 0, 19, 108}, | 
|  | {8798, 0, 129, 127, 0, 19, 108}, {8799, 0, 129, 127, 0, 19, 108}, | 
|  | {8800, 0, 129, 127, 0, 19, 108}, {8801, 0, 129, 127, 0, 19, 108}, | 
|  | {8802, 0, 129, 127, 0, 19, 108}, {8803, 0, 129, 127, 0, 19, 108}, | 
|  | {8804, 0, 129, 127, 0, 19, 108}, {8805, 0, 129, 127, 0, 19, 108}, | 
|  | {8806, 0, 129, 127, 0, 19, 108}, {8807, 0, 129, 127, 0, 19, 108}, | 
|  | {8808, 0, 129, 127, 0, 19, 108}, {8809, 0, 129, 127, 0, 19, 108}, | 
|  | {8810, 0, 129, 127, 0, 19, 108}, {8811, 0, 129, 127, 0, 19, 114}, | 
|  | {8812, 0, 129, 127, 0, 19, 102}, {8813, 0, 129, 127, 0, 19, 114}, | 
|  | {8814, 0, 129, 127, 0, 76, 102}, {8815, 0, 129, 127, 0, 13, 121}, | 
|  | {8816, 0, 129, 127, 0, 19, 114}, {8817, 0, 129, 127, 0, 19, 127}, | 
|  | {8818, 0, 129, 127, 0, 19, 114}, {8819, 0, 129, 127, 0, 218, 108}, | 
|  | }; | 
|  |  | 
|  | // Boundary values to avoid integer overflow when multiplied by 1000. | 
|  | constexpr long kMinCBox = -2147483; | 
|  | constexpr long kMaxCBox = 2147483; | 
|  |  | 
|  | // Boundary value to avoid integer overflow when adding 1/64th of the value. | 
|  | constexpr int kMaxRectTop = 2114445437; | 
|  |  | 
|  | #if !defined(OS_WIN) | 
|  |  | 
|  | bool IsValidEmbeddedCharcodeFromUnicodeCharset(CIDSet charset) { | 
|  | switch (charset) { | 
|  | case CIDSET_GB1: | 
|  | case CIDSET_CNS1: | 
|  | case CIDSET_JAPAN1: | 
|  | case CIDSET_KOREA1: | 
|  | return true; | 
|  |  | 
|  | default: | 
|  | return false; | 
|  | } | 
|  | } | 
|  |  | 
|  | wchar_t EmbeddedUnicodeFromCharcode(const FXCMAP_CMap* pEmbedMap, | 
|  | CIDSet charset, | 
|  | uint32_t charcode) { | 
|  | if (!IsValidEmbeddedCharcodeFromUnicodeCharset(charset)) | 
|  | return 0; | 
|  |  | 
|  | uint16_t cid = CIDFromCharCode(pEmbedMap, charcode); | 
|  | if (!cid) | 
|  | return 0; | 
|  |  | 
|  | pdfium::span<const uint16_t> map = | 
|  | CPDF_FontGlobals::GetInstance()->GetEmbeddedToUnicode(charset); | 
|  | return cid < map.size() ? map[cid] : 0; | 
|  | } | 
|  |  | 
|  | uint32_t EmbeddedCharcodeFromUnicode(const FXCMAP_CMap* pEmbedMap, | 
|  | CIDSet charset, | 
|  | wchar_t unicode) { | 
|  | if (!IsValidEmbeddedCharcodeFromUnicodeCharset(charset)) | 
|  | return 0; | 
|  |  | 
|  | pdfium::span<const uint16_t> map = | 
|  | CPDF_FontGlobals::GetInstance()->GetEmbeddedToUnicode(charset); | 
|  | for (uint32_t i = 0; i < map.size(); ++i) { | 
|  | if (map[i] == unicode) { | 
|  | uint32_t charCode = CharCodeFromCID(pEmbedMap, i); | 
|  | if (charCode) | 
|  | return charCode; | 
|  | } | 
|  | } | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | #endif  // !defined(OS_WIN) | 
|  |  | 
|  | void FT_UseCIDCharmap(FXFT_FaceRec* face, int coding) { | 
|  | int encoding; | 
|  | switch (coding) { | 
|  | case CIDCODING_GB: | 
|  | encoding = FT_ENCODING_GB2312; | 
|  | break; | 
|  | case CIDCODING_BIG5: | 
|  | encoding = FT_ENCODING_BIG5; | 
|  | break; | 
|  | case CIDCODING_JIS: | 
|  | encoding = FT_ENCODING_SJIS; | 
|  | break; | 
|  | case CIDCODING_KOREA: | 
|  | encoding = FT_ENCODING_JOHAB; | 
|  | break; | 
|  | default: | 
|  | encoding = FT_ENCODING_UNICODE; | 
|  | } | 
|  | int err = FXFT_Select_Charmap(face, encoding); | 
|  | if (err) | 
|  | err = FXFT_Select_Charmap(face, FT_ENCODING_UNICODE); | 
|  | if (err && FXFT_Get_Face_Charmaps(face)) | 
|  | FT_Set_Charmap(face, *FXFT_Get_Face_Charmaps(face)); | 
|  | } | 
|  |  | 
|  | bool IsMetricForCID(const uint32_t* pEntry, uint16_t CID) { | 
|  | return pEntry[0] <= CID && pEntry[1] >= CID; | 
|  | } | 
|  |  | 
|  | }  // namespace | 
|  |  | 
|  | CPDF_CIDFont::CPDF_CIDFont(CPDF_Document* pDocument, CPDF_Dictionary* pFontDict) | 
|  | : CPDF_Font(pDocument, pFontDict) { | 
|  | for (size_t i = 0; i < FX_ArraySize(m_CharBBox); ++i) | 
|  | m_CharBBox[i] = FX_RECT(-1, -1, -1, -1); | 
|  | } | 
|  |  | 
|  | CPDF_CIDFont::~CPDF_CIDFont() {} | 
|  |  | 
|  | bool CPDF_CIDFont::IsCIDFont() const { | 
|  | return true; | 
|  | } | 
|  |  | 
|  | const CPDF_CIDFont* CPDF_CIDFont::AsCIDFont() const { | 
|  | return this; | 
|  | } | 
|  |  | 
|  | CPDF_CIDFont* CPDF_CIDFont::AsCIDFont() { | 
|  | return this; | 
|  | } | 
|  |  | 
|  | uint16_t CPDF_CIDFont::CIDFromCharCode(uint32_t charcode) const { | 
|  | return m_pCMap ? m_pCMap->CIDFromCharCode(charcode) | 
|  | : static_cast<uint16_t>(charcode); | 
|  | } | 
|  |  | 
|  | bool CPDF_CIDFont::IsVertWriting() const { | 
|  | return m_pCMap && m_pCMap->IsVertWriting(); | 
|  | } | 
|  |  | 
|  | WideString CPDF_CIDFont::UnicodeFromCharCode(uint32_t charcode) const { | 
|  | WideString str = CPDF_Font::UnicodeFromCharCode(charcode); | 
|  | if (!str.IsEmpty()) | 
|  | return str; | 
|  | wchar_t ret = GetUnicodeFromCharCode(charcode); | 
|  | return ret ? ret : WideString(); | 
|  | } | 
|  |  | 
|  | wchar_t CPDF_CIDFont::GetUnicodeFromCharCode(uint32_t charcode) const { | 
|  | switch (m_pCMap->GetCoding()) { | 
|  | case CIDCODING_UCS2: | 
|  | case CIDCODING_UTF16: | 
|  | return static_cast<wchar_t>(charcode); | 
|  | case CIDCODING_CID: | 
|  | if (!m_pCID2UnicodeMap || !m_pCID2UnicodeMap->IsLoaded()) | 
|  | return 0; | 
|  | return m_pCID2UnicodeMap->UnicodeFromCID(static_cast<uint16_t>(charcode)); | 
|  | } | 
|  | if (m_pCID2UnicodeMap && m_pCID2UnicodeMap->IsLoaded() && m_pCMap->IsLoaded()) | 
|  | return m_pCID2UnicodeMap->UnicodeFromCID(CIDFromCharCode(charcode)); | 
|  |  | 
|  | #if defined(OS_WIN) | 
|  | wchar_t unicode; | 
|  | int charsize = 1; | 
|  | if (charcode > 255) { | 
|  | charcode = (charcode % 256) * 256 + (charcode / 256); | 
|  | charsize = 2; | 
|  | } | 
|  | int ret = FXSYS_MultiByteToWideChar(g_CharsetCPs[m_pCMap->GetCoding()], 0, | 
|  | reinterpret_cast<const char*>(&charcode), | 
|  | charsize, &unicode, 1); | 
|  | return ret == 1 ? unicode : 0; | 
|  | #else | 
|  | if (!m_pCMap->GetEmbedMap()) | 
|  | return 0; | 
|  | return EmbeddedUnicodeFromCharcode(m_pCMap->GetEmbedMap(), | 
|  | m_pCMap->GetCharset(), charcode); | 
|  | #endif | 
|  | } | 
|  |  | 
|  | uint32_t CPDF_CIDFont::CharCodeFromUnicode(wchar_t unicode) const { | 
|  | uint32_t charcode = CPDF_Font::CharCodeFromUnicode(unicode); | 
|  | if (charcode) | 
|  | return charcode; | 
|  | switch (m_pCMap->GetCoding()) { | 
|  | case CIDCODING_UNKNOWN: | 
|  | return 0; | 
|  | case CIDCODING_UCS2: | 
|  | case CIDCODING_UTF16: | 
|  | return unicode; | 
|  | case CIDCODING_CID: { | 
|  | if (!m_pCID2UnicodeMap || !m_pCID2UnicodeMap->IsLoaded()) | 
|  | return 0; | 
|  | uint32_t CID = 0; | 
|  | while (CID < 65536) { | 
|  | wchar_t this_unicode = | 
|  | m_pCID2UnicodeMap->UnicodeFromCID(static_cast<uint16_t>(CID)); | 
|  | if (this_unicode == unicode) | 
|  | return CID; | 
|  | CID++; | 
|  | } | 
|  | break; | 
|  | } | 
|  | } | 
|  |  | 
|  | if (unicode < 0x80) | 
|  | return static_cast<uint32_t>(unicode); | 
|  | if (m_pCMap->GetCoding() == CIDCODING_CID) | 
|  | return 0; | 
|  | #if defined(OS_WIN) | 
|  | uint8_t buffer[32]; | 
|  | int ret = FXSYS_WideCharToMultiByte( | 
|  | g_CharsetCPs[m_pCMap->GetCoding()], 0, &unicode, 1, | 
|  | reinterpret_cast<char*>(buffer), 4, nullptr, nullptr); | 
|  | if (ret == 1) | 
|  | return buffer[0]; | 
|  | if (ret == 2) | 
|  | return buffer[0] * 256 + buffer[1]; | 
|  | #else | 
|  | if (m_pCMap->GetEmbedMap()) { | 
|  | return EmbeddedCharcodeFromUnicode(m_pCMap->GetEmbedMap(), | 
|  | m_pCMap->GetCharset(), unicode); | 
|  | } | 
|  | #endif | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | bool CPDF_CIDFont::Load() { | 
|  | if (m_pFontDict->GetStringFor("Subtype") == "TrueType") { | 
|  | LoadGB2312(); | 
|  | return true; | 
|  | } | 
|  |  | 
|  | const CPDF_Array* pFonts = m_pFontDict->GetArrayFor("DescendantFonts"); | 
|  | if (!pFonts || pFonts->size() != 1) | 
|  | return false; | 
|  |  | 
|  | const CPDF_Dictionary* pCIDFontDict = pFonts->GetDictAt(0); | 
|  | if (!pCIDFontDict) | 
|  | return false; | 
|  |  | 
|  | m_BaseFontName = pCIDFontDict->GetStringFor("BaseFont"); | 
|  | if ((m_BaseFontName.Compare("CourierStd") == 0 || | 
|  | m_BaseFontName.Compare("CourierStd-Bold") == 0 || | 
|  | m_BaseFontName.Compare("CourierStd-BoldOblique") == 0 || | 
|  | m_BaseFontName.Compare("CourierStd-Oblique") == 0) && | 
|  | !IsEmbedded()) { | 
|  | m_bAdobeCourierStd = true; | 
|  | } | 
|  |  | 
|  | CPDF_Object* pEncoding = m_pFontDict->GetDirectObjectFor("Encoding"); | 
|  | if (!pEncoding) | 
|  | return false; | 
|  |  | 
|  | ByteString subtype = pCIDFontDict->GetStringFor("Subtype"); | 
|  | m_bType1 = (subtype == "CIDFontType0"); | 
|  |  | 
|  | CPDF_CMapManager* manager = CPDF_FontGlobals::GetInstance()->GetCMapManager(); | 
|  | if (pEncoding->IsName()) { | 
|  | ByteString cmap = pEncoding->GetString(); | 
|  | m_pCMap = manager->GetPredefinedCMap(cmap); | 
|  | } else if (CPDF_Stream* pStream = pEncoding->AsStream()) { | 
|  | auto pAcc = pdfium::MakeRetain<CPDF_StreamAcc>(pStream); | 
|  | pAcc->LoadAllDataFiltered(); | 
|  | pdfium::span<const uint8_t> span = pAcc->GetSpan(); | 
|  | m_pCMap = pdfium::MakeRetain<CPDF_CMap>(span); | 
|  | } else { | 
|  | return false; | 
|  | } | 
|  |  | 
|  | const CPDF_Dictionary* pFontDesc = pCIDFontDict->GetDictFor("FontDescriptor"); | 
|  | if (pFontDesc) | 
|  | LoadFontDescriptor(pFontDesc); | 
|  |  | 
|  | m_Charset = m_pCMap->GetCharset(); | 
|  | if (m_Charset == CIDSET_UNKNOWN) { | 
|  | const CPDF_Dictionary* pCIDInfo = pCIDFontDict->GetDictFor("CIDSystemInfo"); | 
|  | if (pCIDInfo) { | 
|  | m_Charset = CPDF_CMapParser::CharsetFromOrdering( | 
|  | pCIDInfo->GetStringFor("Ordering").AsStringView()); | 
|  | } | 
|  | } | 
|  | if (m_Charset != CIDSET_UNKNOWN) { | 
|  | m_pCID2UnicodeMap = manager->GetCID2UnicodeMap(m_Charset); | 
|  | } | 
|  | if (m_Font.GetFaceRec()) { | 
|  | if (m_bType1) | 
|  | FXFT_Select_Charmap(m_Font.GetFaceRec(), FT_ENCODING_UNICODE); | 
|  | else | 
|  | FT_UseCIDCharmap(m_Font.GetFaceRec(), m_pCMap->GetCoding()); | 
|  | } | 
|  | m_DefaultWidth = pCIDFontDict->GetIntegerFor("DW", 1000); | 
|  | const CPDF_Array* pWidthArray = pCIDFontDict->GetArrayFor("W"); | 
|  | if (pWidthArray) | 
|  | LoadMetricsArray(pWidthArray, &m_WidthList, 1); | 
|  | if (!IsEmbedded()) | 
|  | LoadSubstFont(); | 
|  |  | 
|  | const CPDF_Object* pmap = pCIDFontDict->GetDirectObjectFor("CIDToGIDMap"); | 
|  | if (pmap) { | 
|  | if (const CPDF_Stream* pStream = pmap->AsStream()) { | 
|  | m_pStreamAcc = pdfium::MakeRetain<CPDF_StreamAcc>(pStream); | 
|  | m_pStreamAcc->LoadAllDataFiltered(); | 
|  | } else if (m_pFontFile && pmap->GetString() == "Identity") { | 
|  | m_bCIDIsGID = true; | 
|  | } | 
|  | } | 
|  |  | 
|  | CheckFontMetrics(); | 
|  | if (IsVertWriting()) { | 
|  | pWidthArray = pCIDFontDict->GetArrayFor("W2"); | 
|  | if (pWidthArray) | 
|  | LoadMetricsArray(pWidthArray, &m_VertMetrics, 3); | 
|  | const CPDF_Array* pDefaultArray = pCIDFontDict->GetArrayFor("DW2"); | 
|  | if (pDefaultArray) { | 
|  | m_DefaultVY = pDefaultArray->GetIntegerAt(0); | 
|  | m_DefaultW1 = pDefaultArray->GetIntegerAt(1); | 
|  | } | 
|  | } | 
|  | return true; | 
|  | } | 
|  |  | 
|  | FX_RECT CPDF_CIDFont::GetCharBBox(uint32_t charcode) { | 
|  | if (charcode < 256 && m_CharBBox[charcode].right != -1) | 
|  | return m_CharBBox[charcode]; | 
|  |  | 
|  | FX_RECT rect; | 
|  | bool bVert = false; | 
|  | int glyph_index = GlyphFromCharCode(charcode, &bVert); | 
|  | FXFT_FaceRec* face = m_Font.GetFaceRec(); | 
|  | if (face) { | 
|  | if (FXFT_Is_Face_Tricky(face)) { | 
|  | int err = | 
|  | FT_Load_Glyph(face, glyph_index, FT_LOAD_IGNORE_GLOBAL_ADVANCE_WIDTH); | 
|  | if (!err) { | 
|  | FT_Glyph glyph; | 
|  | err = FT_Get_Glyph(face->glyph, &glyph); | 
|  | if (!err) { | 
|  | FT_BBox cbox; | 
|  | FT_Glyph_Get_CBox(glyph, FT_GLYPH_BBOX_PIXELS, &cbox); | 
|  | cbox.xMin = pdfium::clamp(cbox.xMin, kMinCBox, kMaxCBox); | 
|  | cbox.xMax = pdfium::clamp(cbox.xMax, kMinCBox, kMaxCBox); | 
|  | cbox.yMin = pdfium::clamp(cbox.yMin, kMinCBox, kMaxCBox); | 
|  | cbox.yMax = pdfium::clamp(cbox.yMax, kMinCBox, kMaxCBox); | 
|  | int pixel_size_x = face->size->metrics.x_ppem; | 
|  | int pixel_size_y = face->size->metrics.y_ppem; | 
|  | if (pixel_size_x == 0 || pixel_size_y == 0) { | 
|  | rect = FX_RECT(cbox.xMin, cbox.yMax, cbox.xMax, cbox.yMin); | 
|  | } else { | 
|  | rect = FX_RECT(cbox.xMin * 1000 / pixel_size_x, | 
|  | cbox.yMax * 1000 / pixel_size_y, | 
|  | cbox.xMax * 1000 / pixel_size_x, | 
|  | cbox.yMin * 1000 / pixel_size_y); | 
|  | } | 
|  | rect.top = std::min(rect.top, | 
|  | static_cast<int>(FXFT_Get_Face_Ascender(face))); | 
|  | rect.bottom = std::max( | 
|  | rect.bottom, static_cast<int>(FXFT_Get_Face_Descender(face))); | 
|  | FT_Done_Glyph(glyph); | 
|  | } | 
|  | } | 
|  | } else { | 
|  | int err = FT_Load_Glyph(face, glyph_index, FT_LOAD_NO_SCALE); | 
|  | if (err == 0) { | 
|  | rect = FX_RECT(TT2PDF(FXFT_Get_Glyph_HoriBearingX(face), face), | 
|  | TT2PDF(FXFT_Get_Glyph_HoriBearingY(face), face), | 
|  | TT2PDF(FXFT_Get_Glyph_HoriBearingX(face) + | 
|  | FXFT_Get_Glyph_Width(face), | 
|  | face), | 
|  | TT2PDF(FXFT_Get_Glyph_HoriBearingY(face) - | 
|  | FXFT_Get_Glyph_Height(face), | 
|  | face)); | 
|  | if (rect.top <= kMaxRectTop) | 
|  | rect.top += rect.top / 64; | 
|  | else | 
|  | rect.top = std::numeric_limits<int>::max(); | 
|  | } | 
|  | } | 
|  | } | 
|  | if (!m_pFontFile && m_Charset == CIDSET_JAPAN1) { | 
|  | uint16_t CID = CIDFromCharCode(charcode); | 
|  | const uint8_t* pTransform = GetCIDTransform(CID); | 
|  | if (pTransform && !bVert) { | 
|  | CFX_Matrix matrix(CIDTransformToFloat(pTransform[0]), | 
|  | CIDTransformToFloat(pTransform[1]), | 
|  | CIDTransformToFloat(pTransform[2]), | 
|  | CIDTransformToFloat(pTransform[3]), | 
|  | CIDTransformToFloat(pTransform[4]) * 1000, | 
|  | CIDTransformToFloat(pTransform[5]) * 1000); | 
|  | rect = matrix.TransformRect(CFX_FloatRect(rect)).GetOuterRect(); | 
|  | } | 
|  | } | 
|  | if (charcode < 256) | 
|  | m_CharBBox[charcode] = rect; | 
|  |  | 
|  | return rect; | 
|  | } | 
|  |  | 
|  | uint32_t CPDF_CIDFont::GetCharWidthF(uint32_t charcode) { | 
|  | if (charcode < 0x80 && m_bAnsiWidthsFixed) | 
|  | return (charcode >= 32 && charcode < 127) ? 500 : 0; | 
|  |  | 
|  | uint16_t cid = CIDFromCharCode(charcode); | 
|  | size_t size = m_WidthList.size(); | 
|  | const uint32_t* pList = m_WidthList.data(); | 
|  | for (size_t i = 0; i < size; i += 3) { | 
|  | const uint32_t* pEntry = pList + i; | 
|  | if (IsMetricForCID(pEntry, cid)) | 
|  | return pEntry[2]; | 
|  | } | 
|  | return m_DefaultWidth; | 
|  | } | 
|  |  | 
|  | short CPDF_CIDFont::GetVertWidth(uint16_t CID) const { | 
|  | size_t vertsize = m_VertMetrics.size() / 5; | 
|  | if (vertsize) { | 
|  | const uint32_t* pTable = m_VertMetrics.data(); | 
|  | for (size_t i = 0; i < vertsize; i++) { | 
|  | const uint32_t* pEntry = pTable + (i * 5); | 
|  | if (IsMetricForCID(pEntry, CID)) | 
|  | return static_cast<short>(pEntry[2]); | 
|  | } | 
|  | } | 
|  | return m_DefaultW1; | 
|  | } | 
|  |  | 
|  | void CPDF_CIDFont::GetVertOrigin(uint16_t CID, short& vx, short& vy) const { | 
|  | size_t vertsize = m_VertMetrics.size() / 5; | 
|  | if (vertsize) { | 
|  | const uint32_t* pTable = m_VertMetrics.data(); | 
|  | for (size_t i = 0; i < vertsize; i++) { | 
|  | const uint32_t* pEntry = pTable + (i * 5); | 
|  | if (IsMetricForCID(pEntry, CID)) { | 
|  | vx = static_cast<short>(pEntry[3]); | 
|  | vy = static_cast<short>(pEntry[4]); | 
|  | return; | 
|  | } | 
|  | } | 
|  | } | 
|  | uint32_t dwWidth = m_DefaultWidth; | 
|  | size_t size = m_WidthList.size(); | 
|  | const uint32_t* pList = m_WidthList.data(); | 
|  | for (size_t i = 0; i < size; i += 3) { | 
|  | const uint32_t* pEntry = pList + i; | 
|  | if (IsMetricForCID(pEntry, CID)) { | 
|  | dwWidth = pEntry[2]; | 
|  | break; | 
|  | } | 
|  | } | 
|  | vx = static_cast<short>(dwWidth) / 2; | 
|  | vy = m_DefaultVY; | 
|  | } | 
|  |  | 
|  | int CPDF_CIDFont::GetGlyphIndex(uint32_t unicode, bool* pVertGlyph) { | 
|  | if (pVertGlyph) | 
|  | *pVertGlyph = false; | 
|  |  | 
|  | FXFT_FaceRec* face = m_Font.GetFaceRec(); | 
|  | int index = FT_Get_Char_Index(face, unicode); | 
|  | if (unicode == 0x2502) | 
|  | return index; | 
|  |  | 
|  | if (!index || !IsVertWriting()) | 
|  | return index; | 
|  |  | 
|  | if (m_pTTGSUBTable) | 
|  | return GetVerticalGlyph(index, pVertGlyph); | 
|  |  | 
|  | if (!m_Font.GetSubData()) { | 
|  | unsigned long length = 0; | 
|  | int error = FT_Load_Sfnt_Table(face, FT_MAKE_TAG('G', 'S', 'U', 'B'), 0, | 
|  | nullptr, &length); | 
|  | if (!error) | 
|  | m_Font.SetSubData(FX_Alloc(uint8_t, length)); | 
|  | } | 
|  | int error = FT_Load_Sfnt_Table(face, FT_MAKE_TAG('G', 'S', 'U', 'B'), 0, | 
|  | m_Font.GetSubData(), nullptr); | 
|  | if (error || !m_Font.GetSubData()) | 
|  | return index; | 
|  |  | 
|  | m_pTTGSUBTable = pdfium::MakeUnique<CFX_CTTGSUBTable>(m_Font.GetSubData()); | 
|  | return GetVerticalGlyph(index, pVertGlyph); | 
|  | } | 
|  |  | 
|  | int CPDF_CIDFont::GetVerticalGlyph(int index, bool* pVertGlyph) { | 
|  | uint32_t vindex = m_pTTGSUBTable->GetVerticalGlyph(index); | 
|  | if (!vindex) | 
|  | return index; | 
|  |  | 
|  | index = vindex; | 
|  | if (pVertGlyph) | 
|  | *pVertGlyph = true; | 
|  | return index; | 
|  | } | 
|  |  | 
|  | int CPDF_CIDFont::GlyphFromCharCode(uint32_t charcode, bool* pVertGlyph) { | 
|  | if (pVertGlyph) | 
|  | *pVertGlyph = false; | 
|  |  | 
|  | if (!m_pFontFile && (!m_pStreamAcc || m_pCID2UnicodeMap)) { | 
|  | uint16_t cid = CIDFromCharCode(charcode); | 
|  | wchar_t unicode = 0; | 
|  | if (m_bCIDIsGID) { | 
|  | #if defined(OS_MACOSX) | 
|  | if (FontStyleIsSymbolic(m_Flags)) | 
|  | return cid; | 
|  |  | 
|  | WideString uni_str = UnicodeFromCharCode(charcode); | 
|  | if (uni_str.IsEmpty()) | 
|  | return cid; | 
|  |  | 
|  | unicode = uni_str[0]; | 
|  | #else | 
|  | return cid; | 
|  | #endif | 
|  | } else { | 
|  | if (cid && m_pCID2UnicodeMap && m_pCID2UnicodeMap->IsLoaded()) | 
|  | unicode = m_pCID2UnicodeMap->UnicodeFromCID(cid); | 
|  | if (unicode == 0) | 
|  | unicode = GetUnicodeFromCharCode(charcode); | 
|  | if (unicode == 0) { | 
|  | WideString unicode_str = UnicodeFromCharCode(charcode); | 
|  | if (!unicode_str.IsEmpty()) | 
|  | unicode = unicode_str[0]; | 
|  | } | 
|  | } | 
|  | FXFT_FaceRec* face = m_Font.GetFaceRec(); | 
|  | if (unicode == 0) { | 
|  | if (!m_bAdobeCourierStd) | 
|  | return charcode ? static_cast<int>(charcode) : -1; | 
|  |  | 
|  | charcode += 31; | 
|  | bool bMSUnicode = FT_UseTTCharmap(face, 3, 1); | 
|  | bool bMacRoman = !bMSUnicode && FT_UseTTCharmap(face, 1, 0); | 
|  | int iBaseEncoding = PDFFONT_ENCODING_STANDARD; | 
|  | if (bMSUnicode) | 
|  | iBaseEncoding = PDFFONT_ENCODING_WINANSI; | 
|  | else if (bMacRoman) | 
|  | iBaseEncoding = PDFFONT_ENCODING_MACROMAN; | 
|  | const char* name = | 
|  | GetAdobeCharName(iBaseEncoding, std::vector<ByteString>(), charcode); | 
|  | if (!name) | 
|  | return charcode ? static_cast<int>(charcode) : -1; | 
|  |  | 
|  | int index = 0; | 
|  | uint16_t name_unicode = PDF_UnicodeFromAdobeName(name); | 
|  | if (!name_unicode) | 
|  | return charcode ? static_cast<int>(charcode) : -1; | 
|  |  | 
|  | if (iBaseEncoding == PDFFONT_ENCODING_STANDARD) | 
|  | return FT_Get_Char_Index(face, name_unicode); | 
|  |  | 
|  | if (iBaseEncoding == PDFFONT_ENCODING_WINANSI) { | 
|  | index = FT_Get_Char_Index(face, name_unicode); | 
|  | } else { | 
|  | ASSERT(iBaseEncoding == PDFFONT_ENCODING_MACROMAN); | 
|  | uint32_t maccode = | 
|  | FT_CharCodeFromUnicode(FT_ENCODING_APPLE_ROMAN, name_unicode); | 
|  | index = maccode ? FT_Get_Char_Index(face, maccode) | 
|  | : FXFT_Get_Name_Index(face, name); | 
|  | } | 
|  | if (index == 0 || index == 0xffff) | 
|  | return charcode ? static_cast<int>(charcode) : -1; | 
|  | return index; | 
|  | } | 
|  | if (m_Charset == CIDSET_JAPAN1) { | 
|  | if (unicode == '\\') { | 
|  | unicode = '/'; | 
|  | #if !defined(OS_MACOSX) | 
|  | } else if (unicode == 0xa5) { | 
|  | unicode = 0x5c; | 
|  | #endif | 
|  | } | 
|  | } | 
|  | if (!face) | 
|  | return unicode; | 
|  |  | 
|  | int err = FXFT_Select_Charmap(face, FT_ENCODING_UNICODE); | 
|  | if (err) { | 
|  | int i; | 
|  | for (i = 0; i < FXFT_Get_Face_CharmapCount(face); i++) { | 
|  | uint32_t ret = FT_CharCodeFromUnicode( | 
|  | FXFT_Get_Charmap_Encoding(FXFT_Get_Face_Charmaps(face)[i]), | 
|  | static_cast<wchar_t>(charcode)); | 
|  | if (ret == 0) | 
|  | continue; | 
|  | FT_Set_Charmap(face, FXFT_Get_Face_Charmaps(face)[i]); | 
|  | unicode = static_cast<wchar_t>(ret); | 
|  | break; | 
|  | } | 
|  | if (i == FXFT_Get_Face_CharmapCount(face) && i) { | 
|  | FT_Set_Charmap(face, FXFT_Get_Face_Charmaps(face)[0]); | 
|  | unicode = static_cast<wchar_t>(charcode); | 
|  | } | 
|  | } | 
|  | if (FXFT_Get_Face_Charmap(face)) { | 
|  | int index = GetGlyphIndex(unicode, pVertGlyph); | 
|  | return index != 0 ? index : -1; | 
|  | } | 
|  | return unicode; | 
|  | } | 
|  |  | 
|  | if (!m_Font.GetFaceRec()) | 
|  | return -1; | 
|  |  | 
|  | uint16_t cid = CIDFromCharCode(charcode); | 
|  | if (!m_pStreamAcc) { | 
|  | if (m_bType1) | 
|  | return cid; | 
|  | if (m_pFontFile && m_pCMap->IsDirectCharcodeToCIDTableIsEmpty()) | 
|  | return cid; | 
|  | if (m_pCMap->GetCoding() == CIDCODING_UNKNOWN || | 
|  | !FXFT_Get_Face_Charmap(m_Font.GetFaceRec())) { | 
|  | return cid; | 
|  | } | 
|  | if (FXFT_Get_Charmap_Encoding(FXFT_Get_Face_Charmap(m_Font.GetFaceRec())) == | 
|  | FT_ENCODING_UNICODE) { | 
|  | WideString unicode_str = UnicodeFromCharCode(charcode); | 
|  | if (unicode_str.IsEmpty()) | 
|  | return -1; | 
|  |  | 
|  | charcode = unicode_str[0]; | 
|  | } | 
|  | return GetGlyphIndex(charcode, pVertGlyph); | 
|  | } | 
|  | uint32_t byte_pos = cid * 2; | 
|  | if (byte_pos + 2 > m_pStreamAcc->GetSize()) | 
|  | return -1; | 
|  |  | 
|  | const uint8_t* pdata = m_pStreamAcc->GetData() + byte_pos; | 
|  | return pdata[0] * 256 + pdata[1]; | 
|  | } | 
|  |  | 
|  | uint32_t CPDF_CIDFont::GetNextChar(ByteStringView pString, | 
|  | size_t* pOffset) const { | 
|  | return m_pCMap->GetNextChar(pString, pOffset); | 
|  | } | 
|  |  | 
|  | int CPDF_CIDFont::GetCharSize(uint32_t charcode) const { | 
|  | return m_pCMap->GetCharSize(charcode); | 
|  | } | 
|  |  | 
|  | size_t CPDF_CIDFont::CountChar(ByteStringView pString) const { | 
|  | return m_pCMap->CountChar(pString); | 
|  | } | 
|  |  | 
|  | int CPDF_CIDFont::AppendChar(char* str, uint32_t charcode) const { | 
|  | return m_pCMap->AppendChar(str, charcode); | 
|  | } | 
|  |  | 
|  | bool CPDF_CIDFont::IsUnicodeCompatible() const { | 
|  | if (m_pCID2UnicodeMap && m_pCID2UnicodeMap->IsLoaded() && m_pCMap->IsLoaded()) | 
|  | return true; | 
|  | return m_pCMap->GetCoding() != CIDCODING_UNKNOWN; | 
|  | } | 
|  |  | 
|  | void CPDF_CIDFont::LoadSubstFont() { | 
|  | FX_SAFE_INT32 safeStemV(m_StemV); | 
|  | safeStemV *= 5; | 
|  | m_Font.LoadSubst(m_BaseFontName, !m_bType1, m_Flags, | 
|  | safeStemV.ValueOrDefault(FXFONT_FW_NORMAL), m_ItalicAngle, | 
|  | g_CharsetCPs[m_Charset], IsVertWriting()); | 
|  | } | 
|  |  | 
|  | void CPDF_CIDFont::LoadMetricsArray(const CPDF_Array* pArray, | 
|  | std::vector<uint32_t>* result, | 
|  | int nElements) { | 
|  | int width_status = 0; | 
|  | int iCurElement = 0; | 
|  | uint32_t first_code = 0; | 
|  | uint32_t last_code = 0; | 
|  | for (size_t i = 0; i < pArray->size(); i++) { | 
|  | const CPDF_Object* pObj = pArray->GetDirectObjectAt(i); | 
|  | if (!pObj) | 
|  | continue; | 
|  |  | 
|  | if (const CPDF_Array* pObjArray = pObj->AsArray()) { | 
|  | if (width_status != 1) | 
|  | return; | 
|  | if (first_code > | 
|  | std::numeric_limits<uint32_t>::max() - pObjArray->size()) { | 
|  | width_status = 0; | 
|  | continue; | 
|  | } | 
|  |  | 
|  | for (size_t j = 0; j < pObjArray->size(); j += nElements) { | 
|  | result->push_back(first_code); | 
|  | result->push_back(first_code); | 
|  | for (int k = 0; k < nElements; k++) | 
|  | result->push_back(pObjArray->GetIntegerAt(j + k)); | 
|  | first_code++; | 
|  | } | 
|  | width_status = 0; | 
|  | } else { | 
|  | if (width_status == 0) { | 
|  | first_code = pObj->GetInteger(); | 
|  | width_status = 1; | 
|  | } else if (width_status == 1) { | 
|  | last_code = pObj->GetInteger(); | 
|  | width_status = 2; | 
|  | iCurElement = 0; | 
|  | } else { | 
|  | if (!iCurElement) { | 
|  | result->push_back(first_code); | 
|  | result->push_back(last_code); | 
|  | } | 
|  | result->push_back(pObj->GetInteger()); | 
|  | iCurElement++; | 
|  | if (iCurElement == nElements) | 
|  | width_status = 0; | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | // static | 
|  | float CPDF_CIDFont::CIDTransformToFloat(uint8_t ch) { | 
|  | return (ch < 128 ? ch : ch - 255) * (1.0f / 127); | 
|  | } | 
|  |  | 
|  | void CPDF_CIDFont::LoadGB2312() { | 
|  | m_BaseFontName = m_pFontDict->GetStringFor("BaseFont"); | 
|  | m_Charset = CIDSET_GB1; | 
|  |  | 
|  | CPDF_CMapManager* manager = CPDF_FontGlobals::GetInstance()->GetCMapManager(); | 
|  | m_pCMap = manager->GetPredefinedCMap("GBK-EUC-H"); | 
|  | m_pCID2UnicodeMap = manager->GetCID2UnicodeMap(m_Charset); | 
|  | const CPDF_Dictionary* pFontDesc = m_pFontDict->GetDictFor("FontDescriptor"); | 
|  | if (pFontDesc) | 
|  | LoadFontDescriptor(pFontDesc); | 
|  |  | 
|  | if (!IsEmbedded()) | 
|  | LoadSubstFont(); | 
|  | CheckFontMetrics(); | 
|  | m_bAnsiWidthsFixed = true; | 
|  | } | 
|  |  | 
|  | const uint8_t* CPDF_CIDFont::GetCIDTransform(uint16_t CID) const { | 
|  | if (m_Charset != CIDSET_JAPAN1 || m_pFontFile) | 
|  | return nullptr; | 
|  |  | 
|  | const auto* pEnd = g_Japan1_VertCIDs + FX_ArraySize(g_Japan1_VertCIDs); | 
|  | const auto* pTransform = std::lower_bound( | 
|  | g_Japan1_VertCIDs, pEnd, CID, | 
|  | [](const CIDTransform& entry, uint16_t cid) { return entry.cid < cid; }); | 
|  | return (pTransform < pEnd && CID == pTransform->cid) ? &pTransform->a | 
|  | : nullptr; | 
|  | } |