core/fpdfapi/fpdf_font/fpdf_font_cid.cpp - pdfium - Git at Google

 // Copyright 2014 PDFium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com

 #include "core/fpdfapi/fpdf_font/font_int.h"

 #include "core/fpdfapi/fpdf_cmaps/cmap_int.h"
 #include "core/fpdfapi/fpdf_font/ttgsubtable.h"
 #include "core/fpdfapi/fpdf_parser/include/cpdf_array.h"
 #include "core/fpdfapi/fpdf_parser/include/cpdf_dictionary.h"
 #include "core/fpdfapi/fpdf_parser/include/cpdf_simple_parser.h"
 #include "core/fpdfapi/include/cpdf_modulemgr.h"
 #include "core/fxcrt/include/fx_ext.h"
 #include "core/fxge/include/fx_freetype.h"
 #include "core/fxge/include/fx_ge.h"

 namespace {

 const FX_CHAR* const g_CharsetNames[CIDSET_NUM_SETS] = {
     nullptr, "GB1", "CNS1", "Japan1", "Korea1", "UCS"};


 class CPDF_PredefinedCMap {
  public:
   const FX_CHAR* m_pName;
   CIDSet m_Charset;
   CIDCoding m_Coding;
   CPDF_CMap::CodingScheme m_CodingScheme;
   uint8_t m_LeadingSegCount;
   uint8_t m_LeadingSegs[4];
 };

 const CPDF_PredefinedCMap g_PredefinedCMaps[] = {
     {"GB-EUC",
      CIDSET_GB1,
      CIDCODING_GB,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0xa1, 0xfe}},
     {"GBpc-EUC",
      CIDSET_GB1,
      CIDCODING_GB,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0xa1, 0xfc}},
     {"GBK-EUC",
      CIDSET_GB1,
      CIDCODING_GB,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0x81, 0xfe}},
     {"GBKp-EUC",
      CIDSET_GB1,
      CIDCODING_GB,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0x81, 0xfe}},
     {"GBK2K-EUC",
      CIDSET_GB1,
      CIDCODING_GB,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0x81, 0xfe}},
     {"GBK2K",
      CIDSET_GB1,
      CIDCODING_GB,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0x81, 0xfe}},
     {"UniGB-UCS2", CIDSET_GB1, CIDCODING_UCS2, CPDF_CMap::TwoBytes, 0, {}},
     {"UniGB-UTF16", CIDSET_GB1, CIDCODING_UTF16, CPDF_CMap::TwoBytes, 0, {}},
     {"B5pc",
      CIDSET_CNS1,
      CIDCODING_BIG5,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0xa1, 0xfc}},
     {"HKscs-B5",
      CIDSET_CNS1,
      CIDCODING_BIG5,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0x88, 0xfe}},
     {"ETen-B5",
      CIDSET_CNS1,
      CIDCODING_BIG5,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0xa1, 0xfe}},
     {"ETenms-B5",
      CIDSET_CNS1,
      CIDCODING_BIG5,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0xa1, 0xfe}},
     {"UniCNS-UCS2", CIDSET_CNS1, CIDCODING_UCS2, CPDF_CMap::TwoBytes, 0, {}},
     {"UniCNS-UTF16", CIDSET_CNS1, CIDCODING_UTF16, CPDF_CMap::TwoBytes, 0, {}},
     {"83pv-RKSJ",
      CIDSET_JAPAN1,
      CIDCODING_JIS,
      CPDF_CMap::MixedTwoBytes,
      2,
      {0x81, 0x9f, 0xe0, 0xfc}},
     {"90ms-RKSJ",
      CIDSET_JAPAN1,
      CIDCODING_JIS,
      CPDF_CMap::MixedTwoBytes,
      2,
      {0x81, 0x9f, 0xe0, 0xfc}},
     {"90msp-RKSJ",
      CIDSET_JAPAN1,
      CIDCODING_JIS,
      CPDF_CMap::MixedTwoBytes,
      2,
      {0x81, 0x9f, 0xe0, 0xfc}},
     {"90pv-RKSJ",
      CIDSET_JAPAN1,
      CIDCODING_JIS,
      CPDF_CMap::MixedTwoBytes,
      2,
      {0x81, 0x9f, 0xe0, 0xfc}},
     {"Add-RKSJ",
      CIDSET_JAPAN1,
      CIDCODING_JIS,
      CPDF_CMap::MixedTwoBytes,
      2,
      {0x81, 0x9f, 0xe0, 0xfc}},
     {"EUC",
      CIDSET_JAPAN1,
      CIDCODING_JIS,
      CPDF_CMap::MixedTwoBytes,
      2,
      {0x8e, 0x8e, 0xa1, 0xfe}},
     {"H", CIDSET_JAPAN1, CIDCODING_JIS, CPDF_CMap::TwoBytes, 1, {0x21, 0x7e}},
     {"V", CIDSET_JAPAN1, CIDCODING_JIS, CPDF_CMap::TwoBytes, 1, {0x21, 0x7e}},
     {"Ext-RKSJ",
      CIDSET_JAPAN1,
      CIDCODING_JIS,
      CPDF_CMap::MixedTwoBytes,
      2,
      {0x81, 0x9f, 0xe0, 0xfc}},
     {"UniJIS-UCS2", CIDSET_JAPAN1, CIDCODING_UCS2, CPDF_CMap::TwoBytes, 0, {}},
     {"UniJIS-UCS2-HW",
      CIDSET_JAPAN1,
      CIDCODING_UCS2,
      CPDF_CMap::TwoBytes,
      0,
      {}},
     {"UniJIS-UTF16",
      CIDSET_JAPAN1,
      CIDCODING_UTF16,
      CPDF_CMap::TwoBytes,
      0,
      {}},
     {"KSC-EUC",
      CIDSET_KOREA1,
      CIDCODING_KOREA,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0xa1, 0xfe}},
     {"KSCms-UHC",
      CIDSET_KOREA1,
      CIDCODING_KOREA,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0x81, 0xfe}},
     {"KSCms-UHC-HW",
      CIDSET_KOREA1,
      CIDCODING_KOREA,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0x81, 0xfe}},
     {"KSCpc-EUC",
      CIDSET_KOREA1,
      CIDCODING_KOREA,
      CPDF_CMap::MixedTwoBytes,
      1,
      {0xa1, 0xfd}},
     {"UniKS-UCS2", CIDSET_KOREA1, CIDCODING_UCS2, CPDF_CMap::TwoBytes, 0, {}},
     {"UniKS-UTF16", CIDSET_KOREA1, CIDCODING_UTF16, CPDF_CMap::TwoBytes, 0, {}},
 };

 CIDSet CIDSetFromSizeT(size_t index) {
   if (index >= CIDSET_NUM_SETS) {
     NOTREACHED();
     return CIDSET_UNKNOWN;
   }
   return static_cast<CIDSet>(index);
 }

 CFX_ByteStringC CMap_GetString(const CFX_ByteStringC& word) {
   if (word.GetLength() <= 2)
     return CFX_ByteStringC();
   return CFX_ByteStringC(&word[1], word.GetLength() - 2);
 }

 int CompareDWORD(const void* data1, const void* data2) {
   return (*(uint32_t*)data1) - (*(uint32_t*)data2);
 }

 int CompareCID(const void* key, const void* element) {
   if ((*(uint32_t*)key) < (*(uint32_t*)element)) {
     return -1;
   }
   if ((*(uint32_t*)key) >
       (*(uint32_t*)element) + ((uint32_t*)element)[1] / 65536) {
     return 1;
   }
   return 0;
 }

 int CheckCodeRange(uint8_t* codes,
                    int size,
                    CMap_CodeRange* pRanges,
                    int nRanges) {
   int iSeg = nRanges - 1;
   while (iSeg >= 0) {
     if (pRanges[iSeg].m_CharSize < size) {
       --iSeg;
       continue;
     }
     int iChar = 0;
     while (iChar < size) {
       if (codes[iChar] < pRanges[iSeg].m_Lower[iChar] ||
           codes[iChar] > pRanges[iSeg].m_Upper[iChar]) {
         break;
       }
       ++iChar;
     }
     if (iChar == pRanges[iSeg].m_CharSize)
       return 2;

     if (iChar)
       return (size == pRanges[iSeg].m_CharSize) ? 2 : 1;
     iSeg--;
   }
   return 0;
 }

 int GetCharSizeImpl(uint32_t charcode,
                     CMap_CodeRange* pRanges,
                     int iRangesSize) {
   if (!iRangesSize)
     return 1;

   uint8_t codes[4];
   codes[0] = codes[1] = 0x00;
   codes[2] = (uint8_t)(charcode >> 8 & 0xFF);
   codes[3] = (uint8_t)charcode;
   int offset = 0;
   int size = 4;
   for (int i = 0; i < 4; ++i) {
     int iSeg = iRangesSize - 1;
     while (iSeg >= 0) {
       if (pRanges[iSeg].m_CharSize < size) {
         --iSeg;
         continue;
       }
       int iChar = 0;
       while (iChar < size) {
         if (codes[offset + iChar] < pRanges[iSeg].m_Lower[iChar] ||
             codes[offset + iChar] > pRanges[iSeg].m_Upper[iChar]) {
           break;
         }
         ++iChar;
       }
       if (iChar == pRanges[iSeg].m_CharSize)
         return size;
       --iSeg;
     }
     --size;
     ++offset;
   }
   return 1;
 }

 }  // namespace

 CPDF_CMapManager::CPDF_CMapManager() {
   m_bPrompted = FALSE;
   FXSYS_memset(m_CID2UnicodeMaps, 0, sizeof m_CID2UnicodeMaps);
 }
 CPDF_CMapManager::~CPDF_CMapManager() {
   for (const auto& pair : m_CMaps) {
     delete pair.second;
   }
   m_CMaps.clear();
   for (size_t i = 0; i < FX_ArraySize(m_CID2UnicodeMaps); ++i) {
     delete m_CID2UnicodeMaps[i];
   }
 }
 CPDF_CMap* CPDF_CMapManager::GetPredefinedCMap(const CFX_ByteString& name,
                                                FX_BOOL bPromptCJK) {
   auto it = m_CMaps.find(name);
   if (it != m_CMaps.end()) {
     return it->second;
   }
   CPDF_CMap* pCMap = LoadPredefinedCMap(name, bPromptCJK);
   if (!name.IsEmpty()) {
     m_CMaps[name] = pCMap;
   }
   return pCMap;
 }
 CPDF_CMap* CPDF_CMapManager::LoadPredefinedCMap(const CFX_ByteString& name,
                                                 FX_BOOL bPromptCJK) {
   CPDF_CMap* pCMap = new CPDF_CMap;
   const FX_CHAR* pname = name.c_str();
   if (*pname == '/') {
     pname++;
   }
   pCMap->LoadPredefined(this, pname, bPromptCJK);
   return pCMap;
 }

 void CPDF_CMapManager::ReloadAll() {
   for (const auto& pair : m_CMaps) {
     CPDF_CMap* pCMap = pair.second;
     pCMap->LoadPredefined(this, pair.first.c_str(), FALSE);
   }
   for (size_t i = 0; i < FX_ArraySize(m_CID2UnicodeMaps); ++i) {
     if (CPDF_CID2UnicodeMap* pMap = m_CID2UnicodeMaps[i]) {
       pMap->Load(this, CIDSetFromSizeT(i), FALSE);
     }
   }
 }
 CPDF_CID2UnicodeMap* CPDF_CMapManager::GetCID2UnicodeMap(CIDSet charset,
                                                          FX_BOOL bPromptCJK) {
   if (!m_CID2UnicodeMaps[charset])
     m_CID2UnicodeMaps[charset] = LoadCID2UnicodeMap(charset, bPromptCJK);
   return m_CID2UnicodeMaps[charset];
 }
 CPDF_CID2UnicodeMap* CPDF_CMapManager::LoadCID2UnicodeMap(CIDSet charset,
                                                           FX_BOOL bPromptCJK) {
   CPDF_CID2UnicodeMap* pMap = new CPDF_CID2UnicodeMap();
   if (!pMap->Initialize()) {
     delete pMap;
     return NULL;
   }
   pMap->Load(this, charset, bPromptCJK);
   return pMap;
 }
 CPDF_CMapParser::CPDF_CMapParser() {
   m_pCMap = NULL;
   m_Status = 0;
   m_CodeSeq = 0;
 }
 FX_BOOL CPDF_CMapParser::Initialize(CPDF_CMap* pCMap) {
   m_pCMap = pCMap;
   m_Status = 0;
   m_CodeSeq = 0;
   m_AddMaps.EstimateSize(0, 10240);
   return TRUE;
 }

 void CPDF_CMapParser::ParseWord(const CFX_ByteStringC& word) {
   if (word.IsEmpty()) {
     return;
   }
   if (word == "begincidchar") {
     m_Status = 1;
     m_CodeSeq = 0;
   } else if (word == "begincidrange") {
     m_Status = 2;
     m_CodeSeq = 0;
   } else if (word == "endcidrange" || word == "endcidchar") {
     m_Status = 0;
   } else if (word == "/WMode") {
     m_Status = 6;
   } else if (word == "/Registry") {
     m_Status = 3;
   } else if (word == "/Ordering") {
     m_Status = 4;
   } else if (word == "/Supplement") {
     m_Status = 5;
   } else if (word == "begincodespacerange") {
     m_Status = 7;
     m_CodeSeq = 0;
   } else if (word == "usecmap") {
   } else if (m_Status == 1 || m_Status == 2) {
     m_CodePoints[m_CodeSeq] = CMap_GetCode(word);
     m_CodeSeq++;
     uint32_t StartCode, EndCode;
     uint16_t StartCID;
     if (m_Status == 1) {
       if (m_CodeSeq < 2) {
         return;
       }
       EndCode = StartCode = m_CodePoints[0];
       StartCID = (uint16_t)m_CodePoints[1];
     } else {
       if (m_CodeSeq < 3) {
         return;
       }
       StartCode = m_CodePoints[0];
       EndCode = m_CodePoints[1];
       StartCID = (uint16_t)m_CodePoints[2];
     }
     if (EndCode < 0x10000) {
       for (uint32_t code = StartCode; code <= EndCode; code++) {
         m_pCMap->m_pMapping[code] = (uint16_t)(StartCID + code - StartCode);
       }
     } else {
       uint32_t buf[2];
       buf[0] = StartCode;
       buf[1] = ((EndCode - StartCode) << 16) + StartCID;
       m_AddMaps.AppendBlock(buf, sizeof buf);
     }
     m_CodeSeq = 0;
   } else if (m_Status == 3) {
     m_Status = 0;
   } else if (m_Status == 4) {
     m_pCMap->m_Charset = CharsetFromOrdering(CMap_GetString(word));
     m_Status = 0;
   } else if (m_Status == 5) {
     m_Status = 0;
   } else if (m_Status == 6) {
     m_pCMap->m_bVertical = CMap_GetCode(word);
     m_Status = 0;
   } else if (m_Status == 7) {
     if (word == "endcodespacerange") {
       int nSegs = m_CodeRanges.GetSize();
       if (nSegs > 1) {
         m_pCMap->m_CodingScheme = CPDF_CMap::MixedFourBytes;
         m_pCMap->m_nCodeRanges = nSegs;
         m_pCMap->m_pLeadingBytes =
             FX_Alloc2D(uint8_t, nSegs, sizeof(CMap_CodeRange));
         FXSYS_memcpy(m_pCMap->m_pLeadingBytes, m_CodeRanges.GetData(),
                      nSegs * sizeof(CMap_CodeRange));
       } else if (nSegs == 1) {
         m_pCMap->m_CodingScheme = (m_CodeRanges[0].m_CharSize == 2)
                                       ? CPDF_CMap::TwoBytes
                                       : CPDF_CMap::OneByte;
       }
       m_Status = 0;
     } else {
       if (word.GetLength() == 0 || word.GetAt(0) != '<') {
         return;
       }
       if (m_CodeSeq % 2) {
         CMap_CodeRange range;
         if (CMap_GetCodeRange(range, m_LastWord.AsStringC(), word)) {
           m_CodeRanges.Add(range);
         }
       }
       m_CodeSeq++;
     }
   }
   m_LastWord = word;
 }

 // Static.
 uint32_t CPDF_CMapParser::CMap_GetCode(const CFX_ByteStringC& word) {
   int num = 0;
   if (word.GetAt(0) == '<') {
     for (int i = 1; i < word.GetLength() && std::isxdigit(word.GetAt(i)); ++i)
       num = num * 16 + FXSYS_toHexDigit(word.GetAt(i));
     return num;
   }

   for (int i = 0; i < word.GetLength() && std::isdigit(word.GetAt(i)); ++i)
     num = num * 10 + FXSYS_toDecimalDigit(static_cast<FX_WCHAR>(word.GetAt(i)));
   return num;
 }

 // Static.
 bool CPDF_CMapParser::CMap_GetCodeRange(CMap_CodeRange& range,
                                         const CFX_ByteStringC& first,
                                         const CFX_ByteStringC& second) {
   if (first.GetLength() == 0 || first.GetAt(0) != '<')
     return false;

   int i;
   for (i = 1; i < first.GetLength(); ++i) {
     if (first.GetAt(i) == '>') {
       break;
     }
   }
   range.m_CharSize = (i - 1) / 2;
   if (range.m_CharSize > 4)
     return false;

   for (i = 0; i < range.m_CharSize; ++i) {
     uint8_t digit1 = first.GetAt(i * 2 + 1);
     uint8_t digit2 = first.GetAt(i * 2 + 2);
     range.m_Lower[i] = FXSYS_toHexDigit(digit1) * 16 + FXSYS_toHexDigit(digit2);
   }

   uint32_t size = second.GetLength();
   for (i = 0; i < range.m_CharSize; ++i) {
     uint8_t digit1 = ((uint32_t)i * 2 + 1 < size)
                          ? second.GetAt((FX_STRSIZE)i * 2 + 1)
                          : '0';
     uint8_t digit2 = ((uint32_t)i * 2 + 2 < size)
                          ? second.GetAt((FX_STRSIZE)i * 2 + 2)
                          : '0';
     range.m_Upper[i] = FXSYS_toHexDigit(digit1) * 16 + FXSYS_toHexDigit(digit2);
   }
   return true;
 }

 CPDF_CMap::CPDF_CMap() {
   m_Charset = CIDSET_UNKNOWN;
   m_Coding = CIDCODING_UNKNOWN;
   m_CodingScheme = TwoBytes;
   m_bVertical = 0;
   m_bLoaded = FALSE;
   m_pMapping = NULL;
   m_pLeadingBytes = NULL;
   m_pAddMapping = NULL;
   m_pEmbedMap = NULL;
   m_pUseMap = NULL;
   m_nCodeRanges = 0;
 }
 CPDF_CMap::~CPDF_CMap() {
   FX_Free(m_pMapping);
   FX_Free(m_pAddMapping);
   FX_Free(m_pLeadingBytes);
   delete m_pUseMap;
 }
 void CPDF_CMap::Release() {
   if (m_PredefinedCMap.IsEmpty()) {
     delete this;
   }
 }

 FX_BOOL CPDF_CMap::LoadPredefined(CPDF_CMapManager* pMgr,
                                   const FX_CHAR* pName,
                                   FX_BOOL bPromptCJK) {
   m_PredefinedCMap = pName;
   if (m_PredefinedCMap == "Identity-H" || m_PredefinedCMap == "Identity-V") {
     m_Coding = CIDCODING_CID;
     m_bVertical = pName[9] == 'V';
     m_bLoaded = TRUE;
     return TRUE;
   }
   CFX_ByteString cmapid = m_PredefinedCMap;
   m_bVertical = cmapid.Right(1) == "V";
   if (cmapid.GetLength() > 2) {
     cmapid = cmapid.Left(cmapid.GetLength() - 2);
   }
   const CPDF_PredefinedCMap* map = nullptr;
   for (size_t i = 0; i < FX_ArraySize(g_PredefinedCMaps); ++i) {
     if (cmapid == CFX_ByteStringC(g_PredefinedCMaps[i].m_pName)) {
       map = &g_PredefinedCMaps[i];
       break;
     }
   }
   if (!map)
     return FALSE;

   m_Charset = map->m_Charset;
   m_Coding = map->m_Coding;
   m_CodingScheme = map->m_CodingScheme;
   if (m_CodingScheme == MixedTwoBytes) {
     m_pLeadingBytes = FX_Alloc(uint8_t, 256);
     for (uint32_t i = 0; i < map->m_LeadingSegCount; ++i) {
       const uint8_t* segs = map->m_LeadingSegs;
       for (int b = segs[i * 2]; b <= segs[i * 2 + 1]; ++b) {
         m_pLeadingBytes[b] = 1;
       }
     }
   }
   FPDFAPI_FindEmbeddedCMap(pName, m_Charset, m_Coding, m_pEmbedMap);
   if (m_pEmbedMap) {
     m_bLoaded = TRUE;
     return TRUE;
   }
   return FALSE;
 }
 FX_BOOL CPDF_CMap::LoadEmbedded(const uint8_t* pData, uint32_t size) {
   m_pMapping = FX_Alloc(uint16_t, 65536);
   CPDF_CMapParser parser;
   parser.Initialize(this);
   CPDF_SimpleParser syntax(pData, size);
   while (1) {
     CFX_ByteStringC word = syntax.GetWord();
     if (word.IsEmpty()) {
       break;
     }
     parser.ParseWord(word);
   }
   if (m_CodingScheme == MixedFourBytes && parser.m_AddMaps.GetSize()) {
     m_pAddMapping = FX_Alloc(uint8_t, parser.m_AddMaps.GetSize() + 4);
     *(uint32_t*)m_pAddMapping = parser.m_AddMaps.GetSize() / 8;
     FXSYS_memcpy(m_pAddMapping + 4, parser.m_AddMaps.GetBuffer(),
                  parser.m_AddMaps.GetSize());
     FXSYS_qsort(m_pAddMapping + 4, parser.m_AddMaps.GetSize() / 8, 8,
                 CompareDWORD);
   }
   return TRUE;
 }

 uint16_t CPDF_CMap::CIDFromCharCode(uint32_t charcode) const {
   if (m_Coding == CIDCODING_CID) {
     return (uint16_t)charcode;
   }
   if (m_pEmbedMap) {
     return FPDFAPI_CIDFromCharCode(m_pEmbedMap, charcode);
   }
   if (!m_pMapping) {
     return (uint16_t)charcode;
   }
   if (charcode >> 16) {
     if (m_pAddMapping) {
       void* found = FXSYS_bsearch(&charcode, m_pAddMapping + 4,
                                   *(uint32_t*)m_pAddMapping, 8, CompareCID);
       if (!found) {
         if (m_pUseMap) {
           return m_pUseMap->CIDFromCharCode(charcode);
         }
         return 0;
       }
       return (uint16_t)(((uint32_t*)found)[1] % 65536 + charcode -
                         *(uint32_t*)found);
     }
     if (m_pUseMap)
       return m_pUseMap->CIDFromCharCode(charcode);
     return 0;
   }
   uint32_t CID = m_pMapping[charcode];
   if (!CID && m_pUseMap)
     return m_pUseMap->CIDFromCharCode(charcode);
   return (uint16_t)CID;
 }

 uint32_t CPDF_CMap::GetNextChar(const FX_CHAR* pString,
                                 int nStrLen,
                                 int& offset) const {
   switch (m_CodingScheme) {
     case OneByte:
       return ((uint8_t*)pString)[offset++];
     case TwoBytes:
       offset += 2;
       return ((uint8_t*)pString)[offset - 2] * 256 +
              ((uint8_t*)pString)[offset - 1];
     case MixedTwoBytes: {
       uint8_t byte1 = ((uint8_t*)pString)[offset++];
       if (!m_pLeadingBytes[byte1]) {
         return byte1;
       }
       uint8_t byte2 = ((uint8_t*)pString)[offset++];
       return byte1 * 256 + byte2;
     }
     case MixedFourBytes: {
       uint8_t codes[4];
       int char_size = 1;
       codes[0] = ((uint8_t*)pString)[offset++];
       CMap_CodeRange* pRanges = (CMap_CodeRange*)m_pLeadingBytes;
       while (1) {
         int ret = CheckCodeRange(codes, char_size, pRanges, m_nCodeRanges);
         if (ret == 0) {
           return 0;
         }
         if (ret == 2) {
           uint32_t charcode = 0;
           for (int i = 0; i < char_size; i++) {
             charcode = (charcode << 8) + codes[i];
           }
           return charcode;
         }
         if (char_size == 4 || offset == nStrLen) {
           return 0;
         }
         codes[char_size++] = ((uint8_t*)pString)[offset++];
       }
       break;
     }
   }
   return 0;
 }
 int CPDF_CMap::GetCharSize(uint32_t charcode) const {
   switch (m_CodingScheme) {
     case OneByte:
       return 1;
     case TwoBytes:
       return 2;
     case MixedTwoBytes:
     case MixedFourBytes:
       if (charcode < 0x100) {
         return 1;
       }
       if (charcode < 0x10000) {
         return 2;
       }
       if (charcode < 0x1000000) {
         return 3;
       }
       return 4;
   }
   return 1;
 }
 int CPDF_CMap::CountChar(const FX_CHAR* pString, int size) const {
   switch (m_CodingScheme) {
     case OneByte:
       return size;
     case TwoBytes:
       return (size + 1) / 2;
     case MixedTwoBytes: {
       int count = 0;
       for (int i = 0; i < size; i++) {
         count++;
         if (m_pLeadingBytes[((uint8_t*)pString)[i]]) {
           i++;
         }
       }
       return count;
     }
     case MixedFourBytes: {
       int count = 0, offset = 0;
       while (offset < size) {
         GetNextChar(pString, size, offset);
         count++;
       }
       return count;
     }
   }
   return size;
 }

 int CPDF_CMap::AppendChar(FX_CHAR* str, uint32_t charcode) const {
   switch (m_CodingScheme) {
     case OneByte:
       str[0] = (uint8_t)charcode;
       return 1;
     case TwoBytes:
       str[0] = (uint8_t)(charcode / 256);
       str[1] = (uint8_t)(charcode % 256);
       return 2;
     case MixedTwoBytes:
     case MixedFourBytes:
       if (charcode < 0x100) {
         CMap_CodeRange* pRanges = (CMap_CodeRange*)m_pLeadingBytes;
         int iSize = GetCharSizeImpl(charcode, pRanges, m_nCodeRanges);
         if (iSize == 0) {
           iSize = 1;
         }
         if (iSize > 1) {
           FXSYS_memset(str, 0, sizeof(uint8_t) * iSize);
         }
         str[iSize - 1] = (uint8_t)charcode;
         return iSize;
       }
       if (charcode < 0x10000) {
         str[0] = (uint8_t)(charcode >> 8);
         str[1] = (uint8_t)charcode;
         return 2;
       }
       if (charcode < 0x1000000) {
         str[0] = (uint8_t)(charcode >> 16);
         str[1] = (uint8_t)(charcode >> 8);
         str[2] = (uint8_t)charcode;
         return 3;
       }
       str[0] = (uint8_t)(charcode >> 24);
       str[1] = (uint8_t)(charcode >> 16);
       str[2] = (uint8_t)(charcode >> 8);
       str[3] = (uint8_t)charcode;
       return 4;
   }
   return 0;
 }
 CPDF_CID2UnicodeMap::CPDF_CID2UnicodeMap() {
   m_EmbeddedCount = 0;
 }
 CPDF_CID2UnicodeMap::~CPDF_CID2UnicodeMap() {}
 FX_BOOL CPDF_CID2UnicodeMap::Initialize() {
   return TRUE;
 }
 FX_BOOL CPDF_CID2UnicodeMap::IsLoaded() {
   return m_EmbeddedCount != 0;
 }
 FX_WCHAR CPDF_CID2UnicodeMap::UnicodeFromCID(uint16_t CID) {
   if (m_Charset == CIDSET_UNICODE) {
     return CID;
   }
   if (CID < m_EmbeddedCount) {
     return m_pEmbeddedMap[CID];
   }
   return 0;
 }

 void CPDF_CID2UnicodeMap::Load(CPDF_CMapManager* pMgr,
                                CIDSet charset,
                                FX_BOOL bPromptCJK) {
   m_Charset = charset;
   FPDFAPI_LoadCID2UnicodeMap(charset, m_pEmbeddedMap, m_EmbeddedCount);
 }

 CIDSet CharsetFromOrdering(const CFX_ByteStringC& ordering) {
   for (size_t charset = 1; charset < FX_ArraySize(g_CharsetNames); ++charset) {
     if (ordering == g_CharsetNames[charset])
       return CIDSetFromSizeT(charset);
   }
   return CIDSET_UNKNOWN;
 }
	// Copyright 2014 PDFium Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com

	#include "core/fpdfapi/fpdf_font/font_int.h"

	#include "core/fpdfapi/fpdf_cmaps/cmap_int.h"
	#include "core/fpdfapi/fpdf_font/ttgsubtable.h"
	#include "core/fpdfapi/fpdf_parser/include/cpdf_array.h"
	#include "core/fpdfapi/fpdf_parser/include/cpdf_dictionary.h"
	#include "core/fpdfapi/fpdf_parser/include/cpdf_simple_parser.h"
	#include "core/fpdfapi/include/cpdf_modulemgr.h"
	#include "core/fxcrt/include/fx_ext.h"
	#include "core/fxge/include/fx_freetype.h"
	#include "core/fxge/include/fx_ge.h"

	namespace {

	const FX_CHAR* const g_CharsetNames[CIDSET_NUM_SETS] = {
	nullptr, "GB1", "CNS1", "Japan1", "Korea1", "UCS"};


	class CPDF_PredefinedCMap {
	public:
	const FX_CHAR* m_pName;
	CIDSet m_Charset;
	CIDCoding m_Coding;
	CPDF_CMap::CodingScheme m_CodingScheme;
	uint8_t m_LeadingSegCount;
	uint8_t m_LeadingSegs[4];
	};

	const CPDF_PredefinedCMap g_PredefinedCMaps[] = {
	{"GB-EUC",
	CIDSET_GB1,
	CIDCODING_GB,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0xa1, 0xfe}},
	{"GBpc-EUC",
	CIDSET_GB1,
	CIDCODING_GB,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0xa1, 0xfc}},
	{"GBK-EUC",
	CIDSET_GB1,
	CIDCODING_GB,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0x81, 0xfe}},
	{"GBKp-EUC",
	CIDSET_GB1,
	CIDCODING_GB,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0x81, 0xfe}},
	{"GBK2K-EUC",
	CIDSET_GB1,
	CIDCODING_GB,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0x81, 0xfe}},
	{"GBK2K",
	CIDSET_GB1,
	CIDCODING_GB,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0x81, 0xfe}},
	{"UniGB-UCS2", CIDSET_GB1, CIDCODING_UCS2, CPDF_CMap::TwoBytes, 0, {}},
	{"UniGB-UTF16", CIDSET_GB1, CIDCODING_UTF16, CPDF_CMap::TwoBytes, 0, {}},
	{"B5pc",
	CIDSET_CNS1,
	CIDCODING_BIG5,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0xa1, 0xfc}},
	{"HKscs-B5",
	CIDSET_CNS1,
	CIDCODING_BIG5,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0x88, 0xfe}},
	{"ETen-B5",
	CIDSET_CNS1,
	CIDCODING_BIG5,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0xa1, 0xfe}},
	{"ETenms-B5",
	CIDSET_CNS1,
	CIDCODING_BIG5,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0xa1, 0xfe}},
	{"UniCNS-UCS2", CIDSET_CNS1, CIDCODING_UCS2, CPDF_CMap::TwoBytes, 0, {}},
	{"UniCNS-UTF16", CIDSET_CNS1, CIDCODING_UTF16, CPDF_CMap::TwoBytes, 0, {}},
	{"83pv-RKSJ",
	CIDSET_JAPAN1,
	CIDCODING_JIS,
	CPDF_CMap::MixedTwoBytes,
	2,
	{0x81, 0x9f, 0xe0, 0xfc}},
	{"90ms-RKSJ",
	CIDSET_JAPAN1,
	CIDCODING_JIS,
	CPDF_CMap::MixedTwoBytes,
	2,
	{0x81, 0x9f, 0xe0, 0xfc}},
	{"90msp-RKSJ",
	CIDSET_JAPAN1,
	CIDCODING_JIS,
	CPDF_CMap::MixedTwoBytes,
	2,
	{0x81, 0x9f, 0xe0, 0xfc}},
	{"90pv-RKSJ",
	CIDSET_JAPAN1,
	CIDCODING_JIS,
	CPDF_CMap::MixedTwoBytes,
	2,
	{0x81, 0x9f, 0xe0, 0xfc}},
	{"Add-RKSJ",
	CIDSET_JAPAN1,
	CIDCODING_JIS,
	CPDF_CMap::MixedTwoBytes,
	2,
	{0x81, 0x9f, 0xe0, 0xfc}},
	{"EUC",
	CIDSET_JAPAN1,
	CIDCODING_JIS,
	CPDF_CMap::MixedTwoBytes,
	2,
	{0x8e, 0x8e, 0xa1, 0xfe}},
	{"H", CIDSET_JAPAN1, CIDCODING_JIS, CPDF_CMap::TwoBytes, 1, {0x21, 0x7e}},
	{"V", CIDSET_JAPAN1, CIDCODING_JIS, CPDF_CMap::TwoBytes, 1, {0x21, 0x7e}},
	{"Ext-RKSJ",
	CIDSET_JAPAN1,
	CIDCODING_JIS,
	CPDF_CMap::MixedTwoBytes,
	2,
	{0x81, 0x9f, 0xe0, 0xfc}},
	{"UniJIS-UCS2", CIDSET_JAPAN1, CIDCODING_UCS2, CPDF_CMap::TwoBytes, 0, {}},
	{"UniJIS-UCS2-HW",
	CIDSET_JAPAN1,
	CIDCODING_UCS2,
	CPDF_CMap::TwoBytes,
	0,
	{}},
	{"UniJIS-UTF16",
	CIDSET_JAPAN1,
	CIDCODING_UTF16,
	CPDF_CMap::TwoBytes,
	0,
	{}},
	{"KSC-EUC",
	CIDSET_KOREA1,
	CIDCODING_KOREA,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0xa1, 0xfe}},
	{"KSCms-UHC",
	CIDSET_KOREA1,
	CIDCODING_KOREA,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0x81, 0xfe}},
	{"KSCms-UHC-HW",
	CIDSET_KOREA1,
	CIDCODING_KOREA,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0x81, 0xfe}},
	{"KSCpc-EUC",
	CIDSET_KOREA1,
	CIDCODING_KOREA,
	CPDF_CMap::MixedTwoBytes,
	1,
	{0xa1, 0xfd}},
	{"UniKS-UCS2", CIDSET_KOREA1, CIDCODING_UCS2, CPDF_CMap::TwoBytes, 0, {}},
	{"UniKS-UTF16", CIDSET_KOREA1, CIDCODING_UTF16, CPDF_CMap::TwoBytes, 0, {}},
	};

	CIDSet CIDSetFromSizeT(size_t index) {
	if (index >= CIDSET_NUM_SETS) {
	NOTREACHED();
	return CIDSET_UNKNOWN;
	}
	return static_cast<CIDSet>(index);
	}

	CFX_ByteStringC CMap_GetString(const CFX_ByteStringC& word) {
	if (word.GetLength() <= 2)
	return CFX_ByteStringC();
	return CFX_ByteStringC(&word[1], word.GetLength() - 2);
	}

	int CompareDWORD(const void* data1, const void* data2) {
	return ((uint32_t)data1) - ((uint32_t)data2);
	}

	int CompareCID(const void* key, const void* element) {
	if (((uint32_t)key) < ((uint32_t)element)) {
	return -1;
	}
	if (((uint32_t)key) >
	((uint32_t)element) + ((uint32_t*)element)[1] / 65536) {
	return 1;
	}
	return 0;
	}

	int CheckCodeRange(uint8_t* codes,
	int size,
	CMap_CodeRange* pRanges,
	int nRanges) {
	int iSeg = nRanges - 1;
	while (iSeg >= 0) {
	if (pRanges[iSeg].m_CharSize < size) {
	--iSeg;
	continue;
	}
	int iChar = 0;
	while (iChar < size) {
	if (codes[iChar] < pRanges[iSeg].m_Lower[iChar] \|\|
	codes[iChar] > pRanges[iSeg].m_Upper[iChar]) {
	break;
	}
	++iChar;
	}
	if (iChar == pRanges[iSeg].m_CharSize)
	return 2;

	if (iChar)
	return (size == pRanges[iSeg].m_CharSize) ? 2 : 1;
	iSeg--;
	}
	return 0;
	}

	int GetCharSizeImpl(uint32_t charcode,
	CMap_CodeRange* pRanges,
	int iRangesSize) {
	if (!iRangesSize)
	return 1;

	uint8_t codes[4];
	codes[0] = codes[1] = 0x00;
	codes[2] = (uint8_t)(charcode >> 8 & 0xFF);
	codes[3] = (uint8_t)charcode;
	int offset = 0;
	int size = 4;
	for (int i = 0; i < 4; ++i) {
	int iSeg = iRangesSize - 1;
	while (iSeg >= 0) {
	if (pRanges[iSeg].m_CharSize < size) {
	--iSeg;
	continue;
	}
	int iChar = 0;
	while (iChar < size) {
	if (codes[offset + iChar] < pRanges[iSeg].m_Lower[iChar] \|\|
	codes[offset + iChar] > pRanges[iSeg].m_Upper[iChar]) {
	break;
	}
	++iChar;
	}
	if (iChar == pRanges[iSeg].m_CharSize)
	return size;
	--iSeg;
	}
	--size;
	++offset;
	}
	return 1;
	}

	} // namespace

	CPDF_CMapManager::CPDF_CMapManager() {
	m_bPrompted = FALSE;
	FXSYS_memset(m_CID2UnicodeMaps, 0, sizeof m_CID2UnicodeMaps);
	}
	CPDF_CMapManager::~CPDF_CMapManager() {
	for (const auto& pair : m_CMaps) {
	delete pair.second;
	}
	m_CMaps.clear();
	for (size_t i = 0; i < FX_ArraySize(m_CID2UnicodeMaps); ++i) {
	delete m_CID2UnicodeMaps[i];
	}
	}
	CPDF_CMap* CPDF_CMapManager::GetPredefinedCMap(const CFX_ByteString& name,
	FX_BOOL bPromptCJK) {
	auto it = m_CMaps.find(name);
	if (it != m_CMaps.end()) {
	return it->second;
	}
	CPDF_CMap* pCMap = LoadPredefinedCMap(name, bPromptCJK);
	if (!name.IsEmpty()) {
	m_CMaps[name] = pCMap;
	}
	return pCMap;
	}
	CPDF_CMap* CPDF_CMapManager::LoadPredefinedCMap(const CFX_ByteString& name,
	FX_BOOL bPromptCJK) {
	CPDF_CMap* pCMap = new CPDF_CMap;
	const FX_CHAR* pname = name.c_str();
	if (*pname == '/') {
	pname++;
	}
	pCMap->LoadPredefined(this, pname, bPromptCJK);
	return pCMap;
	}

	void CPDF_CMapManager::ReloadAll() {
	for (const auto& pair : m_CMaps) {
	CPDF_CMap* pCMap = pair.second;
	pCMap->LoadPredefined(this, pair.first.c_str(), FALSE);
	}
	for (size_t i = 0; i < FX_ArraySize(m_CID2UnicodeMaps); ++i) {
	if (CPDF_CID2UnicodeMap* pMap = m_CID2UnicodeMaps[i]) {
	pMap->Load(this, CIDSetFromSizeT(i), FALSE);
	}
	}
	}
	CPDF_CID2UnicodeMap* CPDF_CMapManager::GetCID2UnicodeMap(CIDSet charset,
	FX_BOOL bPromptCJK) {
	if (!m_CID2UnicodeMaps[charset])
	m_CID2UnicodeMaps[charset] = LoadCID2UnicodeMap(charset, bPromptCJK);
	return m_CID2UnicodeMaps[charset];
	}
	CPDF_CID2UnicodeMap* CPDF_CMapManager::LoadCID2UnicodeMap(CIDSet charset,
	FX_BOOL bPromptCJK) {
	CPDF_CID2UnicodeMap* pMap = new CPDF_CID2UnicodeMap();
	if (!pMap->Initialize()) {
	delete pMap;
	return NULL;
	}
	pMap->Load(this, charset, bPromptCJK);
	return pMap;
	}
	CPDF_CMapParser::CPDF_CMapParser() {
	m_pCMap = NULL;
	m_Status = 0;
	m_CodeSeq = 0;
	}
	FX_BOOL CPDF_CMapParser::Initialize(CPDF_CMap* pCMap) {
	m_pCMap = pCMap;
	m_Status = 0;
	m_CodeSeq = 0;
	m_AddMaps.EstimateSize(0, 10240);
	return TRUE;
	}

	void CPDF_CMapParser::ParseWord(const CFX_ByteStringC& word) {
	if (word.IsEmpty()) {
	return;
	}
	if (word == "begincidchar") {
	m_Status = 1;
	m_CodeSeq = 0;
	} else if (word == "begincidrange") {
	m_Status = 2;
	m_CodeSeq = 0;
	} else if (word == "endcidrange" \|\| word == "endcidchar") {
	m_Status = 0;
	} else if (word == "/WMode") {
	m_Status = 6;
	} else if (word == "/Registry") {
	m_Status = 3;
	} else if (word == "/Ordering") {
	m_Status = 4;
	} else if (word == "/Supplement") {
	m_Status = 5;
	} else if (word == "begincodespacerange") {
	m_Status = 7;
	m_CodeSeq = 0;
	} else if (word == "usecmap") {
	} else if (m_Status == 1 \|\| m_Status == 2) {
	m_CodePoints[m_CodeSeq] = CMap_GetCode(word);
	m_CodeSeq++;
	uint32_t StartCode, EndCode;
	uint16_t StartCID;
	if (m_Status == 1) {
	if (m_CodeSeq < 2) {
	return;
	}
	EndCode = StartCode = m_CodePoints[0];
	StartCID = (uint16_t)m_CodePoints[1];
	} else {
	if (m_CodeSeq < 3) {
	return;
	}
	StartCode = m_CodePoints[0];
	EndCode = m_CodePoints[1];
	StartCID = (uint16_t)m_CodePoints[2];
	}
	if (EndCode < 0x10000) {
	for (uint32_t code = StartCode; code <= EndCode; code++) {
	m_pCMap->m_pMapping[code] = (uint16_t)(StartCID + code - StartCode);
	}
	} else {
	uint32_t buf[2];
	buf[0] = StartCode;
	buf[1] = ((EndCode - StartCode) << 16) + StartCID;
	m_AddMaps.AppendBlock(buf, sizeof buf);
	}
	m_CodeSeq = 0;
	} else if (m_Status == 3) {
	m_Status = 0;
	} else if (m_Status == 4) {
	m_pCMap->m_Charset = CharsetFromOrdering(CMap_GetString(word));
	m_Status = 0;
	} else if (m_Status == 5) {
	m_Status = 0;
	} else if (m_Status == 6) {
	m_pCMap->m_bVertical = CMap_GetCode(word);
	m_Status = 0;
	} else if (m_Status == 7) {
	if (word == "endcodespacerange") {
	int nSegs = m_CodeRanges.GetSize();
	if (nSegs > 1) {
	m_pCMap->m_CodingScheme = CPDF_CMap::MixedFourBytes;
	m_pCMap->m_nCodeRanges = nSegs;
	m_pCMap->m_pLeadingBytes =
	FX_Alloc2D(uint8_t, nSegs, sizeof(CMap_CodeRange));
	FXSYS_memcpy(m_pCMap->m_pLeadingBytes, m_CodeRanges.GetData(),
	nSegs * sizeof(CMap_CodeRange));
	} else if (nSegs == 1) {
	m_pCMap->m_CodingScheme = (m_CodeRanges[0].m_CharSize == 2)
	? CPDF_CMap::TwoBytes
	: CPDF_CMap::OneByte;
	}
	m_Status = 0;
	} else {
	if (word.GetLength() == 0 \|\| word.GetAt(0) != '<') {
	return;
	}
	if (m_CodeSeq % 2) {
	CMap_CodeRange range;
	if (CMap_GetCodeRange(range, m_LastWord.AsStringC(), word)) {
	m_CodeRanges.Add(range);
	}
	}
	m_CodeSeq++;
	}
	}
	m_LastWord = word;
	}

	// Static.
	uint32_t CPDF_CMapParser::CMap_GetCode(const CFX_ByteStringC& word) {
	int num = 0;
	if (word.GetAt(0) == '<') {
	for (int i = 1; i < word.GetLength() && std::isxdigit(word.GetAt(i)); ++i)
	num = num * 16 + FXSYS_toHexDigit(word.GetAt(i));
	return num;
	}

	for (int i = 0; i < word.GetLength() && std::isdigit(word.GetAt(i)); ++i)
	num = num * 10 + FXSYS_toDecimalDigit(static_cast<FX_WCHAR>(word.GetAt(i)));
	return num;
	}

	// Static.
	bool CPDF_CMapParser::CMap_GetCodeRange(CMap_CodeRange& range,
	const CFX_ByteStringC& first,
	const CFX_ByteStringC& second) {
	if (first.GetLength() == 0 \|\| first.GetAt(0) != '<')
	return false;

	int i;
	for (i = 1; i < first.GetLength(); ++i) {
	if (first.GetAt(i) == '>') {
	break;
	}
	}
	range.m_CharSize = (i - 1) / 2;
	if (range.m_CharSize > 4)
	return false;

	for (i = 0; i < range.m_CharSize; ++i) {
	uint8_t digit1 = first.GetAt(i * 2 + 1);
	uint8_t digit2 = first.GetAt(i * 2 + 2);
	range.m_Lower[i] = FXSYS_toHexDigit(digit1) * 16 + FXSYS_toHexDigit(digit2);
	}

	uint32_t size = second.GetLength();
	for (i = 0; i < range.m_CharSize; ++i) {
	uint8_t digit1 = ((uint32_t)i * 2 + 1 < size)
	? second.GetAt((FX_STRSIZE)i * 2 + 1)
	: '0';
	uint8_t digit2 = ((uint32_t)i * 2 + 2 < size)
	? second.GetAt((FX_STRSIZE)i * 2 + 2)
	: '0';
	range.m_Upper[i] = FXSYS_toHexDigit(digit1) * 16 + FXSYS_toHexDigit(digit2);
	}
	return true;
	}

	CPDF_CMap::CPDF_CMap() {
	m_Charset = CIDSET_UNKNOWN;
	m_Coding = CIDCODING_UNKNOWN;
	m_CodingScheme = TwoBytes;
	m_bVertical = 0;
	m_bLoaded = FALSE;
	m_pMapping = NULL;
	m_pLeadingBytes = NULL;
	m_pAddMapping = NULL;
	m_pEmbedMap = NULL;
	m_pUseMap = NULL;
	m_nCodeRanges = 0;
	}
	CPDF_CMap::~CPDF_CMap() {
	FX_Free(m_pMapping);
	FX_Free(m_pAddMapping);
	FX_Free(m_pLeadingBytes);
	delete m_pUseMap;
	}
	void CPDF_CMap::Release() {
	if (m_PredefinedCMap.IsEmpty()) {
	delete this;
	}
	}

	FX_BOOL CPDF_CMap::LoadPredefined(CPDF_CMapManager* pMgr,
	const FX_CHAR* pName,
	FX_BOOL bPromptCJK) {
	m_PredefinedCMap = pName;
	if (m_PredefinedCMap == "Identity-H" \|\| m_PredefinedCMap == "Identity-V") {
	m_Coding = CIDCODING_CID;
	m_bVertical = pName[9] == 'V';
	m_bLoaded = TRUE;
	return TRUE;
	}
	CFX_ByteString cmapid = m_PredefinedCMap;
	m_bVertical = cmapid.Right(1) == "V";
	if (cmapid.GetLength() > 2) {
	cmapid = cmapid.Left(cmapid.GetLength() - 2);
	}
	const CPDF_PredefinedCMap* map = nullptr;
	for (size_t i = 0; i < FX_ArraySize(g_PredefinedCMaps); ++i) {
	if (cmapid == CFX_ByteStringC(g_PredefinedCMaps[i].m_pName)) {
	map = &g_PredefinedCMaps[i];
	break;
	}
	}
	if (!map)
	return FALSE;

	m_Charset = map->m_Charset;
	m_Coding = map->m_Coding;
	m_CodingScheme = map->m_CodingScheme;
	if (m_CodingScheme == MixedTwoBytes) {
	m_pLeadingBytes = FX_Alloc(uint8_t, 256);
	for (uint32_t i = 0; i < map->m_LeadingSegCount; ++i) {
	const uint8_t* segs = map->m_LeadingSegs;
	for (int b = segs[i * 2]; b <= segs[i * 2 + 1]; ++b) {
	m_pLeadingBytes[b] = 1;
	}
	}
	}
	FPDFAPI_FindEmbeddedCMap(pName, m_Charset, m_Coding, m_pEmbedMap);
	if (m_pEmbedMap) {
	m_bLoaded = TRUE;
	return TRUE;
	}
	return FALSE;
	}
	FX_BOOL CPDF_CMap::LoadEmbedded(const uint8_t* pData, uint32_t size) {
	m_pMapping = FX_Alloc(uint16_t, 65536);
	CPDF_CMapParser parser;
	parser.Initialize(this);
	CPDF_SimpleParser syntax(pData, size);
	while (1) {
	CFX_ByteStringC word = syntax.GetWord();
	if (word.IsEmpty()) {
	break;
	}
	parser.ParseWord(word);
	}
	if (m_CodingScheme == MixedFourBytes && parser.m_AddMaps.GetSize()) {
	m_pAddMapping = FX_Alloc(uint8_t, parser.m_AddMaps.GetSize() + 4);
	(uint32_t)m_pAddMapping = parser.m_AddMaps.GetSize() / 8;
	FXSYS_memcpy(m_pAddMapping + 4, parser.m_AddMaps.GetBuffer(),
	parser.m_AddMaps.GetSize());
	FXSYS_qsort(m_pAddMapping + 4, parser.m_AddMaps.GetSize() / 8, 8,
	CompareDWORD);
	}
	return TRUE;
	}

	uint16_t CPDF_CMap::CIDFromCharCode(uint32_t charcode) const {
	if (m_Coding == CIDCODING_CID) {
	return (uint16_t)charcode;
	}
	if (m_pEmbedMap) {
	return FPDFAPI_CIDFromCharCode(m_pEmbedMap, charcode);
	}
	if (!m_pMapping) {
	return (uint16_t)charcode;
	}
	if (charcode >> 16) {
	if (m_pAddMapping) {
	void* found = FXSYS_bsearch(&charcode, m_pAddMapping + 4,
	(uint32_t)m_pAddMapping, 8, CompareCID);
	if (!found) {
	if (m_pUseMap) {
	return m_pUseMap->CIDFromCharCode(charcode);
	}
	return 0;
	}
	return (uint16_t)(((uint32_t*)found)[1] % 65536 + charcode -
	(uint32_t)found);
	}
	if (m_pUseMap)
	return m_pUseMap->CIDFromCharCode(charcode);
	return 0;
	}
	uint32_t CID = m_pMapping[charcode];
	if (!CID && m_pUseMap)
	return m_pUseMap->CIDFromCharCode(charcode);
	return (uint16_t)CID;
	}

	uint32_t CPDF_CMap::GetNextChar(const FX_CHAR* pString,
	int nStrLen,
	int& offset) const {
	switch (m_CodingScheme) {
	case OneByte:
	return ((uint8_t*)pString)[offset++];
	case TwoBytes:
	offset += 2;
	return ((uint8_t)pString)[offset - 2] 256 +
	((uint8_t*)pString)[offset - 1];
	case MixedTwoBytes: {
	uint8_t byte1 = ((uint8_t*)pString)[offset++];
	if (!m_pLeadingBytes[byte1]) {
	return byte1;
	}
	uint8_t byte2 = ((uint8_t*)pString)[offset++];
	return byte1 * 256 + byte2;
	}
	case MixedFourBytes: {
	uint8_t codes[4];
	int char_size = 1;
	codes[0] = ((uint8_t*)pString)[offset++];
	CMap_CodeRange* pRanges = (CMap_CodeRange*)m_pLeadingBytes;
	while (1) {
	int ret = CheckCodeRange(codes, char_size, pRanges, m_nCodeRanges);
	if (ret == 0) {
	return 0;
	}
	if (ret == 2) {
	uint32_t charcode = 0;
	for (int i = 0; i < char_size; i++) {
	charcode = (charcode << 8) + codes[i];
	}
	return charcode;
	}
	if (char_size == 4 \|\| offset == nStrLen) {
	return 0;
	}
	codes[char_size++] = ((uint8_t*)pString)[offset++];
	}
	break;
	}
	}
	return 0;
	}
	int CPDF_CMap::GetCharSize(uint32_t charcode) const {
	switch (m_CodingScheme) {
	case OneByte:
	return 1;
	case TwoBytes:
	return 2;
	case MixedTwoBytes:
	case MixedFourBytes:
	if (charcode < 0x100) {
	return 1;
	}
	if (charcode < 0x10000) {
	return 2;
	}
	if (charcode < 0x1000000) {
	return 3;
	}
	return 4;
	}
	return 1;
	}
	int CPDF_CMap::CountChar(const FX_CHAR* pString, int size) const {
	switch (m_CodingScheme) {
	case OneByte:
	return size;
	case TwoBytes:
	return (size + 1) / 2;
	case MixedTwoBytes: {
	int count = 0;
	for (int i = 0; i < size; i++) {
	count++;
	if (m_pLeadingBytes[((uint8_t*)pString)[i]]) {
	i++;
	}
	}
	return count;
	}
	case MixedFourBytes: {
	int count = 0, offset = 0;
	while (offset < size) {
	GetNextChar(pString, size, offset);
	count++;
	}
	return count;
	}
	}
	return size;
	}

	int CPDF_CMap::AppendChar(FX_CHAR* str, uint32_t charcode) const {
	switch (m_CodingScheme) {
	case OneByte:
	str[0] = (uint8_t)charcode;
	return 1;
	case TwoBytes:
	str[0] = (uint8_t)(charcode / 256);
	str[1] = (uint8_t)(charcode % 256);
	return 2;
	case MixedTwoBytes:
	case MixedFourBytes:
	if (charcode < 0x100) {
	CMap_CodeRange* pRanges = (CMap_CodeRange*)m_pLeadingBytes;
	int iSize = GetCharSizeImpl(charcode, pRanges, m_nCodeRanges);
	if (iSize == 0) {
	iSize = 1;
	}
	if (iSize > 1) {
	FXSYS_memset(str, 0, sizeof(uint8_t) * iSize);
	}
	str[iSize - 1] = (uint8_t)charcode;
	return iSize;
	}
	if (charcode < 0x10000) {
	str[0] = (uint8_t)(charcode >> 8);
	str[1] = (uint8_t)charcode;
	return 2;
	}
	if (charcode < 0x1000000) {
	str[0] = (uint8_t)(charcode >> 16);
	str[1] = (uint8_t)(charcode >> 8);
	str[2] = (uint8_t)charcode;
	return 3;
	}
	str[0] = (uint8_t)(charcode >> 24);
	str[1] = (uint8_t)(charcode >> 16);
	str[2] = (uint8_t)(charcode >> 8);
	str[3] = (uint8_t)charcode;
	return 4;
	}
	return 0;
	}
	CPDF_CID2UnicodeMap::CPDF_CID2UnicodeMap() {
	m_EmbeddedCount = 0;
	}
	CPDF_CID2UnicodeMap::~CPDF_CID2UnicodeMap() {}
	FX_BOOL CPDF_CID2UnicodeMap::Initialize() {
	return TRUE;
	}
	FX_BOOL CPDF_CID2UnicodeMap::IsLoaded() {
	return m_EmbeddedCount != 0;
	}
	FX_WCHAR CPDF_CID2UnicodeMap::UnicodeFromCID(uint16_t CID) {
	if (m_Charset == CIDSET_UNICODE) {
	return CID;
	}
	if (CID < m_EmbeddedCount) {
	return m_pEmbeddedMap[CID];
	}
	return 0;
	}

	void CPDF_CID2UnicodeMap::Load(CPDF_CMapManager* pMgr,
	CIDSet charset,
	FX_BOOL bPromptCJK) {
	m_Charset = charset;
	FPDFAPI_LoadCID2UnicodeMap(charset, m_pEmbeddedMap, m_EmbeddedCount);
	}

	CIDSet CharsetFromOrdering(const CFX_ByteStringC& ordering) {
	for (size_t charset = 1; charset < FX_ArraySize(g_CharsetNames); ++charset) {
	if (ordering == g_CharsetNames[charset])
	return CIDSetFromSizeT(charset);
	}
	return CIDSET_UNKNOWN;
	}