| // Copyright 2017 The PDFium Authors |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com |
| |
| #ifndef CORE_FPDFAPI_FONT_CPDF_TOUNICODEMAP_H_ |
| #define CORE_FPDFAPI_FONT_CPDF_TOUNICODEMAP_H_ |
| |
| #include <map> |
| #include <optional> |
| #include <vector> |
| |
| #include "core/fxcrt/fx_string.h" |
| #include "core/fxcrt/retain_ptr.h" |
| #include "core/fxcrt/unowned_ptr.h" |
| |
| class CPDF_CID2UnicodeMap; |
| class CPDF_SimpleParser; |
| class CPDF_Stream; |
| |
| class CPDF_ToUnicodeMap { |
| public: |
| explicit CPDF_ToUnicodeMap(RetainPtr<const CPDF_Stream> pStream); |
| ~CPDF_ToUnicodeMap(); |
| |
| WideString Lookup(uint32_t charcode) const; |
| uint32_t ReverseLookup(wchar_t unicode) const; |
| |
| size_t GetUnicodeCountByCharcodeForTesting(uint32_t charcode) const; |
| |
| private: |
| friend class CPDFToUnicodeMapTest_StringToCode_Test; |
| friend class CPDFToUnicodeMapTest_StringToWideString_Test; |
| |
| static std::optional<uint32_t> StringToCode(ByteStringView str); |
| static WideString StringToWideString(ByteStringView str); |
| |
| void Load(RetainPtr<const CPDF_Stream> pStream); |
| |
| // `previous_word` is the most recent word that `parser` returned. |
| // Returns the last word `parser` encountered. |
| ByteStringView HandleBeginBFChar(CPDF_SimpleParser& parser, |
| ByteStringView previous_word); |
| ByteStringView HandleBeginBFRange(CPDF_SimpleParser& parser, |
| ByteStringView previous_word); |
| |
| uint32_t GetMultiCharIndexIndicator() const; |
| void SetCode(uint32_t srccode, WideString destcode); |
| |
| // Inserts a new entry into `map_` and `reverse_map_`. |
| void InsertIntoMaps(uint32_t code, uint32_t destcode); |
| |
| // Key: charcode |
| // Value: unicode |
| // If there are multiple entries with the same key, this stores the lowest |
| // value. |
| std::map<uint32_t, uint32_t> map_; |
| // Key: unicode |
| // Value: charcode |
| // Since `map_` may encounter entries with the same key but different values, |
| // that situation does not cause a conflict in `reverse_map_`. Thus |
| // `reverse_map_` may have a different number of entries compared to `map_`. |
| // Similar to `map_`, if there is a key collision, then this stores the lowest |
| // value. |
| std::map<uint32_t, uint32_t> reverse_map_; |
| |
| UnownedPtr<const CPDF_CID2UnicodeMap> base_map_; |
| std::vector<WideString> multi_char_vec_; |
| }; |
| |
| #endif // CORE_FPDFAPI_FONT_CPDF_TOUNICODEMAP_H_ |