fpdfsdk/fpdf_edittext.cpp - pdfium - Git at Google

 // Copyright 2017 The PDFium Authors
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include <map>
 #include <memory>
 #include <sstream>
 #include <utility>
 #include <vector>

 #include "core/fpdfapi/font/cpdf_cidfont.h"
 #include "core/fpdfapi/font/cpdf_font.h"
 #include "core/fpdfapi/page/cpdf_docpagedata.h"
 #include "core/fpdfapi/page/cpdf_textobject.h"
 #include "core/fpdfapi/page/cpdf_textstate.h"
 #include "core/fpdfapi/parser/cpdf_array.h"
 #include "core/fpdfapi/parser/cpdf_dictionary.h"
 #include "core/fpdfapi/parser/cpdf_document.h"
 #include "core/fpdfapi/parser/cpdf_name.h"
 #include "core/fpdfapi/parser/cpdf_number.h"
 #include "core/fpdfapi/parser/cpdf_reference.h"
 #include "core/fpdfapi/parser/cpdf_stream.h"
 #include "core/fpdfapi/parser/cpdf_string.h"
 #include "core/fpdfapi/render/charposlist.h"
 #include "core/fpdfapi/render/cpdf_pagerendercontext.h"
 #include "core/fpdfapi/render/cpdf_rendercontext.h"
 #include "core/fpdfapi/render/cpdf_renderstatus.h"
 #include "core/fpdfapi/render/cpdf_textrenderer.h"
 #include "core/fpdftext/cpdf_textpage.h"
 #include "core/fxcrt/check.h"
 #include "core/fxcrt/check_op.h"
 #include "core/fxcrt/compiler_specific.h"
 #include "core/fxcrt/containers/contains.h"
 #include "core/fxcrt/fx_extension.h"
 #include "core/fxcrt/fx_memcpy_wrappers.h"
 #include "core/fxcrt/fx_string_wrappers.h"
 #include "core/fxcrt/numerics/safe_conversions.h"
 #include "core/fxcrt/span_util.h"
 #include "core/fxcrt/stl_util.h"
 #include "core/fxcrt/utf16.h"
 #include "core/fxge/cfx_defaultrenderdevice.h"
 #include "core/fxge/cfx_fontmgr.h"
 #include "core/fxge/dib/cfx_dibitmap.h"
 #include "core/fxge/fx_font.h"
 #include "core/fxge/text_char_pos.h"
 #include "fpdfsdk/cpdfsdk_helpers.h"
 #include "public/fpdf_edit.h"

 // These checks are here because core/ and public/ cannot depend on each other.
 static_assert(static_cast<int>(TextRenderingMode::MODE_UNKNOWN) ==
                   FPDF_TEXTRENDERMODE_UNKNOWN,
               "TextRenderingMode::MODE_UNKNOWN value mismatch");
 static_assert(static_cast<int>(TextRenderingMode::MODE_FILL) ==
                   FPDF_TEXTRENDERMODE_FILL,
               "TextRenderingMode::MODE_FILL value mismatch");
 static_assert(static_cast<int>(TextRenderingMode::MODE_STROKE) ==
                   FPDF_TEXTRENDERMODE_STROKE,
               "TextRenderingMode::MODE_STROKE value mismatch");
 static_assert(static_cast<int>(TextRenderingMode::MODE_FILL_STROKE) ==
                   FPDF_TEXTRENDERMODE_FILL_STROKE,
               "TextRenderingMode::MODE_FILL_STROKE value mismatch");
 static_assert(static_cast<int>(TextRenderingMode::MODE_INVISIBLE) ==
                   FPDF_TEXTRENDERMODE_INVISIBLE,
               "TextRenderingMode::MODE_INVISIBLE value mismatch");
 static_assert(static_cast<int>(TextRenderingMode::MODE_FILL_CLIP) ==
                   FPDF_TEXTRENDERMODE_FILL_CLIP,
               "TextRenderingMode::MODE_FILL_CLIP value mismatch");
 static_assert(static_cast<int>(TextRenderingMode::MODE_STROKE_CLIP) ==
                   FPDF_TEXTRENDERMODE_STROKE_CLIP,
               "TextRenderingMode::MODE_STROKE_CLIP value mismatch");
 static_assert(static_cast<int>(TextRenderingMode::MODE_FILL_STROKE_CLIP) ==
                   FPDF_TEXTRENDERMODE_FILL_STROKE_CLIP,
               "TextRenderingMode::MODE_FILL_STROKE_CLIP value mismatch");
 static_assert(static_cast<int>(TextRenderingMode::MODE_CLIP) ==
                   FPDF_TEXTRENDERMODE_CLIP,
               "TextRenderingMode::MODE_CLIP value mismatch");
 static_assert(static_cast<int>(TextRenderingMode::MODE_LAST) ==
                   FPDF_TEXTRENDERMODE_LAST,
               "TextRenderingMode::MODE_LAST value mismatch");

 namespace {

 ByteString BaseFontNameForType(const CFX_Font* font, int font_type) {
   ByteString name = font_type == FPDF_FONT_TYPE1 ? font->GetPsName()
                                                  : font->GetBaseFontName();
   return name.IsEmpty() ? CFX_Font::kUntitledFontName : name;
 }

 RetainPtr<CPDF_Dictionary> CreateCompositeFontDict(CPDF_Document* doc,
                                                    const CFX_Font* font,
                                                    int font_type,
                                                    const ByteString& name) {
   auto font_dict = doc->NewIndirect<CPDF_Dictionary>();
   font_dict->SetNewFor<CPDF_Name>("Type", "Font");
   font_dict->SetNewFor<CPDF_Name>("Subtype", "Type0");
   // TODO(npm): Get the correct encoding, if it's not identity.
   ByteString encoding = "Identity-H";
   font_dict->SetNewFor<CPDF_Name>("Encoding", encoding);
   font_dict->SetNewFor<CPDF_Name>(
       "BaseFont", font_type == FPDF_FONT_TYPE1 ? name + "-" + encoding : name);
   return font_dict;
 }

 RetainPtr<CPDF_Dictionary> CreateCidFontDict(CPDF_Document* doc,
                                              int font_type,
                                              const ByteString& name) {
   auto cid_font_dict = doc->NewIndirect<CPDF_Dictionary>();
   cid_font_dict->SetNewFor<CPDF_Name>("Type", "Font");
   cid_font_dict->SetNewFor<CPDF_Name>("Subtype", font_type == FPDF_FONT_TYPE1
                                                      ? "CIDFontType0"
                                                      : "CIDFontType2");
   cid_font_dict->SetNewFor<CPDF_Name>("BaseFont", name);

   // TODO(npm): Maybe use FT_Get_CID_Registry_Ordering_Supplement to get the
   // CIDSystemInfo
   auto cid_system_info_dict = doc->NewIndirect<CPDF_Dictionary>();
   cid_system_info_dict->SetNewFor<CPDF_String>("Registry", "Adobe");
   cid_system_info_dict->SetNewFor<CPDF_String>("Ordering", "Identity");
   cid_system_info_dict->SetNewFor<CPDF_Number>("Supplement", 0);
   cid_font_dict->SetNewFor<CPDF_Reference>("CIDSystemInfo", doc,
                                            cid_system_info_dict->GetObjNum());
   return cid_font_dict;
 }

 RetainPtr<CPDF_Dictionary> LoadFontDesc(CPDF_Document* doc,
                                         const ByteString& font_name,
                                         CFX_Font* font,
                                         pdfium::span<const uint8_t> font_data,
                                         int font_type) {
   auto font_descriptor_dict = doc->NewIndirect<CPDF_Dictionary>();
   font_descriptor_dict->SetNewFor<CPDF_Name>("Type", "FontDescriptor");
   font_descriptor_dict->SetNewFor<CPDF_Name>("FontName", font_name);
   int flags = 0;
   if (font->GetFace()->IsFixedWidth()) {
     flags |= FXFONT_FIXED_PITCH;
   }
   if (font_name.Contains("Serif"))
     flags |= FXFONT_SERIF;
   if (font->GetFace()->IsItalic()) {
     flags |= FXFONT_ITALIC;
   }
   if (font->GetFace()->IsBold()) {
     flags |= FXFONT_FORCE_BOLD;
   }

   // TODO(npm): How do I know if a font is symbolic, script, allcap, smallcap?
   flags |= FXFONT_NONSYMBOLIC;

   font_descriptor_dict->SetNewFor<CPDF_Number>("Flags", flags);
   FX_RECT bbox = font->GetBBox().value_or(FX_RECT());
   font_descriptor_dict->SetRectFor("FontBBox", CFX_FloatRect(bbox));

   // TODO(npm): calculate italic angle correctly
   font_descriptor_dict->SetNewFor<CPDF_Number>("ItalicAngle",
                                                font->IsItalic() ? -12 : 0);

   font_descriptor_dict->SetNewFor<CPDF_Number>("Ascent", font->GetAscent());
   font_descriptor_dict->SetNewFor<CPDF_Number>("Descent", font->GetDescent());

   // TODO(npm): calculate the capheight, stemV correctly
   font_descriptor_dict->SetNewFor<CPDF_Number>("CapHeight", font->GetAscent());
   font_descriptor_dict->SetNewFor<CPDF_Number>("StemV",
                                                font->IsBold() ? 120 : 70);

   auto stream = doc->NewIndirect<CPDF_Stream>(font_data);
   // TODO(npm): Lengths for Type1 fonts.
   if (font_type == FPDF_FONT_TRUETYPE) {
     stream->GetMutableDict()->SetNewFor<CPDF_Number>(
         "Length1", pdfium::checked_cast<int>(font_data.size()));
   }
   ByteString font_file_key =
       font_type == FPDF_FONT_TYPE1 ? "FontFile" : "FontFile2";
   font_descriptor_dict->SetNewFor<CPDF_Reference>(font_file_key, doc,
                                                   stream->GetObjNum());
   return font_descriptor_dict;
 }

 RetainPtr<CPDF_Array> CreateWidthsArray(
     CPDF_Document* doc,
     const std::map<uint32_t, uint32_t>& widths) {
   auto widths_array = doc->NewIndirect<CPDF_Array>();
   for (auto it = widths.begin(); it != widths.end(); ++it) {
     int ch = it->first;
     int w = it->second;
     if (std::next(it) == widths.end()) {
       // Only one char left, use format c [w]
       auto single_w_array = pdfium::MakeRetain<CPDF_Array>();
       single_w_array->AppendNew<CPDF_Number>(w);
       widths_array->AppendNew<CPDF_Number>(ch);
       widths_array->Append(std::move(single_w_array));
       break;
     }
     ++it;
     int next_ch = it->first;
     int next_w = it->second;
     if (next_ch == ch + 1 && next_w == w) {
       // The array can have a group c_first c_last w: all CIDs in the range from
       // c_first to c_last will have width w
       widths_array->AppendNew<CPDF_Number>(ch);
       ch = next_ch;
       while (true) {
         auto next_it = std::next(it);
         if (next_it == widths.end() || next_it->first != it->first + 1 ||
             next_it->second != it->second) {
           break;
         }
         ++it;
         ch = it->first;
       }
       widths_array->AppendNew<CPDF_Number>(ch);
       widths_array->AppendNew<CPDF_Number>(w);
       continue;
     }
     // Otherwise we can have a group of the form c [w1 w2 ...]: c has width
     // w1, c+1 has width w2, etc.
     widths_array->AppendNew<CPDF_Number>(ch);
     auto current_width_array = pdfium::MakeRetain<CPDF_Array>();
     current_width_array->AppendNew<CPDF_Number>(w);
     current_width_array->AppendNew<CPDF_Number>(next_w);
     while (true) {
       auto next_it = std::next(it);
       if (next_it == widths.end() || next_it->first != it->first + 1) {
         break;
       }
       ++it;
       current_width_array->AppendNew<CPDF_Number>(static_cast<int>(it->second));
     }
     widths_array->Append(std::move(current_width_array));
   }
   return widths_array;
 }

 const char kToUnicodeStart[] =
     "/CIDInit /ProcSet findresource begin\n"
     "12 dict begin\n"
     "begincmap\n"
     "/CIDSystemInfo\n"
     "<</Registry (Adobe)\n"
     "/Ordering (Identity)\n"
     "/Supplement 0\n"
     ">> def\n"
     "/CMapName /Adobe-Identity-H def\n"
     "/CMapType 2 def\n"
     "1 begincodespacerange\n"
     "<0000> <FFFF>\n"
     "endcodespacerange\n";

 const char kToUnicodeEnd[] =
     "endcmap\n"
     "CMapName currentdict /CMap defineresource pop\n"
     "end\n"
     "end\n";

 void AddCharcode(fxcrt::ostringstream& buffer, uint32_t number) {
   CHECK_LE(number, 0xFFFF);
   buffer << "<";
   char ans[4];
   FXSYS_IntToFourHexChars(number, ans);
   for (char c : ans) {
     buffer << c;
   }
   buffer << ">";
 }

 // PDF spec 1.7 Section 5.9.2: "Unicode character sequences as expressed in
 // UTF-16BE encoding." See https://en.wikipedia.org/wiki/UTF-16#Description
 void AddUnicode(fxcrt::ostringstream& buffer, uint32_t unicode) {
   if (pdfium::IsHighSurrogate(unicode) || pdfium::IsLowSurrogate(unicode)) {
     unicode = 0;
   }

   char ans[8];
   size_t char_count = FXSYS_ToUTF16BE(unicode, ans);
   buffer << "<";
   CHECK_LE(char_count, std::size(ans));
   auto ans_span = pdfium::make_span(ans).first(char_count);
   for (char c : ans_span) {
     buffer << c;
   }
   buffer << ">";
 }

 // Loads the charcode to unicode mapping into a stream
 RetainPtr<CPDF_Stream> LoadUnicode(
     CPDF_Document* doc,
     const std::multimap<uint32_t, uint32_t>& to_unicode) {
   // A map charcode->unicode
   std::map<uint32_t, uint32_t> char_to_uni;
   // A map <char_start, char_end> to vector v of unicode characters of size (end
   // - start + 1). This abbreviates: start->v[0], start+1->v[1], etc. PDF spec
   // 1.7 Section 5.9.2 says that only the last byte of the unicode may change.
   std::map<std::pair<uint32_t, uint32_t>, std::vector<uint32_t>>
       map_range_vector;
   // A map <start, end> -> unicode
   // This abbreviates: start->unicode, start+1->unicode+1, etc.
   // PDF spec 1.7 Section 5.9.2 says that only the last byte of the unicode may
   // change.
   std::map<std::pair<uint32_t, uint32_t>, uint32_t> map_range;

   // Calculate the maps
   for (auto it = to_unicode.begin(); it != to_unicode.end(); ++it) {
     uint32_t first_charcode = it->first;
     uint32_t first_unicode = it->second;
     {
       auto next_it = std::next(it);
       if (next_it == to_unicode.end() || first_charcode + 1 != next_it->first) {
         char_to_uni[first_charcode] = first_unicode;
         continue;
       }
     }
     ++it;
     uint32_t current_charcode = it->first;
     uint32_t current_unicode = it->second;
     if (current_charcode % 256 == 0) {
       char_to_uni[first_charcode] = first_unicode;
       char_to_uni[current_charcode] = current_unicode;
       continue;
     }
     const size_t max_extra = 255 - (current_charcode % 256);
     auto next_it = std::next(it);
     if (first_unicode + 1 != current_unicode) {
       // Consecutive charcodes mapping to non-consecutive unicodes
       std::vector<uint32_t> unicodes = {first_unicode, current_unicode};
       for (size_t i = 0; i < max_extra; ++i) {
         if (next_it == to_unicode.end() ||
             current_charcode + 1 != next_it->first) {
           break;
         }
         ++it;
         ++current_charcode;
         unicodes.push_back(it->second);
         next_it = std::next(it);
       }
       CHECK_EQ(it->first - first_charcode + 1, unicodes.size());
       map_range_vector[std::make_pair(first_charcode, it->first)] = unicodes;
       continue;
     }
     // Consecutive charcodes mapping to consecutive unicodes
     for (size_t i = 0; i < max_extra; ++i) {
       if (next_it == to_unicode.end() ||
           current_charcode + 1 != next_it->first ||
           current_unicode + 1 != next_it->second) {
         break;
       }
       ++it;
       ++current_charcode;
       ++current_unicode;
       next_it = std::next(it);
     }
     map_range[std::make_pair(first_charcode, current_charcode)] = first_unicode;
   }

   fxcrt::ostringstream buffer;
   buffer << kToUnicodeStart;
   // Add maps to buffer
   buffer << static_cast<uint32_t>(char_to_uni.size()) << " beginbfchar\n";
   for (const auto& it : char_to_uni) {
     AddCharcode(buffer, it.first);
     buffer << " ";
     AddUnicode(buffer, it.second);
     buffer << "\n";
   }
   buffer << "endbfchar\n"
          << static_cast<uint32_t>(map_range_vector.size() + map_range.size())
          << " beginbfrange\n";
   for (const auto& it : map_range_vector) {
     const std::pair<uint32_t, uint32_t>& charcode_range = it.first;
     AddCharcode(buffer, charcode_range.first);
     buffer << " ";
     AddCharcode(buffer, charcode_range.second);
     buffer << " [";
     const std::vector<uint32_t>& unicodes = it.second;
     for (size_t i = 0; i < unicodes.size(); ++i) {
       AddUnicode(buffer, unicodes[i]);
       if (i != unicodes.size() - 1)
         buffer << " ";
     }
     buffer << "]\n";
   }
   for (const auto& it : map_range) {
     const std::pair<uint32_t, uint32_t>& charcode_range = it.first;
     AddCharcode(buffer, charcode_range.first);
     buffer << " ";
     AddCharcode(buffer, charcode_range.second);
     buffer << " ";
     AddUnicode(buffer, it.second);
     buffer << "\n";
   }
   buffer << "endbfrange\n";
   buffer << kToUnicodeEnd;
   auto stream = doc->NewIndirect<CPDF_Stream>(&buffer);
   return stream;
 }

 void CreateDescendantFontsArray(CPDF_Document* doc,
                                 CPDF_Dictionary* font_dict,
                                 uint32_t cid_font_dict_obj_num) {
   auto descendant_fonts_dict =
       font_dict->SetNewFor<CPDF_Array>("DescendantFonts");
   descendant_fonts_dict->AppendNew<CPDF_Reference>(doc, cid_font_dict_obj_num);
 }

 RetainPtr<CPDF_Font> LoadSimpleFont(CPDF_Document* doc,
                                     std::unique_ptr<CFX_Font> font,
                                     pdfium::span<const uint8_t> font_data,
                                     int font_type) {
   // If it doesn't have a single char, just fail.
   RetainPtr<CFX_Face> face = font->GetFace();
   if (face->GetGlyphCount() <= 0) {
     return nullptr;
   }

   // Simple fonts have 1-byte charcodes only.
   static constexpr uint32_t kMaxSimpleFontChar = 0xFF;
   auto char_codes_and_indices =
       face->GetCharCodesAndIndices(kMaxSimpleFontChar);
   if (char_codes_and_indices.empty()) {
     return nullptr;
   }

   auto font_dict = doc->NewIndirect<CPDF_Dictionary>();
   font_dict->SetNewFor<CPDF_Name>("Type", "Font");
   font_dict->SetNewFor<CPDF_Name>(
       "Subtype", font_type == FPDF_FONT_TYPE1 ? "Type1" : "TrueType");
   const ByteString name = BaseFontNameForType(font.get(), font_type);
   font_dict->SetNewFor<CPDF_Name>("BaseFont", name);

   font_dict->SetNewFor<CPDF_Number>(
       "FirstChar", static_cast<int>(char_codes_and_indices[0].char_code));
   auto widths_array = doc->NewIndirect<CPDF_Array>();
   for (size_t i = 0; i < char_codes_and_indices.size(); ++i) {
     widths_array->AppendNew<CPDF_Number>(
         font->GetGlyphWidth(char_codes_and_indices[i].glyph_index));
     if (i > 0 && i < char_codes_and_indices.size() - 1) {
       for (uint32_t j = char_codes_and_indices[i - 1].char_code + 1;
            j < char_codes_and_indices[i].char_code; ++j) {
         widths_array->AppendNew<CPDF_Number>(0);
       }
     }
   }
   font_dict->SetNewFor<CPDF_Number>(
       "LastChar", static_cast<int>(char_codes_and_indices.back().char_code));
   font_dict->SetNewFor<CPDF_Reference>("Widths", doc,
                                        widths_array->GetObjNum());
   RetainPtr<CPDF_Dictionary> font_descriptor_dict =
       LoadFontDesc(doc, name, font.get(), font_data, font_type);

   font_dict->SetNewFor<CPDF_Reference>("FontDescriptor", doc,
                                        font_descriptor_dict->GetObjNum());
   return CPDF_DocPageData::FromDocument(doc)->GetFont(std::move(font_dict));
 }

 RetainPtr<CPDF_Font> LoadCompositeFont(CPDF_Document* doc,
                                        std::unique_ptr<CFX_Font> font,
                                        pdfium::span<const uint8_t> font_data,
                                        int font_type) {
   // If it doesn't have a single char, just fail.
   RetainPtr<CFX_Face> face = font->GetFace();
   if (face->GetGlyphCount() <= 0) {
     return nullptr;
   }

   auto char_codes_and_indices =
       face->GetCharCodesAndIndices(pdfium::kMaximumSupplementaryCodePoint);
   if (char_codes_and_indices.empty()) {
     return nullptr;
   }

   const ByteString name = BaseFontNameForType(font.get(), font_type);
   RetainPtr<CPDF_Dictionary> font_dict =
       CreateCompositeFontDict(doc, font.get(), font_type, name);

   RetainPtr<CPDF_Dictionary> cid_font_dict =
       CreateCidFontDict(doc, font_type, name);

   RetainPtr<CPDF_Dictionary> font_descriptor_dict =
       LoadFontDesc(doc, name, font.get(), font_data, font_type);
   cid_font_dict->SetNewFor<CPDF_Reference>("FontDescriptor", doc,
                                            font_descriptor_dict->GetObjNum());

   std::multimap<uint32_t, uint32_t> to_unicode;
   std::map<uint32_t, uint32_t> widths;
   for (const auto& item : char_codes_and_indices) {
     if (!pdfium::Contains(widths, item.glyph_index)) {
       widths[item.glyph_index] = font->GetGlyphWidth(item.glyph_index);
     }
     to_unicode.emplace(item.glyph_index, item.char_code);
   }
   RetainPtr<CPDF_Array> widths_array = CreateWidthsArray(doc, widths);
   cid_font_dict->SetNewFor<CPDF_Reference>("W", doc, widths_array->GetObjNum());

   // TODO(npm): Support vertical writing

   CreateDescendantFontsArray(doc, font_dict.Get(), cid_font_dict->GetObjNum());

   RetainPtr<CPDF_Stream> to_unicode_stream = LoadUnicode(doc, to_unicode);
   font_dict->SetNewFor<CPDF_Reference>("ToUnicode", doc,
                                        to_unicode_stream->GetObjNum());
   return CPDF_DocPageData::FromDocument(doc)->GetFont(font_dict);
 }

 RetainPtr<CPDF_Font> LoadCustomCompositeFont(
     CPDF_Document* doc,
     std::unique_ptr<CFX_Font> font,
     pdfium::span<const uint8_t> font_span,
     const char* to_unicode_cmap,
     pdfium::span<const uint8_t> cid_to_gid_map_span) {
   // If it doesn't have a single char, just fail.
   RetainPtr<CFX_Face> face = font->GetFace();
   if (face->GetGlyphCount() <= 0) {
     return nullptr;
   }

   auto char_codes_and_indices =
       face->GetCharCodesAndIndices(pdfium::kMaximumSupplementaryCodePoint);
   if (char_codes_and_indices.empty()) {
     return nullptr;
   }

   const ByteString name = BaseFontNameForType(font.get(), FPDF_FONT_TRUETYPE);
   RetainPtr<CPDF_Dictionary> font_dict =
       CreateCompositeFontDict(doc, font.get(), FPDF_FONT_TRUETYPE, name);

   RetainPtr<CPDF_Dictionary> cid_font_dict =
       CreateCidFontDict(doc, FPDF_FONT_TRUETYPE, name);

   RetainPtr<CPDF_Dictionary> font_descriptor =
       LoadFontDesc(doc, name, font.get(), font_span, FPDF_FONT_TRUETYPE);
   cid_font_dict->SetNewFor<CPDF_Reference>("FontDescriptor", doc,
                                            font_descriptor->GetObjNum());

   std::map<uint32_t, uint32_t> widths;
   for (const auto& item : char_codes_and_indices) {
     if (!pdfium::Contains(widths, item.glyph_index)) {
       widths[item.glyph_index] = font->GetGlyphWidth(item.glyph_index);
     }
   }
   RetainPtr<CPDF_Array> widths_array = CreateWidthsArray(doc, widths);
   cid_font_dict->SetNewFor<CPDF_Reference>("W", doc, widths_array->GetObjNum());

   auto cid_to_gid_map = doc->NewIndirect<CPDF_Stream>(cid_to_gid_map_span);
   cid_font_dict->SetNewFor<CPDF_Reference>("CIDToGIDMap", doc,
                                            cid_to_gid_map->GetObjNum());

   CreateDescendantFontsArray(doc, font_dict, cid_font_dict->GetObjNum());

   auto to_unicode_stream = doc->NewIndirect<CPDF_Stream>(
       ByteStringView(to_unicode_cmap).unsigned_span());
   font_dict->SetNewFor<CPDF_Reference>("ToUnicode", doc,
                                        to_unicode_stream->GetObjNum());
   return CPDF_DocPageData::FromDocument(doc)->GetFont(font_dict);
 }

 CPDF_TextObject* CPDFTextObjectFromFPDFPageObject(FPDF_PAGEOBJECT page_object) {
   auto* obj = CPDFPageObjectFromFPDFPageObject(page_object);
   return obj ? obj->AsText() : nullptr;
 }

 FPDF_GLYPHPATH FPDFGlyphPathFromCFXPath(const CFX_Path* path) {
   return reinterpret_cast<FPDF_GLYPHPATH>(path);
 }
 const CFX_Path* CFXPathFromFPDFGlyphPath(FPDF_GLYPHPATH path) {
   return reinterpret_cast<const CFX_Path*>(path);
 }

 }  // namespace

 FPDF_EXPORT FPDF_PAGEOBJECT FPDF_CALLCONV
 FPDFPageObj_NewTextObj(FPDF_DOCUMENT document,
                        FPDF_BYTESTRING font,
                        float font_size) {
   CPDF_Document* pDoc = CPDFDocumentFromFPDFDocument(document);
   if (!pDoc)
     return nullptr;

   RetainPtr<CPDF_Font> pFont =
       CPDF_Font::GetStockFont(pDoc, ByteStringView(font));
   if (!pFont)
     return nullptr;

   auto pTextObj = std::make_unique<CPDF_TextObject>();
   pTextObj->mutable_text_state().SetFont(std::move(pFont));
   pTextObj->mutable_text_state().SetFontSize(font_size);
   pTextObj->SetDefaultStates();

   // Caller takes ownership.
   return FPDFPageObjectFromCPDFPageObject(pTextObj.release());
 }

 FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV
 FPDFText_SetText(FPDF_PAGEOBJECT text_object, FPDF_WIDESTRING text) {
   CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text_object);
   if (!pTextObj) {
     return false;
   }
   // SAFETY: required from caller.
   WideString encodedText = UNSAFE_BUFFERS(WideStringFromFPDFWideString(text));
   ByteString byteText;
   for (wchar_t wc : encodedText) {
     pTextObj->GetFont()->AppendChar(
         &byteText, pTextObj->GetFont()->CharCodeFromUnicode(wc));
   }
   pTextObj->SetText(byteText);
   return true;
 }

 FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV
 FPDFText_SetCharcodes(FPDF_PAGEOBJECT text_object,
                       const uint32_t* charcodes,
                       size_t count) {
   CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text_object);
   if (!pTextObj)
     return false;

   if (!charcodes && count)
     return false;

   ByteString byte_text;
   if (charcodes) {
     for (size_t i = 0; i < count; ++i) {
       pTextObj->GetFont()->AppendChar(&byte_text, UNSAFE_TODO(charcodes[i]));
     }
   }
   pTextObj->SetText(byte_text);
   return true;
 }

 FPDF_EXPORT FPDF_FONT FPDF_CALLCONV FPDFText_LoadFont(FPDF_DOCUMENT document,
                                                       const uint8_t* data,
                                                       uint32_t size,
                                                       int font_type,
                                                       FPDF_BOOL cid) {
   CPDF_Document* pDoc = CPDFDocumentFromFPDFDocument(document);
   if (!pDoc || !data || size == 0 ||
       (font_type != FPDF_FONT_TYPE1 && font_type != FPDF_FONT_TRUETYPE)) {
     return nullptr;
   }
   // SAFETY: required from caller.
   auto span = UNSAFE_BUFFERS(pdfium::make_span(data, size));
   auto pFont = std::make_unique<CFX_Font>();

   // TODO(npm): Maybe use FT_Get_X11_Font_Format to check format? Otherwise, we
   // are allowing giving any font that can be loaded on freetype and setting it
   // as any font type.
   if (!pFont->LoadEmbedded(span, /*force_vertical=*/false, /*object_tag=*/0))
     return nullptr;

   // Caller takes ownership.
   return FPDFFontFromCPDFFont(
       cid ? LoadCompositeFont(pDoc, std::move(pFont), span, font_type).Leak()
           : LoadSimpleFont(pDoc, std::move(pFont), span, font_type).Leak());
 }

 FPDF_EXPORT FPDF_FONT FPDF_CALLCONV
 FPDFText_LoadStandardFont(FPDF_DOCUMENT document, FPDF_BYTESTRING font) {
   CPDF_Document* pDoc = CPDFDocumentFromFPDFDocument(document);
   if (!pDoc)
     return nullptr;

   // Caller takes ownership.
   return FPDFFontFromCPDFFont(
       CPDF_Font::GetStockFont(pDoc, ByteStringView(font)).Leak());
 }

 FPDF_EXPORT FPDF_FONT FPDF_CALLCONV
 FPDFText_LoadCidType2Font(FPDF_DOCUMENT document,
                           const uint8_t* font_data,
                           uint32_t font_data_size,
                           FPDF_BYTESTRING to_unicode_cmap,
                           const uint8_t* cid_to_gid_map_data,
                           uint32_t cid_to_gid_map_data_size) {
   CPDF_Document* doc = CPDFDocumentFromFPDFDocument(document);
   if (!doc || !font_data || font_data_size == 0 || !to_unicode_cmap ||
       strlen(to_unicode_cmap) == 0 || !cid_to_gid_map_data ||
       cid_to_gid_map_data_size == 0) {
     return nullptr;
   }
   // SAFETY: required from caller.
   auto font_span = UNSAFE_BUFFERS(pdfium::make_span(font_data, font_data_size));
   auto font = std::make_unique<CFX_Font>();

   // TODO(thestig): Consider checking the font format. See similar comment in
   // FPDFText_LoadFont() above.
   if (!font->LoadEmbedded(font_span, /*force_vertical=*/false,
                           /*object_tag=*/0)) {
     return nullptr;
   }

   // Caller takes ownership of result.
   // SAFETY: caller ensures `cid_to_gid_map_data` points to at least
   // `cid_to_gid_map_data_size` entries.
   return FPDFFontFromCPDFFont(
       LoadCustomCompositeFont(
           doc, std::move(font), font_span, to_unicode_cmap,
           UNSAFE_BUFFERS(
               pdfium::make_span(cid_to_gid_map_data, cid_to_gid_map_data_size)))
           .Leak());
 }

 FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV
 FPDFTextObj_GetFontSize(FPDF_PAGEOBJECT text, float* size) {
   if (!size)
     return false;

   CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text);
   if (!pTextObj)
     return false;

   *size = pTextObj->GetFontSize();
   return true;
 }

 FPDF_EXPORT unsigned long FPDF_CALLCONV
 FPDFTextObj_GetText(FPDF_PAGEOBJECT text_object,
                     FPDF_TEXTPAGE text_page,
                     FPDF_WCHAR* buffer,
                     unsigned long length) {
   CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text_object);
   if (!pTextObj)
     return 0;

   CPDF_TextPage* pTextPage = CPDFTextPageFromFPDFTextPage(text_page);
   if (!pTextPage)
     return 0;

   // SAFETY: required from caller.
   return Utf16EncodeMaybeCopyAndReturnLength(
       pTextPage->GetTextByObject(pTextObj),
       UNSAFE_BUFFERS(SpanFromFPDFApiArgs(buffer, length)));
 }

 FPDF_EXPORT FPDF_BITMAP FPDF_CALLCONV
 FPDFTextObj_GetRenderedBitmap(FPDF_DOCUMENT document,
                               FPDF_PAGE page,
                               FPDF_PAGEOBJECT text_object,
                               float scale) {
   CPDF_Document* doc = CPDFDocumentFromFPDFDocument(document);
   if (!doc)
     return nullptr;

   CPDF_Page* optional_page = CPDFPageFromFPDFPage(page);
   if (optional_page && optional_page->GetDocument() != doc)
     return nullptr;

   CPDF_TextObject* text = CPDFTextObjectFromFPDFPageObject(text_object);
   if (!text)
     return nullptr;

   if (scale <= 0)
     return nullptr;

   const CFX_Matrix scale_matrix(scale, 0, 0, scale, 0, 0);
   const CFX_FloatRect& text_rect = text->GetRect();
   const CFX_FloatRect scaled_text_rect = scale_matrix.TransformRect(text_rect);

   // `rect` has to use integer values. Round up as needed.
   const FX_RECT rect = scaled_text_rect.GetOuterRect();
   if (rect.IsEmpty())
     return nullptr;

   auto result_bitmap = pdfium::MakeRetain<CFX_DIBitmap>();
   if (!result_bitmap->Create(rect.Width(), rect.Height(), FXDIB_Format::kArgb))
     return nullptr;

   auto render_context = std::make_unique<CPDF_PageRenderContext>();
   CPDF_PageRenderContext* render_context_ptr = render_context.get();
   CPDF_Page::RenderContextClearer clearer(optional_page);
   if (optional_page)
     optional_page->SetRenderContext(std::move(render_context));

   RetainPtr<CPDF_Dictionary> page_resources =
       optional_page ? optional_page->GetMutablePageResources() : nullptr;

   auto device = std::make_unique<CFX_DefaultRenderDevice>();
   CFX_DefaultRenderDevice* device_ptr = device.get();
   render_context_ptr->m_pDevice = std::move(device);
   render_context_ptr->m_pContext = std::make_unique<CPDF_RenderContext>(
       doc, std::move(page_resources), /*pPageCache=*/nullptr);

   device_ptr->Attach(result_bitmap);

   CFX_Matrix device_matrix(rect.Width(), 0, 0, rect.Height(), 0, 0);
   CPDF_RenderStatus status(render_context_ptr->m_pContext.get(), device_ptr);
   status.SetDeviceMatrix(device_matrix);
   status.Initialize(nullptr, nullptr);

   // Need to flip the rendering and also move it to fit within `result_bitmap`.
   CFX_Matrix render_matrix(1, 0, 0, -1, -text_rect.left, text_rect.top);
   render_matrix *= scale_matrix;
   status.RenderSingleObject(text, render_matrix);

   // Caller takes ownership.
   return FPDFBitmapFromCFXDIBitmap(result_bitmap.Leak());
 }

 FPDF_EXPORT void FPDF_CALLCONV FPDFFont_Close(FPDF_FONT font) {
   // Take back ownership from caller and release.
   RetainPtr<CPDF_Font>().Unleak(CPDFFontFromFPDFFont(font));
 }

 FPDF_EXPORT FPDF_PAGEOBJECT FPDF_CALLCONV
 FPDFPageObj_CreateTextObj(FPDF_DOCUMENT document,
                           FPDF_FONT font,
                           float font_size) {
   CPDF_Document* pDoc = CPDFDocumentFromFPDFDocument(document);
   CPDF_Font* pFont = CPDFFontFromFPDFFont(font);
   if (!pDoc || !pFont)
     return nullptr;

   auto pTextObj = std::make_unique<CPDF_TextObject>();
   pTextObj->mutable_text_state().SetFont(
       CPDF_DocPageData::FromDocument(pDoc)->GetFont(
           pFont->GetMutableFontDict()));
   pTextObj->mutable_text_state().SetFontSize(font_size);
   pTextObj->SetDefaultStates();
   return FPDFPageObjectFromCPDFPageObject(pTextObj.release());
 }

 FPDF_EXPORT FPDF_TEXT_RENDERMODE FPDF_CALLCONV
 FPDFTextObj_GetTextRenderMode(FPDF_PAGEOBJECT text) {
   CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text);
   if (!pTextObj)
     return FPDF_TEXTRENDERMODE_UNKNOWN;
   return static_cast<FPDF_TEXT_RENDERMODE>(pTextObj->GetTextRenderMode());
 }

 FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV
 FPDFTextObj_SetTextRenderMode(FPDF_PAGEOBJECT text,
                               FPDF_TEXT_RENDERMODE render_mode) {
   if (render_mode <= FPDF_TEXTRENDERMODE_UNKNOWN ||
       render_mode > FPDF_TEXTRENDERMODE_LAST) {
     return false;
   }

   CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text);
   if (!pTextObj)
     return false;

   pTextObj->SetTextRenderMode(static_cast<TextRenderingMode>(render_mode));
   return true;
 }

 FPDF_EXPORT FPDF_FONT FPDF_CALLCONV FPDFTextObj_GetFont(FPDF_PAGEOBJECT text) {
   CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text);
   if (!pTextObj)
     return nullptr;

   // Unretained reference in public API. NOLINTNEXTLINE
   return FPDFFontFromCPDFFont(pTextObj->GetFont());
 }

 FPDF_EXPORT unsigned long FPDF_CALLCONV
 FPDFFont_GetFontName(FPDF_FONT font, char* buffer, unsigned long length) {
   auto* pFont = CPDFFontFromFPDFFont(font);
   if (!pFont)
     return 0;

   // SAFETY: required from caller.
   auto result_span = UNSAFE_BUFFERS(SpanFromFPDFApiArgs(buffer, length));
   ByteString name = pFont->GetFont()->GetFamilyName();
   pdfium::span<const char> name_span = name.span_with_terminator();
   fxcrt::try_spancpy(result_span, name_span);
   return static_cast<unsigned long>(name_span.size());
 }

 FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetFontData(FPDF_FONT font,
                                                          uint8_t* buffer,
                                                          size_t buflen,
                                                          size_t* out_buflen) {
   auto* cfont = CPDFFontFromFPDFFont(font);
   if (!cfont || !out_buflen)
     return false;

   // SAFETY: required from caller.
   auto result_span = UNSAFE_BUFFERS(
       SpanFromFPDFApiArgs(buffer, pdfium::checked_cast<unsigned long>(buflen)));
   pdfium::span<const uint8_t> data = cfont->GetFont()->GetFontSpan();
   fxcrt::try_spancpy(result_span, data);
   *out_buflen = data.size();
   return true;
 }

 FPDF_EXPORT int FPDF_CALLCONV FPDFFont_GetIsEmbedded(FPDF_FONT font) {
   auto* cfont = CPDFFontFromFPDFFont(font);
   if (!cfont)
     return -1;
   return cfont->IsEmbedded() ? 1 : 0;
 }

 FPDF_EXPORT int FPDF_CALLCONV FPDFFont_GetFlags(FPDF_FONT font) {
   auto* pFont = CPDFFontFromFPDFFont(font);
   if (!pFont)
     return -1;

   // Return only flags from ISO 32000-1:2008, table 123.
   return pFont->GetFontFlags() & 0x7ffff;
 }

 FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetWeight(FPDF_FONT font) {
   auto* pFont = CPDFFontFromFPDFFont(font);
   return pFont ? pFont->GetFontWeight() : -1;
 }

 FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetItalicAngle(FPDF_FONT font,
                                                             int* angle) {
   auto* pFont = CPDFFontFromFPDFFont(font);
   if (!pFont || !angle)
     return false;

   *angle = pFont->GetItalicAngle();
   return true;
 }

 FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetAscent(FPDF_FONT font,
                                                        float font_size,
                                                        float* ascent) {
   auto* pFont = CPDFFontFromFPDFFont(font);
   if (!pFont || !ascent)
     return false;

   *ascent = pFont->GetTypeAscent() * font_size / 1000.f;
   return true;
 }

 FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetDescent(FPDF_FONT font,
                                                         float font_size,
                                                         float* descent) {
   auto* pFont = CPDFFontFromFPDFFont(font);
   if (!pFont || !descent)
     return false;

   *descent = pFont->GetTypeDescent() * font_size / 1000.f;
   return true;
 }

 FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetGlyphWidth(FPDF_FONT font,
                                                            uint32_t glyph,
                                                            float font_size,
                                                            float* width) {
   auto* pFont = CPDFFontFromFPDFFont(font);
   if (!pFont || !width)
     return false;

   uint32_t charcode = pFont->CharCodeFromUnicode(static_cast<wchar_t>(glyph));

   CPDF_CIDFont* pCIDFont = pFont->AsCIDFont();
   if (pCIDFont && pCIDFont->IsVertWriting()) {
     uint16_t cid = pCIDFont->CIDFromCharCode(charcode);
     *width = pCIDFont->GetVertWidth(cid) * font_size / 1000.f;
   } else {
     *width = pFont->GetCharWidthF(charcode) * font_size / 1000.f;
   }

   return true;
 }

 FPDF_EXPORT FPDF_GLYPHPATH FPDF_CALLCONV
 FPDFFont_GetGlyphPath(FPDF_FONT font, uint32_t glyph, float font_size) {
   auto* pFont = CPDFFontFromFPDFFont(font);
   if (!pFont)
     return nullptr;

   if (!pdfium::IsValueInRangeForNumericType<wchar_t>(glyph)) {
     return nullptr;
   }

   uint32_t charcode = pFont->CharCodeFromUnicode(static_cast<wchar_t>(glyph));
   std::vector<TextCharPos> pos =
       GetCharPosList(pdfium::span_from_ref(charcode),
                      pdfium::span<const float>(), pFont, font_size);
   if (pos.empty())
     return nullptr;

   CFX_Font* pCfxFont;
   if (pos[0].m_FallbackFontPosition == -1) {
     pCfxFont = pFont->GetFont();
     DCHECK(pCfxFont);  // Never null.
   } else {
     pCfxFont = pFont->GetFontFallback(pos[0].m_FallbackFontPosition);
     if (!pCfxFont)
       return nullptr;
   }

   const CFX_Path* pPath =
       pCfxFont->LoadGlyphPath(pos[0].m_GlyphIndex, pos[0].m_FontCharWidth);

   return FPDFGlyphPathFromCFXPath(pPath);
 }

 FPDF_EXPORT int FPDF_CALLCONV
 FPDFGlyphPath_CountGlyphSegments(FPDF_GLYPHPATH glyphpath) {
   auto* pPath = CFXPathFromFPDFGlyphPath(glyphpath);
   if (!pPath)
     return -1;

   return fxcrt::CollectionSize<int>(pPath->GetPoints());
 }

 FPDF_EXPORT FPDF_PATHSEGMENT FPDF_CALLCONV
 FPDFGlyphPath_GetGlyphPathSegment(FPDF_GLYPHPATH glyphpath, int index) {
   auto* pPath = CFXPathFromFPDFGlyphPath(glyphpath);
   if (!pPath)
     return nullptr;

   pdfium::span<const CFX_Path::Point> points = pPath->GetPoints();
   if (!fxcrt::IndexInBounds(points, index))
     return nullptr;

   return FPDFPathSegmentFromFXPathPoint(&points[index]);
 }