| // Copyright 2017 The PDFium Authors |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include <map> |
| #include <memory> |
| #include <sstream> |
| #include <utility> |
| #include <vector> |
| |
| #include "core/fpdfapi/font/cpdf_cidfont.h" |
| #include "core/fpdfapi/font/cpdf_font.h" |
| #include "core/fpdfapi/page/cpdf_docpagedata.h" |
| #include "core/fpdfapi/page/cpdf_textobject.h" |
| #include "core/fpdfapi/page/cpdf_textstate.h" |
| #include "core/fpdfapi/parser/cpdf_array.h" |
| #include "core/fpdfapi/parser/cpdf_dictionary.h" |
| #include "core/fpdfapi/parser/cpdf_document.h" |
| #include "core/fpdfapi/parser/cpdf_name.h" |
| #include "core/fpdfapi/parser/cpdf_number.h" |
| #include "core/fpdfapi/parser/cpdf_reference.h" |
| #include "core/fpdfapi/parser/cpdf_stream.h" |
| #include "core/fpdfapi/parser/cpdf_string.h" |
| #include "core/fpdfapi/render/charposlist.h" |
| #include "core/fpdfapi/render/cpdf_pagerendercontext.h" |
| #include "core/fpdfapi/render/cpdf_rendercontext.h" |
| #include "core/fpdfapi/render/cpdf_renderstatus.h" |
| #include "core/fpdfapi/render/cpdf_textrenderer.h" |
| #include "core/fpdftext/cpdf_textpage.h" |
| #include "core/fxcrt/check.h" |
| #include "core/fxcrt/check_op.h" |
| #include "core/fxcrt/compiler_specific.h" |
| #include "core/fxcrt/containers/contains.h" |
| #include "core/fxcrt/fx_extension.h" |
| #include "core/fxcrt/fx_memcpy_wrappers.h" |
| #include "core/fxcrt/fx_string_wrappers.h" |
| #include "core/fxcrt/numerics/safe_conversions.h" |
| #include "core/fxcrt/span_util.h" |
| #include "core/fxcrt/stl_util.h" |
| #include "core/fxcrt/utf16.h" |
| #include "core/fxge/cfx_defaultrenderdevice.h" |
| #include "core/fxge/cfx_fontmgr.h" |
| #include "core/fxge/dib/cfx_dibitmap.h" |
| #include "core/fxge/fx_font.h" |
| #include "core/fxge/text_char_pos.h" |
| #include "fpdfsdk/cpdfsdk_helpers.h" |
| #include "public/fpdf_edit.h" |
| |
| // These checks are here because core/ and public/ cannot depend on each other. |
| static_assert(static_cast<int>(TextRenderingMode::MODE_UNKNOWN) == |
| FPDF_TEXTRENDERMODE_UNKNOWN, |
| "TextRenderingMode::MODE_UNKNOWN value mismatch"); |
| static_assert(static_cast<int>(TextRenderingMode::MODE_FILL) == |
| FPDF_TEXTRENDERMODE_FILL, |
| "TextRenderingMode::MODE_FILL value mismatch"); |
| static_assert(static_cast<int>(TextRenderingMode::MODE_STROKE) == |
| FPDF_TEXTRENDERMODE_STROKE, |
| "TextRenderingMode::MODE_STROKE value mismatch"); |
| static_assert(static_cast<int>(TextRenderingMode::MODE_FILL_STROKE) == |
| FPDF_TEXTRENDERMODE_FILL_STROKE, |
| "TextRenderingMode::MODE_FILL_STROKE value mismatch"); |
| static_assert(static_cast<int>(TextRenderingMode::MODE_INVISIBLE) == |
| FPDF_TEXTRENDERMODE_INVISIBLE, |
| "TextRenderingMode::MODE_INVISIBLE value mismatch"); |
| static_assert(static_cast<int>(TextRenderingMode::MODE_FILL_CLIP) == |
| FPDF_TEXTRENDERMODE_FILL_CLIP, |
| "TextRenderingMode::MODE_FILL_CLIP value mismatch"); |
| static_assert(static_cast<int>(TextRenderingMode::MODE_STROKE_CLIP) == |
| FPDF_TEXTRENDERMODE_STROKE_CLIP, |
| "TextRenderingMode::MODE_STROKE_CLIP value mismatch"); |
| static_assert(static_cast<int>(TextRenderingMode::MODE_FILL_STROKE_CLIP) == |
| FPDF_TEXTRENDERMODE_FILL_STROKE_CLIP, |
| "TextRenderingMode::MODE_FILL_STROKE_CLIP value mismatch"); |
| static_assert(static_cast<int>(TextRenderingMode::MODE_CLIP) == |
| FPDF_TEXTRENDERMODE_CLIP, |
| "TextRenderingMode::MODE_CLIP value mismatch"); |
| static_assert(static_cast<int>(TextRenderingMode::MODE_LAST) == |
| FPDF_TEXTRENDERMODE_LAST, |
| "TextRenderingMode::MODE_LAST value mismatch"); |
| |
| namespace { |
| |
| ByteString BaseFontNameForType(const CFX_Font* font, int font_type) { |
| ByteString name = font_type == FPDF_FONT_TYPE1 ? font->GetPsName() |
| : font->GetBaseFontName(); |
| return name.IsEmpty() ? CFX_Font::kUntitledFontName : name; |
| } |
| |
| RetainPtr<CPDF_Dictionary> CreateCompositeFontDict(CPDF_Document* doc, |
| const CFX_Font* font, |
| int font_type, |
| const ByteString& name) { |
| auto font_dict = doc->NewIndirect<CPDF_Dictionary>(); |
| font_dict->SetNewFor<CPDF_Name>("Type", "Font"); |
| font_dict->SetNewFor<CPDF_Name>("Subtype", "Type0"); |
| // TODO(npm): Get the correct encoding, if it's not identity. |
| ByteString encoding = "Identity-H"; |
| font_dict->SetNewFor<CPDF_Name>("Encoding", encoding); |
| font_dict->SetNewFor<CPDF_Name>( |
| "BaseFont", font_type == FPDF_FONT_TYPE1 ? name + "-" + encoding : name); |
| return font_dict; |
| } |
| |
| RetainPtr<CPDF_Dictionary> CreateCidFontDict(CPDF_Document* doc, |
| int font_type, |
| const ByteString& name) { |
| auto cid_font_dict = doc->NewIndirect<CPDF_Dictionary>(); |
| cid_font_dict->SetNewFor<CPDF_Name>("Type", "Font"); |
| cid_font_dict->SetNewFor<CPDF_Name>("Subtype", font_type == FPDF_FONT_TYPE1 |
| ? "CIDFontType0" |
| : "CIDFontType2"); |
| cid_font_dict->SetNewFor<CPDF_Name>("BaseFont", name); |
| |
| // TODO(npm): Maybe use FT_Get_CID_Registry_Ordering_Supplement to get the |
| // CIDSystemInfo |
| auto cid_system_info_dict = doc->NewIndirect<CPDF_Dictionary>(); |
| cid_system_info_dict->SetNewFor<CPDF_String>("Registry", "Adobe"); |
| cid_system_info_dict->SetNewFor<CPDF_String>("Ordering", "Identity"); |
| cid_system_info_dict->SetNewFor<CPDF_Number>("Supplement", 0); |
| cid_font_dict->SetNewFor<CPDF_Reference>("CIDSystemInfo", doc, |
| cid_system_info_dict->GetObjNum()); |
| return cid_font_dict; |
| } |
| |
| RetainPtr<CPDF_Dictionary> LoadFontDesc(CPDF_Document* doc, |
| const ByteString& font_name, |
| CFX_Font* font, |
| pdfium::span<const uint8_t> font_data, |
| int font_type) { |
| auto font_descriptor_dict = doc->NewIndirect<CPDF_Dictionary>(); |
| font_descriptor_dict->SetNewFor<CPDF_Name>("Type", "FontDescriptor"); |
| font_descriptor_dict->SetNewFor<CPDF_Name>("FontName", font_name); |
| int flags = 0; |
| if (font->GetFace()->IsFixedWidth()) { |
| flags |= FXFONT_FIXED_PITCH; |
| } |
| if (font_name.Contains("Serif")) |
| flags |= FXFONT_SERIF; |
| if (font->GetFace()->IsItalic()) { |
| flags |= FXFONT_ITALIC; |
| } |
| if (font->GetFace()->IsBold()) { |
| flags |= FXFONT_FORCE_BOLD; |
| } |
| |
| // TODO(npm): How do I know if a font is symbolic, script, allcap, smallcap? |
| flags |= FXFONT_NONSYMBOLIC; |
| |
| font_descriptor_dict->SetNewFor<CPDF_Number>("Flags", flags); |
| FX_RECT bbox = font->GetBBox().value_or(FX_RECT()); |
| font_descriptor_dict->SetRectFor("FontBBox", CFX_FloatRect(bbox)); |
| |
| // TODO(npm): calculate italic angle correctly |
| font_descriptor_dict->SetNewFor<CPDF_Number>("ItalicAngle", |
| font->IsItalic() ? -12 : 0); |
| |
| font_descriptor_dict->SetNewFor<CPDF_Number>("Ascent", font->GetAscent()); |
| font_descriptor_dict->SetNewFor<CPDF_Number>("Descent", font->GetDescent()); |
| |
| // TODO(npm): calculate the capheight, stemV correctly |
| font_descriptor_dict->SetNewFor<CPDF_Number>("CapHeight", font->GetAscent()); |
| font_descriptor_dict->SetNewFor<CPDF_Number>("StemV", |
| font->IsBold() ? 120 : 70); |
| |
| auto stream = doc->NewIndirect<CPDF_Stream>(font_data); |
| // TODO(npm): Lengths for Type1 fonts. |
| if (font_type == FPDF_FONT_TRUETYPE) { |
| stream->GetMutableDict()->SetNewFor<CPDF_Number>( |
| "Length1", pdfium::checked_cast<int>(font_data.size())); |
| } |
| ByteString font_file_key = |
| font_type == FPDF_FONT_TYPE1 ? "FontFile" : "FontFile2"; |
| font_descriptor_dict->SetNewFor<CPDF_Reference>(font_file_key, doc, |
| stream->GetObjNum()); |
| return font_descriptor_dict; |
| } |
| |
| RetainPtr<CPDF_Array> CreateWidthsArray( |
| CPDF_Document* doc, |
| const std::map<uint32_t, uint32_t>& widths) { |
| auto widths_array = doc->NewIndirect<CPDF_Array>(); |
| for (auto it = widths.begin(); it != widths.end(); ++it) { |
| int ch = it->first; |
| int w = it->second; |
| if (std::next(it) == widths.end()) { |
| // Only one char left, use format c [w] |
| auto single_w_array = pdfium::MakeRetain<CPDF_Array>(); |
| single_w_array->AppendNew<CPDF_Number>(w); |
| widths_array->AppendNew<CPDF_Number>(ch); |
| widths_array->Append(std::move(single_w_array)); |
| break; |
| } |
| ++it; |
| int next_ch = it->first; |
| int next_w = it->second; |
| if (next_ch == ch + 1 && next_w == w) { |
| // The array can have a group c_first c_last w: all CIDs in the range from |
| // c_first to c_last will have width w |
| widths_array->AppendNew<CPDF_Number>(ch); |
| ch = next_ch; |
| while (true) { |
| auto next_it = std::next(it); |
| if (next_it == widths.end() || next_it->first != it->first + 1 || |
| next_it->second != it->second) { |
| break; |
| } |
| ++it; |
| ch = it->first; |
| } |
| widths_array->AppendNew<CPDF_Number>(ch); |
| widths_array->AppendNew<CPDF_Number>(w); |
| continue; |
| } |
| // Otherwise we can have a group of the form c [w1 w2 ...]: c has width |
| // w1, c+1 has width w2, etc. |
| widths_array->AppendNew<CPDF_Number>(ch); |
| auto current_width_array = pdfium::MakeRetain<CPDF_Array>(); |
| current_width_array->AppendNew<CPDF_Number>(w); |
| current_width_array->AppendNew<CPDF_Number>(next_w); |
| while (true) { |
| auto next_it = std::next(it); |
| if (next_it == widths.end() || next_it->first != it->first + 1) { |
| break; |
| } |
| ++it; |
| current_width_array->AppendNew<CPDF_Number>(static_cast<int>(it->second)); |
| } |
| widths_array->Append(std::move(current_width_array)); |
| } |
| return widths_array; |
| } |
| |
| const char kToUnicodeStart[] = |
| "/CIDInit /ProcSet findresource begin\n" |
| "12 dict begin\n" |
| "begincmap\n" |
| "/CIDSystemInfo\n" |
| "<</Registry (Adobe)\n" |
| "/Ordering (Identity)\n" |
| "/Supplement 0\n" |
| ">> def\n" |
| "/CMapName /Adobe-Identity-H def\n" |
| "/CMapType 2 def\n" |
| "1 begincodespacerange\n" |
| "<0000> <FFFF>\n" |
| "endcodespacerange\n"; |
| |
| const char kToUnicodeEnd[] = |
| "endcmap\n" |
| "CMapName currentdict /CMap defineresource pop\n" |
| "end\n" |
| "end\n"; |
| |
| void AddCharcode(fxcrt::ostringstream& buffer, uint32_t number) { |
| CHECK_LE(number, 0xFFFF); |
| buffer << "<"; |
| char ans[4]; |
| FXSYS_IntToFourHexChars(number, ans); |
| for (char c : ans) { |
| buffer << c; |
| } |
| buffer << ">"; |
| } |
| |
| // PDF spec 1.7 Section 5.9.2: "Unicode character sequences as expressed in |
| // UTF-16BE encoding." See https://en.wikipedia.org/wiki/UTF-16#Description |
| void AddUnicode(fxcrt::ostringstream& buffer, uint32_t unicode) { |
| if (pdfium::IsHighSurrogate(unicode) || pdfium::IsLowSurrogate(unicode)) { |
| unicode = 0; |
| } |
| |
| char ans[8]; |
| size_t char_count = FXSYS_ToUTF16BE(unicode, ans); |
| buffer << "<"; |
| CHECK_LE(char_count, std::size(ans)); |
| auto ans_span = pdfium::make_span(ans).first(char_count); |
| for (char c : ans_span) { |
| buffer << c; |
| } |
| buffer << ">"; |
| } |
| |
| // Loads the charcode to unicode mapping into a stream |
| RetainPtr<CPDF_Stream> LoadUnicode( |
| CPDF_Document* doc, |
| const std::multimap<uint32_t, uint32_t>& to_unicode) { |
| // A map charcode->unicode |
| std::map<uint32_t, uint32_t> char_to_uni; |
| // A map <char_start, char_end> to vector v of unicode characters of size (end |
| // - start + 1). This abbreviates: start->v[0], start+1->v[1], etc. PDF spec |
| // 1.7 Section 5.9.2 says that only the last byte of the unicode may change. |
| std::map<std::pair<uint32_t, uint32_t>, std::vector<uint32_t>> |
| map_range_vector; |
| // A map <start, end> -> unicode |
| // This abbreviates: start->unicode, start+1->unicode+1, etc. |
| // PDF spec 1.7 Section 5.9.2 says that only the last byte of the unicode may |
| // change. |
| std::map<std::pair<uint32_t, uint32_t>, uint32_t> map_range; |
| |
| // Calculate the maps |
| for (auto it = to_unicode.begin(); it != to_unicode.end(); ++it) { |
| uint32_t first_charcode = it->first; |
| uint32_t first_unicode = it->second; |
| { |
| auto next_it = std::next(it); |
| if (next_it == to_unicode.end() || first_charcode + 1 != next_it->first) { |
| char_to_uni[first_charcode] = first_unicode; |
| continue; |
| } |
| } |
| ++it; |
| uint32_t current_charcode = it->first; |
| uint32_t current_unicode = it->second; |
| if (current_charcode % 256 == 0) { |
| char_to_uni[first_charcode] = first_unicode; |
| char_to_uni[current_charcode] = current_unicode; |
| continue; |
| } |
| const size_t max_extra = 255 - (current_charcode % 256); |
| auto next_it = std::next(it); |
| if (first_unicode + 1 != current_unicode) { |
| // Consecutive charcodes mapping to non-consecutive unicodes |
| std::vector<uint32_t> unicodes = {first_unicode, current_unicode}; |
| for (size_t i = 0; i < max_extra; ++i) { |
| if (next_it == to_unicode.end() || |
| current_charcode + 1 != next_it->first) { |
| break; |
| } |
| ++it; |
| ++current_charcode; |
| unicodes.push_back(it->second); |
| next_it = std::next(it); |
| } |
| CHECK_EQ(it->first - first_charcode + 1, unicodes.size()); |
| map_range_vector[std::make_pair(first_charcode, it->first)] = unicodes; |
| continue; |
| } |
| // Consecutive charcodes mapping to consecutive unicodes |
| for (size_t i = 0; i < max_extra; ++i) { |
| if (next_it == to_unicode.end() || |
| current_charcode + 1 != next_it->first || |
| current_unicode + 1 != next_it->second) { |
| break; |
| } |
| ++it; |
| ++current_charcode; |
| ++current_unicode; |
| next_it = std::next(it); |
| } |
| map_range[std::make_pair(first_charcode, current_charcode)] = first_unicode; |
| } |
| |
| fxcrt::ostringstream buffer; |
| buffer << kToUnicodeStart; |
| // Add maps to buffer |
| buffer << static_cast<uint32_t>(char_to_uni.size()) << " beginbfchar\n"; |
| for (const auto& it : char_to_uni) { |
| AddCharcode(buffer, it.first); |
| buffer << " "; |
| AddUnicode(buffer, it.second); |
| buffer << "\n"; |
| } |
| buffer << "endbfchar\n" |
| << static_cast<uint32_t>(map_range_vector.size() + map_range.size()) |
| << " beginbfrange\n"; |
| for (const auto& it : map_range_vector) { |
| const std::pair<uint32_t, uint32_t>& charcode_range = it.first; |
| AddCharcode(buffer, charcode_range.first); |
| buffer << " "; |
| AddCharcode(buffer, charcode_range.second); |
| buffer << " ["; |
| const std::vector<uint32_t>& unicodes = it.second; |
| for (size_t i = 0; i < unicodes.size(); ++i) { |
| AddUnicode(buffer, unicodes[i]); |
| if (i != unicodes.size() - 1) |
| buffer << " "; |
| } |
| buffer << "]\n"; |
| } |
| for (const auto& it : map_range) { |
| const std::pair<uint32_t, uint32_t>& charcode_range = it.first; |
| AddCharcode(buffer, charcode_range.first); |
| buffer << " "; |
| AddCharcode(buffer, charcode_range.second); |
| buffer << " "; |
| AddUnicode(buffer, it.second); |
| buffer << "\n"; |
| } |
| buffer << "endbfrange\n"; |
| buffer << kToUnicodeEnd; |
| auto stream = doc->NewIndirect<CPDF_Stream>(&buffer); |
| return stream; |
| } |
| |
| void CreateDescendantFontsArray(CPDF_Document* doc, |
| CPDF_Dictionary* font_dict, |
| uint32_t cid_font_dict_obj_num) { |
| auto descendant_fonts_dict = |
| font_dict->SetNewFor<CPDF_Array>("DescendantFonts"); |
| descendant_fonts_dict->AppendNew<CPDF_Reference>(doc, cid_font_dict_obj_num); |
| } |
| |
| RetainPtr<CPDF_Font> LoadSimpleFont(CPDF_Document* doc, |
| std::unique_ptr<CFX_Font> font, |
| pdfium::span<const uint8_t> font_data, |
| int font_type) { |
| // If it doesn't have a single char, just fail. |
| RetainPtr<CFX_Face> face = font->GetFace(); |
| if (face->GetGlyphCount() <= 0) { |
| return nullptr; |
| } |
| |
| // Simple fonts have 1-byte charcodes only. |
| static constexpr uint32_t kMaxSimpleFontChar = 0xFF; |
| auto char_codes_and_indices = |
| face->GetCharCodesAndIndices(kMaxSimpleFontChar); |
| if (char_codes_and_indices.empty()) { |
| return nullptr; |
| } |
| |
| auto font_dict = doc->NewIndirect<CPDF_Dictionary>(); |
| font_dict->SetNewFor<CPDF_Name>("Type", "Font"); |
| font_dict->SetNewFor<CPDF_Name>( |
| "Subtype", font_type == FPDF_FONT_TYPE1 ? "Type1" : "TrueType"); |
| const ByteString name = BaseFontNameForType(font.get(), font_type); |
| font_dict->SetNewFor<CPDF_Name>("BaseFont", name); |
| |
| font_dict->SetNewFor<CPDF_Number>( |
| "FirstChar", static_cast<int>(char_codes_and_indices[0].char_code)); |
| auto widths_array = doc->NewIndirect<CPDF_Array>(); |
| for (size_t i = 0; i < char_codes_and_indices.size(); ++i) { |
| widths_array->AppendNew<CPDF_Number>( |
| font->GetGlyphWidth(char_codes_and_indices[i].glyph_index)); |
| if (i > 0 && i < char_codes_and_indices.size() - 1) { |
| for (uint32_t j = char_codes_and_indices[i - 1].char_code + 1; |
| j < char_codes_and_indices[i].char_code; ++j) { |
| widths_array->AppendNew<CPDF_Number>(0); |
| } |
| } |
| } |
| font_dict->SetNewFor<CPDF_Number>( |
| "LastChar", static_cast<int>(char_codes_and_indices.back().char_code)); |
| font_dict->SetNewFor<CPDF_Reference>("Widths", doc, |
| widths_array->GetObjNum()); |
| RetainPtr<CPDF_Dictionary> font_descriptor_dict = |
| LoadFontDesc(doc, name, font.get(), font_data, font_type); |
| |
| font_dict->SetNewFor<CPDF_Reference>("FontDescriptor", doc, |
| font_descriptor_dict->GetObjNum()); |
| return CPDF_DocPageData::FromDocument(doc)->GetFont(std::move(font_dict)); |
| } |
| |
| RetainPtr<CPDF_Font> LoadCompositeFont(CPDF_Document* doc, |
| std::unique_ptr<CFX_Font> font, |
| pdfium::span<const uint8_t> font_data, |
| int font_type) { |
| // If it doesn't have a single char, just fail. |
| RetainPtr<CFX_Face> face = font->GetFace(); |
| if (face->GetGlyphCount() <= 0) { |
| return nullptr; |
| } |
| |
| auto char_codes_and_indices = |
| face->GetCharCodesAndIndices(pdfium::kMaximumSupplementaryCodePoint); |
| if (char_codes_and_indices.empty()) { |
| return nullptr; |
| } |
| |
| const ByteString name = BaseFontNameForType(font.get(), font_type); |
| RetainPtr<CPDF_Dictionary> font_dict = |
| CreateCompositeFontDict(doc, font.get(), font_type, name); |
| |
| RetainPtr<CPDF_Dictionary> cid_font_dict = |
| CreateCidFontDict(doc, font_type, name); |
| |
| RetainPtr<CPDF_Dictionary> font_descriptor_dict = |
| LoadFontDesc(doc, name, font.get(), font_data, font_type); |
| cid_font_dict->SetNewFor<CPDF_Reference>("FontDescriptor", doc, |
| font_descriptor_dict->GetObjNum()); |
| |
| std::multimap<uint32_t, uint32_t> to_unicode; |
| std::map<uint32_t, uint32_t> widths; |
| for (const auto& item : char_codes_and_indices) { |
| if (!pdfium::Contains(widths, item.glyph_index)) { |
| widths[item.glyph_index] = font->GetGlyphWidth(item.glyph_index); |
| } |
| to_unicode.emplace(item.glyph_index, item.char_code); |
| } |
| RetainPtr<CPDF_Array> widths_array = CreateWidthsArray(doc, widths); |
| cid_font_dict->SetNewFor<CPDF_Reference>("W", doc, widths_array->GetObjNum()); |
| |
| // TODO(npm): Support vertical writing |
| |
| CreateDescendantFontsArray(doc, font_dict.Get(), cid_font_dict->GetObjNum()); |
| |
| RetainPtr<CPDF_Stream> to_unicode_stream = LoadUnicode(doc, to_unicode); |
| font_dict->SetNewFor<CPDF_Reference>("ToUnicode", doc, |
| to_unicode_stream->GetObjNum()); |
| return CPDF_DocPageData::FromDocument(doc)->GetFont(font_dict); |
| } |
| |
| RetainPtr<CPDF_Font> LoadCustomCompositeFont( |
| CPDF_Document* doc, |
| std::unique_ptr<CFX_Font> font, |
| pdfium::span<const uint8_t> font_span, |
| const char* to_unicode_cmap, |
| pdfium::span<const uint8_t> cid_to_gid_map_span) { |
| // If it doesn't have a single char, just fail. |
| RetainPtr<CFX_Face> face = font->GetFace(); |
| if (face->GetGlyphCount() <= 0) { |
| return nullptr; |
| } |
| |
| auto char_codes_and_indices = |
| face->GetCharCodesAndIndices(pdfium::kMaximumSupplementaryCodePoint); |
| if (char_codes_and_indices.empty()) { |
| return nullptr; |
| } |
| |
| const ByteString name = BaseFontNameForType(font.get(), FPDF_FONT_TRUETYPE); |
| RetainPtr<CPDF_Dictionary> font_dict = |
| CreateCompositeFontDict(doc, font.get(), FPDF_FONT_TRUETYPE, name); |
| |
| RetainPtr<CPDF_Dictionary> cid_font_dict = |
| CreateCidFontDict(doc, FPDF_FONT_TRUETYPE, name); |
| |
| RetainPtr<CPDF_Dictionary> font_descriptor = |
| LoadFontDesc(doc, name, font.get(), font_span, FPDF_FONT_TRUETYPE); |
| cid_font_dict->SetNewFor<CPDF_Reference>("FontDescriptor", doc, |
| font_descriptor->GetObjNum()); |
| |
| std::map<uint32_t, uint32_t> widths; |
| for (const auto& item : char_codes_and_indices) { |
| if (!pdfium::Contains(widths, item.glyph_index)) { |
| widths[item.glyph_index] = font->GetGlyphWidth(item.glyph_index); |
| } |
| } |
| RetainPtr<CPDF_Array> widths_array = CreateWidthsArray(doc, widths); |
| cid_font_dict->SetNewFor<CPDF_Reference>("W", doc, widths_array->GetObjNum()); |
| |
| auto cid_to_gid_map = doc->NewIndirect<CPDF_Stream>(cid_to_gid_map_span); |
| cid_font_dict->SetNewFor<CPDF_Reference>("CIDToGIDMap", doc, |
| cid_to_gid_map->GetObjNum()); |
| |
| CreateDescendantFontsArray(doc, font_dict, cid_font_dict->GetObjNum()); |
| |
| auto to_unicode_stream = doc->NewIndirect<CPDF_Stream>( |
| ByteStringView(to_unicode_cmap).unsigned_span()); |
| font_dict->SetNewFor<CPDF_Reference>("ToUnicode", doc, |
| to_unicode_stream->GetObjNum()); |
| return CPDF_DocPageData::FromDocument(doc)->GetFont(font_dict); |
| } |
| |
| CPDF_TextObject* CPDFTextObjectFromFPDFPageObject(FPDF_PAGEOBJECT page_object) { |
| auto* obj = CPDFPageObjectFromFPDFPageObject(page_object); |
| return obj ? obj->AsText() : nullptr; |
| } |
| |
| FPDF_GLYPHPATH FPDFGlyphPathFromCFXPath(const CFX_Path* path) { |
| return reinterpret_cast<FPDF_GLYPHPATH>(path); |
| } |
| const CFX_Path* CFXPathFromFPDFGlyphPath(FPDF_GLYPHPATH path) { |
| return reinterpret_cast<const CFX_Path*>(path); |
| } |
| |
| } // namespace |
| |
| FPDF_EXPORT FPDF_PAGEOBJECT FPDF_CALLCONV |
| FPDFPageObj_NewTextObj(FPDF_DOCUMENT document, |
| FPDF_BYTESTRING font, |
| float font_size) { |
| CPDF_Document* pDoc = CPDFDocumentFromFPDFDocument(document); |
| if (!pDoc) |
| return nullptr; |
| |
| RetainPtr<CPDF_Font> pFont = |
| CPDF_Font::GetStockFont(pDoc, ByteStringView(font)); |
| if (!pFont) |
| return nullptr; |
| |
| auto pTextObj = std::make_unique<CPDF_TextObject>(); |
| pTextObj->mutable_text_state().SetFont(std::move(pFont)); |
| pTextObj->mutable_text_state().SetFontSize(font_size); |
| pTextObj->SetDefaultStates(); |
| |
| // Caller takes ownership. |
| return FPDFPageObjectFromCPDFPageObject(pTextObj.release()); |
| } |
| |
| FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV |
| FPDFText_SetText(FPDF_PAGEOBJECT text_object, FPDF_WIDESTRING text) { |
| CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text_object); |
| if (!pTextObj) { |
| return false; |
| } |
| // SAFETY: required from caller. |
| WideString encodedText = UNSAFE_BUFFERS(WideStringFromFPDFWideString(text)); |
| ByteString byteText; |
| for (wchar_t wc : encodedText) { |
| pTextObj->GetFont()->AppendChar( |
| &byteText, pTextObj->GetFont()->CharCodeFromUnicode(wc)); |
| } |
| pTextObj->SetText(byteText); |
| return true; |
| } |
| |
| FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV |
| FPDFText_SetCharcodes(FPDF_PAGEOBJECT text_object, |
| const uint32_t* charcodes, |
| size_t count) { |
| CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text_object); |
| if (!pTextObj) |
| return false; |
| |
| if (!charcodes && count) |
| return false; |
| |
| ByteString byte_text; |
| if (charcodes) { |
| for (size_t i = 0; i < count; ++i) { |
| pTextObj->GetFont()->AppendChar(&byte_text, UNSAFE_TODO(charcodes[i])); |
| } |
| } |
| pTextObj->SetText(byte_text); |
| return true; |
| } |
| |
| FPDF_EXPORT FPDF_FONT FPDF_CALLCONV FPDFText_LoadFont(FPDF_DOCUMENT document, |
| const uint8_t* data, |
| uint32_t size, |
| int font_type, |
| FPDF_BOOL cid) { |
| CPDF_Document* pDoc = CPDFDocumentFromFPDFDocument(document); |
| if (!pDoc || !data || size == 0 || |
| (font_type != FPDF_FONT_TYPE1 && font_type != FPDF_FONT_TRUETYPE)) { |
| return nullptr; |
| } |
| // SAFETY: required from caller. |
| auto span = UNSAFE_BUFFERS(pdfium::make_span(data, size)); |
| auto pFont = std::make_unique<CFX_Font>(); |
| |
| // TODO(npm): Maybe use FT_Get_X11_Font_Format to check format? Otherwise, we |
| // are allowing giving any font that can be loaded on freetype and setting it |
| // as any font type. |
| if (!pFont->LoadEmbedded(span, /*force_vertical=*/false, /*object_tag=*/0)) |
| return nullptr; |
| |
| // Caller takes ownership. |
| return FPDFFontFromCPDFFont( |
| cid ? LoadCompositeFont(pDoc, std::move(pFont), span, font_type).Leak() |
| : LoadSimpleFont(pDoc, std::move(pFont), span, font_type).Leak()); |
| } |
| |
| FPDF_EXPORT FPDF_FONT FPDF_CALLCONV |
| FPDFText_LoadStandardFont(FPDF_DOCUMENT document, FPDF_BYTESTRING font) { |
| CPDF_Document* pDoc = CPDFDocumentFromFPDFDocument(document); |
| if (!pDoc) |
| return nullptr; |
| |
| // Caller takes ownership. |
| return FPDFFontFromCPDFFont( |
| CPDF_Font::GetStockFont(pDoc, ByteStringView(font)).Leak()); |
| } |
| |
| FPDF_EXPORT FPDF_FONT FPDF_CALLCONV |
| FPDFText_LoadCidType2Font(FPDF_DOCUMENT document, |
| const uint8_t* font_data, |
| uint32_t font_data_size, |
| FPDF_BYTESTRING to_unicode_cmap, |
| const uint8_t* cid_to_gid_map_data, |
| uint32_t cid_to_gid_map_data_size) { |
| CPDF_Document* doc = CPDFDocumentFromFPDFDocument(document); |
| if (!doc || !font_data || font_data_size == 0 || !to_unicode_cmap || |
| strlen(to_unicode_cmap) == 0 || !cid_to_gid_map_data || |
| cid_to_gid_map_data_size == 0) { |
| return nullptr; |
| } |
| // SAFETY: required from caller. |
| auto font_span = UNSAFE_BUFFERS(pdfium::make_span(font_data, font_data_size)); |
| auto font = std::make_unique<CFX_Font>(); |
| |
| // TODO(thestig): Consider checking the font format. See similar comment in |
| // FPDFText_LoadFont() above. |
| if (!font->LoadEmbedded(font_span, /*force_vertical=*/false, |
| /*object_tag=*/0)) { |
| return nullptr; |
| } |
| |
| // Caller takes ownership of result. |
| // SAFETY: caller ensures `cid_to_gid_map_data` points to at least |
| // `cid_to_gid_map_data_size` entries. |
| return FPDFFontFromCPDFFont( |
| LoadCustomCompositeFont( |
| doc, std::move(font), font_span, to_unicode_cmap, |
| UNSAFE_BUFFERS( |
| pdfium::make_span(cid_to_gid_map_data, cid_to_gid_map_data_size))) |
| .Leak()); |
| } |
| |
| FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV |
| FPDFTextObj_GetFontSize(FPDF_PAGEOBJECT text, float* size) { |
| if (!size) |
| return false; |
| |
| CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text); |
| if (!pTextObj) |
| return false; |
| |
| *size = pTextObj->GetFontSize(); |
| return true; |
| } |
| |
| FPDF_EXPORT unsigned long FPDF_CALLCONV |
| FPDFTextObj_GetText(FPDF_PAGEOBJECT text_object, |
| FPDF_TEXTPAGE text_page, |
| FPDF_WCHAR* buffer, |
| unsigned long length) { |
| CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text_object); |
| if (!pTextObj) |
| return 0; |
| |
| CPDF_TextPage* pTextPage = CPDFTextPageFromFPDFTextPage(text_page); |
| if (!pTextPage) |
| return 0; |
| |
| // SAFETY: required from caller. |
| return Utf16EncodeMaybeCopyAndReturnLength( |
| pTextPage->GetTextByObject(pTextObj), |
| UNSAFE_BUFFERS(SpanFromFPDFApiArgs(buffer, length))); |
| } |
| |
| FPDF_EXPORT FPDF_BITMAP FPDF_CALLCONV |
| FPDFTextObj_GetRenderedBitmap(FPDF_DOCUMENT document, |
| FPDF_PAGE page, |
| FPDF_PAGEOBJECT text_object, |
| float scale) { |
| CPDF_Document* doc = CPDFDocumentFromFPDFDocument(document); |
| if (!doc) |
| return nullptr; |
| |
| CPDF_Page* optional_page = CPDFPageFromFPDFPage(page); |
| if (optional_page && optional_page->GetDocument() != doc) |
| return nullptr; |
| |
| CPDF_TextObject* text = CPDFTextObjectFromFPDFPageObject(text_object); |
| if (!text) |
| return nullptr; |
| |
| if (scale <= 0) |
| return nullptr; |
| |
| const CFX_Matrix scale_matrix(scale, 0, 0, scale, 0, 0); |
| const CFX_FloatRect& text_rect = text->GetRect(); |
| const CFX_FloatRect scaled_text_rect = scale_matrix.TransformRect(text_rect); |
| |
| // `rect` has to use integer values. Round up as needed. |
| const FX_RECT rect = scaled_text_rect.GetOuterRect(); |
| if (rect.IsEmpty()) |
| return nullptr; |
| |
| auto result_bitmap = pdfium::MakeRetain<CFX_DIBitmap>(); |
| if (!result_bitmap->Create(rect.Width(), rect.Height(), FXDIB_Format::kArgb)) |
| return nullptr; |
| |
| auto render_context = std::make_unique<CPDF_PageRenderContext>(); |
| CPDF_PageRenderContext* render_context_ptr = render_context.get(); |
| CPDF_Page::RenderContextClearer clearer(optional_page); |
| if (optional_page) |
| optional_page->SetRenderContext(std::move(render_context)); |
| |
| RetainPtr<CPDF_Dictionary> page_resources = |
| optional_page ? optional_page->GetMutablePageResources() : nullptr; |
| |
| auto device = std::make_unique<CFX_DefaultRenderDevice>(); |
| CFX_DefaultRenderDevice* device_ptr = device.get(); |
| render_context_ptr->m_pDevice = std::move(device); |
| render_context_ptr->m_pContext = std::make_unique<CPDF_RenderContext>( |
| doc, std::move(page_resources), /*pPageCache=*/nullptr); |
| |
| device_ptr->Attach(result_bitmap); |
| |
| CFX_Matrix device_matrix(rect.Width(), 0, 0, rect.Height(), 0, 0); |
| CPDF_RenderStatus status(render_context_ptr->m_pContext.get(), device_ptr); |
| status.SetDeviceMatrix(device_matrix); |
| status.Initialize(nullptr, nullptr); |
| |
| // Need to flip the rendering and also move it to fit within `result_bitmap`. |
| CFX_Matrix render_matrix(1, 0, 0, -1, -text_rect.left, text_rect.top); |
| render_matrix *= scale_matrix; |
| status.RenderSingleObject(text, render_matrix); |
| |
| // Caller takes ownership. |
| return FPDFBitmapFromCFXDIBitmap(result_bitmap.Leak()); |
| } |
| |
| FPDF_EXPORT void FPDF_CALLCONV FPDFFont_Close(FPDF_FONT font) { |
| // Take back ownership from caller and release. |
| RetainPtr<CPDF_Font>().Unleak(CPDFFontFromFPDFFont(font)); |
| } |
| |
| FPDF_EXPORT FPDF_PAGEOBJECT FPDF_CALLCONV |
| FPDFPageObj_CreateTextObj(FPDF_DOCUMENT document, |
| FPDF_FONT font, |
| float font_size) { |
| CPDF_Document* pDoc = CPDFDocumentFromFPDFDocument(document); |
| CPDF_Font* pFont = CPDFFontFromFPDFFont(font); |
| if (!pDoc || !pFont) |
| return nullptr; |
| |
| auto pTextObj = std::make_unique<CPDF_TextObject>(); |
| pTextObj->mutable_text_state().SetFont( |
| CPDF_DocPageData::FromDocument(pDoc)->GetFont( |
| pFont->GetMutableFontDict())); |
| pTextObj->mutable_text_state().SetFontSize(font_size); |
| pTextObj->SetDefaultStates(); |
| return FPDFPageObjectFromCPDFPageObject(pTextObj.release()); |
| } |
| |
| FPDF_EXPORT FPDF_TEXT_RENDERMODE FPDF_CALLCONV |
| FPDFTextObj_GetTextRenderMode(FPDF_PAGEOBJECT text) { |
| CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text); |
| if (!pTextObj) |
| return FPDF_TEXTRENDERMODE_UNKNOWN; |
| return static_cast<FPDF_TEXT_RENDERMODE>(pTextObj->GetTextRenderMode()); |
| } |
| |
| FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV |
| FPDFTextObj_SetTextRenderMode(FPDF_PAGEOBJECT text, |
| FPDF_TEXT_RENDERMODE render_mode) { |
| if (render_mode <= FPDF_TEXTRENDERMODE_UNKNOWN || |
| render_mode > FPDF_TEXTRENDERMODE_LAST) { |
| return false; |
| } |
| |
| CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text); |
| if (!pTextObj) |
| return false; |
| |
| pTextObj->SetTextRenderMode(static_cast<TextRenderingMode>(render_mode)); |
| return true; |
| } |
| |
| FPDF_EXPORT FPDF_FONT FPDF_CALLCONV FPDFTextObj_GetFont(FPDF_PAGEOBJECT text) { |
| CPDF_TextObject* pTextObj = CPDFTextObjectFromFPDFPageObject(text); |
| if (!pTextObj) |
| return nullptr; |
| |
| // Unretained reference in public API. NOLINTNEXTLINE |
| return FPDFFontFromCPDFFont(pTextObj->GetFont()); |
| } |
| |
| FPDF_EXPORT unsigned long FPDF_CALLCONV |
| FPDFFont_GetFontName(FPDF_FONT font, char* buffer, unsigned long length) { |
| auto* pFont = CPDFFontFromFPDFFont(font); |
| if (!pFont) |
| return 0; |
| |
| // SAFETY: required from caller. |
| auto result_span = UNSAFE_BUFFERS(SpanFromFPDFApiArgs(buffer, length)); |
| ByteString name = pFont->GetFont()->GetFamilyName(); |
| pdfium::span<const char> name_span = name.span_with_terminator(); |
| fxcrt::try_spancpy(result_span, name_span); |
| return static_cast<unsigned long>(name_span.size()); |
| } |
| |
| FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetFontData(FPDF_FONT font, |
| uint8_t* buffer, |
| size_t buflen, |
| size_t* out_buflen) { |
| auto* cfont = CPDFFontFromFPDFFont(font); |
| if (!cfont || !out_buflen) |
| return false; |
| |
| // SAFETY: required from caller. |
| auto result_span = UNSAFE_BUFFERS( |
| SpanFromFPDFApiArgs(buffer, pdfium::checked_cast<unsigned long>(buflen))); |
| pdfium::span<const uint8_t> data = cfont->GetFont()->GetFontSpan(); |
| fxcrt::try_spancpy(result_span, data); |
| *out_buflen = data.size(); |
| return true; |
| } |
| |
| FPDF_EXPORT int FPDF_CALLCONV FPDFFont_GetIsEmbedded(FPDF_FONT font) { |
| auto* cfont = CPDFFontFromFPDFFont(font); |
| if (!cfont) |
| return -1; |
| return cfont->IsEmbedded() ? 1 : 0; |
| } |
| |
| FPDF_EXPORT int FPDF_CALLCONV FPDFFont_GetFlags(FPDF_FONT font) { |
| auto* pFont = CPDFFontFromFPDFFont(font); |
| if (!pFont) |
| return -1; |
| |
| // Return only flags from ISO 32000-1:2008, table 123. |
| return pFont->GetFontFlags() & 0x7ffff; |
| } |
| |
| FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetWeight(FPDF_FONT font) { |
| auto* pFont = CPDFFontFromFPDFFont(font); |
| return pFont ? pFont->GetFontWeight() : -1; |
| } |
| |
| FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetItalicAngle(FPDF_FONT font, |
| int* angle) { |
| auto* pFont = CPDFFontFromFPDFFont(font); |
| if (!pFont || !angle) |
| return false; |
| |
| *angle = pFont->GetItalicAngle(); |
| return true; |
| } |
| |
| FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetAscent(FPDF_FONT font, |
| float font_size, |
| float* ascent) { |
| auto* pFont = CPDFFontFromFPDFFont(font); |
| if (!pFont || !ascent) |
| return false; |
| |
| *ascent = pFont->GetTypeAscent() * font_size / 1000.f; |
| return true; |
| } |
| |
| FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetDescent(FPDF_FONT font, |
| float font_size, |
| float* descent) { |
| auto* pFont = CPDFFontFromFPDFFont(font); |
| if (!pFont || !descent) |
| return false; |
| |
| *descent = pFont->GetTypeDescent() * font_size / 1000.f; |
| return true; |
| } |
| |
| FPDF_EXPORT FPDF_BOOL FPDF_CALLCONV FPDFFont_GetGlyphWidth(FPDF_FONT font, |
| uint32_t glyph, |
| float font_size, |
| float* width) { |
| auto* pFont = CPDFFontFromFPDFFont(font); |
| if (!pFont || !width) |
| return false; |
| |
| uint32_t charcode = pFont->CharCodeFromUnicode(static_cast<wchar_t>(glyph)); |
| |
| CPDF_CIDFont* pCIDFont = pFont->AsCIDFont(); |
| if (pCIDFont && pCIDFont->IsVertWriting()) { |
| uint16_t cid = pCIDFont->CIDFromCharCode(charcode); |
| *width = pCIDFont->GetVertWidth(cid) * font_size / 1000.f; |
| } else { |
| *width = pFont->GetCharWidthF(charcode) * font_size / 1000.f; |
| } |
| |
| return true; |
| } |
| |
| FPDF_EXPORT FPDF_GLYPHPATH FPDF_CALLCONV |
| FPDFFont_GetGlyphPath(FPDF_FONT font, uint32_t glyph, float font_size) { |
| auto* pFont = CPDFFontFromFPDFFont(font); |
| if (!pFont) |
| return nullptr; |
| |
| if (!pdfium::IsValueInRangeForNumericType<wchar_t>(glyph)) { |
| return nullptr; |
| } |
| |
| uint32_t charcode = pFont->CharCodeFromUnicode(static_cast<wchar_t>(glyph)); |
| std::vector<TextCharPos> pos = |
| GetCharPosList(pdfium::span_from_ref(charcode), |
| pdfium::span<const float>(), pFont, font_size); |
| if (pos.empty()) |
| return nullptr; |
| |
| CFX_Font* pCfxFont; |
| if (pos[0].m_FallbackFontPosition == -1) { |
| pCfxFont = pFont->GetFont(); |
| DCHECK(pCfxFont); // Never null. |
| } else { |
| pCfxFont = pFont->GetFontFallback(pos[0].m_FallbackFontPosition); |
| if (!pCfxFont) |
| return nullptr; |
| } |
| |
| const CFX_Path* pPath = |
| pCfxFont->LoadGlyphPath(pos[0].m_GlyphIndex, pos[0].m_FontCharWidth); |
| |
| return FPDFGlyphPathFromCFXPath(pPath); |
| } |
| |
| FPDF_EXPORT int FPDF_CALLCONV |
| FPDFGlyphPath_CountGlyphSegments(FPDF_GLYPHPATH glyphpath) { |
| auto* pPath = CFXPathFromFPDFGlyphPath(glyphpath); |
| if (!pPath) |
| return -1; |
| |
| return fxcrt::CollectionSize<int>(pPath->GetPoints()); |
| } |
| |
| FPDF_EXPORT FPDF_PATHSEGMENT FPDF_CALLCONV |
| FPDFGlyphPath_GetGlyphPathSegment(FPDF_GLYPHPATH glyphpath, int index) { |
| auto* pPath = CFXPathFromFPDFGlyphPath(glyphpath); |
| if (!pPath) |
| return nullptr; |
| |
| pdfium::span<const CFX_Path::Point> points = pPath->GetPoints(); |
| if (!fxcrt::IndexInBounds(points, index)) |
| return nullptr; |
| |
| return FPDFPathSegmentFromFXPathPoint(&points[index]); |
| } |