blob: 14f0b86cdfaffb915ca66e97bdd24b088ea21b89 [file] [log] [blame] [edit]
// Copyright 2016 The PDFium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
#include "core/fpdfapi/render/charposlist.h"
#include "build/build_config.h"
#include "core/fpdfapi/font/cpdf_cidfont.h"
#include "core/fpdfapi/font/cpdf_font.h"
#include "core/fpdfapi/parser/cpdf_stream.h"
#include "core/fxge/cfx_fontmapper.h"
#include "core/fxge/cfx_substfont.h"
#include "core/fxge/text_char_pos.h"
namespace {
bool ShouldUseExistingFont(const CPDF_Font* font,
uint32_t glyph_id,
bool has_to_unicode) {
// Check for invalid glyph ID.
if (glyph_id == static_cast<uint32_t>(-1))
return false;
if (!font->IsTrueTypeFont())
return true;
// For TrueType fonts, a glyph ID of 0 may be invalid.
//
// When a "ToUnicode" entry exists in the font dictionary, it indicates
// a "ToUnicode" mapping file is used to convert from CIDs (which
// begins at decimal 0) to Unicode code. (See ToUnicode Mapping File
// Tutorial - Adobe
// https://www.adobe.com/content/dam/acom/en/devnet/acrobat/pdfs/5411.ToUnicode.pdf
// and
// https://www.freetype.org/freetype2/docs/tutorial/step1.html#section-6)
return glyph_id != 0 || has_to_unicode;
}
// The following is not a perfect solution and can be further improved.
// For example, if `subst_font` is "Book" and the `base_font_name` is "Bookman",
// this function will return "true" even though the actual font "Bookman"
// is not loaded.
// An exact string match is not possible here, because `subst_font_name`
// will be the same value for different postscript names.
// For example: "Times New Roman" as `subst_font_name` for all of these
// `base_font_name` values: "TimesNewRoman,Bold", "TimesNewRomanPS-Bold",
// "TimesNewRomanBold" and "TimesNewRoman-Bold".
bool IsActualFontLoaded(const CFX_SubstFont* subst_font,
const ByteString& base_font_name) {
// Skip if we loaded the actual font.
// example: TimesNewRoman,Bold -> Times New Roman
ByteString subst_font_name = subst_font->m_Family;
subst_font_name.Remove(' ');
subst_font_name.MakeLower();
std::optional<size_t> find =
base_font_name.Find(subst_font_name.AsStringView());
return find.has_value() && find.value() == 0;
}
bool ApplyGlyphSpacingHeuristic(const CPDF_Font* font,
const CFX_Font* current_font,
bool is_vertical_writing) {
if (is_vertical_writing || font->IsEmbedded() || !font->HasFontWidths()) {
return false;
}
// Skip if we loaded a standard alternate font.
// example: Helvetica -> Arial
ByteString base_font_name = font->GetBaseFontName();
base_font_name.MakeLower();
auto standard_font_name =
CFX_FontMapper::GetStandardFontName(&base_font_name);
if (standard_font_name.has_value()) {
return false;
}
CFX_SubstFont* subst_font = current_font->GetSubstFont();
if (subst_font->IsBuiltInGenericFont()) {
return false;
}
return !IsActualFontLoaded(subst_font, base_font_name);
}
} // namespace
std::vector<TextCharPos> GetCharPosList(pdfium::span<const uint32_t> char_codes,
pdfium::span<const float> char_pos,
CPDF_Font* font,
float font_size) {
std::vector<TextCharPos> results;
results.reserve(char_codes.size());
CPDF_CIDFont* cid_font = font->AsCIDFont();
bool is_vertical_writing = cid_font && cid_font->IsVertWriting();
bool has_to_unicode = !!font->GetFontDict()->GetStreamFor("ToUnicode");
for (size_t i = 0; i < char_codes.size(); ++i) {
uint32_t char_code = char_codes[i];
if (char_code == static_cast<uint32_t>(-1))
continue;
bool is_vertical_glyph = false;
results.emplace_back();
TextCharPos& text_char_pos = results.back();
if (cid_font)
text_char_pos.m_bFontStyle = true;
WideString unicode = font->UnicodeFromCharCode(char_code);
text_char_pos.m_Unicode = !unicode.IsEmpty() ? unicode[0] : char_code;
text_char_pos.m_GlyphIndex =
font->GlyphFromCharCode(char_code, &is_vertical_glyph);
uint32_t glyph_id = text_char_pos.m_GlyphIndex;
#if BUILDFLAG(IS_APPLE)
text_char_pos.m_ExtGID = font->GlyphFromCharCodeExt(char_code);
glyph_id = text_char_pos.m_ExtGID != static_cast<uint32_t>(-1)
? text_char_pos.m_ExtGID
: text_char_pos.m_GlyphIndex;
#endif
CFX_Font* current_font;
if (ShouldUseExistingFont(font, glyph_id, has_to_unicode)) {
current_font = font->GetFont();
text_char_pos.m_FallbackFontPosition = -1;
} else {
int32_t fallback_position = font->FallbackFontFromCharcode(char_code);
current_font = font->GetFontFallback(fallback_position);
text_char_pos.m_FallbackFontPosition = fallback_position;
text_char_pos.m_GlyphIndex =
font->FallbackGlyphFromCharcode(fallback_position, char_code);
#if BUILDFLAG(IS_APPLE)
text_char_pos.m_ExtGID = text_char_pos.m_GlyphIndex;
#endif
}
if (!font->IsEmbedded() && !font->IsCIDFont())
text_char_pos.m_FontCharWidth = font->GetCharWidthF(char_code);
else
text_char_pos.m_FontCharWidth = 0;
text_char_pos.m_Origin = CFX_PointF(i > 0 ? char_pos[i - 1] : 0, 0);
text_char_pos.m_bGlyphAdjust = false;
float scaling_factor = 1.0f;
if (ApplyGlyphSpacingHeuristic(font, current_font, is_vertical_writing)) {
int pdf_glyph_width = font->GetCharWidthF(char_code);
int font_glyph_width =
current_font->GetGlyphWidth(text_char_pos.m_GlyphIndex);
if (font_glyph_width && pdf_glyph_width > font_glyph_width + 1) {
// Move the initial x position by half of the excess (transformed to
// text space coordinates).
text_char_pos.m_Origin.x +=
(pdf_glyph_width - font_glyph_width) * font_size / 2000.0f;
} else if (pdf_glyph_width && font_glyph_width &&
pdf_glyph_width < font_glyph_width) {
scaling_factor = static_cast<float>(pdf_glyph_width) / font_glyph_width;
text_char_pos.m_AdjustMatrix[0] = scaling_factor;
text_char_pos.m_AdjustMatrix[1] = 0.0f;
text_char_pos.m_AdjustMatrix[2] = 0.0f;
text_char_pos.m_AdjustMatrix[3] = 1.0f;
text_char_pos.m_bGlyphAdjust = true;
}
}
if (!cid_font)
continue;
uint16_t cid = cid_font->CIDFromCharCode(char_code);
if (is_vertical_writing) {
text_char_pos.m_Origin = CFX_PointF(0, text_char_pos.m_Origin.x);
CFX_Point16 vertical_origin = cid_font->GetVertOrigin(cid);
text_char_pos.m_Origin.x -= font_size * vertical_origin.x / 1000;
text_char_pos.m_Origin.y -= font_size * vertical_origin.y / 1000;
}
const CIDTransform* cid_transform = cid_font->GetCIDTransform(cid);
if (cid_transform && !is_vertical_glyph) {
text_char_pos.m_AdjustMatrix[0] =
cid_font->CIDTransformToFloat(cid_transform->a) * scaling_factor;
text_char_pos.m_AdjustMatrix[1] =
cid_font->CIDTransformToFloat(cid_transform->b) * scaling_factor;
text_char_pos.m_AdjustMatrix[2] =
cid_font->CIDTransformToFloat(cid_transform->c);
text_char_pos.m_AdjustMatrix[3] =
cid_font->CIDTransformToFloat(cid_transform->d);
text_char_pos.m_Origin.x +=
cid_font->CIDTransformToFloat(cid_transform->e) * font_size;
text_char_pos.m_Origin.y +=
cid_font->CIDTransformToFloat(cid_transform->f) * font_size;
text_char_pos.m_bGlyphAdjust = true;
}
}
return results;
}