blob: 6d2974e83cdec9a730a5b110c155a9a1357e45f2 [file] [log] [blame] [edit]
// Copyright 2014 The PDFium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
#include "xfa/fgas/layout/cfgas_txtbreak.h"
#include <algorithm>
#include <array>
#include "build/build_config.h"
#include "core/fxcrt/check.h"
#include "core/fxcrt/compiler_specific.h"
#include "core/fxcrt/containers/adapters.h"
#include "core/fxcrt/fx_codepage.h"
#include "core/fxcrt/fx_extension.h"
#include "core/fxcrt/fx_safe_types.h"
#include "core/fxcrt/numerics/safe_conversions.h"
#include "core/fxcrt/stl_util.h"
#include "core/fxge/text_char_pos.h"
#include "xfa/fgas/font/cfgas_gefont.h"
#include "xfa/fgas/layout/cfgas_char.h"
#include "xfa/fgas/layout/fgas_arabic.h"
#include "xfa/fgas/layout/fgas_linebreak.h"
namespace {
struct FX_FORMCHAR {
uint16_t wch;
uint16_t wForm;
int32_t iWidth;
};
bool IsCtrlCode(wchar_t wch) {
FX_CHARTYPE dwRet = pdfium::unicode::GetCharType(wch);
return dwRet == FX_CHARTYPE::kTab || dwRet == FX_CHARTYPE::kControl;
}
} // namespace
CFGAS_TxtBreak::CFGAS_TxtBreak() : CFGAS_Break(LayoutStyle::kNone) {}
CFGAS_TxtBreak::~CFGAS_TxtBreak() = default;
void CFGAS_TxtBreak::SetLineWidth(float fLineWidth) {
line_width_ = FXSYS_roundf(fLineWidth * kConversionFactor);
DCHECK(line_width_ >= 20000);
}
void CFGAS_TxtBreak::SetAlignment(int32_t iAlignment) {
DCHECK(iAlignment >= CFX_TxtLineAlignment_Left);
DCHECK(iAlignment <= CFX_TxtLineAlignment_Justified);
alignment_ = iAlignment;
}
void CFGAS_TxtBreak::SetCombWidth(float fCombWidth) {
comb_width_ = FXSYS_roundf(fCombWidth * kConversionFactor);
}
void CFGAS_TxtBreak::AppendChar_Combination(CFGAS_Char* pCurChar) {
FX_SAFE_INT32 iCharWidth = comb_width_;
pCurChar->char_width_ = -1;
if (!comb_text_) {
wchar_t wch = pCurChar->char_code();
CFGAS_Char* pLastChar = GetLastChar(0, false, false);
if (pLastChar &&
(pLastChar->char_styles_ & FX_TXTCHARSTYLE_ArabicShadda) == 0) {
wchar_t wLast = pLastChar->char_code();
std::optional<uint16_t> maybe_shadda;
if (wch == pdfium::kArabicShadda) {
maybe_shadda = pdfium::GetArabicFromShaddaTable(wLast);
} else if (wLast == pdfium::kArabicShadda) {
maybe_shadda = pdfium::GetArabicFromShaddaTable(wch);
}
if (maybe_shadda.has_value()) {
wch = maybe_shadda.value();
pCurChar->char_styles_ |= FX_TXTCHARSTYLE_ArabicShadda;
pLastChar->char_styles_ |= FX_TXTCHARSTYLE_ArabicShadda;
pLastChar->char_width_ = 0;
}
}
std::optional<uint16_t> iCharWidthRet;
if (font_) {
iCharWidthRet = font_->GetCharWidth(wch);
}
iCharWidth = iCharWidthRet.value_or(0);
iCharWidth *= font_size_;
iCharWidth *= horizontal_scale_;
iCharWidth /= 100;
}
iCharWidth *= -1;
pCurChar->char_width_ = iCharWidth.ValueOrDefault(0);
}
void CFGAS_TxtBreak::AppendChar_Tab(CFGAS_Char* pCurChar) {
char_type_ = FX_CHARTYPE::kTab;
}
CFGAS_Char::BreakType CFGAS_TxtBreak::AppendChar_Control(CFGAS_Char* pCurChar) {
char_type_ = FX_CHARTYPE::kControl;
CFGAS_Char::BreakType dwRet = CFGAS_Char::BreakType::kNone;
if (!single_line_) {
wchar_t wch = pCurChar->char_code();
switch (wch) {
case L'\v':
case pdfium::unicode::kLineSeparator:
dwRet = CFGAS_Char::BreakType::kLine;
break;
case L'\f':
dwRet = CFGAS_Char::BreakType::kPage;
break;
case pdfium::unicode::kParagraphSeparator:
dwRet = CFGAS_Char::BreakType::kParagraph;
break;
default:
if (wch == w_paragraph_break_char_) {
dwRet = CFGAS_Char::BreakType::kParagraph;
}
break;
}
if (dwRet != CFGAS_Char::BreakType::kNone) {
dwRet = EndBreak(dwRet);
}
}
return dwRet;
}
CFGAS_Char::BreakType CFGAS_TxtBreak::AppendChar_Arabic(CFGAS_Char* pCurChar) {
FX_CHARTYPE chartype = pCurChar->GetCharType();
int32_t& iLineWidth = cur_line_->width_;
wchar_t wForm;
CFGAS_Char* pLastChar = nullptr;
bool bAlef = false;
if (!comb_text_ && char_type_ >= FX_CHARTYPE::kArabicAlef &&
char_type_ <= FX_CHARTYPE::kArabicDistortion) {
FX_SAFE_INT32 iCharWidth = 0;
pLastChar = GetLastChar(1, true, false);
if (pLastChar) {
if (pLastChar->char_width_ > 0) {
iLineWidth -= pLastChar->char_width_;
}
iCharWidth = pLastChar->char_width_;
CFGAS_Char* pPrevChar = GetLastChar(2, true, false);
wForm = pdfium::GetArabicFormChar(pLastChar, pPrevChar, pCurChar);
bAlef = (wForm == pdfium::unicode::kZeroWidthNoBreakSpace &&
pLastChar->GetCharType() == FX_CHARTYPE::kArabicAlef);
if (font_) {
iCharWidth = font_->GetCharWidth(wForm).value_or(0);
}
if (wForm == pdfium::unicode::kZeroWidthNoBreakSpace) {
iCharWidth = 0;
}
iCharWidth *= font_size_;
iCharWidth *= horizontal_scale_;
iCharWidth /= 100;
int32_t iCharWidthValid = iCharWidth.ValueOrDefault(0);
pLastChar->char_width_ = iCharWidthValid;
iLineWidth += iCharWidthValid;
}
}
char_type_ = chartype;
wForm =
pdfium::GetArabicFormChar(pCurChar, bAlef ? nullptr : pLastChar, nullptr);
FX_SAFE_INT32 iCharWidth = 0;
if (comb_text_) {
iCharWidth = comb_width_;
} else {
if (font_ && wForm != pdfium::unicode::kZeroWidthNoBreakSpace) {
iCharWidth = font_->GetCharWidth(wForm).value_or(0);
}
iCharWidth *= font_size_;
iCharWidth *= horizontal_scale_;
iCharWidth /= 100;
}
int32_t iCharWidthValid = iCharWidth.ValueOrDefault(0);
pCurChar->char_width_ = iCharWidthValid;
iLineWidth += iCharWidthValid;
cur_line_->IncrementArabicCharCount();
if (!single_line_ && IsGreaterThanLineWidth(iLineWidth)) {
return EndBreak(CFGAS_Char::BreakType::kLine);
}
return CFGAS_Char::BreakType::kNone;
}
CFGAS_Char::BreakType CFGAS_TxtBreak::AppendChar_Others(CFGAS_Char* pCurChar) {
FX_CHARTYPE chartype = pCurChar->GetCharType();
int32_t& iLineWidth = cur_line_->width_;
char_type_ = chartype;
wchar_t wch = pCurChar->char_code();
wchar_t wForm = wch;
FX_SAFE_INT32 iCharWidth = 0;
if (comb_text_) {
iCharWidth = comb_width_;
} else if (font_) {
iCharWidth = font_->GetCharWidth(wForm).value_or(0);
iCharWidth *= font_size_;
iCharWidth *= horizontal_scale_;
iCharWidth /= 100;
}
iCharWidth += char_space_;
int32_t iValidCharWidth = iCharWidth.ValueOrDefault(0);
pCurChar->char_width_ = iValidCharWidth;
iLineWidth += iValidCharWidth;
if (!single_line_ && chartype != FX_CHARTYPE::kSpace &&
IsGreaterThanLineWidth(iLineWidth)) {
return EndBreak(CFGAS_Char::BreakType::kLine);
}
return CFGAS_Char::BreakType::kNone;
}
CFGAS_Char::BreakType CFGAS_TxtBreak::AppendChar(wchar_t wch) {
FX_CHARTYPE chartype = pdfium::unicode::GetCharType(wch);
cur_line_->line_chars_.emplace_back(wch, horizontal_scale_, vertical_scale_);
CFGAS_Char* pCurChar = &cur_line_->line_chars_.back();
pCurChar->char_styles_ = alignment_ | (1 << 8);
CFGAS_Char::BreakType dwRet1 = CFGAS_Char::BreakType::kNone;
if (chartype != FX_CHARTYPE::kCombination &&
GetUnifiedCharType(char_type_) != GetUnifiedCharType(chartype) &&
char_type_ != FX_CHARTYPE::kUnknown && !single_line_ &&
IsGreaterThanLineWidth(cur_line_->width_) &&
(char_type_ != FX_CHARTYPE::kSpace ||
chartype != FX_CHARTYPE::kControl)) {
dwRet1 = EndBreak(CFGAS_Char::BreakType::kLine);
if (!cur_line_->line_chars_.empty()) {
pCurChar = &cur_line_->line_chars_.back();
}
}
CFGAS_Char::BreakType dwRet2 = CFGAS_Char::BreakType::kNone;
if (wch == w_paragraph_break_char_) {
// This is handled in AppendChar_Control, but it seems like \n and \r
// don't get matched as control characters so we go into AppendChar_other
// and never detect the new paragraph ...
dwRet2 = CFGAS_Char::BreakType::kParagraph;
EndBreak(dwRet2);
} else {
switch (chartype) {
case FX_CHARTYPE::kTab:
AppendChar_Tab(pCurChar);
break;
case FX_CHARTYPE::kControl:
dwRet2 = AppendChar_Control(pCurChar);
break;
case FX_CHARTYPE::kCombination:
AppendChar_Combination(pCurChar);
break;
case FX_CHARTYPE::kArabicAlef:
case FX_CHARTYPE::kArabicSpecial:
case FX_CHARTYPE::kArabicDistortion:
case FX_CHARTYPE::kArabicNormal:
case FX_CHARTYPE::kArabicForm:
case FX_CHARTYPE::kArabic:
dwRet2 = AppendChar_Arabic(pCurChar);
break;
case FX_CHARTYPE::kUnknown:
case FX_CHARTYPE::kSpace:
case FX_CHARTYPE::kNumeric:
case FX_CHARTYPE::kNormal:
dwRet2 = AppendChar_Others(pCurChar);
break;
}
}
return std::max(dwRet1, dwRet2);
}
void CFGAS_TxtBreak::EndBreakSplitLine(CFGAS_BreakLine* pNextLine,
bool bAllChars) {
bool bDone = false;
CFGAS_Char* pTC;
if (!single_line_ && IsGreaterThanLineWidth(cur_line_->width_)) {
pTC = cur_line_->LastChar();
switch (pTC->GetCharType()) {
case FX_CHARTYPE::kTab:
case FX_CHARTYPE::kControl:
case FX_CHARTYPE::kSpace:
break;
default:
SplitTextLine(cur_line_, pNextLine, bAllChars);
bDone = true;
break;
}
}
if (bAllChars && !bDone) {
int32_t iEndPos = cur_line_->width_;
GetBreakPos(&cur_line_->line_chars_, bAllChars, true, &iEndPos);
}
}
std::deque<CFGAS_Break::TPO> CFGAS_TxtBreak::EndBreakBidiLine(
CFGAS_Char::BreakType dwStatus) {
CFGAS_BreakPiece tp;
std::deque<TPO> tpos;
CFGAS_Char* pTC;
std::vector<CFGAS_Char>& chars = cur_line_->line_chars_;
if (!cur_line_->HasArabicChar()) {
tp.SetStatus(dwStatus);
tp.SetStartPos(cur_line_->start_);
tp.SetWidth(cur_line_->width_);
tp.SetStartChar(0);
tp.SetCharCount(fxcrt::CollectionSize<int32_t>(cur_line_->line_chars_));
tp.SetChars(&cur_line_->line_chars_);
pTC = &chars[0];
tp.SetCharStyles(pTC->char_styles_);
tp.SetHorizontalScale(pTC->horizonal_scale());
tp.SetVerticalScale(pTC->vertical_scale());
cur_line_->line_pieces_.push_back(tp);
tpos.push_back({0, 0});
return tpos;
}
size_t iBidiNum = 0;
for (size_t i = 0; i < cur_line_->line_chars_.size(); ++i) {
pTC = &chars[i];
pTC->bidi_pos_ = static_cast<int32_t>(i);
if (pTC->GetCharType() != FX_CHARTYPE::kControl) {
iBidiNum = i;
}
if (i == 0) {
pTC->bidi_level_ = 1;
}
}
CFGAS_Char::BidiLine(&chars, iBidiNum + 1);
tp.SetStatus(CFGAS_Char::BreakType::kPiece);
tp.SetStartPos(cur_line_->start_);
tp.SetChars(&cur_line_->line_chars_);
int32_t iBidiLevel = -1;
int32_t iCharWidth;
int32_t i = 0;
int32_t j = -1;
int32_t iCount = fxcrt::CollectionSize<int32_t>(cur_line_->line_chars_);
while (i < iCount) {
pTC = &chars[i];
if (iBidiLevel < 0) {
iBidiLevel = pTC->bidi_level_;
tp.SetWidth(0);
tp.SetBidiLevel(iBidiLevel);
tp.SetBidiPos(pTC->bidi_order_);
tp.SetCharStyles(pTC->char_styles_);
tp.SetHorizontalScale(pTC->horizonal_scale());
tp.SetVerticalScale(pTC->vertical_scale());
tp.SetStatus(CFGAS_Char::BreakType::kPiece);
}
if (iBidiLevel != pTC->bidi_level_ ||
pTC->status_ != CFGAS_Char::BreakType::kNone) {
if (iBidiLevel == pTC->bidi_level_) {
tp.SetStatus(pTC->status_);
iCharWidth = pTC->char_width_;
if (iCharWidth > 0) {
tp.IncrementWidth(iCharWidth);
}
i++;
}
tp.SetCharCount(i - tp.GetStartChar());
cur_line_->line_pieces_.push_back(tp);
tp.IncrementStartPos(tp.GetWidth());
tp.SetStartChar(i);
tpos.push_back({++j, tp.GetBidiPos()});
iBidiLevel = -1;
} else {
iCharWidth = pTC->char_width_;
if (iCharWidth > 0) {
tp.IncrementWidth(iCharWidth);
}
i++;
}
}
if (i > tp.GetStartChar()) {
tp.SetStatus(dwStatus);
tp.SetCharCount(i - tp.GetStartChar());
cur_line_->line_pieces_.push_back(tp);
tpos.push_back({++j, tp.GetBidiPos()});
}
if (j > -1) {
if (j > 0) {
std::sort(tpos.begin(), tpos.end());
int32_t iStartPos = 0;
for (i = 0; i <= j; i++) {
CFGAS_BreakPiece& ttp = cur_line_->line_pieces_[tpos[i].index];
ttp.SetStartPos(iStartPos);
iStartPos += ttp.GetWidth();
}
}
cur_line_->line_pieces_[j].SetStatus(dwStatus);
}
return tpos;
}
void CFGAS_TxtBreak::EndBreakAlignment(const std::deque<TPO>& tpos,
bool bAllChars,
CFGAS_Char::BreakType dwStatus) {
int32_t iNetWidth = cur_line_->width_;
int32_t iGapChars = 0;
bool bFind = false;
for (const TPO& pos : pdfium::Reversed(tpos)) {
const CFGAS_BreakPiece& ttp = cur_line_->line_pieces_[pos.index];
if (!bFind) {
iNetWidth = ttp.GetEndPos();
}
bool bArabic = FX_IsOdd(ttp.GetBidiLevel());
int32_t j = bArabic ? 0 : ttp.GetCharCount() - 1;
while (j > -1 && j < ttp.GetCharCount()) {
const CFGAS_Char* pTC = ttp.GetChar(j);
if (pTC->line_break_type_ == FX_LINEBREAKTYPE::kDIRECT_BRK) {
iGapChars++;
}
if (!bFind || !bAllChars) {
FX_CHARTYPE chartype = pTC->GetCharType();
if (chartype == FX_CHARTYPE::kSpace ||
chartype == FX_CHARTYPE::kControl) {
if (!bFind && bAllChars && pTC->char_width_ > 0) {
iNetWidth -= pTC->char_width_;
}
} else {
bFind = true;
if (!bAllChars) {
break;
}
}
}
j += bArabic ? 1 : -1;
}
if (!bAllChars && bFind) {
break;
}
}
int32_t iOffset = line_width_ - iNetWidth;
if (iGapChars > 0 && alignment_ & CFX_TxtLineAlignment_Justified &&
dwStatus != CFGAS_Char::BreakType::kParagraph) {
int32_t iStart = -1;
for (auto& tpo : tpos) {
CFGAS_BreakPiece& ttp = cur_line_->line_pieces_[tpo.index];
if (iStart < -1) {
iStart = ttp.GetStartPos();
} else {
ttp.SetStartPos(iStart);
}
for (int32_t j = 0; j < ttp.GetCharCount() && iGapChars > 0;
j++, iGapChars--) {
CFGAS_Char* pTC = ttp.GetChar(j);
if (pTC->line_break_type_ != FX_LINEBREAKTYPE::kDIRECT_BRK ||
pTC->char_width_ < 0) {
continue;
}
int32_t k = iOffset / iGapChars;
pTC->char_width_ += k;
ttp.IncrementWidth(k);
iOffset -= k;
}
iStart += ttp.GetWidth();
}
} else if (alignment_ & CFX_TxtLineAlignment_Center ||
alignment_ & CFX_TxtLineAlignment_Right) {
if (alignment_ & CFX_TxtLineAlignment_Center &&
!(alignment_ & CFX_TxtLineAlignment_Right)) {
iOffset /= 2;
}
if (iOffset > 0) {
for (auto& ttp : cur_line_->line_pieces_) {
ttp.IncrementStartPos(iOffset);
}
}
}
}
CFGAS_Char::BreakType CFGAS_TxtBreak::EndBreak(CFGAS_Char::BreakType dwStatus) {
DCHECK(dwStatus != CFGAS_Char::BreakType::kNone);
if (!cur_line_->line_pieces_.empty()) {
if (dwStatus != CFGAS_Char::BreakType::kPiece) {
cur_line_->line_pieces_.back().SetStatus(dwStatus);
}
return cur_line_->line_pieces_.back().GetStatus();
}
if (HasLine()) {
if (lines_[ready_line_index_].line_pieces_.empty()) {
return CFGAS_Char::BreakType::kNone;
}
if (dwStatus != CFGAS_Char::BreakType::kPiece) {
lines_[ready_line_index_].line_pieces_.back().SetStatus(dwStatus);
}
return lines_[ready_line_index_].line_pieces_.back().GetStatus();
}
if (cur_line_->line_chars_.empty()) {
return CFGAS_Char::BreakType::kNone;
}
cur_line_->line_chars_.back().status_ = dwStatus;
if (dwStatus == CFGAS_Char::BreakType::kPiece) {
return dwStatus;
}
ready_line_index_ = cur_line_ == &lines_[0] ? 0 : 1;
CFGAS_BreakLine* pNextLine = &lines_[1 - ready_line_index_];
const bool bAllChars = alignment_ > CFX_TxtLineAlignment_Right;
EndBreakSplitLine(pNextLine, bAllChars);
std::deque<TPO> tpos = EndBreakBidiLine(dwStatus);
if (alignment_ > CFX_TxtLineAlignment_Left) {
EndBreakAlignment(tpos, bAllChars, dwStatus);
}
cur_line_ = pNextLine;
CFGAS_Char* pTC = GetLastChar(0, false, false);
char_type_ = pTC ? pTC->GetCharType() : FX_CHARTYPE::kUnknown;
return dwStatus;
}
int32_t CFGAS_TxtBreak::GetBreakPos(std::vector<CFGAS_Char>* pChars,
bool bAllChars,
bool bOnlyBrk,
int32_t* pEndPos) {
std::vector<CFGAS_Char>& chars = *pChars;
int32_t iLength = fxcrt::CollectionSize<int32_t>(chars) - 1;
if (iLength < 1) {
return iLength;
}
int32_t iBreak = -1;
int32_t iBreakPos = -1;
int32_t iIndirect = -1;
int32_t iIndirectPos = -1;
int32_t iLast = -1;
int32_t iLastPos = -1;
if (single_line_ || *pEndPos <= line_width_) {
if (!bAllChars) {
return iLength;
}
iBreak = iLength;
iBreakPos = *pEndPos;
}
FX_LINEBREAKTYPE eType;
FX_BREAKPROPERTY nCur;
FX_BREAKPROPERTY nNext;
CFGAS_Char* pCur = &chars[iLength--];
if (bAllChars) {
pCur->line_break_type_ = FX_LINEBREAKTYPE::kUNKNOWN;
}
nNext = pdfium::unicode::GetBreakProperty(pCur->char_code());
int32_t iCharWidth = pCur->char_width_;
if (iCharWidth > 0) {
*pEndPos -= iCharWidth;
}
while (iLength >= 0) {
pCur = &chars[iLength];
nCur = pdfium::unicode::GetBreakProperty(pCur->char_code());
if (nNext == FX_BREAKPROPERTY::kSP) {
eType = FX_LINEBREAKTYPE::kPROHIBITED_BRK;
} else {
eType = GetLineBreakTypeFromPair(nCur, nNext);
}
if (bAllChars) {
pCur->line_break_type_ = eType;
}
if (!bOnlyBrk) {
if (single_line_ || *pEndPos <= line_width_ ||
nCur == FX_BREAKPROPERTY::kSP) {
if (eType == FX_LINEBREAKTYPE::kDIRECT_BRK && iBreak < 0) {
iBreak = iLength;
iBreakPos = *pEndPos;
if (!bAllChars) {
return iLength;
}
} else if (eType == FX_LINEBREAKTYPE::kINDIRECT_BRK && iIndirect < 0) {
iIndirect = iLength;
iIndirectPos = *pEndPos;
}
if (iLast < 0) {
iLast = iLength;
iLastPos = *pEndPos;
}
}
iCharWidth = pCur->char_width_;
if (iCharWidth > 0) {
*pEndPos -= iCharWidth;
}
}
nNext = nCur;
iLength--;
}
if (bOnlyBrk) {
return 0;
}
if (iBreak > -1) {
*pEndPos = iBreakPos;
return iBreak;
}
if (iIndirect > -1) {
*pEndPos = iIndirectPos;
return iIndirect;
}
if (iLast > -1) {
*pEndPos = iLastPos;
return iLast;
}
return 0;
}
void CFGAS_TxtBreak::SplitTextLine(CFGAS_BreakLine* pCurLine,
CFGAS_BreakLine* pNextLine,
bool bAllChars) {
DCHECK(pCurLine);
DCHECK(pNextLine);
if (pCurLine->line_chars_.size() < 2) {
return;
}
int32_t iEndPos = pCurLine->width_;
std::vector<CFGAS_Char>& curChars = pCurLine->line_chars_;
int32_t iCharPos = GetBreakPos(&curChars, bAllChars, false, &iEndPos);
if (iCharPos < 0) {
iCharPos = 0;
}
iCharPos++;
if (iCharPos >= fxcrt::CollectionSize<int32_t>(pCurLine->line_chars_)) {
pNextLine->Clear();
CFGAS_Char* pTC = &curChars[iCharPos - 1];
pTC->line_break_type_ = FX_LINEBREAKTYPE::kUNKNOWN;
return;
}
pNextLine->line_chars_ =
std::vector<CFGAS_Char>(curChars.begin() + iCharPos, curChars.end());
curChars.erase(curChars.begin() + iCharPos, curChars.end());
pCurLine->width_ = iEndPos;
CFGAS_Char* pTC = &curChars[iCharPos - 1];
pTC->line_break_type_ = FX_LINEBREAKTYPE::kUNKNOWN;
int32_t iWidth = 0;
for (size_t i = 0; i < pNextLine->line_chars_.size(); ++i) {
if (pNextLine->line_chars_[i].GetCharType() >= FX_CHARTYPE::kArabicAlef) {
pCurLine->DecrementArabicCharCount();
pNextLine->IncrementArabicCharCount();
}
iWidth += std::max(0, pNextLine->line_chars_[i].char_width_);
pNextLine->line_chars_[i].status_ = CFGAS_Char::BreakType::kNone;
}
pNextLine->width_ = iWidth;
}
size_t CFGAS_TxtBreak::GetDisplayPos(const Run& run,
pdfium::span<TextCharPos> pCharPos) const {
if (run.iLength < 1) {
return 0;
}
Engine* pEngine = run.pEdtEngine;
WideStringView pStr = run.wsStr.AsStringView();
pdfium::span<int32_t> pWidths = run.pWidths;
int32_t iLength = run.iLength - 1;
RetainPtr<CFGAS_GEFont> pFont = run.pFont;
Mask<LayoutStyle> dwStyles = run.dwStyles;
CFX_RectF rtText(*run.pRect);
const bool bRTLPiece = (run.dwCharStyles & FX_TXTCHARSTYLE_OddBidiLevel) != 0;
const float fFontSize = run.fFontSize;
const int32_t iFontSize = FXSYS_roundf(fFontSize * 20.0f);
const int32_t iAscent = pFont->GetAscent();
const int32_t iDescent = pFont->GetDescent();
const int32_t iMaxHeight = iAscent - iDescent;
const float fAscent = iMaxHeight ? fFontSize * iAscent / iMaxHeight : 0;
int32_t iHorScale = run.iHorizontalScale;
int32_t iVerScale = run.iVerticalScale;
bool bSkipSpace = run.bSkipSpace;
const float fYBase = rtText.top + (rtText.height - fFontSize) / 2.0f;
float fX = bRTLPiece ? rtText.right() : rtText.left;
float fY = fYBase + fAscent;
size_t szCount = 0;
int32_t iNext = 0;
wchar_t wPrev = pdfium::unicode::kZeroWidthNoBreakSpace;
wchar_t wNext = pdfium::unicode::kZeroWidthNoBreakSpace;
wchar_t wForm = pdfium::unicode::kZeroWidthNoBreakSpace;
wchar_t wLast = pdfium::unicode::kZeroWidthNoBreakSpace;
bool bShadda = false;
bool bLam = false;
for (int32_t i = 0; i <= iLength; i++) {
int32_t iAbsolute = i + run.iStart;
int32_t iWidth;
wchar_t wch;
if (pEngine) {
wch = pEngine->GetChar(iAbsolute);
iWidth = pEngine->GetWidthOfChar(iAbsolute);
} else {
wch = pStr.Front();
pStr = pStr.Substr(1);
iWidth = pWidths.front();
pWidths = pWidths.subspan(1);
}
FX_CHARTYPE chartype = pdfium::unicode::GetCharType(wch);
if (chartype == FX_CHARTYPE::kArabicAlef && iWidth == 0) {
wPrev = pdfium::unicode::kZeroWidthNoBreakSpace;
wLast = wch;
continue;
}
if (chartype >= FX_CHARTYPE::kArabicAlef) {
if (i < iLength) {
if (pEngine) {
iNext = i + 1;
while (iNext <= iLength) {
int32_t iNextAbsolute = iNext + run.iStart;
wNext = pEngine->GetChar(iNextAbsolute);
if (pdfium::unicode::GetCharType(wNext) !=
FX_CHARTYPE::kCombination) {
break;
}
iNext++;
}
if (iNext > iLength) {
wNext = pdfium::unicode::kZeroWidthNoBreakSpace;
}
} else {
int32_t j = -1;
do {
j++;
if (i + j >= iLength) {
break;
}
wNext = pStr[j];
} while (pdfium::unicode::GetCharType(wNext) ==
FX_CHARTYPE::kCombination);
if (i + j >= iLength) {
wNext = pdfium::unicode::kZeroWidthNoBreakSpace;
}
}
} else {
wNext = pdfium::unicode::kZeroWidthNoBreakSpace;
}
wForm = pdfium::GetArabicFormChar(wch, wPrev, wNext);
bLam = (wPrev == pdfium::kArabicLetterLam &&
wch == pdfium::kArabicLetterLam &&
wNext == pdfium::kArabicLetterHeh);
} else if (chartype == FX_CHARTYPE::kCombination) {
wForm = wch;
if (wch >= 0x064C && wch <= 0x0651) {
if (bShadda) {
wForm = pdfium::unicode::kZeroWidthNoBreakSpace;
bShadda = false;
} else {
wNext = pdfium::unicode::kZeroWidthNoBreakSpace;
if (pEngine) {
iNext = i + 1;
if (iNext <= iLength) {
int32_t iNextAbsolute = iNext + run.iStart;
wNext = pEngine->GetChar(iNextAbsolute);
}
} else if (i < iLength) {
wNext = pStr.Front();
}
std::optional<uint16_t> maybe_shadda;
if (wch == pdfium::kArabicShadda) {
maybe_shadda = pdfium::GetArabicFromShaddaTable(wNext);
} else if (wNext == pdfium::kArabicShadda) {
maybe_shadda = pdfium::GetArabicFromShaddaTable(wch);
}
if (maybe_shadda.has_value()) {
wForm = maybe_shadda.value();
bShadda = true;
}
}
} else {
bShadda = false;
}
} else if (chartype == FX_CHARTYPE::kNumeric) {
wForm = wch;
} else if (wch == L'.') {
wForm = wch;
} else if (wch == L',') {
wForm = wch;
} else if (bRTLPiece) {
wForm = pdfium::unicode::GetMirrorChar(wch);
} else {
wForm = wch;
}
if (chartype != FX_CHARTYPE::kCombination) {
bShadda = false;
}
if (chartype < FX_CHARTYPE::kArabicAlef) {
bLam = false;
}
bool bEmptyChar =
(chartype >= FX_CHARTYPE::kTab && chartype <= FX_CHARTYPE::kControl);
if (wForm == pdfium::unicode::kZeroWidthNoBreakSpace) {
bEmptyChar = true;
}
int32_t iForms = bLam ? 3 : 1;
szCount += (bEmptyChar && bSkipSpace) ? 0 : iForms;
if (pCharPos.empty()) {
if (iWidth > 0) {
wPrev = wch;
}
wLast = wch;
continue;
}
int32_t iCharWidth = iWidth;
if (iCharWidth < 0) {
iCharWidth = -iCharWidth;
}
iCharWidth /= iFontSize;
std::array<FX_FORMCHAR, 3> form_chars;
form_chars[0].wch = wch;
form_chars[0].wForm = wForm;
form_chars[0].iWidth = iCharWidth;
if (bLam) {
form_chars[1].wForm = pdfium::kArabicShadda;
form_chars[1].iWidth =
pFont->GetCharWidth(pdfium::kArabicShadda).value_or(0);
form_chars[2].wForm = pdfium::kArabicLetterSuperscriptAlef;
form_chars[2].iWidth =
pFont->GetCharWidth(pdfium::kArabicLetterSuperscriptAlef).value_or(0);
}
for (int32_t j = 0; j < iForms; j++) {
TextCharPos& front_ref = pCharPos.front();
wForm = (wchar_t)form_chars[j].wForm;
iCharWidth = form_chars[j].iWidth;
if (j > 0) {
chartype = FX_CHARTYPE::kCombination;
wch = wForm;
wLast = (wchar_t)form_chars[j - 1].wForm;
}
if (!bEmptyChar || (bEmptyChar && !bSkipSpace)) {
front_ref.m_GlyphIndex = pFont->GetGlyphIndex(wForm);
#if BUILDFLAG(IS_APPLE)
front_ref.m_ExtGID = front_ref.m_GlyphIndex;
#endif
front_ref.m_FontCharWidth = iCharWidth;
}
const float fCharWidth = fFontSize * iCharWidth / 1000.0f;
if (bRTLPiece && chartype != FX_CHARTYPE::kCombination) {
fX -= fCharWidth;
}
if (!bEmptyChar || (bEmptyChar && !bSkipSpace)) {
front_ref.m_Origin = CFX_PointF(fX, fY);
if (!!(dwStyles & LayoutStyle::kCombText)) {
int32_t iFormWidth = pFont->GetCharWidth(wForm).value_or(iCharWidth);
float fOffset = fFontSize * (iCharWidth - iFormWidth) / 2000.0f;
front_ref.m_Origin.x += fOffset;
}
if (chartype == FX_CHARTYPE::kCombination) {
std::optional<FX_RECT> rtBBox = pFont->GetCharBBox(wForm);
if (rtBBox.has_value()) {
front_ref.m_Origin.y =
fYBase + fFontSize -
fFontSize * rtBBox.value().Height() / iMaxHeight;
}
if (wForm == wch &&
wLast != pdfium::unicode::kZeroWidthNoBreakSpace) {
if (pdfium::unicode::GetCharType(wLast) ==
FX_CHARTYPE::kCombination) {
std::optional<FX_RECT> rtOtherBox = pFont->GetCharBBox(wLast);
if (rtOtherBox.has_value()) {
front_ref.m_Origin.y -=
fFontSize * rtOtherBox.value().Height() / iMaxHeight;
}
}
}
}
}
if (!bRTLPiece && chartype != FX_CHARTYPE::kCombination) {
fX += fCharWidth;
}
if (!bEmptyChar || (bEmptyChar && !bSkipSpace)) {
front_ref.m_bGlyphAdjust = true;
front_ref.m_AdjustMatrix[0] = -1;
front_ref.m_AdjustMatrix[1] = 0;
front_ref.m_AdjustMatrix[2] = 0;
front_ref.m_AdjustMatrix[3] = 1;
if (iHorScale != 100 || iVerScale != 100) {
front_ref.m_AdjustMatrix[0] =
front_ref.m_AdjustMatrix[0] * iHorScale / 100.0f;
front_ref.m_AdjustMatrix[1] =
front_ref.m_AdjustMatrix[1] * iHorScale / 100.0f;
front_ref.m_AdjustMatrix[2] =
front_ref.m_AdjustMatrix[2] * iVerScale / 100.0f;
front_ref.m_AdjustMatrix[3] =
front_ref.m_AdjustMatrix[3] * iVerScale / 100.0f;
}
pCharPos = pCharPos.subspan(1);
}
}
if (iWidth > 0) {
wPrev = static_cast<wchar_t>(form_chars[0].wch);
}
wLast = wch;
}
return szCount;
}
std::vector<CFX_RectF> CFGAS_TxtBreak::GetCharRects(const Run& run) const {
if (run.iLength < 1) {
return std::vector<CFX_RectF>();
}
Engine* pEngine = run.pEdtEngine;
WideStringView pStr = run.wsStr.AsStringView();
pdfium::span<int32_t> pWidths = run.pWidths;
int32_t iLength = run.iLength;
CFX_RectF rect(*run.pRect);
float fFontSize = run.fFontSize;
bool bRTLPiece = !!(run.dwCharStyles & FX_TXTCHARSTYLE_OddBidiLevel);
bool bSingleLine = !!(run.dwStyles & LayoutStyle::kSingleLine);
float fStart = bRTLPiece ? rect.right() : rect.left;
std::vector<CFX_RectF> rtArray(iLength);
for (int32_t i = 0; i < iLength; i++) {
wchar_t wch;
int32_t iCharSize;
if (pEngine) {
int32_t iAbsolute = i + run.iStart;
wch = pEngine->GetChar(iAbsolute);
iCharSize = pEngine->GetWidthOfChar(iAbsolute);
} else {
wch = pStr.Front();
pStr = pStr.Substr(1);
iCharSize = pWidths.front();
pWidths = pWidths.subspan(1);
}
float fCharSize = static_cast<float>(iCharSize) / kConversionFactor;
bool bRet = (!bSingleLine && IsCtrlCode(wch));
if (!(wch == L'\v' || wch == L'\f' ||
wch == pdfium::unicode::kLineSeparator ||
wch == pdfium::unicode::kParagraphSeparator || wch == L'\n')) {
bRet = false;
}
if (bRet) {
fCharSize = fFontSize / 2.0f;
}
rect.left = fStart;
if (bRTLPiece) {
rect.left -= fCharSize;
fStart -= fCharSize;
} else {
fStart += fCharSize;
}
rect.width = fCharSize;
rtArray[i] = rect;
}
return rtArray;
}
CFGAS_TxtBreak::Engine::~Engine() = default;
CFGAS_TxtBreak::Run::Run() = default;
CFGAS_TxtBreak::Run::~Run() = default;
CFGAS_TxtBreak::Run::Run(const CFGAS_TxtBreak::Run& other) = default;