blob: b5f50022f197b9f8a38516d6b4def3382730cb9b [file] [log] [blame]
// Copyright 2014 PDFium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
#include "../../include/pdfwindow/PDFWindow.h"
#include "../../include/pdfwindow/PWL_Wnd.h"
#include "../../include/pdfwindow/PWL_FontMap.h"
#define DEFAULT_FONT_NAME "Helvetica"
/* ------------------------------ CPWL_FontMap ------------------------------ */
CPWL_FontMap::CPWL_FontMap(IFX_SystemHandler* pSystemHandler) :
m_pPDFDoc(NULL),
m_pSystemHandler(pSystemHandler)
{
ASSERT(m_pSystemHandler != NULL);
}
CPWL_FontMap::~CPWL_FontMap()
{
if (m_pPDFDoc)
{
delete m_pPDFDoc;
m_pPDFDoc = NULL;
}
Empty();
}
void CPWL_FontMap::SetSystemHandler(IFX_SystemHandler* pSystemHandler)
{
m_pSystemHandler = pSystemHandler;
}
CPDF_Document* CPWL_FontMap::GetDocument()
{
if (!m_pPDFDoc)
{
if (CPDF_ModuleMgr::Get())
{
m_pPDFDoc = FX_NEW CPDF_Document;
m_pPDFDoc->CreateNewDoc();
}
}
return m_pPDFDoc;
}
CPDF_Font* CPWL_FontMap::GetPDFFont(FX_INT32 nFontIndex)
{
if (nFontIndex >=0 && nFontIndex < m_aData.GetSize())
{
if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex))
{
return pData->pFont;
}
}
return NULL;
}
CFX_ByteString CPWL_FontMap::GetPDFFontAlias(FX_INT32 nFontIndex)
{
if (nFontIndex >=0 && nFontIndex < m_aData.GetSize())
{
if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex))
{
return pData->sFontName;
}
}
return "";
}
FX_BOOL CPWL_FontMap::KnowWord(FX_INT32 nFontIndex, FX_WORD word)
{
if (nFontIndex >=0 && nFontIndex < m_aData.GetSize())
{
if (m_aData.GetAt(nFontIndex))
{
return CharCodeFromUnicode(nFontIndex, word) >= 0;
}
}
return FALSE;
}
FX_INT32 CPWL_FontMap::GetWordFontIndex(FX_WORD word, FX_INT32 nCharset, FX_INT32 nFontIndex)
{
if (nFontIndex > 0)
{
if (KnowWord(nFontIndex, word))
return nFontIndex;
}
else
{
if (const CPWL_FontMap_Data* pData = GetFontMapData(0))
{
if (nCharset == DEFAULT_CHARSET ||
pData->nCharset == SYMBOL_CHARSET ||
nCharset == pData->nCharset)
{
if (KnowWord(0, word))
{
return 0;
}
}
}
}
FX_INT32 nNewFontIndex = -1;
nNewFontIndex = this->GetFontIndex(GetNativeFontName(nCharset), nCharset, TRUE);
if (nNewFontIndex >= 0)
{
if (KnowWord(nNewFontIndex, word))
return nNewFontIndex;
}
nNewFontIndex = this->GetFontIndex("Arial Unicode MS", DEFAULT_CHARSET, FALSE);
if (nNewFontIndex >= 0)
{
if (KnowWord(nNewFontIndex, word))
return nNewFontIndex;
}
return -1;
}
FX_INT32 CPWL_FontMap::CharCodeFromUnicode(FX_INT32 nFontIndex, FX_WORD word)
{
if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex))
{
if (pData->pFont)
{
if (pData->pFont->IsUnicodeCompatible())
{
int nCharCode = pData->pFont->CharCodeFromUnicode(word);
pData->pFont->GlyphFromCharCode(nCharCode);
return nCharCode;
}
else
{
if (word < 0xFF)
return word;
}
}
}
return -1;
}
CFX_ByteString CPWL_FontMap::GetNativeFontName(FX_INT32 nCharset)
{
//searching native font is slow, so we must save time
for (FX_INT32 i=0,sz=m_aNativeFont.GetSize(); i<sz; i++)
{
if (CPWL_FontMap_Native* pData = m_aNativeFont.GetAt(i))
{
if (pData->nCharset == nCharset)
return pData->sFontName;
}
}
CFX_ByteString sNew = GetNativeFont(nCharset);
if (!sNew.IsEmpty())
{
CPWL_FontMap_Native* pNewData = new CPWL_FontMap_Native;
pNewData->nCharset = nCharset;
pNewData->sFontName = sNew;
m_aNativeFont.Add(pNewData);
}
return sNew;
}
void CPWL_FontMap::Empty()
{
{
for (FX_INT32 i=0, sz=m_aData.GetSize(); i<sz; i++)
delete m_aData.GetAt(i);
m_aData.RemoveAll();
}
{
for (FX_INT32 i=0, sz=m_aNativeFont.GetSize(); i<sz; i++)
delete m_aNativeFont.GetAt(i);
m_aNativeFont.RemoveAll();
}
}
void CPWL_FontMap::Initial(FX_LPCSTR fontname)
{
CFX_ByteString sFontName = fontname;
if (sFontName.IsEmpty())
sFontName = DEFAULT_FONT_NAME;
GetFontIndex(sFontName, ANSI_CHARSET, FALSE);
//GetFontIndex(this->GetNativeFontName(nCharset), nCharset);
}
/*
List of currently supported standard fonts:
Courier, Courier-Bold, Courier-BoldOblique, Courier-Oblique
Helvetica, Helvetica-Bold, Helvetica-BoldOblique, Helvetica-Oblique
Times-Roman, Times-Bold, Times-Italic, Times-BoldItalic
Symbol, ZapfDingbats
*/
const char* g_sDEStandardFontName[] = {"Courier", "Courier-Bold", "Courier-BoldOblique", "Courier-Oblique",
"Helvetica", "Helvetica-Bold", "Helvetica-BoldOblique", "Helvetica-Oblique",
"Times-Roman", "Times-Bold", "Times-Italic", "Times-BoldItalic",
"Symbol", "ZapfDingbats"};
FX_BOOL CPWL_FontMap::IsStandardFont(const CFX_ByteString& sFontName)
{
for (FX_INT32 i=0; i<14; i++)
{
if (sFontName == g_sDEStandardFontName[i])
return TRUE;
}
return FALSE;
}
FX_INT32 CPWL_FontMap::FindFont(const CFX_ByteString& sFontName, FX_INT32 nCharset)
{
for (FX_INT32 i=0,sz=m_aData.GetSize(); i<sz; i++)
{
if (CPWL_FontMap_Data* pData = m_aData.GetAt(i))
{
if (nCharset == DEFAULT_CHARSET || nCharset == pData->nCharset)
{
if (sFontName.IsEmpty() || pData->sFontName == sFontName)
return i;
}
}
}
return -1;
}
FX_INT32 CPWL_FontMap::GetFontIndex(const CFX_ByteString& sFontName, FX_INT32 nCharset, FX_BOOL bFind)
{
FX_INT32 nFontIndex = FindFont(EncodeFontAlias(sFontName, nCharset), nCharset);
if (nFontIndex >= 0) return nFontIndex;
// nFontIndex = FindFont("", nCharset);
// if (nFontIndex >= 0) return nFontIndex;
CFX_ByteString sAlias;
CPDF_Font* pFont = NULL;
if (bFind)
pFont = FindFontSameCharset(sAlias, nCharset);
if (!pFont)
{
CFX_ByteString sTemp = sFontName;
pFont = AddFontToDocument(GetDocument(), sTemp, nCharset);
/*
if (FindFont(sAlias))
{
sAlias = EncodeFontAlias(sTemp, nCharset);
}
else
*/
{
sAlias = EncodeFontAlias(sTemp, nCharset);
}
}
AddedFont(pFont, sAlias);
return AddFontData(pFont, sAlias, nCharset);
}
FX_INT32 CPWL_FontMap::GetPWLFontIndex(FX_WORD word, FX_INT32 nCharset)
{
FX_INT32 nFind = -1;
for (FX_INT32 i=0,sz=m_aData.GetSize(); i<sz; i++)
{
if (CPWL_FontMap_Data* pData = m_aData.GetAt(i))
{
if (pData->nCharset == nCharset)
{
nFind = i;
break;
}
}
}
CPDF_Font* pNewFont = GetPDFFont(nFind);
if (!pNewFont) return -1;
/*
if (CPDF_Font* pFont = GetPDFFont(nFind))
{
PWLFont.AddWordToFontDict(pFontDict, word);
}
*/
#ifdef FOXIT_CHROME_BUILD
CFX_ByteString sAlias = EncodeFontAlias("Arial_Chrome", nCharset);
#else
CFX_ByteString sAlias = EncodeFontAlias("Arial_Foxit", nCharset);
#endif
AddedFont(pNewFont, sAlias);
return AddFontData(pNewFont, sAlias, nCharset);
}
CPDF_Font* CPWL_FontMap::FindFontSameCharset(CFX_ByteString& sFontAlias, FX_INT32 nCharset)
{
return NULL;
}
FX_INT32 CPWL_FontMap::AddFontData(CPDF_Font* pFont, const CFX_ByteString& sFontAlias, FX_INT32 nCharset)
{
CPWL_FontMap_Data* pNewData = new CPWL_FontMap_Data;
pNewData->pFont = pFont;
pNewData->sFontName = sFontAlias;
pNewData->nCharset = nCharset;
m_aData.Add(pNewData);
return m_aData.GetSize() -1;
}
void CPWL_FontMap::AddedFont(CPDF_Font* pFont, const CFX_ByteString& sFontAlias)
{
}
CFX_ByteString CPWL_FontMap::GetFontName(FX_INT32 nFontIndex)
{
if (nFontIndex >=0 && nFontIndex < m_aData.GetSize())
{
if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex))
{
return pData->sFontName;
}
}
return "";
}
CFX_ByteString CPWL_FontMap::GetNativeFont(FX_INT32 nCharset)
{
CFX_ByteString sFontName;
if (nCharset == DEFAULT_CHARSET)
nCharset = GetNativeCharset();
sFontName = GetDefaultFontByCharset(nCharset);
if (m_pSystemHandler)
{
if (m_pSystemHandler->FindNativeTrueTypeFont(nCharset, sFontName))
return sFontName;
sFontName = m_pSystemHandler->GetNativeTrueTypeFont(nCharset);
}
return sFontName;
}
CPDF_Font* CPWL_FontMap::AddFontToDocument(CPDF_Document* pDoc, CFX_ByteString& sFontName, FX_BYTE nCharset)
{
if (IsStandardFont(sFontName))
return AddStandardFont(pDoc, sFontName);
else
return AddSystemFont(pDoc, sFontName, nCharset);
}
CPDF_Font* CPWL_FontMap::AddStandardFont(CPDF_Document* pDoc, CFX_ByteString& sFontName)
{
if (!pDoc) return NULL;
CPDF_Font* pFont = NULL;
if (sFontName == "ZapfDingbats")
pFont = pDoc->AddStandardFont(sFontName, NULL);
else
{
CPDF_FontEncoding fe(PDFFONT_ENCODING_WINANSI);
pFont = pDoc->AddStandardFont(sFontName, &fe);
}
return pFont;
}
CPDF_Font* CPWL_FontMap::AddSystemFont(CPDF_Document* pDoc, CFX_ByteString& sFontName, FX_BYTE nCharset)
{
if (!pDoc) return NULL;
if (sFontName.IsEmpty()) sFontName = GetNativeFont(nCharset);
if (nCharset == DEFAULT_CHARSET) nCharset = GetNativeCharset();
if (m_pSystemHandler)
return m_pSystemHandler->AddNativeTrueTypeFontToPDF(pDoc, sFontName, nCharset);
return NULL;
}
CFX_ByteString CPWL_FontMap::EncodeFontAlias(const CFX_ByteString& sFontName, FX_INT32 nCharset)
{
CFX_ByteString sPostfix;
sPostfix.Format("_%02X", nCharset);
return EncodeFontAlias(sFontName) + sPostfix;
}
CFX_ByteString CPWL_FontMap::EncodeFontAlias(const CFX_ByteString& sFontName)
{
CFX_ByteString sRet = sFontName;
sRet.Remove(' ');
return sRet;
}
FX_INT32 CPWL_FontMap::GetFontMapCount() const
{
return m_aData.GetSize();
}
const CPWL_FontMap_Data* CPWL_FontMap::GetFontMapData(FX_INT32 nIndex) const
{
if (nIndex >=0 && nIndex < m_aData.GetSize())
{
return m_aData.GetAt(nIndex);
}
return NULL;
}
FX_INT32 CPWL_FontMap::GetNativeCharset()
{
FX_BYTE nCharset = ANSI_CHARSET;
FX_INT32 iCodePage = FXSYS_GetACP();
switch (iCodePage)
{
case 932://Japan
nCharset = SHIFTJIS_CHARSET;
break;
case 936://Chinese (PRC, Singapore)
nCharset = GB2312_CHARSET;
break;
case 950://Chinese (Taiwan; Hong Kong SAR, PRC)
nCharset = GB2312_CHARSET;
break;
case 1252://Windows 3.1 Latin 1 (US, Western Europe)
nCharset = ANSI_CHARSET;
break;
case 874://Thai
nCharset = THAI_CHARSET;
break;
case 949://Korean
nCharset = HANGUL_CHARSET;
break;
case 1200://Unicode (BMP of ISO 10646)
nCharset = ANSI_CHARSET;
break;
case 1250://Windows 3.1 Eastern European
nCharset = EASTEUROPE_CHARSET;
break;
case 1251://Windows 3.1 Cyrillic
nCharset = RUSSIAN_CHARSET;
break;
case 1253://Windows 3.1 Greek
nCharset = GREEK_CHARSET;
break;
case 1254://Windows 3.1 Turkish
nCharset = TURKISH_CHARSET;
break;
case 1255://Hebrew
nCharset = HEBREW_CHARSET;
break;
case 1256://Arabic
nCharset = ARABIC_CHARSET;
break;
case 1257://Baltic
nCharset = BALTIC_CHARSET;
break;
case 1258://Vietnamese
nCharset = VIETNAMESE_CHARSET;
break;
case 1361://Korean(Johab)
nCharset = JOHAB_CHARSET;
break;
}
return nCharset;
}
const CPWL_FontMap::CharsetFontMap CPWL_FontMap::defaultTTFMap[] = {
{ ANSI_CHARSET, "Helvetica" },
{ GB2312_CHARSET, "SimSun" },
{ CHINESEBIG5_CHARSET, "MingLiU" },
{ SHIFTJIS_CHARSET, "MS Gothic" },
{ HANGUL_CHARSET, "Batang" },
{ RUSSIAN_CHARSET, "Arial" },
#if _FXM_PLATFORM_ == _FXM_PLATFORM_LINUX_ || _FXM_PLATFORM_ == _FXM_PLATFORM_APPLE_
{ EASTEUROPE_CHARSET, "Arial" },
#else
{ EASTEUROPE_CHARSET, "Tahoma" },
#endif
{ ARABIC_CHARSET, "Arial" },
{ -1, NULL }
};
CFX_ByteString CPWL_FontMap::GetDefaultFontByCharset(FX_INT32 nCharset)
{
int i = 0;
while (defaultTTFMap[i].charset != -1) {
if (nCharset == defaultTTFMap[i].charset)
return defaultTTFMap[i].fontname;
++i;
}
return "";
}
FX_INT32 CPWL_FontMap::CharSetFromUnicode(FX_WORD word, FX_INT32 nOldCharset)
{
if(m_pSystemHandler && (-1 != m_pSystemHandler->GetCharSet()))
return m_pSystemHandler->GetCharSet();
//to avoid CJK Font to show ASCII
if (word < 0x7F) return ANSI_CHARSET;
//follow the old charset
if (nOldCharset != DEFAULT_CHARSET) return nOldCharset;
//find new charset
if ((word >= 0x4E00 && word <= 0x9FA5) ||
(word >= 0xE7C7 && word <= 0xE7F3) ||
(word >= 0x3000 && word <= 0x303F) || //£©"¡¶" "¡·" "¡£" "¡¢"
(word >= 0x2000 && word <= 0x206F))
{
return GB2312_CHARSET;
}
if (((word >= 0x3040) && (word <= 0x309F)) ||
((word >= 0x30A0) && (word <= 0x30FF)) ||
((word >= 0x31F0) && (word <= 0x31FF)) ||
((word >= 0xFF00) && (word <= 0xFFEF)) )
{
return SHIFTJIS_CHARSET;
}
if (((word >= 0xAC00) && (word <= 0xD7AF)) ||
((word >= 0x1100) && (word <= 0x11FF)) ||
((word >= 0x3130) && (word <= 0x318F)))
{
return HANGUL_CHARSET;
}
if (word >= 0x0E00 && word <= 0x0E7F)
return THAI_CHARSET;
if ((word >= 0x0370 && word <= 0x03FF) ||
(word >= 0x1F00 && word <= 0x1FFF))
return GREEK_CHARSET;
if ((word >= 0x0600 && word <= 0x06FF) ||
(word >= 0xFB50 && word <= 0xFEFC))
return ARABIC_CHARSET;
if (word >= 0x0590 && word <= 0x05FF)
return HEBREW_CHARSET;
if (word >= 0x0400 && word <= 0x04FF)
return RUSSIAN_CHARSET;
if (word >= 0x0100 && word <= 0x024F)
return EASTEUROPE_CHARSET;
if (word >= 0x1E00 && word <= 0x1EFF)
return VIETNAMESE_CHARSET;
return ANSI_CHARSET;
}
/* ------------------------ CPWL_DocFontMap ------------------------ */
CPWL_DocFontMap::CPWL_DocFontMap(IFX_SystemHandler* pSystemHandler, CPDF_Document* pAttachedDoc)
: CPWL_FontMap(pSystemHandler),
m_pAttachedDoc(pAttachedDoc)
{
}
CPWL_DocFontMap::~CPWL_DocFontMap()
{
}
CPDF_Document* CPWL_DocFontMap::GetDocument()
{
return m_pAttachedDoc;
}