// Copyright 2014 PDFium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com #include "../../include/pdfwindow/PDFWindow.h" #include "../../include/pdfwindow/PWL_Wnd.h" #include "../../include/pdfwindow/PWL_FontMap.h" #define DEFAULT_FONT_NAME "Helvetica" /* ------------------------------ CPWL_FontMap ------------------------------ */ CPWL_FontMap::CPWL_FontMap(IFX_SystemHandler* pSystemHandler) : m_pPDFDoc(NULL), m_pSystemHandler(pSystemHandler) { ASSERT(m_pSystemHandler != NULL); } CPWL_FontMap::~CPWL_FontMap() { if (m_pPDFDoc) { delete m_pPDFDoc; m_pPDFDoc = NULL; } Empty(); } void CPWL_FontMap::SetSystemHandler(IFX_SystemHandler* pSystemHandler) { m_pSystemHandler = pSystemHandler; } CPDF_Document* CPWL_FontMap::GetDocument() { if (!m_pPDFDoc) { if (CPDF_ModuleMgr::Get()) { m_pPDFDoc = FX_NEW CPDF_Document; m_pPDFDoc->CreateNewDoc(); } } return m_pPDFDoc; } CPDF_Font* CPWL_FontMap::GetPDFFont(FX_INT32 nFontIndex) { if (nFontIndex >=0 && nFontIndex < m_aData.GetSize()) { if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex)) { return pData->pFont; } } return NULL; } CFX_ByteString CPWL_FontMap::GetPDFFontAlias(FX_INT32 nFontIndex) { if (nFontIndex >=0 && nFontIndex < m_aData.GetSize()) { if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex)) { return pData->sFontName; } } return ""; } FX_BOOL CPWL_FontMap::KnowWord(FX_INT32 nFontIndex, FX_WORD word) { if (nFontIndex >=0 && nFontIndex < m_aData.GetSize()) { if (m_aData.GetAt(nFontIndex)) { return CharCodeFromUnicode(nFontIndex, word) >= 0; } } return FALSE; } FX_INT32 CPWL_FontMap::GetWordFontIndex(FX_WORD word, FX_INT32 nCharset, FX_INT32 nFontIndex) { if (nFontIndex > 0) { if (KnowWord(nFontIndex, word)) return nFontIndex; } else { if (const CPWL_FontMap_Data* pData = GetFontMapData(0)) { if (nCharset == DEFAULT_CHARSET || pData->nCharset == SYMBOL_CHARSET || nCharset == pData->nCharset) { if (KnowWord(0, word)) { return 0; } } } } FX_INT32 nNewFontIndex = -1; nNewFontIndex = this->GetFontIndex(GetNativeFontName(nCharset), nCharset, TRUE); if (nNewFontIndex >= 0) { if (KnowWord(nNewFontIndex, word)) return nNewFontIndex; } nNewFontIndex = this->GetFontIndex("Arial Unicode MS", DEFAULT_CHARSET, FALSE); if (nNewFontIndex >= 0) { if (KnowWord(nNewFontIndex, word)) return nNewFontIndex; } return -1; } FX_INT32 CPWL_FontMap::CharCodeFromUnicode(FX_INT32 nFontIndex, FX_WORD word) { if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex)) { if (pData->pFont) { if (pData->pFont->IsUnicodeCompatible()) { int nCharCode = pData->pFont->CharCodeFromUnicode(word); pData->pFont->GlyphFromCharCode(nCharCode); return nCharCode; } else { if (word < 0xFF) return word; } } } return -1; } CFX_ByteString CPWL_FontMap::GetNativeFontName(FX_INT32 nCharset) { //searching native font is slow, so we must save time for (FX_INT32 i=0,sz=m_aNativeFont.GetSize(); i<sz; i++) { if (CPWL_FontMap_Native* pData = m_aNativeFont.GetAt(i)) { if (pData->nCharset == nCharset) return pData->sFontName; } } CFX_ByteString sNew = GetNativeFont(nCharset); if (!sNew.IsEmpty()) { CPWL_FontMap_Native* pNewData = new CPWL_FontMap_Native; pNewData->nCharset = nCharset; pNewData->sFontName = sNew; m_aNativeFont.Add(pNewData); } return sNew; } void CPWL_FontMap::Empty() { { for (FX_INT32 i=0, sz=m_aData.GetSize(); i<sz; i++) delete m_aData.GetAt(i); m_aData.RemoveAll(); } { for (FX_INT32 i=0, sz=m_aNativeFont.GetSize(); i<sz; i++) delete m_aNativeFont.GetAt(i); m_aNativeFont.RemoveAll(); } } void CPWL_FontMap::Initial(FX_LPCSTR fontname) { CFX_ByteString sFontName = fontname; if (sFontName.IsEmpty()) sFontName = DEFAULT_FONT_NAME; GetFontIndex(sFontName, ANSI_CHARSET, FALSE); //GetFontIndex(this->GetNativeFontName(nCharset), nCharset); } /* List of currently supported standard fonts: Courier, Courier-Bold, Courier-BoldOblique, Courier-Oblique Helvetica, Helvetica-Bold, Helvetica-BoldOblique, Helvetica-Oblique Times-Roman, Times-Bold, Times-Italic, Times-BoldItalic Symbol, ZapfDingbats */ const char* g_sDEStandardFontName[] = {"Courier", "Courier-Bold", "Courier-BoldOblique", "Courier-Oblique", "Helvetica", "Helvetica-Bold", "Helvetica-BoldOblique", "Helvetica-Oblique", "Times-Roman", "Times-Bold", "Times-Italic", "Times-BoldItalic", "Symbol", "ZapfDingbats"}; FX_BOOL CPWL_FontMap::IsStandardFont(const CFX_ByteString& sFontName) { for (FX_INT32 i=0; i<14; i++) { if (sFontName == g_sDEStandardFontName[i]) return TRUE; } return FALSE; } FX_INT32 CPWL_FontMap::FindFont(const CFX_ByteString& sFontName, FX_INT32 nCharset) { for (FX_INT32 i=0,sz=m_aData.GetSize(); i<sz; i++) { if (CPWL_FontMap_Data* pData = m_aData.GetAt(i)) { if (nCharset == DEFAULT_CHARSET || nCharset == pData->nCharset) { if (sFontName.IsEmpty() || pData->sFontName == sFontName) return i; } } } return -1; } FX_INT32 CPWL_FontMap::GetFontIndex(const CFX_ByteString& sFontName, FX_INT32 nCharset, FX_BOOL bFind) { FX_INT32 nFontIndex = FindFont(EncodeFontAlias(sFontName, nCharset), nCharset); if (nFontIndex >= 0) return nFontIndex; // nFontIndex = FindFont("", nCharset); // if (nFontIndex >= 0) return nFontIndex; CFX_ByteString sAlias; CPDF_Font* pFont = NULL; if (bFind) pFont = FindFontSameCharset(sAlias, nCharset); if (!pFont) { CFX_ByteString sTemp = sFontName; pFont = AddFontToDocument(GetDocument(), sTemp, nCharset); /* if (FindFont(sAlias)) { sAlias = EncodeFontAlias(sTemp, nCharset); } else */ { sAlias = EncodeFontAlias(sTemp, nCharset); } } AddedFont(pFont, sAlias); return AddFontData(pFont, sAlias, nCharset); } FX_INT32 CPWL_FontMap::GetPWLFontIndex(FX_WORD word, FX_INT32 nCharset) { FX_INT32 nFind = -1; for (FX_INT32 i=0,sz=m_aData.GetSize(); i<sz; i++) { if (CPWL_FontMap_Data* pData = m_aData.GetAt(i)) { if (pData->nCharset == nCharset) { nFind = i; break; } } } CPDF_Font* pNewFont = GetPDFFont(nFind); if (!pNewFont) return -1; /* if (CPDF_Font* pFont = GetPDFFont(nFind)) { PWLFont.AddWordToFontDict(pFontDict, word); } */ #ifdef FOXIT_CHROME_BUILD CFX_ByteString sAlias = EncodeFontAlias("Arial_Chrome", nCharset); #else CFX_ByteString sAlias = EncodeFontAlias("Arial_Foxit", nCharset); #endif AddedFont(pNewFont, sAlias); return AddFontData(pNewFont, sAlias, nCharset); } CPDF_Font* CPWL_FontMap::FindFontSameCharset(CFX_ByteString& sFontAlias, FX_INT32 nCharset) { return NULL; } FX_INT32 CPWL_FontMap::AddFontData(CPDF_Font* pFont, const CFX_ByteString& sFontAlias, FX_INT32 nCharset) { CPWL_FontMap_Data* pNewData = new CPWL_FontMap_Data; pNewData->pFont = pFont; pNewData->sFontName = sFontAlias; pNewData->nCharset = nCharset; m_aData.Add(pNewData); return m_aData.GetSize() -1; } void CPWL_FontMap::AddedFont(CPDF_Font* pFont, const CFX_ByteString& sFontAlias) { } CFX_ByteString CPWL_FontMap::GetFontName(FX_INT32 nFontIndex) { if (nFontIndex >=0 && nFontIndex < m_aData.GetSize()) { if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex)) { return pData->sFontName; } } return ""; } CFX_ByteString CPWL_FontMap::GetNativeFont(FX_INT32 nCharset) { CFX_ByteString sFontName; if (nCharset == DEFAULT_CHARSET) nCharset = GetNativeCharset(); sFontName = GetDefaultFontByCharset(nCharset); if (m_pSystemHandler) { if (m_pSystemHandler->FindNativeTrueTypeFont(nCharset, sFontName)) return sFontName; sFontName = m_pSystemHandler->GetNativeTrueTypeFont(nCharset); } return sFontName; } CPDF_Font* CPWL_FontMap::AddFontToDocument(CPDF_Document* pDoc, CFX_ByteString& sFontName, FX_BYTE nCharset) { if (IsStandardFont(sFontName)) return AddStandardFont(pDoc, sFontName); else return AddSystemFont(pDoc, sFontName, nCharset); } CPDF_Font* CPWL_FontMap::AddStandardFont(CPDF_Document* pDoc, CFX_ByteString& sFontName) { if (!pDoc) return NULL; CPDF_Font* pFont = NULL; if (sFontName == "ZapfDingbats") pFont = pDoc->AddStandardFont(sFontName, NULL); else { CPDF_FontEncoding fe(PDFFONT_ENCODING_WINANSI); pFont = pDoc->AddStandardFont(sFontName, &fe); } return pFont; } CPDF_Font* CPWL_FontMap::AddSystemFont(CPDF_Document* pDoc, CFX_ByteString& sFontName, FX_BYTE nCharset) { if (!pDoc) return NULL; if (sFontName.IsEmpty()) sFontName = GetNativeFont(nCharset); if (nCharset == DEFAULT_CHARSET) nCharset = GetNativeCharset(); if (m_pSystemHandler) return m_pSystemHandler->AddNativeTrueTypeFontToPDF(pDoc, sFontName, nCharset); return NULL; } CFX_ByteString CPWL_FontMap::EncodeFontAlias(const CFX_ByteString& sFontName, FX_INT32 nCharset) { CFX_ByteString sPostfix; sPostfix.Format("_%02X", nCharset); return EncodeFontAlias(sFontName) + sPostfix; } CFX_ByteString CPWL_FontMap::EncodeFontAlias(const CFX_ByteString& sFontName) { CFX_ByteString sRet = sFontName; sRet.Remove(' '); return sRet; } FX_INT32 CPWL_FontMap::GetFontMapCount() const { return m_aData.GetSize(); } const CPWL_FontMap_Data* CPWL_FontMap::GetFontMapData(FX_INT32 nIndex) const { if (nIndex >=0 && nIndex < m_aData.GetSize()) { return m_aData.GetAt(nIndex); } return NULL; } FX_INT32 CPWL_FontMap::GetNativeCharset() { FX_BYTE nCharset = ANSI_CHARSET; FX_INT32 iCodePage = FXSYS_GetACP(); switch (iCodePage) { case 932://Japan nCharset = SHIFTJIS_CHARSET; break; case 936://Chinese (PRC, Singapore) nCharset = GB2312_CHARSET; break; case 950://Chinese (Taiwan; Hong Kong SAR, PRC) nCharset = GB2312_CHARSET; break; case 1252://Windows 3.1 Latin 1 (US, Western Europe) nCharset = ANSI_CHARSET; break; case 874://Thai nCharset = THAI_CHARSET; break; case 949://Korean nCharset = HANGUL_CHARSET; break; case 1200://Unicode (BMP of ISO 10646) nCharset = ANSI_CHARSET; break; case 1250://Windows 3.1 Eastern European nCharset = EASTEUROPE_CHARSET; break; case 1251://Windows 3.1 Cyrillic nCharset = RUSSIAN_CHARSET; break; case 1253://Windows 3.1 Greek nCharset = GREEK_CHARSET; break; case 1254://Windows 3.1 Turkish nCharset = TURKISH_CHARSET; break; case 1255://Hebrew nCharset = HEBREW_CHARSET; break; case 1256://Arabic nCharset = ARABIC_CHARSET; break; case 1257://Baltic nCharset = BALTIC_CHARSET; break; case 1258://Vietnamese nCharset = VIETNAMESE_CHARSET; break; case 1361://Korean(Johab) nCharset = JOHAB_CHARSET; break; } return nCharset; } const CPWL_FontMap::CharsetFontMap CPWL_FontMap::defaultTTFMap[] = { { ANSI_CHARSET, "Helvetica" }, { GB2312_CHARSET, "SimSun" }, { CHINESEBIG5_CHARSET, "MingLiU" }, { SHIFTJIS_CHARSET, "MS Gothic" }, { HANGUL_CHARSET, "Batang" }, { RUSSIAN_CHARSET, "Arial" }, #if _FXM_PLATFORM_ == _FXM_PLATFORM_LINUX_ || _FXM_PLATFORM_ == _FXM_PLATFORM_APPLE_ { EASTEUROPE_CHARSET, "Arial" }, #else { EASTEUROPE_CHARSET, "Tahoma" }, #endif { ARABIC_CHARSET, "Arial" }, { -1, NULL } }; CFX_ByteString CPWL_FontMap::GetDefaultFontByCharset(FX_INT32 nCharset) { int i = 0; while (defaultTTFMap[i].charset != -1) { if (nCharset == defaultTTFMap[i].charset) return defaultTTFMap[i].fontname; ++i; } return ""; } FX_INT32 CPWL_FontMap::CharSetFromUnicode(FX_WORD word, FX_INT32 nOldCharset) { if(m_pSystemHandler && (-1 != m_pSystemHandler->GetCharSet())) return m_pSystemHandler->GetCharSet(); //to avoid CJK Font to show ASCII if (word < 0x7F) return ANSI_CHARSET; //follow the old charset if (nOldCharset != DEFAULT_CHARSET) return nOldCharset; //find new charset if ((word >= 0x4E00 && word <= 0x9FA5) || (word >= 0xE7C7 && word <= 0xE7F3) || (word >= 0x3000 && word <= 0x303F) || //��"��" "��" "��" "��" (word >= 0x2000 && word <= 0x206F)) { return GB2312_CHARSET; } if (((word >= 0x3040) && (word <= 0x309F)) || ((word >= 0x30A0) && (word <= 0x30FF)) || ((word >= 0x31F0) && (word <= 0x31FF)) || ((word >= 0xFF00) && (word <= 0xFFEF)) ) { return SHIFTJIS_CHARSET; } if (((word >= 0xAC00) && (word <= 0xD7AF)) || ((word >= 0x1100) && (word <= 0x11FF)) || ((word >= 0x3130) && (word <= 0x318F))) { return HANGUL_CHARSET; } if (word >= 0x0E00 && word <= 0x0E7F) return THAI_CHARSET; if ((word >= 0x0370 && word <= 0x03FF) || (word >= 0x1F00 && word <= 0x1FFF)) return GREEK_CHARSET; if ((word >= 0x0600 && word <= 0x06FF) || (word >= 0xFB50 && word <= 0xFEFC)) return ARABIC_CHARSET; if (word >= 0x0590 && word <= 0x05FF) return HEBREW_CHARSET; if (word >= 0x0400 && word <= 0x04FF) return RUSSIAN_CHARSET; if (word >= 0x0100 && word <= 0x024F) return EASTEUROPE_CHARSET; if (word >= 0x1E00 && word <= 0x1EFF) return VIETNAMESE_CHARSET; return ANSI_CHARSET; } /* ------------------------ CPWL_DocFontMap ------------------------ */ CPWL_DocFontMap::CPWL_DocFontMap(IFX_SystemHandler* pSystemHandler, CPDF_Document* pAttachedDoc) : CPWL_FontMap(pSystemHandler), m_pAttachedDoc(pAttachedDoc) { } CPWL_DocFontMap::~CPWL_DocFontMap() { } CPDF_Document* CPWL_DocFontMap::GetDocument() { return m_pAttachedDoc; }