blob: 6b719606a744cfb13d84d0592b1f9d94c25f0f76 [file] [log] [blame]
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -07001// Copyright 2014 PDFium Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
Lei Zhang60f507b2015-06-13 00:41:00 -07004
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -07005// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
6
dan sinclair89e904b2016-03-23 19:29:15 -04007#include "fpdfsdk/pdfwindow/PWL_FontMap.h"
Lei Zhangc2fb35f2016-01-05 16:46:58 -08008
dsinclair39c62fd2016-09-29 12:49:17 -07009#include "core/fpdfapi/cpdf_modulemgr.h"
dsinclair166bc162016-09-29 11:58:38 -070010#include "core/fpdfapi/fpdf_font/cpdf_font.h"
11#include "core/fpdfapi/fpdf_font/cpdf_fontencoding.h"
dsinclairc6c425a2016-09-29 12:01:30 -070012#include "core/fpdfapi/fpdf_parser/cpdf_document.h"
13#include "core/fpdfapi/fpdf_parser/cpdf_parser.h"
dsinclairc7a73492016-04-05 12:01:42 -070014#include "core/fpdfdoc/include/ipvt_fontmap.h"
dan sinclair89e904b2016-03-23 19:29:15 -040015#include "fpdfsdk/pdfwindow/PWL_Wnd.h"
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070016
Lei Zhang1b976642016-01-08 14:24:37 -080017namespace {
18
19const char kDefaultFontName[] = "Helvetica";
20
21const char* const g_sDEStandardFontName[] = {"Courier",
22 "Courier-Bold",
23 "Courier-BoldOblique",
24 "Courier-Oblique",
25 "Helvetica",
26 "Helvetica-Bold",
27 "Helvetica-BoldOblique",
28 "Helvetica-Oblique",
29 "Times-Roman",
30 "Times-Bold",
31 "Times-Italic",
32 "Times-BoldItalic",
33 "Symbol",
34 "ZapfDingbats"};
35
36} // namespace
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070037
dsinclairb9590102016-04-27 06:38:59 -070038CPWL_FontMap::CPWL_FontMap(CFX_SystemHandler* pSystemHandler)
weili2d5b0202016-08-03 11:06:49 -070039 : m_pSystemHandler(pSystemHandler) {
Lei Zhang96660d62015-12-14 18:27:25 -080040 ASSERT(m_pSystemHandler);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070041}
42
Nico Weber9d8ec5a2015-08-04 13:00:21 -070043CPWL_FontMap::~CPWL_FontMap() {
Nico Weber9d8ec5a2015-08-04 13:00:21 -070044 Empty();
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070045}
46
Nico Weber9d8ec5a2015-08-04 13:00:21 -070047CPDF_Document* CPWL_FontMap::GetDocument() {
48 if (!m_pPDFDoc) {
49 if (CPDF_ModuleMgr::Get()) {
thestigd4c34f22016-09-28 17:04:51 -070050 m_pPDFDoc = WrapUnique(new CPDF_Document(std::unique_ptr<CPDF_Parser>()));
Nico Weber9d8ec5a2015-08-04 13:00:21 -070051 m_pPDFDoc->CreateNewDoc();
52 }
53 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070054
weili2d5b0202016-08-03 11:06:49 -070055 return m_pPDFDoc.get();
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070056}
57
Nico Weber9d8ec5a2015-08-04 13:00:21 -070058CPDF_Font* CPWL_FontMap::GetPDFFont(int32_t nFontIndex) {
59 if (nFontIndex >= 0 && nFontIndex < m_aData.GetSize()) {
60 if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex)) {
61 return pData->pFont;
Tom Sepez2f2ffec2015-07-23 14:42:09 -070062 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -070063 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070064
thestig1cd352e2016-06-07 17:53:06 -070065 return nullptr;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070066}
67
Nico Weber9d8ec5a2015-08-04 13:00:21 -070068CFX_ByteString CPWL_FontMap::GetPDFFontAlias(int32_t nFontIndex) {
69 if (nFontIndex >= 0 && nFontIndex < m_aData.GetSize()) {
70 if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex)) {
71 return pData->sFontName;
Tom Sepez2f2ffec2015-07-23 14:42:09 -070072 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -070073 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070074
Nico Weber9d8ec5a2015-08-04 13:00:21 -070075 return "";
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070076}
77
Tom Sepez62a70f92016-03-21 15:00:20 -070078FX_BOOL CPWL_FontMap::KnowWord(int32_t nFontIndex, uint16_t word) {
Nico Weber9d8ec5a2015-08-04 13:00:21 -070079 if (nFontIndex >= 0 && nFontIndex < m_aData.GetSize()) {
80 if (m_aData.GetAt(nFontIndex)) {
81 return CharCodeFromUnicode(nFontIndex, word) >= 0;
Tom Sepez2f2ffec2015-07-23 14:42:09 -070082 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -070083 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070084
Nico Weber9d8ec5a2015-08-04 13:00:21 -070085 return FALSE;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070086}
87
Tom Sepez62a70f92016-03-21 15:00:20 -070088int32_t CPWL_FontMap::GetWordFontIndex(uint16_t word,
Nico Weber9d8ec5a2015-08-04 13:00:21 -070089 int32_t nCharset,
90 int32_t nFontIndex) {
91 if (nFontIndex > 0) {
92 if (KnowWord(nFontIndex, word))
93 return nFontIndex;
94 } else {
95 if (const CPWL_FontMap_Data* pData = GetFontMapData(0)) {
npmea3c3be2016-09-19 07:24:33 -070096 if (nCharset == FXFONT_DEFAULT_CHARSET ||
97 pData->nCharset == FXFONT_SYMBOL_CHARSET ||
Nico Weber9d8ec5a2015-08-04 13:00:21 -070098 nCharset == pData->nCharset) {
99 if (KnowWord(0, word))
100 return 0;
101 }
Tom Sepez2f2ffec2015-07-23 14:42:09 -0700102 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700103 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700104
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700105 int32_t nNewFontIndex =
106 GetFontIndex(GetNativeFontName(nCharset), nCharset, TRUE);
107 if (nNewFontIndex >= 0) {
108 if (KnowWord(nNewFontIndex, word))
109 return nNewFontIndex;
110 }
npmea3c3be2016-09-19 07:24:33 -0700111 nNewFontIndex =
112 GetFontIndex("Arial Unicode MS", FXFONT_DEFAULT_CHARSET, FALSE);
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700113 if (nNewFontIndex >= 0) {
114 if (KnowWord(nNewFontIndex, word))
115 return nNewFontIndex;
116 }
117 return -1;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700118}
119
Tom Sepez62a70f92016-03-21 15:00:20 -0700120int32_t CPWL_FontMap::CharCodeFromUnicode(int32_t nFontIndex, uint16_t word) {
thestig8ea3f512016-06-27 11:55:24 -0700121 CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex);
122 if (!pData)
123 return -1;
124
125 if (!pData->pFont)
126 return -1;
127
128 if (pData->pFont->IsUnicodeCompatible())
129 return pData->pFont->CharCodeFromUnicode(word);
130
131 return word < 0xFF ? word : -1;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700132}
133
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700134CFX_ByteString CPWL_FontMap::GetNativeFontName(int32_t nCharset) {
135 // searching native font is slow, so we must save time
136 for (int32_t i = 0, sz = m_aNativeFont.GetSize(); i < sz; i++) {
137 if (CPWL_FontMap_Native* pData = m_aNativeFont.GetAt(i)) {
138 if (pData->nCharset == nCharset)
139 return pData->sFontName;
Tom Sepez2f2ffec2015-07-23 14:42:09 -0700140 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700141 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700142
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700143 CFX_ByteString sNew = GetNativeFont(nCharset);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700144
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700145 if (!sNew.IsEmpty()) {
146 CPWL_FontMap_Native* pNewData = new CPWL_FontMap_Native;
147 pNewData->nCharset = nCharset;
148 pNewData->sFontName = sNew;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700149
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700150 m_aNativeFont.Add(pNewData);
151 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700152
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700153 return sNew;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700154}
155
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700156void CPWL_FontMap::Empty() {
157 {
158 for (int32_t i = 0, sz = m_aData.GetSize(); i < sz; i++)
159 delete m_aData.GetAt(i);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700160
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700161 m_aData.RemoveAll();
162 }
163 {
164 for (int32_t i = 0, sz = m_aNativeFont.GetSize(); i < sz; i++)
165 delete m_aNativeFont.GetAt(i);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700166
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700167 m_aNativeFont.RemoveAll();
168 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700169}
170
Lei Zhangfcfa3b82015-12-24 21:07:28 -0800171void CPWL_FontMap::Initialize() {
npmea3c3be2016-09-19 07:24:33 -0700172 GetFontIndex(kDefaultFontName, FXFONT_ANSI_CHARSET, FALSE);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700173}
Lei Zhang60f507b2015-06-13 00:41:00 -0700174
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700175FX_BOOL CPWL_FontMap::IsStandardFont(const CFX_ByteString& sFontName) {
Wei Li89409932016-03-28 10:33:33 -0700176 for (size_t i = 0; i < FX_ArraySize(g_sDEStandardFontName); ++i) {
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700177 if (sFontName == g_sDEStandardFontName[i])
178 return TRUE;
179 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700180
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700181 return FALSE;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700182}
183
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700184int32_t CPWL_FontMap::FindFont(const CFX_ByteString& sFontName,
185 int32_t nCharset) {
186 for (int32_t i = 0, sz = m_aData.GetSize(); i < sz; i++) {
187 if (CPWL_FontMap_Data* pData = m_aData.GetAt(i)) {
npmea3c3be2016-09-19 07:24:33 -0700188 if (nCharset == FXFONT_DEFAULT_CHARSET || nCharset == pData->nCharset) {
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700189 if (sFontName.IsEmpty() || pData->sFontName == sFontName)
190 return i;
191 }
Tom Sepez2f2ffec2015-07-23 14:42:09 -0700192 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700193 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700194
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700195 return -1;
196}
197
198int32_t CPWL_FontMap::GetFontIndex(const CFX_ByteString& sFontName,
199 int32_t nCharset,
200 FX_BOOL bFind) {
201 int32_t nFontIndex = FindFont(EncodeFontAlias(sFontName, nCharset), nCharset);
202 if (nFontIndex >= 0)
203 return nFontIndex;
204
205 CFX_ByteString sAlias;
thestig1cd352e2016-06-07 17:53:06 -0700206 CPDF_Font* pFont = nullptr;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700207 if (bFind)
208 pFont = FindFontSameCharset(sAlias, nCharset);
209
210 if (!pFont) {
211 CFX_ByteString sTemp = sFontName;
212 pFont = AddFontToDocument(GetDocument(), sTemp, nCharset);
213 sAlias = EncodeFontAlias(sTemp, nCharset);
214 }
215 AddedFont(pFont, sAlias);
216 return AddFontData(pFont, sAlias, nCharset);
217}
218
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700219CPDF_Font* CPWL_FontMap::FindFontSameCharset(CFX_ByteString& sFontAlias,
220 int32_t nCharset) {
thestig1cd352e2016-06-07 17:53:06 -0700221 return nullptr;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700222}
223
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700224int32_t CPWL_FontMap::AddFontData(CPDF_Font* pFont,
225 const CFX_ByteString& sFontAlias,
226 int32_t nCharset) {
227 CPWL_FontMap_Data* pNewData = new CPWL_FontMap_Data;
228 pNewData->pFont = pFont;
229 pNewData->sFontName = sFontAlias;
230 pNewData->nCharset = nCharset;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700231
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700232 m_aData.Add(pNewData);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700233
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700234 return m_aData.GetSize() - 1;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700235}
236
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700237void CPWL_FontMap::AddedFont(CPDF_Font* pFont,
238 const CFX_ByteString& sFontAlias) {}
239
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700240CFX_ByteString CPWL_FontMap::GetNativeFont(int32_t nCharset) {
npmea3c3be2016-09-19 07:24:33 -0700241 if (nCharset == FXFONT_DEFAULT_CHARSET)
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700242 nCharset = GetNativeCharset();
243
244 CFX_ByteString sFontName = GetDefaultFontByCharset(nCharset);
dsinclair0e3e8902016-08-24 11:39:24 -0700245 if (m_pSystemHandler->FindNativeTrueTypeFont(sFontName))
246 return sFontName;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700247
dsinclair0e3e8902016-08-24 11:39:24 -0700248 sFontName.clear();
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700249 return sFontName;
250}
251
252CPDF_Font* CPWL_FontMap::AddFontToDocument(CPDF_Document* pDoc,
253 CFX_ByteString& sFontName,
254 uint8_t nCharset) {
255 if (IsStandardFont(sFontName))
256 return AddStandardFont(pDoc, sFontName);
257
258 return AddSystemFont(pDoc, sFontName, nCharset);
259}
260
261CPDF_Font* CPWL_FontMap::AddStandardFont(CPDF_Document* pDoc,
262 CFX_ByteString& sFontName) {
263 if (!pDoc)
thestig1cd352e2016-06-07 17:53:06 -0700264 return nullptr;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700265
thestig1cd352e2016-06-07 17:53:06 -0700266 CPDF_Font* pFont = nullptr;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700267
Lei Zhangc2fb35f2016-01-05 16:46:58 -0800268 if (sFontName == "ZapfDingbats") {
thestig1cd352e2016-06-07 17:53:06 -0700269 pFont = pDoc->AddStandardFont(sFontName.c_str(), nullptr);
Lei Zhangc2fb35f2016-01-05 16:46:58 -0800270 } else {
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700271 CPDF_FontEncoding fe(PDFFONT_ENCODING_WINANSI);
tsepezb4c9f3f2016-04-13 15:41:21 -0700272 pFont = pDoc->AddStandardFont(sFontName.c_str(), &fe);
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700273 }
274
275 return pFont;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700276}
277
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700278CPDF_Font* CPWL_FontMap::AddSystemFont(CPDF_Document* pDoc,
279 CFX_ByteString& sFontName,
280 uint8_t nCharset) {
281 if (!pDoc)
thestig1cd352e2016-06-07 17:53:06 -0700282 return nullptr;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700283
284 if (sFontName.IsEmpty())
285 sFontName = GetNativeFont(nCharset);
npmea3c3be2016-09-19 07:24:33 -0700286 if (nCharset == FXFONT_DEFAULT_CHARSET)
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700287 nCharset = GetNativeCharset();
288
dsinclair0e3e8902016-08-24 11:39:24 -0700289 return m_pSystemHandler->AddNativeTrueTypeFontToPDF(pDoc, sFontName,
290 nCharset);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700291}
292
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700293CFX_ByteString CPWL_FontMap::EncodeFontAlias(const CFX_ByteString& sFontName,
294 int32_t nCharset) {
295 CFX_ByteString sPostfix;
296 sPostfix.Format("_%02X", nCharset);
297 return EncodeFontAlias(sFontName) + sPostfix;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700298}
299
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700300CFX_ByteString CPWL_FontMap::EncodeFontAlias(const CFX_ByteString& sFontName) {
301 CFX_ByteString sRet = sFontName;
302 sRet.Remove(' ');
303 return sRet;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700304}
305
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700306const CPWL_FontMap_Data* CPWL_FontMap::GetFontMapData(int32_t nIndex) const {
307 if (nIndex >= 0 && nIndex < m_aData.GetSize()) {
308 return m_aData.GetAt(nIndex);
309 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700310
thestig1cd352e2016-06-07 17:53:06 -0700311 return nullptr;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700312}
313
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700314int32_t CPWL_FontMap::GetNativeCharset() {
npmea3c3be2016-09-19 07:24:33 -0700315 uint8_t nCharset = FXFONT_ANSI_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700316 int32_t iCodePage = FXSYS_GetACP();
317 switch (iCodePage) {
318 case 932: // Japan
npmea3c3be2016-09-19 07:24:33 -0700319 nCharset = FXFONT_SHIFTJIS_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700320 break;
321 case 936: // Chinese (PRC, Singapore)
npmea3c3be2016-09-19 07:24:33 -0700322 nCharset = FXFONT_GB2312_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700323 break;
324 case 950: // Chinese (Taiwan; Hong Kong SAR, PRC)
npmea3c3be2016-09-19 07:24:33 -0700325 nCharset = FXFONT_GB2312_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700326 break;
327 case 1252: // Windows 3.1 Latin 1 (US, Western Europe)
npmea3c3be2016-09-19 07:24:33 -0700328 nCharset = FXFONT_ANSI_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700329 break;
330 case 874: // Thai
npmea3c3be2016-09-19 07:24:33 -0700331 nCharset = FXFONT_THAI_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700332 break;
333 case 949: // Korean
npmea3c3be2016-09-19 07:24:33 -0700334 nCharset = FXFONT_HANGUL_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700335 break;
336 case 1200: // Unicode (BMP of ISO 10646)
npmea3c3be2016-09-19 07:24:33 -0700337 nCharset = FXFONT_ANSI_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700338 break;
339 case 1250: // Windows 3.1 Eastern European
npmea3c3be2016-09-19 07:24:33 -0700340 nCharset = FXFONT_EASTEUROPE_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700341 break;
342 case 1251: // Windows 3.1 Cyrillic
npmea3c3be2016-09-19 07:24:33 -0700343 nCharset = FXFONT_RUSSIAN_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700344 break;
345 case 1253: // Windows 3.1 Greek
npmea3c3be2016-09-19 07:24:33 -0700346 nCharset = FXFONT_GREEK_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700347 break;
348 case 1254: // Windows 3.1 Turkish
npmea3c3be2016-09-19 07:24:33 -0700349 nCharset = FXFONT_TURKISH_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700350 break;
351 case 1255: // Hebrew
npmea3c3be2016-09-19 07:24:33 -0700352 nCharset = FXFONT_HEBREW_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700353 break;
354 case 1256: // Arabic
npmea3c3be2016-09-19 07:24:33 -0700355 nCharset = FXFONT_ARABIC_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700356 break;
357 case 1257: // Baltic
npmea3c3be2016-09-19 07:24:33 -0700358 nCharset = FXFONT_BALTIC_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700359 break;
360 case 1258: // Vietnamese
npmea3c3be2016-09-19 07:24:33 -0700361 nCharset = FXFONT_VIETNAMESE_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700362 break;
363 case 1361: // Korean(Johab)
npmea3c3be2016-09-19 07:24:33 -0700364 nCharset = FXFONT_JOHAB_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700365 break;
366 }
367 return nCharset;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700368}
369
weili2d5b0202016-08-03 11:06:49 -0700370const FPDF_CharsetFontMap CPWL_FontMap::defaultTTFMap[] = {
npmea3c3be2016-09-19 07:24:33 -0700371 {FXFONT_ANSI_CHARSET, "Helvetica"},
372 {FXFONT_GB2312_CHARSET, "SimSun"},
373 {FXFONT_CHINESEBIG5_CHARSET, "MingLiU"},
374 {FXFONT_SHIFTJIS_CHARSET, "MS Gothic"},
375 {FXFONT_HANGUL_CHARSET, "Batang"},
376 {FXFONT_RUSSIAN_CHARSET, "Arial"},
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700377#if _FXM_PLATFORM_ == _FXM_PLATFORM_LINUX_ || \
378 _FXM_PLATFORM_ == _FXM_PLATFORM_APPLE_
npmea3c3be2016-09-19 07:24:33 -0700379 {FXFONT_EASTEUROPE_CHARSET, "Arial"},
Bo Xudbd4c062014-05-29 11:32:56 -0700380#else
npmea3c3be2016-09-19 07:24:33 -0700381 {FXFONT_EASTEUROPE_CHARSET, "Tahoma"},
Bo Xudbd4c062014-05-29 11:32:56 -0700382#endif
npmea3c3be2016-09-19 07:24:33 -0700383 {FXFONT_ARABIC_CHARSET, "Arial"},
384 {-1, nullptr}};
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700385
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700386CFX_ByteString CPWL_FontMap::GetDefaultFontByCharset(int32_t nCharset) {
387 int i = 0;
388 while (defaultTTFMap[i].charset != -1) {
389 if (nCharset == defaultTTFMap[i].charset)
390 return defaultTTFMap[i].fontname;
391 ++i;
392 }
393 return "";
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700394}
395
Tom Sepez62a70f92016-03-21 15:00:20 -0700396int32_t CPWL_FontMap::CharSetFromUnicode(uint16_t word, int32_t nOldCharset) {
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700397 // to avoid CJK Font to show ASCII
398 if (word < 0x7F)
npmea3c3be2016-09-19 07:24:33 -0700399 return FXFONT_ANSI_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700400 // follow the old charset
npmea3c3be2016-09-19 07:24:33 -0700401 if (nOldCharset != FXFONT_DEFAULT_CHARSET)
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700402 return nOldCharset;
403
404 // find new charset
405 if ((word >= 0x4E00 && word <= 0x9FA5) ||
406 (word >= 0xE7C7 && word <= 0xE7F3) ||
407 (word >= 0x3000 && word <= 0x303F) ||
408 (word >= 0x2000 && word <= 0x206F)) {
npmea3c3be2016-09-19 07:24:33 -0700409 return FXFONT_GB2312_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700410 }
411
412 if (((word >= 0x3040) && (word <= 0x309F)) ||
413 ((word >= 0x30A0) && (word <= 0x30FF)) ||
414 ((word >= 0x31F0) && (word <= 0x31FF)) ||
415 ((word >= 0xFF00) && (word <= 0xFFEF))) {
npmea3c3be2016-09-19 07:24:33 -0700416 return FXFONT_SHIFTJIS_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700417 }
418
419 if (((word >= 0xAC00) && (word <= 0xD7AF)) ||
420 ((word >= 0x1100) && (word <= 0x11FF)) ||
421 ((word >= 0x3130) && (word <= 0x318F))) {
npmea3c3be2016-09-19 07:24:33 -0700422 return FXFONT_HANGUL_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700423 }
424
425 if (word >= 0x0E00 && word <= 0x0E7F)
npmea3c3be2016-09-19 07:24:33 -0700426 return FXFONT_THAI_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700427
428 if ((word >= 0x0370 && word <= 0x03FF) || (word >= 0x1F00 && word <= 0x1FFF))
npmea3c3be2016-09-19 07:24:33 -0700429 return FXFONT_GREEK_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700430
431 if ((word >= 0x0600 && word <= 0x06FF) || (word >= 0xFB50 && word <= 0xFEFC))
npmea3c3be2016-09-19 07:24:33 -0700432 return FXFONT_ARABIC_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700433
434 if (word >= 0x0590 && word <= 0x05FF)
npmea3c3be2016-09-19 07:24:33 -0700435 return FXFONT_HEBREW_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700436
437 if (word >= 0x0400 && word <= 0x04FF)
npmea3c3be2016-09-19 07:24:33 -0700438 return FXFONT_RUSSIAN_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700439
440 if (word >= 0x0100 && word <= 0x024F)
npmea3c3be2016-09-19 07:24:33 -0700441 return FXFONT_EASTEUROPE_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700442
443 if (word >= 0x1E00 && word <= 0x1EFF)
npmea3c3be2016-09-19 07:24:33 -0700444 return FXFONT_VIETNAMESE_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700445
npmea3c3be2016-09-19 07:24:33 -0700446 return FXFONT_ANSI_CHARSET;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700447}