blob: 131334ac22b0e401a7069e98b58317d074d0b562 [file] [log] [blame]
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -07001// Copyright 2014 PDFium Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
Lei Zhang60f507b2015-06-13 00:41:00 -07004
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -07005// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
6
dan sinclair89e904b2016-03-23 19:29:15 -04007#include "fpdfsdk/pdfwindow/PWL_FontMap.h"
Lei Zhangc2fb35f2016-01-05 16:46:58 -08008
dan sinclair61b2fc72016-03-23 19:21:44 -04009#include "core/fpdfapi/fpdf_font/include/cpdf_font.h"
10#include "core/fpdfapi/fpdf_font/include/cpdf_fontencoding.h"
Dan Sinclairaa403d32016-03-15 14:57:22 -040011#include "core/fpdfapi/fpdf_parser/include/cpdf_document.h"
dsinclaircedaa552016-08-24 11:12:19 -070012#include "core/fpdfapi/fpdf_parser/include/cpdf_parser.h"
Dan Sinclairaa403d32016-03-15 14:57:22 -040013#include "core/fpdfapi/include/cpdf_modulemgr.h"
dsinclairc7a73492016-04-05 12:01:42 -070014#include "core/fpdfdoc/include/ipvt_fontmap.h"
dan sinclair89e904b2016-03-23 19:29:15 -040015#include "fpdfsdk/pdfwindow/PWL_Wnd.h"
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070016
Lei Zhang1b976642016-01-08 14:24:37 -080017namespace {
18
19const char kDefaultFontName[] = "Helvetica";
20
21const char* const g_sDEStandardFontName[] = {"Courier",
22 "Courier-Bold",
23 "Courier-BoldOblique",
24 "Courier-Oblique",
25 "Helvetica",
26 "Helvetica-Bold",
27 "Helvetica-BoldOblique",
28 "Helvetica-Oblique",
29 "Times-Roman",
30 "Times-Bold",
31 "Times-Italic",
32 "Times-BoldItalic",
33 "Symbol",
34 "ZapfDingbats"};
35
36} // namespace
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070037
dsinclairb9590102016-04-27 06:38:59 -070038CPWL_FontMap::CPWL_FontMap(CFX_SystemHandler* pSystemHandler)
weili2d5b0202016-08-03 11:06:49 -070039 : m_pSystemHandler(pSystemHandler) {
Lei Zhang96660d62015-12-14 18:27:25 -080040 ASSERT(m_pSystemHandler);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070041}
42
Nico Weber9d8ec5a2015-08-04 13:00:21 -070043CPWL_FontMap::~CPWL_FontMap() {
Nico Weber9d8ec5a2015-08-04 13:00:21 -070044 Empty();
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070045}
46
dsinclairb9590102016-04-27 06:38:59 -070047void CPWL_FontMap::SetSystemHandler(CFX_SystemHandler* pSystemHandler) {
Nico Weber9d8ec5a2015-08-04 13:00:21 -070048 m_pSystemHandler = pSystemHandler;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070049}
50
Nico Weber9d8ec5a2015-08-04 13:00:21 -070051CPDF_Document* CPWL_FontMap::GetDocument() {
52 if (!m_pPDFDoc) {
53 if (CPDF_ModuleMgr::Get()) {
dsinclaircedaa552016-08-24 11:12:19 -070054 m_pPDFDoc.reset(new CPDF_Document(std::unique_ptr<CPDF_Parser>()));
Nico Weber9d8ec5a2015-08-04 13:00:21 -070055 m_pPDFDoc->CreateNewDoc();
56 }
57 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070058
weili2d5b0202016-08-03 11:06:49 -070059 return m_pPDFDoc.get();
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070060}
61
Nico Weber9d8ec5a2015-08-04 13:00:21 -070062CPDF_Font* CPWL_FontMap::GetPDFFont(int32_t nFontIndex) {
63 if (nFontIndex >= 0 && nFontIndex < m_aData.GetSize()) {
64 if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex)) {
65 return pData->pFont;
Tom Sepez2f2ffec2015-07-23 14:42:09 -070066 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -070067 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070068
thestig1cd352e2016-06-07 17:53:06 -070069 return nullptr;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070070}
71
Nico Weber9d8ec5a2015-08-04 13:00:21 -070072CFX_ByteString CPWL_FontMap::GetPDFFontAlias(int32_t nFontIndex) {
73 if (nFontIndex >= 0 && nFontIndex < m_aData.GetSize()) {
74 if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex)) {
75 return pData->sFontName;
Tom Sepez2f2ffec2015-07-23 14:42:09 -070076 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -070077 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070078
Nico Weber9d8ec5a2015-08-04 13:00:21 -070079 return "";
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070080}
81
Tom Sepez62a70f92016-03-21 15:00:20 -070082FX_BOOL CPWL_FontMap::KnowWord(int32_t nFontIndex, uint16_t word) {
Nico Weber9d8ec5a2015-08-04 13:00:21 -070083 if (nFontIndex >= 0 && nFontIndex < m_aData.GetSize()) {
84 if (m_aData.GetAt(nFontIndex)) {
85 return CharCodeFromUnicode(nFontIndex, word) >= 0;
Tom Sepez2f2ffec2015-07-23 14:42:09 -070086 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -070087 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070088
Nico Weber9d8ec5a2015-08-04 13:00:21 -070089 return FALSE;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -070090}
91
Tom Sepez62a70f92016-03-21 15:00:20 -070092int32_t CPWL_FontMap::GetWordFontIndex(uint16_t word,
Nico Weber9d8ec5a2015-08-04 13:00:21 -070093 int32_t nCharset,
94 int32_t nFontIndex) {
95 if (nFontIndex > 0) {
96 if (KnowWord(nFontIndex, word))
97 return nFontIndex;
98 } else {
99 if (const CPWL_FontMap_Data* pData = GetFontMapData(0)) {
100 if (nCharset == DEFAULT_CHARSET || pData->nCharset == SYMBOL_CHARSET ||
101 nCharset == pData->nCharset) {
102 if (KnowWord(0, word))
103 return 0;
104 }
Tom Sepez2f2ffec2015-07-23 14:42:09 -0700105 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700106 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700107
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700108 int32_t nNewFontIndex =
109 GetFontIndex(GetNativeFontName(nCharset), nCharset, TRUE);
110 if (nNewFontIndex >= 0) {
111 if (KnowWord(nNewFontIndex, word))
112 return nNewFontIndex;
113 }
114 nNewFontIndex = GetFontIndex("Arial Unicode MS", DEFAULT_CHARSET, FALSE);
115 if (nNewFontIndex >= 0) {
116 if (KnowWord(nNewFontIndex, word))
117 return nNewFontIndex;
118 }
119 return -1;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700120}
121
Tom Sepez62a70f92016-03-21 15:00:20 -0700122int32_t CPWL_FontMap::CharCodeFromUnicode(int32_t nFontIndex, uint16_t word) {
thestig8ea3f512016-06-27 11:55:24 -0700123 CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex);
124 if (!pData)
125 return -1;
126
127 if (!pData->pFont)
128 return -1;
129
130 if (pData->pFont->IsUnicodeCompatible())
131 return pData->pFont->CharCodeFromUnicode(word);
132
133 return word < 0xFF ? word : -1;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700134}
135
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700136CFX_ByteString CPWL_FontMap::GetNativeFontName(int32_t nCharset) {
137 // searching native font is slow, so we must save time
138 for (int32_t i = 0, sz = m_aNativeFont.GetSize(); i < sz; i++) {
139 if (CPWL_FontMap_Native* pData = m_aNativeFont.GetAt(i)) {
140 if (pData->nCharset == nCharset)
141 return pData->sFontName;
Tom Sepez2f2ffec2015-07-23 14:42:09 -0700142 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700143 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700144
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700145 CFX_ByteString sNew = GetNativeFont(nCharset);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700146
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700147 if (!sNew.IsEmpty()) {
148 CPWL_FontMap_Native* pNewData = new CPWL_FontMap_Native;
149 pNewData->nCharset = nCharset;
150 pNewData->sFontName = sNew;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700151
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700152 m_aNativeFont.Add(pNewData);
153 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700154
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700155 return sNew;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700156}
157
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700158void CPWL_FontMap::Empty() {
159 {
160 for (int32_t i = 0, sz = m_aData.GetSize(); i < sz; i++)
161 delete m_aData.GetAt(i);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700162
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700163 m_aData.RemoveAll();
164 }
165 {
166 for (int32_t i = 0, sz = m_aNativeFont.GetSize(); i < sz; i++)
167 delete m_aNativeFont.GetAt(i);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700168
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700169 m_aNativeFont.RemoveAll();
170 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700171}
172
Lei Zhangfcfa3b82015-12-24 21:07:28 -0800173void CPWL_FontMap::Initialize() {
Lei Zhang1b976642016-01-08 14:24:37 -0800174 GetFontIndex(kDefaultFontName, ANSI_CHARSET, FALSE);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700175}
Lei Zhang60f507b2015-06-13 00:41:00 -0700176
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700177FX_BOOL CPWL_FontMap::IsStandardFont(const CFX_ByteString& sFontName) {
Wei Li89409932016-03-28 10:33:33 -0700178 for (size_t i = 0; i < FX_ArraySize(g_sDEStandardFontName); ++i) {
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700179 if (sFontName == g_sDEStandardFontName[i])
180 return TRUE;
181 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700182
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700183 return FALSE;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700184}
185
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700186int32_t CPWL_FontMap::FindFont(const CFX_ByteString& sFontName,
187 int32_t nCharset) {
188 for (int32_t i = 0, sz = m_aData.GetSize(); i < sz; i++) {
189 if (CPWL_FontMap_Data* pData = m_aData.GetAt(i)) {
190 if (nCharset == DEFAULT_CHARSET || nCharset == pData->nCharset) {
191 if (sFontName.IsEmpty() || pData->sFontName == sFontName)
192 return i;
193 }
Tom Sepez2f2ffec2015-07-23 14:42:09 -0700194 }
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700195 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700196
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700197 return -1;
198}
199
200int32_t CPWL_FontMap::GetFontIndex(const CFX_ByteString& sFontName,
201 int32_t nCharset,
202 FX_BOOL bFind) {
203 int32_t nFontIndex = FindFont(EncodeFontAlias(sFontName, nCharset), nCharset);
204 if (nFontIndex >= 0)
205 return nFontIndex;
206
207 CFX_ByteString sAlias;
thestig1cd352e2016-06-07 17:53:06 -0700208 CPDF_Font* pFont = nullptr;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700209 if (bFind)
210 pFont = FindFontSameCharset(sAlias, nCharset);
211
212 if (!pFont) {
213 CFX_ByteString sTemp = sFontName;
214 pFont = AddFontToDocument(GetDocument(), sTemp, nCharset);
215 sAlias = EncodeFontAlias(sTemp, nCharset);
216 }
217 AddedFont(pFont, sAlias);
218 return AddFontData(pFont, sAlias, nCharset);
219}
220
Tom Sepez62a70f92016-03-21 15:00:20 -0700221int32_t CPWL_FontMap::GetPWLFontIndex(uint16_t word, int32_t nCharset) {
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700222 int32_t nFind = -1;
223
224 for (int32_t i = 0, sz = m_aData.GetSize(); i < sz; i++) {
225 if (CPWL_FontMap_Data* pData = m_aData.GetAt(i)) {
226 if (pData->nCharset == nCharset) {
227 nFind = i;
228 break;
229 }
230 }
231 }
232
233 CPDF_Font* pNewFont = GetPDFFont(nFind);
234
235 if (!pNewFont)
Tom Sepez2f2ffec2015-07-23 14:42:09 -0700236 return -1;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700237
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700238 CFX_ByteString sAlias = EncodeFontAlias("Arial_Chrome", nCharset);
239 AddedFont(pNewFont, sAlias);
240
241 return AddFontData(pNewFont, sAlias, nCharset);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700242}
243
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700244CPDF_Font* CPWL_FontMap::FindFontSameCharset(CFX_ByteString& sFontAlias,
245 int32_t nCharset) {
thestig1cd352e2016-06-07 17:53:06 -0700246 return nullptr;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700247}
248
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700249int32_t CPWL_FontMap::AddFontData(CPDF_Font* pFont,
250 const CFX_ByteString& sFontAlias,
251 int32_t nCharset) {
252 CPWL_FontMap_Data* pNewData = new CPWL_FontMap_Data;
253 pNewData->pFont = pFont;
254 pNewData->sFontName = sFontAlias;
255 pNewData->nCharset = nCharset;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700256
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700257 m_aData.Add(pNewData);
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700258
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700259 return m_aData.GetSize() - 1;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700260}
261
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700262void CPWL_FontMap::AddedFont(CPDF_Font* pFont,
263 const CFX_ByteString& sFontAlias) {}
264
265CFX_ByteString CPWL_FontMap::GetFontName(int32_t nFontIndex) {
266 if (nFontIndex >= 0 && nFontIndex < m_aData.GetSize()) {
267 if (CPWL_FontMap_Data* pData = m_aData.GetAt(nFontIndex)) {
268 return pData->sFontName;
269 }
270 }
271
272 return "";
273}
274
275CFX_ByteString CPWL_FontMap::GetNativeFont(int32_t nCharset) {
276 if (nCharset == DEFAULT_CHARSET)
277 nCharset = GetNativeCharset();
278
279 CFX_ByteString sFontName = GetDefaultFontByCharset(nCharset);
280 if (m_pSystemHandler) {
thestig907a5222016-06-21 14:38:27 -0700281 if (m_pSystemHandler->FindNativeTrueTypeFont(sFontName))
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700282 return sFontName;
283
thestig907a5222016-06-21 14:38:27 -0700284 sFontName.clear();
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700285 }
286 return sFontName;
287}
288
289CPDF_Font* CPWL_FontMap::AddFontToDocument(CPDF_Document* pDoc,
290 CFX_ByteString& sFontName,
291 uint8_t nCharset) {
292 if (IsStandardFont(sFontName))
293 return AddStandardFont(pDoc, sFontName);
294
295 return AddSystemFont(pDoc, sFontName, nCharset);
296}
297
298CPDF_Font* CPWL_FontMap::AddStandardFont(CPDF_Document* pDoc,
299 CFX_ByteString& sFontName) {
300 if (!pDoc)
thestig1cd352e2016-06-07 17:53:06 -0700301 return nullptr;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700302
thestig1cd352e2016-06-07 17:53:06 -0700303 CPDF_Font* pFont = nullptr;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700304
Lei Zhangc2fb35f2016-01-05 16:46:58 -0800305 if (sFontName == "ZapfDingbats") {
thestig1cd352e2016-06-07 17:53:06 -0700306 pFont = pDoc->AddStandardFont(sFontName.c_str(), nullptr);
Lei Zhangc2fb35f2016-01-05 16:46:58 -0800307 } else {
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700308 CPDF_FontEncoding fe(PDFFONT_ENCODING_WINANSI);
tsepezb4c9f3f2016-04-13 15:41:21 -0700309 pFont = pDoc->AddStandardFont(sFontName.c_str(), &fe);
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700310 }
311
312 return pFont;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700313}
314
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700315CPDF_Font* CPWL_FontMap::AddSystemFont(CPDF_Document* pDoc,
316 CFX_ByteString& sFontName,
317 uint8_t nCharset) {
318 if (!pDoc)
thestig1cd352e2016-06-07 17:53:06 -0700319 return nullptr;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700320
321 if (sFontName.IsEmpty())
322 sFontName = GetNativeFont(nCharset);
323 if (nCharset == DEFAULT_CHARSET)
324 nCharset = GetNativeCharset();
325
326 if (m_pSystemHandler)
327 return m_pSystemHandler->AddNativeTrueTypeFontToPDF(pDoc, sFontName,
328 nCharset);
329
thestig1cd352e2016-06-07 17:53:06 -0700330 return nullptr;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700331}
332
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700333CFX_ByteString CPWL_FontMap::EncodeFontAlias(const CFX_ByteString& sFontName,
334 int32_t nCharset) {
335 CFX_ByteString sPostfix;
336 sPostfix.Format("_%02X", nCharset);
337 return EncodeFontAlias(sFontName) + sPostfix;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700338}
339
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700340CFX_ByteString CPWL_FontMap::EncodeFontAlias(const CFX_ByteString& sFontName) {
341 CFX_ByteString sRet = sFontName;
342 sRet.Remove(' ');
343 return sRet;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700344}
345
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700346int32_t CPWL_FontMap::GetFontMapCount() const {
347 return m_aData.GetSize();
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700348}
349
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700350const CPWL_FontMap_Data* CPWL_FontMap::GetFontMapData(int32_t nIndex) const {
351 if (nIndex >= 0 && nIndex < m_aData.GetSize()) {
352 return m_aData.GetAt(nIndex);
353 }
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700354
thestig1cd352e2016-06-07 17:53:06 -0700355 return nullptr;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700356}
357
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700358int32_t CPWL_FontMap::GetNativeCharset() {
359 uint8_t nCharset = ANSI_CHARSET;
360 int32_t iCodePage = FXSYS_GetACP();
361 switch (iCodePage) {
362 case 932: // Japan
363 nCharset = SHIFTJIS_CHARSET;
364 break;
365 case 936: // Chinese (PRC, Singapore)
366 nCharset = GB2312_CHARSET;
367 break;
368 case 950: // Chinese (Taiwan; Hong Kong SAR, PRC)
369 nCharset = GB2312_CHARSET;
370 break;
371 case 1252: // Windows 3.1 Latin 1 (US, Western Europe)
372 nCharset = ANSI_CHARSET;
373 break;
374 case 874: // Thai
375 nCharset = THAI_CHARSET;
376 break;
377 case 949: // Korean
378 nCharset = HANGUL_CHARSET;
379 break;
380 case 1200: // Unicode (BMP of ISO 10646)
381 nCharset = ANSI_CHARSET;
382 break;
383 case 1250: // Windows 3.1 Eastern European
384 nCharset = EASTEUROPE_CHARSET;
385 break;
386 case 1251: // Windows 3.1 Cyrillic
387 nCharset = RUSSIAN_CHARSET;
388 break;
389 case 1253: // Windows 3.1 Greek
390 nCharset = GREEK_CHARSET;
391 break;
392 case 1254: // Windows 3.1 Turkish
393 nCharset = TURKISH_CHARSET;
394 break;
395 case 1255: // Hebrew
396 nCharset = HEBREW_CHARSET;
397 break;
398 case 1256: // Arabic
399 nCharset = ARABIC_CHARSET;
400 break;
401 case 1257: // Baltic
402 nCharset = BALTIC_CHARSET;
403 break;
404 case 1258: // Vietnamese
405 nCharset = VIETNAMESE_CHARSET;
406 break;
407 case 1361: // Korean(Johab)
408 nCharset = JOHAB_CHARSET;
409 break;
410 }
411 return nCharset;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700412}
413
weili2d5b0202016-08-03 11:06:49 -0700414const FPDF_CharsetFontMap CPWL_FontMap::defaultTTFMap[] = {
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700415 {ANSI_CHARSET, "Helvetica"}, {GB2312_CHARSET, "SimSun"},
416 {CHINESEBIG5_CHARSET, "MingLiU"}, {SHIFTJIS_CHARSET, "MS Gothic"},
417 {HANGUL_CHARSET, "Batang"}, {RUSSIAN_CHARSET, "Arial"},
418#if _FXM_PLATFORM_ == _FXM_PLATFORM_LINUX_ || \
419 _FXM_PLATFORM_ == _FXM_PLATFORM_APPLE_
420 {EASTEUROPE_CHARSET, "Arial"},
Bo Xudbd4c062014-05-29 11:32:56 -0700421#else
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700422 {EASTEUROPE_CHARSET, "Tahoma"},
Bo Xudbd4c062014-05-29 11:32:56 -0700423#endif
thestig1cd352e2016-06-07 17:53:06 -0700424 {ARABIC_CHARSET, "Arial"}, {-1, nullptr}};
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700425
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700426CFX_ByteString CPWL_FontMap::GetDefaultFontByCharset(int32_t nCharset) {
427 int i = 0;
428 while (defaultTTFMap[i].charset != -1) {
429 if (nCharset == defaultTTFMap[i].charset)
430 return defaultTTFMap[i].fontname;
431 ++i;
432 }
433 return "";
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700434}
435
Tom Sepez62a70f92016-03-21 15:00:20 -0700436int32_t CPWL_FontMap::CharSetFromUnicode(uint16_t word, int32_t nOldCharset) {
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700437 // to avoid CJK Font to show ASCII
438 if (word < 0x7F)
Tom Sepez2f2ffec2015-07-23 14:42:09 -0700439 return ANSI_CHARSET;
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700440 // follow the old charset
441 if (nOldCharset != DEFAULT_CHARSET)
442 return nOldCharset;
443
444 // find new charset
445 if ((word >= 0x4E00 && word <= 0x9FA5) ||
446 (word >= 0xE7C7 && word <= 0xE7F3) ||
447 (word >= 0x3000 && word <= 0x303F) ||
448 (word >= 0x2000 && word <= 0x206F)) {
449 return GB2312_CHARSET;
450 }
451
452 if (((word >= 0x3040) && (word <= 0x309F)) ||
453 ((word >= 0x30A0) && (word <= 0x30FF)) ||
454 ((word >= 0x31F0) && (word <= 0x31FF)) ||
455 ((word >= 0xFF00) && (word <= 0xFFEF))) {
456 return SHIFTJIS_CHARSET;
457 }
458
459 if (((word >= 0xAC00) && (word <= 0xD7AF)) ||
460 ((word >= 0x1100) && (word <= 0x11FF)) ||
461 ((word >= 0x3130) && (word <= 0x318F))) {
462 return HANGUL_CHARSET;
463 }
464
465 if (word >= 0x0E00 && word <= 0x0E7F)
466 return THAI_CHARSET;
467
468 if ((word >= 0x0370 && word <= 0x03FF) || (word >= 0x1F00 && word <= 0x1FFF))
469 return GREEK_CHARSET;
470
471 if ((word >= 0x0600 && word <= 0x06FF) || (word >= 0xFB50 && word <= 0xFEFC))
472 return ARABIC_CHARSET;
473
474 if (word >= 0x0590 && word <= 0x05FF)
475 return HEBREW_CHARSET;
476
477 if (word >= 0x0400 && word <= 0x04FF)
478 return RUSSIAN_CHARSET;
479
480 if (word >= 0x0100 && word <= 0x024F)
481 return EASTEUROPE_CHARSET;
482
483 if (word >= 0x1E00 && word <= 0x1EFF)
484 return VIETNAMESE_CHARSET;
485
486 return ANSI_CHARSET;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700487}
488
dsinclairb9590102016-04-27 06:38:59 -0700489CPWL_DocFontMap::CPWL_DocFontMap(CFX_SystemHandler* pSystemHandler,
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700490 CPDF_Document* pAttachedDoc)
491 : CPWL_FontMap(pSystemHandler), m_pAttachedDoc(pAttachedDoc) {}
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700492
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700493CPWL_DocFontMap::~CPWL_DocFontMap() {}
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700494
Nico Weber9d8ec5a2015-08-04 13:00:21 -0700495CPDF_Document* CPWL_DocFontMap::GetDocument() {
496 return m_pAttachedDoc;
John Abd-El-Malek3f3b45c2014-05-23 17:28:10 -0700497}