blob: c53e60729f54f3f62c75346a5035b1d2fea4ef58 [file] [log] [blame]
Selim Gurun30d4e1f2013-08-15 12:46:15 -07001/*
2 * Copyright 2011 Google Inc. All Rights Reserved.
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "subsetter_impl.h"
18
19#include <string.h>
20
21#include <algorithm>
22#include <iterator>
23#include <map>
24#include <set>
25
26#include "sfntly/table/bitmap/eblc_table.h"
27#include "sfntly/table/bitmap/ebdt_table.h"
28#include "sfntly/table/bitmap/index_sub_table.h"
29#include "sfntly/table/bitmap/index_sub_table_format1.h"
30#include "sfntly/table/bitmap/index_sub_table_format2.h"
31#include "sfntly/table/bitmap/index_sub_table_format3.h"
32#include "sfntly/table/bitmap/index_sub_table_format4.h"
33#include "sfntly/table/bitmap/index_sub_table_format5.h"
34#include "sfntly/table/core/name_table.h"
35#include "sfntly/tag.h"
36#include "sfntly/data/memory_byte_array.h"
37#include "sfntly/port/memory_input_stream.h"
38#include "sfntly/port/memory_output_stream.h"
39
40#if defined U_USING_ICU_NAMESPACE
41 U_NAMESPACE_USE
42#endif
43
44namespace {
45
46using namespace sfntly;
47
48// The bitmap tables must be greater than 16KB to trigger bitmap subsetter.
49static const int BITMAP_SIZE_THRESHOLD = 16384;
50
51void ConstructName(UChar* name_part, UnicodeString* name, int32_t name_id) {
52 switch (name_id) {
53 case NameId::kFullFontName:
54 *name = name_part;
55 break;
56 case NameId::kFontFamilyName:
57 case NameId::kPreferredFamily:
58 case NameId::kWWSFamilyName: {
59 UnicodeString original = *name;
60 *name = name_part;
61 *name += original;
62 break;
63 }
64 case NameId::kFontSubfamilyName:
65 case NameId::kPreferredSubfamily:
66 case NameId::kWWSSubfamilyName:
67 *name += name_part;
68 break;
69 default:
70 // This name part is not used to construct font name (e.g. copyright).
71 // Simply ignore it.
72 break;
73 }
74}
75
76int32_t HashCode(int32_t platform_id, int32_t encoding_id, int32_t language_id,
77 int32_t name_id) {
78 int32_t result = platform_id << 24 | encoding_id << 16 | language_id << 8;
79 if (name_id == NameId::kFullFontName) {
80 result |= 0xff;
81 } else if (name_id == NameId::kPreferredFamily ||
82 name_id == NameId::kPreferredSubfamily) {
83 result |= 0xf;
84 } else if (name_id == NameId::kWWSFamilyName ||
85 name_id == NameId::kWWSSubfamilyName) {
86 result |= 1;
87 }
88 return result;
89}
90
91bool HasName(const char* font_name, Font* font) {
92 UnicodeString font_string = UnicodeString::fromUTF8(font_name);
93 if (font_string.isEmpty())
94 return false;
95 UnicodeString regular_suffix = UnicodeString::fromUTF8(" Regular");
96 UnicodeString alt_font_string = font_string;
97 alt_font_string += regular_suffix;
98
99 typedef std::map<int32_t, UnicodeString> NameMap;
100 NameMap names;
101 NameTablePtr name_table = down_cast<NameTable*>(font->GetTable(Tag::name));
102 if (name_table == NULL) {
103 return false;
104 }
105
106 for (int32_t i = 0; i < name_table->NameCount(); ++i) {
107 switch (name_table->NameId(i)) {
108 case NameId::kFontFamilyName:
109 case NameId::kFontSubfamilyName:
110 case NameId::kFullFontName:
111 case NameId::kPreferredFamily:
112 case NameId::kPreferredSubfamily:
113 case NameId::kWWSFamilyName:
114 case NameId::kWWSSubfamilyName: {
115 UChar* name_part = name_table->Name(i);
116 if (name_part == NULL) {
117 continue;
118 }
119 int32_t hash_code = HashCode(name_table->PlatformId(i),
120 name_table->EncodingId(i),
121 name_table->LanguageId(i),
122 name_table->NameId(i));
123 ConstructName(name_part, &(names[hash_code]), name_table->NameId(i));
124 delete[] name_part;
125 break;
126 }
127 default:
128 break;
129 }
130 }
131
132 if (!names.empty()) {
133 for (NameMap::iterator i = names.begin(), e = names.end(); i != e; ++i) {
134 if (i->second.caseCompare(font_string, 0) == 0 ||
135 i->second.caseCompare(alt_font_string, 0) == 0) {
136 return true;
137 }
138 }
139 }
140 return false;
141}
142
143Font* FindFont(const char* font_name, const FontArray& font_array) {
144 if (font_array.empty() || font_array[0] == NULL) {
145 return NULL;
146 }
147
148 if (font_name && strlen(font_name)) {
149 for (FontArray::const_iterator i = font_array.begin(), e = font_array.end();
150 i != e; ++i) {
151 if (HasName(font_name, i->p_)) {
152 return i->p_;
153 }
154 }
155 }
156
157 return font_array[0].p_;
158}
159
160bool ResolveCompositeGlyphs(GlyphTable* glyph_table,
161 LocaTable* loca_table,
162 const unsigned int* glyph_ids,
163 size_t glyph_count,
164 IntegerSet* glyph_id_processed) {
165 if (glyph_table == NULL || loca_table == NULL ||
166 glyph_ids == NULL || glyph_count == 0 || glyph_id_processed == NULL) {
167 return false;
168 }
169
170 // Sort and uniquify glyph ids.
171 IntegerSet glyph_id_remaining;
172 glyph_id_remaining.insert(0); // Always include glyph id 0.
173 for (size_t i = 0; i < glyph_count; ++i) {
174 glyph_id_remaining.insert(glyph_ids[i]);
175 }
176
177 // Identify if any given glyph id maps to a composite glyph. If so, include
178 // the glyphs referenced by that composite glyph.
179 while (!glyph_id_remaining.empty()) {
180 IntegerSet comp_glyph_id;
181 for (IntegerSet::iterator i = glyph_id_remaining.begin(),
182 e = glyph_id_remaining.end(); i != e; ++i) {
183 if (*i < 0 || *i >= loca_table->num_glyphs()) {
184 // Invalid glyph id, ignore.
185 continue;
186 }
187
188 int32_t length = loca_table->GlyphLength(*i);
189 if (length == 0) {
190 // Empty glyph, ignore.
191 continue;
192 }
193 int32_t offset = loca_table->GlyphOffset(*i);
194
195 GlyphPtr glyph;
196 glyph.Attach(glyph_table->GetGlyph(offset, length));
197 if (glyph == NULL) {
198 // Error finding glyph, ignore.
199 continue;
200 }
201
202 if (glyph->GlyphType() == GlyphType::kComposite) {
203 Ptr<GlyphTable::CompositeGlyph> comp_glyph =
204 down_cast<GlyphTable::CompositeGlyph*>(glyph.p_);
205 for (int32_t j = 0; j < comp_glyph->NumGlyphs(); ++j) {
206 int32_t glyph_id = comp_glyph->GlyphIndex(j);
207 if (glyph_id_processed->find(glyph_id) == glyph_id_processed->end() &&
208 glyph_id_remaining.find(glyph_id) == glyph_id_remaining.end()) {
209 comp_glyph_id.insert(comp_glyph->GlyphIndex(j));
210 }
211 }
212 }
213
214 glyph_id_processed->insert(*i);
215 }
216
217 glyph_id_remaining.clear();
218 glyph_id_remaining = comp_glyph_id;
219 }
220
221 return true;
222}
223
224bool SetupGlyfBuilders(Font::Builder* font_builder,
225 GlyphTable* glyph_table,
226 LocaTable* loca_table,
227 const IntegerSet& glyph_ids) {
228 if (!font_builder || !glyph_table || !loca_table) {
229 return false;
230 }
231
232 GlyphTableBuilderPtr glyph_table_builder =
233 down_cast<GlyphTable::Builder*>(font_builder->NewTableBuilder(Tag::glyf));
234 LocaTableBuilderPtr loca_table_builder =
235 down_cast<LocaTable::Builder*>(font_builder->NewTableBuilder(Tag::loca));
236 if (glyph_table_builder == NULL || loca_table_builder == NULL) {
237 // Out of memory.
238 return false;
239 }
240
241 // Extract glyphs and setup loca list.
242 IntegerList loca_list;
243 loca_list.resize(loca_table->num_glyphs());
244 loca_list.push_back(0);
245 int32_t last_glyph_id = 0;
246 int32_t last_offset = 0;
247 GlyphTable::GlyphBuilderList* glyph_builders =
248 glyph_table_builder->GlyphBuilders();
249 for (IntegerSet::const_iterator i = glyph_ids.begin(), e = glyph_ids.end();
250 i != e; ++i) {
251 int32_t length = loca_table->GlyphLength(*i);
252 int32_t offset = loca_table->GlyphOffset(*i);
253
254 GlyphPtr glyph;
255 glyph.Attach(glyph_table->GetGlyph(offset, length));
256
257 // Add glyph to new glyf table.
258 ReadableFontDataPtr data = glyph->ReadFontData();
259 WritableFontDataPtr copy_data;
260 copy_data.Attach(WritableFontData::CreateWritableFontData(data->Length()));
261 data->CopyTo(copy_data);
262 GlyphBuilderPtr glyph_builder;
263 glyph_builder.Attach(glyph_table_builder->GlyphBuilder(copy_data));
264 glyph_builders->push_back(glyph_builder);
265
266 // Configure loca list.
267 for (int32_t j = last_glyph_id + 1; j <= *i; ++j) {
268 loca_list[j] = last_offset;
269 }
270 last_offset += length;
271 loca_list[*i + 1] = last_offset;
272 last_glyph_id = *i;
273 }
274 for (int32_t j = last_glyph_id + 1; j <= loca_table->num_glyphs(); ++j) {
275 loca_list[j] = last_offset;
276 }
277 loca_table_builder->SetLocaList(&loca_list);
278
279 return true;
280}
281
282bool HasOverlap(int32_t range_begin, int32_t range_end,
283 const IntegerSet& glyph_ids) {
284 if (range_begin == range_end) {
285 return glyph_ids.find(range_begin) != glyph_ids.end();
286 } else if (range_end > range_begin) {
287 IntegerSet::const_iterator left = glyph_ids.lower_bound(range_begin);
288 IntegerSet::const_iterator right = glyph_ids.lower_bound(range_end);
289 return right != left;
290 }
291 return false;
292}
293
294// Initialize builder, returns false if glyph_id subset is not covered.
295// Not thread-safe, caller to ensure object life-time.
296bool InitializeBitmapBuilder(EbdtTable::Builder* ebdt, EblcTable::Builder* eblc,
297 const IntegerSet& glyph_ids) {
298 BitmapLocaList loca_list;
299 BitmapSizeTableBuilderList* strikes = eblc->BitmapSizeBuilders();
300
301 // Note: Do not call eblc_builder->GenerateLocaList(&loca_list) and then
302 // ebdt_builder->SetLoca(loca_list). For fonts like SimSun, there are
303 // >28K glyphs inside, where a typical usage will be <1K glyphs. Doing
304 // the calls improperly will result in creation of >100K objects that
305 // will be destroyed immediately, inducing significant slowness.
306 IntegerList removed_strikes;
307 for (size_t i = 0; i < strikes->size(); i++) {
308 if (!HasOverlap((*strikes)[i]->StartGlyphIndex(),
309 (*strikes)[i]->EndGlyphIndex(), glyph_ids)) {
310 removed_strikes.push_back(i);
311 continue;
312 }
313
314 IndexSubTableBuilderList* index_builders =
315 (*strikes)[i]->IndexSubTableBuilders();
316 IntegerList removed_indexes;
317 BitmapGlyphInfoMap info_map;
318 for (size_t j = 0; j < index_builders->size(); ++j) {
319 if ((*index_builders)[j] == NULL) {
320 // Subtable is malformed, let's just skip it.
321 removed_indexes.push_back(j);
322 continue;
323 }
324 int32_t first_glyph_id = (*index_builders)[j]->first_glyph_index();
325 int32_t last_glyph_id = (*index_builders)[j]->last_glyph_index();
326 if (!HasOverlap(first_glyph_id, last_glyph_id, glyph_ids)) {
327 removed_indexes.push_back(j);
328 continue;
329 }
330 for (IntegerSet::const_iterator gid = glyph_ids.begin(),
331 gid_end = glyph_ids.end();
332 gid != gid_end; gid++) {
333 if (*gid < first_glyph_id) {
334 continue;
335 }
336 if (*gid > last_glyph_id) {
337 break;
338 }
339 BitmapGlyphInfoPtr info;
340 info.Attach((*index_builders)[j]->GlyphInfo(*gid));
341 if (info && info->length()) { // Do not include gid without bitmap
342 info_map[*gid] = info;
343 }
344 }
345 }
346 if (!info_map.empty()) {
347 loca_list.push_back(info_map);
348 } else {
349 removed_strikes.push_back(i); // Detected null entries.
350 }
351
352 // Remove unused index sub tables
353 for (IntegerList::reverse_iterator j = removed_indexes.rbegin(),
354 e = removed_indexes.rend();
355 j != e; j++) {
356 index_builders->erase(index_builders->begin() + *j);
357 }
358 }
359 if (removed_strikes.size() == strikes->size() || loca_list.empty()) {
360 return false;
361 }
362
363 for (IntegerList::reverse_iterator i = removed_strikes.rbegin(),
364 e = removed_strikes.rend(); i != e; i++) {
365 strikes->erase(strikes->begin() + *i);
366 }
367
368 if (strikes->empty()) { // no glyph covered, can safely drop the builders.
369 return false;
370 }
371
372 ebdt->SetLoca(&loca_list);
373 ebdt->GlyphBuilders(); // Initialize the builder.
374 return true;
375}
376
377void CopyBigGlyphMetrics(BigGlyphMetrics::Builder* source,
378 BigGlyphMetrics::Builder* target) {
379 target->SetHeight(static_cast<byte_t>(source->Height()));
380 target->SetWidth(static_cast<byte_t>(source->Width()));
381 target->SetHoriBearingX(static_cast<byte_t>(source->HoriBearingX()));
382 target->SetHoriBearingY(static_cast<byte_t>(source->HoriBearingY()));
383 target->SetHoriAdvance(static_cast<byte_t>(source->HoriAdvance()));
384 target->SetVertBearingX(static_cast<byte_t>(source->VertBearingX()));
385 target->SetVertBearingY(static_cast<byte_t>(source->VertBearingY()));
386 target->SetVertAdvance(static_cast<byte_t>(source->VertAdvance()));
387}
388
389CALLER_ATTACH IndexSubTable::Builder*
390ConstructIndexFormat4(IndexSubTable::Builder* b, const BitmapGlyphInfoMap& loca,
391 int32_t* image_data_offset) {
392 IndexSubTableFormat4BuilderPtr builder4;
393 builder4.Attach(IndexSubTableFormat4::Builder::CreateBuilder());
394 CodeOffsetPairBuilderList offset_pairs;
395
396 size_t offset = 0;
397 int32_t lower_bound = b->first_glyph_index();
398 int32_t upper_bound = b->last_glyph_index();
399 int32_t last_gid = -1;
400 BitmapGlyphInfoMap::const_iterator i = loca.lower_bound(lower_bound);
401 BitmapGlyphInfoMap::const_iterator end = loca.end();
402 if (i != end) {
403 last_gid = i->first;
404 builder4->set_first_glyph_index(last_gid);
405 builder4->set_image_format(b->image_format());
406 builder4->set_image_data_offset(*image_data_offset);
407 }
408 for (; i != end; i++) {
409 int32_t gid = i->first;
410 if (gid > upper_bound) {
411 break;
412 }
413 offset_pairs.push_back(
414 IndexSubTableFormat4::CodeOffsetPairBuilder(gid, offset));
415 offset += i->second->length();
416 last_gid = gid;
417 }
418 offset_pairs.push_back(
419 IndexSubTableFormat4::CodeOffsetPairBuilder(-1, offset));
420 builder4->set_last_glyph_index(last_gid);
421 *image_data_offset += offset;
422 builder4->SetOffsetArray(offset_pairs);
423
424 return builder4.Detach();
425}
426
427CALLER_ATTACH IndexSubTable::Builder*
428ConstructIndexFormat5(IndexSubTable::Builder* b, const BitmapGlyphInfoMap& loca,
429 int32_t* image_data_offset) {
430 IndexSubTableFormat5BuilderPtr new_builder;
431 new_builder.Attach(IndexSubTableFormat5::Builder::CreateBuilder());
432
433 // Copy BigMetrics
434 int32_t image_size = 0;
435 if (b->index_format() == IndexSubTable::Format::FORMAT_2) {
436 IndexSubTableFormat2BuilderPtr builder2 =
437 down_cast<IndexSubTableFormat2::Builder*>(b);
438 CopyBigGlyphMetrics(builder2->BigMetrics(), new_builder->BigMetrics());
439 image_size = builder2->ImageSize();
440 } else {
441 IndexSubTableFormat5BuilderPtr builder5 =
442 down_cast<IndexSubTableFormat5::Builder*>(b);
443 BigGlyphMetricsBuilderPtr metrics_builder;
444 CopyBigGlyphMetrics(builder5->BigMetrics(), new_builder->BigMetrics());
445 image_size = builder5->ImageSize();
446 }
447
448 IntegerList* glyph_array = new_builder->GlyphArray();
449 size_t offset = 0;
450 int32_t lower_bound = b->first_glyph_index();
451 int32_t upper_bound = b->last_glyph_index();
452 int32_t last_gid = -1;
453 BitmapGlyphInfoMap::const_iterator i = loca.lower_bound(lower_bound);
454 BitmapGlyphInfoMap::const_iterator end = loca.end();
455 if (i != end) {
456 last_gid = i->first;
457 new_builder->set_first_glyph_index(last_gid);
458 new_builder->set_image_format(b->image_format());
459 new_builder->set_image_data_offset(*image_data_offset);
460 new_builder->SetImageSize(image_size);
461 }
462 for (; i != end; i++) {
463 int32_t gid = i->first;
464 if (gid > upper_bound) {
465 break;
466 }
467 glyph_array->push_back(gid);
468 offset += i->second->length();
469 last_gid = gid;
470 }
471 new_builder->set_last_glyph_index(last_gid);
472 *image_data_offset += offset;
473 return new_builder.Detach();
474}
475
476CALLER_ATTACH IndexSubTable::Builder*
477SubsetIndexSubTable(IndexSubTable::Builder* builder,
478 const BitmapGlyphInfoMap& loca,
479 int32_t* image_data_offset) {
480 switch (builder->index_format()) {
481 case IndexSubTable::Format::FORMAT_1:
482 case IndexSubTable::Format::FORMAT_3:
483 case IndexSubTable::Format::FORMAT_4:
484 return ConstructIndexFormat4(builder, loca, image_data_offset);
485 case IndexSubTable::Format::FORMAT_2:
486 case IndexSubTable::Format::FORMAT_5:
487 return ConstructIndexFormat5(builder, loca, image_data_offset);
488 default:
489 assert(false);
490 break;
491 }
492 return NULL;
493}
494
495}
496
497namespace sfntly {
498
499// Not thread-safe, caller to ensure object life-time.
500void SubsetEBLC(EblcTable::Builder* eblc, const BitmapLocaList& new_loca) {
501 BitmapSizeTableBuilderList* size_builders = eblc->BitmapSizeBuilders();
502 if (size_builders == NULL) {
503 return;
504 }
505
506 int32_t image_data_offset = EbdtTable::Offset::kHeaderLength;
507 for (size_t strike = 0; strike < size_builders->size(); ++strike) {
508 IndexSubTableBuilderList* index_builders =
509 (*size_builders)[strike]->IndexSubTableBuilders();
510 for (size_t index = 0; index < index_builders->size(); ++index) {
511 IndexSubTable::Builder* new_builder_raw =
512 SubsetIndexSubTable((*index_builders)[index], new_loca[strike],
513 &image_data_offset);
514 if (NULL != new_builder_raw) {
515 (*index_builders)[index].Attach(new_builder_raw);
516 }
517 }
518 }
519}
520
521// EBLC structure (from stuartg)
522// header
523// bitmapSizeTable[]
524// one per strike
525// holds strike metrics - sbitLineMetrics
526// holds info about indexSubTableArray
527// indexSubTableArray[][]
528// one per strike and then one per indexSubTable for that strike
529// holds info about the indexSubTable
530// the indexSubTable entries pointed to can be of different formats
531// indexSubTable
532// one per indexSubTableArray entry
533// tells how to get the glyphs
534// may hold the glyph metrics if they are uniform for all the glyphs in range
535// Please note that the structure can also be
536// {indexSubTableArray[], indexSubTables[]}[]
537// This way is also legal and in fact how Microsoft fonts are laid out.
538//
539// There is nothing that says that the indexSubTableArray entries and/or the
540// indexSubTable items need to be unique. They may be shared between strikes.
541//
542// EBDT structure:
543// header
544// glyphs
545// amorphous blob of data
546// different glyphs that are only able to be figured out from the EBLC table
547// may hold metrics - depends on the EBLC entry that pointed to them
548
549// Subsetting EBLC table (from arthurhsu)
550// Most pages use only a fraction (hundreds or less) glyphs out of a given font
551// (which can have >20K glyphs for CJK). It's safe to assume that the subset
552// font will have sparse bitmap glyphs. So we reconstruct the EBLC table as
553// format 4 or 5 here.
554
555enum BuildersToRemove {
556 kRemoveNone,
557 kRemoveBDAT,
558 kRemoveBDATAndEBDT,
559 kRemoveEBDT
560};
561
562int SetupBitmapBuilders(Font* font, Font::Builder* font_builder,
563 const IntegerSet& glyph_ids) {
564 if (!font || !font_builder) {
565 return false;
566 }
567
568 // Check if bitmap table exists.
569 EbdtTablePtr ebdt_table = down_cast<EbdtTable*>(font->GetTable(Tag::EBDT));
570 EblcTablePtr eblc_table = down_cast<EblcTable*>(font->GetTable(Tag::EBLC));
571 bool use_ebdt = (ebdt_table != NULL && eblc_table != NULL);
572 if (!use_ebdt) {
573 ebdt_table = down_cast<EbdtTable*>(font->GetTable(Tag::bdat));
574 eblc_table = down_cast<EblcTable*>(font->GetTable(Tag::bloc));
575 if (ebdt_table == NULL || eblc_table == NULL) {
576 return kRemoveNone;
577 }
578 }
579
580 // If the bitmap table's size is too small, skip subsetting.
581 if (ebdt_table->DataLength() + eblc_table->DataLength() <
582 BITMAP_SIZE_THRESHOLD) {
583 return use_ebdt ? kRemoveBDAT : kRemoveNone;
584 }
585
586 // Get the builders.
587 EbdtTableBuilderPtr ebdt_table_builder = down_cast<EbdtTable::Builder*>(
588 font_builder->NewTableBuilder(use_ebdt ? Tag::EBDT : Tag::bdat,
589 ebdt_table->ReadFontData()));
590 EblcTableBuilderPtr eblc_table_builder = down_cast<EblcTable::Builder*>(
591 font_builder->NewTableBuilder(use_ebdt ? Tag::EBLC : Tag::bloc,
592 eblc_table->ReadFontData()));
593 if (ebdt_table_builder == NULL || eblc_table_builder == NULL) {
594 // Out of memory.
595 return use_ebdt ? kRemoveBDAT : kRemoveNone;
596 }
597
598 if (!InitializeBitmapBuilder(ebdt_table_builder, eblc_table_builder,
599 glyph_ids)) {
600 // Bitmap tables do not cover the glyphs in our subset.
601 font_builder->RemoveTableBuilder(use_ebdt ? Tag::EBLC : Tag::bloc);
602 font_builder->RemoveTableBuilder(use_ebdt ? Tag::EBDT : Tag::bdat);
603 return use_ebdt ? kRemoveBDATAndEBDT : kRemoveEBDT;
604 }
605
606 BitmapLocaList new_loca;
607 ebdt_table_builder->GenerateLocaList(&new_loca);
608 SubsetEBLC(eblc_table_builder, new_loca);
609
610 return use_ebdt ? kRemoveBDAT : kRemoveNone;
611}
612
613SubsetterImpl::SubsetterImpl() {
614}
615
616SubsetterImpl::~SubsetterImpl() {
617}
618
Colin Cross13a82432017-04-07 10:50:33 -0700619bool SubsetterImpl::LoadFont(int font_index,
620 const unsigned char* original_font,
621 size_t font_size) {
622 MemoryInputStream mis;
623 mis.Attach(original_font, font_size);
624 if (factory_ == NULL) {
625 factory_.Attach(FontFactory::GetInstance());
626 }
627
628 FontArray font_array;
629 factory_->LoadFonts(&mis, &font_array);
630 if (font_index < 0 || (size_t)font_index >= font_array.size()) {
631 return false;
632 }
633 font_ = font_array[font_index].p_;
634 return font_ != NULL;
635}
636
Selim Gurun30d4e1f2013-08-15 12:46:15 -0700637bool SubsetterImpl::LoadFont(const char* font_name,
638 const unsigned char* original_font,
639 size_t font_size) {
640 MemoryInputStream mis;
641 mis.Attach(original_font, font_size);
642 if (factory_ == NULL) {
643 factory_.Attach(FontFactory::GetInstance());
644 }
645
646 FontArray font_array;
647 factory_->LoadFonts(&mis, &font_array);
648 font_ = FindFont(font_name, font_array);
649 if (font_ == NULL) {
650 return false;
651 }
652
653 return true;
654}
655
656int SubsetterImpl::SubsetFont(const unsigned int* glyph_ids,
657 size_t glyph_count,
658 unsigned char** output_buffer) {
659 if (factory_ == NULL || font_ == NULL) {
660 return -1;
661 }
662
663 // Find glyf and loca table.
664 GlyphTablePtr glyph_table =
665 down_cast<GlyphTable*>(font_->GetTable(Tag::glyf));
666 LocaTablePtr loca_table = down_cast<LocaTable*>(font_->GetTable(Tag::loca));
667 if (glyph_table == NULL || loca_table == NULL) {
668 // We are not able to subset the font.
669 return 0;
670 }
671
672 IntegerSet glyph_id_processed;
673 if (!ResolveCompositeGlyphs(glyph_table, loca_table,
674 glyph_ids, glyph_count, &glyph_id_processed) ||
675 glyph_id_processed.empty()) {
676 return 0;
677 }
678
679 FontPtr new_font;
680 new_font.Attach(Subset(glyph_id_processed, glyph_table, loca_table));
681 if (new_font == NULL) {
682 return 0;
683 }
684
685 MemoryOutputStream output_stream;
686 factory_->SerializeFont(new_font, &output_stream);
687 int length = static_cast<int>(output_stream.Size());
688 if (length > 0) {
689 *output_buffer = new unsigned char[length];
690 memcpy(*output_buffer, output_stream.Get(), length);
691 }
692
693 return length;
694}
695
696// Long comments regarding TTF tables and PDF (from stuartg)
697//
698// According to PDF spec 1.4 (section 5.8), the following tables must be
699// present:
700// head, hhea, loca, maxp, cvt, prep, glyf, hmtx, fpgm
701// cmap if font is used with a simple font dict and not a CIDFont dict
702//
703// Other tables we need to keep for PDF rendering to support zoom in/out:
704// bdat, bloc, ebdt, eblc, ebsc, gasp
705//
706// Special table:
707// CFF - if you have this table then you shouldn't have a glyf table and this
708// is the table with all the glyphs. Shall skip subsetting completely
709// since sfntly is not capable of subsetting it for now.
710// post - extra info here for printing on PostScript printers but maybe not
711// enough to outweigh the space taken by the names
712//
713// Tables to break apart:
714// name - could throw away all but one language and one platform strings/ might
715// throw away some of the name entries
716// cmap - could strip out non-needed cmap subtables
717// - format 4 subtable can be subsetted as well using sfntly
718//
719// Graphite tables:
720// silf, glat, gloc, feat - should be okay to strip out
721//
722// Tables that can be discarded:
723// OS/2 - everything here is for layout and description of the font that is
724// elsewhere (some in the PDF objects)
725// BASE, GDEF, GSUB, GPOS, JSTF - all used for layout
726// kern - old style layout
727// DSIG - this will be invalid after subsetting
728// hdmx - layout
729// PCLT - metadata that's not needed
730// vmtx - layout
731// vhea - layout
732// VDMX
733// VORG - not used by TT/OT - used by CFF
734// hsty - would be surprised to see one of these - used on the Newton
735// AAT tables - mort, morx, feat, acnt, bsin, just, lcar, fdsc, fmtx, prop,
736// Zapf, opbd, trak, fvar, gvar, avar, cvar
737// - these are all layout tables and once layout happens are not
738// needed anymore
739// LTSH - layout
740
741CALLER_ATTACH
742Font* SubsetterImpl::Subset(const IntegerSet& glyph_ids, GlyphTable* glyf,
743 LocaTable* loca) {
744 // The const is initialized here to workaround VC bug of rendering all Tag::*
745 // as 0. These tags represents the TTF tables that we will embed in subset
746 // font.
747 const int32_t TABLES_IN_SUBSET[] = {
748 Tag::head, Tag::hhea, Tag::loca, Tag::maxp, Tag::cvt,
749 Tag::prep, Tag::glyf, Tag::hmtx, Tag::fpgm, Tag::EBDT,
750 Tag::EBLC, Tag::EBSC, Tag::bdat, Tag::bloc, Tag::bhed,
751 Tag::cmap, // Keep here for future tagged PDF development.
752 Tag::name, // Keep here due to legal concerns: copyright info inside.
753 };
754
755 // Setup font builders we need.
756 FontBuilderPtr font_builder;
757 font_builder.Attach(factory_->NewFontBuilder());
758 IntegerSet remove_tags;
759
760 if (SetupGlyfBuilders(font_builder, glyf, loca, glyph_ids)) {
761 remove_tags.insert(Tag::glyf);
762 remove_tags.insert(Tag::loca);
763 }
764
765 // For old Apple bitmap fonts, they have only bdats and bhed is identical
766 // to head. As a result, we can't remove bdat tables for those fonts.
767 int setup_result = SetupBitmapBuilders(font_, font_builder, glyph_ids);
768 if (setup_result == kRemoveBDATAndEBDT || setup_result == kRemoveEBDT) {
769 remove_tags.insert(Tag::EBDT);
770 remove_tags.insert(Tag::EBLC);
771 remove_tags.insert(Tag::EBSC);
772 }
773
774 if (setup_result == kRemoveBDAT || setup_result == kRemoveBDATAndEBDT) {
775 remove_tags.insert(Tag::bdat);
776 remove_tags.insert(Tag::bloc);
777 remove_tags.insert(Tag::bhed);
778 }
779
780 IntegerSet allowed_tags;
781 for (size_t i = 0; i < sizeof(TABLES_IN_SUBSET) / sizeof(int32_t); ++i) {
782 allowed_tags.insert(TABLES_IN_SUBSET[i]);
783 }
784
785 IntegerSet result;
786 std::set_difference(allowed_tags.begin(), allowed_tags.end(),
787 remove_tags.begin(), remove_tags.end(),
788 std::inserter(result, result.end()));
789 allowed_tags = result;
790
791 // Setup remaining builders.
792 for (IntegerSet::iterator i = allowed_tags.begin(), e = allowed_tags.end();
793 i != e; ++i) {
794 Table* table = font_->GetTable(*i);
795 if (table) {
796 font_builder->NewTableBuilder(*i, table->ReadFontData());
797 }
798 }
799
800 return font_builder->Build();
801}
802
803} // namespace sfntly