blob: febd8f00a5926aacfb8b047a4fc2f2f2f3403d26 [file] [log] [blame]
Ben Wagnera25fbef2017-08-30 13:56:19 -04001/*
2 * Copyright 2016 Google Inc.
3 *
4 * Use of this source code is governed by a BSD-style license that can be
5 * found in the LICENSE file.
6 */
7
Ben Wagner17774242018-08-07 14:31:33 -04008#include "SkFontArguments.h"
Ben Wagner67e3a302017-09-05 14:46:19 -04009#include "SkFontMgr.h"
Ben Wagner17774242018-08-07 14:31:33 -040010#include "SkMalloc.h"
Hal Canary0e07ad72018-02-08 13:06:56 -050011#include "SkOnce.h"
Hal Canary2a1848d2018-11-26 17:23:24 -050012#include "SkFont.h"
Mike Reed77f94ea2019-01-22 16:30:40 -050013#include "SkFontMetrics.h"
Ben Wagner17774242018-08-07 14:31:33 -040014#include "SkPoint.h"
15#include "SkRefCnt.h"
16#include "SkScalar.h"
Ben Wagnera25fbef2017-08-30 13:56:19 -040017#include "SkShaper.h"
18#include "SkStream.h"
Ben Wagner17774242018-08-07 14:31:33 -040019#include "SkString.h"
20#include "SkTArray.h"
Ben Wagner8d45a382017-11-16 10:08:28 -050021#include "SkTDPQueue.h"
Ben Wagner17774242018-08-07 14:31:33 -040022#include "SkTFitsIn.h"
Ben Wagner8d45a382017-11-16 10:08:28 -050023#include "SkTLazy.h"
Ben Wagnere0001732017-08-31 16:26:26 -040024#include "SkTemplates.h"
Hal Canaryc640d0d2018-06-13 09:59:02 -040025#include "SkTo.h"
Ben Wagnera25fbef2017-08-30 13:56:19 -040026#include "SkTypeface.h"
Ben Wagner17774242018-08-07 14:31:33 -040027#include "SkTypes.h"
28#include "SkUTF.h"
29
30#include <hb.h>
31#include <hb-ot.h>
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -050032#include <unicode/ubrk.h>
Ben Wagner17774242018-08-07 14:31:33 -040033#include <unicode/ubidi.h>
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -050034#include <unicode/ustring.h>
Ben Wagner17774242018-08-07 14:31:33 -040035#include <unicode/urename.h>
36#include <unicode/utext.h>
37#include <unicode/utypes.h>
38
Ben Wagner0ec8ec22018-09-04 18:17:13 -040039#include <cstring>
40#include <locale>
Ben Wagner17774242018-08-07 14:31:33 -040041#include <memory>
42#include <utility>
Ben Wagnera25fbef2017-08-30 13:56:19 -040043
Hal Canary32498f02019-02-04 15:36:31 -050044#ifdef SK_USING_THIRD_PARTY_ICU
45#include "SkLoadICU.h"
46#else
47static inline void SkLoadICU() {}
48#endif // SK_USING_THIRD_PARTY_ICU
49
Ben Wagnera25fbef2017-08-30 13:56:19 -040050namespace {
51template <class T, void(*P)(T*)> using resource = std::unique_ptr<T, SkFunctionWrapper<void, T, P>>;
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -050052using HBBlob = resource<hb_blob_t , hb_blob_destroy >;
53using HBFace = resource<hb_face_t , hb_face_destroy >;
54using HBFont = resource<hb_font_t , hb_font_destroy >;
55using HBBuffer = resource<hb_buffer_t , hb_buffer_destroy>;
56using ICUBiDi = resource<UBiDi , ubidi_close >;
Ben Wagner0ec8ec22018-09-04 18:17:13 -040057using ICUBrk = resource<UBreakIterator, ubrk_close >;
Ben Wagnera25fbef2017-08-30 13:56:19 -040058
59HBBlob stream_to_blob(std::unique_ptr<SkStreamAsset> asset) {
60 size_t size = asset->getLength();
61 HBBlob blob;
62 if (const void* base = asset->getMemoryBase()) {
63 blob.reset(hb_blob_create((char*)base, SkToUInt(size),
64 HB_MEMORY_MODE_READONLY, asset.release(),
65 [](void* p) { delete (SkStreamAsset*)p; }));
66 } else {
67 // SkDebugf("Extra SkStreamAsset copy\n");
68 void* ptr = size ? sk_malloc_throw(size) : nullptr;
69 asset->read(ptr, size);
70 blob.reset(hb_blob_create((char*)ptr, SkToUInt(size),
71 HB_MEMORY_MODE_READONLY, ptr, sk_free));
72 }
73 SkASSERT(blob);
74 hb_blob_make_immutable(blob.get());
75 return blob;
76}
Ben Wagnera25fbef2017-08-30 13:56:19 -040077
Ben Wagner8d45a382017-11-16 10:08:28 -050078HBFont create_hb_font(SkTypeface* tf) {
Hal Canary0dfa2082018-10-31 13:02:49 -040079 if (!tf) {
80 return nullptr;
81 }
Ben Wagnera25fbef2017-08-30 13:56:19 -040082 int index;
Hal Canaryddef43f2018-11-16 10:53:51 -050083 std::unique_ptr<SkStreamAsset> typefaceAsset(tf->openStream(&index));
84 if (!typefaceAsset) {
85 SkString name;
86 tf->getFamilyName(&name);
87 SkDebugf("Typeface '%s' has no data :(\n", name.c_str());
88 return nullptr;
89 }
90 HBBlob blob(stream_to_blob(std::move(typefaceAsset)));
Ben Wagnera25fbef2017-08-30 13:56:19 -040091 HBFace face(hb_face_create(blob.get(), (unsigned)index));
92 SkASSERT(face);
93 if (!face) {
Ben Wagnere0001732017-08-31 16:26:26 -040094 return nullptr;
Ben Wagnera25fbef2017-08-30 13:56:19 -040095 }
96 hb_face_set_index(face.get(), (unsigned)index);
Ben Wagnere0001732017-08-31 16:26:26 -040097 hb_face_set_upem(face.get(), tf->getUnitsPerEm());
Ben Wagnera25fbef2017-08-30 13:56:19 -040098
Ben Wagnere0001732017-08-31 16:26:26 -040099 HBFont font(hb_font_create(face.get()));
100 SkASSERT(font);
101 if (!font) {
102 return nullptr;
103 }
Ben Wagnere0001732017-08-31 16:26:26 -0400104 hb_ot_font_set_funcs(font.get());
105 int axis_count = tf->getVariationDesignPosition(nullptr, 0);
106 if (axis_count > 0) {
107 SkAutoSTMalloc<4, SkFontArguments::VariationPosition::Coordinate> axis_values(axis_count);
108 if (tf->getVariationDesignPosition(axis_values, axis_count) == axis_count) {
109 hb_font_set_variations(font.get(),
110 reinterpret_cast<hb_variation_t*>(axis_values.get()),
111 axis_count);
112 }
113 }
114 return font;
115}
116
Hal Canaryf107a2f2018-07-25 16:52:48 -0400117/** this version replaces invalid utf-8 sequences with code point U+FFFD. */
118static inline SkUnichar utf8_next(const char** ptr, const char* end) {
119 SkUnichar val = SkUTF::NextUTF8(ptr, end);
120 if (val < 0) {
121 return 0xFFFD; // REPLACEMENT CHARACTER
122 }
123 return val;
124}
125
Ben Wagner8d45a382017-11-16 10:08:28 -0500126class RunIterator {
127public:
128 virtual ~RunIterator() {}
129 virtual void consume() = 0;
130 // Pointer one past the last (utf8) element in the current run.
131 virtual const char* endOfCurrentRun() const = 0;
132 virtual bool atEnd() const = 0;
133 bool operator<(const RunIterator& that) const {
134 return this->endOfCurrentRun() < that.endOfCurrentRun();
135 }
136};
137
138class BiDiRunIterator : public RunIterator {
139public:
140 static SkTLazy<BiDiRunIterator> Make(const char* utf8, size_t utf8Bytes, UBiDiLevel level) {
141 SkTLazy<BiDiRunIterator> ret;
142
143 // ubidi only accepts utf16 (though internally it basically works on utf32 chars).
144 // We want an ubidi_setPara(UBiDi*, UText*, UBiDiLevel, UBiDiLevel*, UErrorCode*);
145 if (!SkTFitsIn<int32_t>(utf8Bytes)) {
146 SkDebugf("Bidi error: text too long");
147 return ret;
148 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500149
150 UErrorCode status = U_ZERO_ERROR;
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -0500151
152 // Getting the length like this seems to always set U_BUFFER_OVERFLOW_ERROR
153 int32_t utf16Units;
154 u_strFromUTF8(nullptr, 0, &utf16Units, utf8, utf8Bytes, &status);
155 status = U_ZERO_ERROR;
156 std::unique_ptr<UChar[]> utf16(new UChar[utf16Units]);
157 u_strFromUTF8(utf16.get(), utf16Units, nullptr, utf8, utf8Bytes, &status);
158 if (U_FAILURE(status)) {
159 SkDebugf("Invalid utf8 input: %s", u_errorName(status));
160 return ret;
161 }
162
163 ICUBiDi bidi(ubidi_openSized(utf16Units, 0, &status));
Ben Wagner8d45a382017-11-16 10:08:28 -0500164 if (U_FAILURE(status)) {
165 SkDebugf("Bidi error: %s", u_errorName(status));
166 return ret;
167 }
168 SkASSERT(bidi);
169
170 // The required lifetime of utf16 isn't well documented.
171 // It appears it isn't used after ubidi_setPara except through ubidi_getText.
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -0500172 ubidi_setPara(bidi.get(), utf16.get(), utf16Units, level, nullptr, &status);
Ben Wagner8d45a382017-11-16 10:08:28 -0500173 if (U_FAILURE(status)) {
174 SkDebugf("Bidi error: %s", u_errorName(status));
175 return ret;
176 }
177
Hal Canary4014ba62018-07-24 11:33:21 -0400178 ret.init(utf8, utf8 + utf8Bytes, std::move(bidi));
Ben Wagner8d45a382017-11-16 10:08:28 -0500179 return ret;
180 }
Hal Canary4014ba62018-07-24 11:33:21 -0400181 BiDiRunIterator(const char* utf8, const char* end, ICUBiDi bidi)
Ben Wagner8d45a382017-11-16 10:08:28 -0500182 : fBidi(std::move(bidi))
183 , fEndOfCurrentRun(utf8)
Hal Canary4014ba62018-07-24 11:33:21 -0400184 , fEndOfAllRuns(end)
Ben Wagner8d45a382017-11-16 10:08:28 -0500185 , fUTF16LogicalPosition(0)
186 , fLevel(UBIDI_DEFAULT_LTR)
187 {}
188 void consume() override {
189 SkASSERT(fUTF16LogicalPosition < ubidi_getLength(fBidi.get()));
190 int32_t endPosition = ubidi_getLength(fBidi.get());
191 fLevel = ubidi_getLevelAt(fBidi.get(), fUTF16LogicalPosition);
Hal Canaryf107a2f2018-07-25 16:52:48 -0400192 SkUnichar u = utf8_next(&fEndOfCurrentRun, fEndOfAllRuns);
193 fUTF16LogicalPosition += SkUTF::ToUTF16(u);
Ben Wagner8d45a382017-11-16 10:08:28 -0500194 UBiDiLevel level;
195 while (fUTF16LogicalPosition < endPosition) {
196 level = ubidi_getLevelAt(fBidi.get(), fUTF16LogicalPosition);
197 if (level != fLevel) {
198 break;
199 }
Hal Canaryf107a2f2018-07-25 16:52:48 -0400200 u = utf8_next(&fEndOfCurrentRun, fEndOfAllRuns);
201 fUTF16LogicalPosition += SkUTF::ToUTF16(u);
Ben Wagner8d45a382017-11-16 10:08:28 -0500202 }
203 }
204 const char* endOfCurrentRun() const override {
205 return fEndOfCurrentRun;
206 }
207 bool atEnd() const override {
208 return fUTF16LogicalPosition == ubidi_getLength(fBidi.get());
209 }
210
211 UBiDiLevel currentLevel() const {
212 return fLevel;
213 }
214private:
215 ICUBiDi fBidi;
216 const char* fEndOfCurrentRun;
Hal Canary4014ba62018-07-24 11:33:21 -0400217 const char* fEndOfAllRuns;
Ben Wagner8d45a382017-11-16 10:08:28 -0500218 int32_t fUTF16LogicalPosition;
219 UBiDiLevel fLevel;
220};
221
222class ScriptRunIterator : public RunIterator {
223public:
224 static SkTLazy<ScriptRunIterator> Make(const char* utf8, size_t utf8Bytes,
225 hb_unicode_funcs_t* hbUnicode)
226 {
227 SkTLazy<ScriptRunIterator> ret;
228 ret.init(utf8, utf8Bytes, hbUnicode);
229 return ret;
230 }
231 ScriptRunIterator(const char* utf8, size_t utf8Bytes, hb_unicode_funcs_t* hbUnicode)
232 : fCurrent(utf8), fEnd(fCurrent + utf8Bytes)
233 , fHBUnicode(hbUnicode)
234 , fCurrentScript(HB_SCRIPT_UNKNOWN)
235 {}
236 void consume() override {
237 SkASSERT(fCurrent < fEnd);
Hal Canaryf107a2f2018-07-25 16:52:48 -0400238 SkUnichar u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500239 fCurrentScript = hb_unicode_script(fHBUnicode, u);
240 while (fCurrent < fEnd) {
241 const char* prev = fCurrent;
Hal Canaryf107a2f2018-07-25 16:52:48 -0400242 u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500243 const hb_script_t script = hb_unicode_script(fHBUnicode, u);
244 if (script != fCurrentScript) {
245 if (fCurrentScript == HB_SCRIPT_INHERITED || fCurrentScript == HB_SCRIPT_COMMON) {
246 fCurrentScript = script;
247 } else if (script == HB_SCRIPT_INHERITED || script == HB_SCRIPT_COMMON) {
248 continue;
249 } else {
250 fCurrent = prev;
251 break;
252 }
253 }
254 }
255 if (fCurrentScript == HB_SCRIPT_INHERITED) {
256 fCurrentScript = HB_SCRIPT_COMMON;
257 }
258 }
259 const char* endOfCurrentRun() const override {
260 return fCurrent;
261 }
262 bool atEnd() const override {
263 return fCurrent == fEnd;
264 }
265
266 hb_script_t currentScript() const {
267 return fCurrentScript;
268 }
269private:
270 const char* fCurrent;
271 const char* fEnd;
272 hb_unicode_funcs_t* fHBUnicode;
273 hb_script_t fCurrentScript;
274};
275
276class FontRunIterator : public RunIterator {
277public:
278 static SkTLazy<FontRunIterator> Make(const char* utf8, size_t utf8Bytes,
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400279 SkFont font,
Ben Wagner8d45a382017-11-16 10:08:28 -0500280 sk_sp<SkFontMgr> fallbackMgr)
281 {
282 SkTLazy<FontRunIterator> ret;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400283 font.setTypeface(font.refTypefaceOrDefault());
284 HBFont hbFont = create_hb_font(font.getTypeface());
285 if (!hbFont) {
286 SkDebugf("create_hb_font failed!\n");
287 return ret;
288 }
289 ret.init(utf8, utf8Bytes, std::move(font), std::move(hbFont), std::move(fallbackMgr));
Ben Wagner8d45a382017-11-16 10:08:28 -0500290 return ret;
291 }
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400292 FontRunIterator(const char* utf8, size_t utf8Bytes, SkFont font,
293 HBFont hbFont, sk_sp<SkFontMgr> fallbackMgr)
Ben Wagner8d45a382017-11-16 10:08:28 -0500294 : fCurrent(utf8), fEnd(fCurrent + utf8Bytes)
295 , fFallbackMgr(std::move(fallbackMgr))
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400296 , fHBFont(std::move(hbFont)), fFont(std::move(font))
297 , fFallbackHBFont(nullptr), fFallbackFont(fFont)
298 , fCurrentHBFont(fHBFont.get()), fCurrentFont(&fFont)
299 {
300 fFallbackFont.setTypeface(nullptr);
301 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500302 void consume() override {
303 SkASSERT(fCurrent < fEnd);
Hal Canaryf107a2f2018-07-25 16:52:48 -0400304 SkUnichar u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500305 // If the starting typeface can handle this character, use it.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400306 if (fFont.getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1)) {
307 fCurrentFont = &fFont;
308 fCurrentHBFont = fHBFont.get();
Ben Wagnera900ad52018-08-31 17:48:19 -0400309 // If the current fallback can handle this character, use it.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400310 } else if (fFallbackFont.getTypeface() &&
311 fFallbackFont.getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1))
Ben Wagnera900ad52018-08-31 17:48:19 -0400312 {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400313 fCurrentFont = &fFallbackFont;
Ben Wagnera900ad52018-08-31 17:48:19 -0400314 fCurrentHBFont = fFallbackHBFont.get();
Ben Wagner8d45a382017-11-16 10:08:28 -0500315 // If not, try to find a fallback typeface
316 } else {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400317 fFallbackFont.setTypeface(sk_ref_sp(fFallbackMgr->matchFamilyStyleCharacter(
318 nullptr, fFont.getTypeface()->fontStyle(), nullptr, 0, u)));
319 fFallbackHBFont = create_hb_font(fFallbackFont.getTypeface());
320 fCurrentFont = &fFallbackFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500321 fCurrentHBFont = fFallbackHBFont.get();
Ben Wagner8d45a382017-11-16 10:08:28 -0500322 }
323
324 while (fCurrent < fEnd) {
325 const char* prev = fCurrent;
Hal Canaryf107a2f2018-07-25 16:52:48 -0400326 u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500327
Ben Wagnera900ad52018-08-31 17:48:19 -0400328 // If not using initial typeface and initial typeface has this character, stop fallback.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400329 if (fCurrentFont->getTypeface() != fFont.getTypeface() &&
330 fFont.getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1))
Ben Wagner8d45a382017-11-16 10:08:28 -0500331 {
332 fCurrent = prev;
333 return;
334 }
335 // If the current typeface cannot handle this character, stop using it.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400336 if (!fCurrentFont->getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1)) {
Ben Wagner8d45a382017-11-16 10:08:28 -0500337 fCurrent = prev;
338 return;
339 }
340 }
341 }
342 const char* endOfCurrentRun() const override {
343 return fCurrent;
344 }
345 bool atEnd() const override {
346 return fCurrent == fEnd;
347 }
348
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400349 SkFont* currentFont() const {
350 return fCurrentFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500351 }
352 hb_font_t* currentHBFont() const {
353 return fCurrentHBFont;
354 }
355private:
356 const char* fCurrent;
357 const char* fEnd;
358 sk_sp<SkFontMgr> fFallbackMgr;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400359 HBFont fHBFont;
360 SkFont fFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500361 HBFont fFallbackHBFont;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400362 SkFont fFallbackFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500363 hb_font_t* fCurrentHBFont;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400364 SkFont* fCurrentFont;
365};
366
367class LanguageRunIterator : public RunIterator {
368public:
369 static SkTLazy<LanguageRunIterator> Make(const char* utf8, size_t utf8Bytes) {
370 SkTLazy<LanguageRunIterator> ret;
371 ret.init(utf8, utf8Bytes);
372 return ret;
373 }
374 LanguageRunIterator(const char* utf8, size_t utf8Bytes)
375 : fCurrent(utf8), fEnd(fCurrent + utf8Bytes)
376 , fLanguage(hb_language_from_string(std::locale().name().c_str(), -1))
377 { }
378 void consume() override {
379 // Ideally something like cld2/3 could be used, or user signals.
380 SkASSERT(fCurrent < fEnd);
381 fCurrent = fEnd;
382 }
383 const char* endOfCurrentRun() const override {
384 return fCurrent;
385 }
386 bool atEnd() const override {
387 return fCurrent == fEnd;
388 }
389
390 hb_language_t currentLanguage() const {
391 return fLanguage;
392 }
393private:
394 const char* fCurrent;
395 const char* fEnd;
396 hb_language_t fLanguage;
Ben Wagner8d45a382017-11-16 10:08:28 -0500397};
398
399class RunIteratorQueue {
400public:
401 void insert(RunIterator* runIterator) {
402 fRunIterators.insert(runIterator);
403 }
404
405 bool advanceRuns() {
406 const RunIterator* leastRun = fRunIterators.peek();
407 if (leastRun->atEnd()) {
408 SkASSERT(this->allRunsAreAtEnd());
409 return false;
410 }
411 const char* leastEnd = leastRun->endOfCurrentRun();
412 RunIterator* currentRun = nullptr;
413 SkDEBUGCODE(const char* previousEndOfCurrentRun);
414 while ((currentRun = fRunIterators.peek())->endOfCurrentRun() <= leastEnd) {
415 fRunIterators.pop();
416 SkDEBUGCODE(previousEndOfCurrentRun = currentRun->endOfCurrentRun());
417 currentRun->consume();
418 SkASSERT(previousEndOfCurrentRun < currentRun->endOfCurrentRun());
419 fRunIterators.insert(currentRun);
420 }
421 return true;
422 }
423
424 const char* endOfCurrentRun() const {
425 return fRunIterators.peek()->endOfCurrentRun();
426 }
427
428private:
429 bool allRunsAreAtEnd() const {
430 for (int i = 0; i < fRunIterators.count(); ++i) {
431 if (!fRunIterators.at(i)->atEnd()) {
432 return false;
433 }
434 }
435 return true;
436 }
437
438 static bool CompareRunIterator(RunIterator* const& a, RunIterator* const& b) {
439 return *a < *b;
440 }
441 SkTDPQueue<RunIterator*, CompareRunIterator> fRunIterators;
442};
443
444struct ShapedGlyph {
445 SkGlyphID fID;
446 uint32_t fCluster;
447 SkPoint fOffset;
448 SkVector fAdvance;
449 bool fMayLineBreakBefore;
450 bool fMustLineBreakBefore;
451 bool fHasVisual;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400452 bool fGraphemeBreakBefore;
453 bool fUnsafeToBreak;
Ben Wagner8d45a382017-11-16 10:08:28 -0500454};
455struct ShapedRun {
Mike Reed6d595682018-12-05 17:28:14 -0500456 ShapedRun(const char* utf8Start, const char* utf8End, int numGlyphs, const SkFont& font,
Ben Wagner8d45a382017-11-16 10:08:28 -0500457 UBiDiLevel level, std::unique_ptr<ShapedGlyph[]> glyphs)
Mike Reed6d595682018-12-05 17:28:14 -0500458 : fUtf8Start(utf8Start), fUtf8End(utf8End), fNumGlyphs(numGlyphs), fFont(font)
Ben Wagner8d45a382017-11-16 10:08:28 -0500459 , fLevel(level), fGlyphs(std::move(glyphs))
460 {}
461
462 const char* fUtf8Start;
463 const char* fUtf8End;
464 int fNumGlyphs;
Mike Reed6d595682018-12-05 17:28:14 -0500465 SkFont fFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500466 UBiDiLevel fLevel;
467 std::unique_ptr<ShapedGlyph[]> fGlyphs;
Florin Malita950243d2019-01-11 11:08:35 -0500468 SkVector fAdvance = { 0, 0 };
Ben Wagner8d45a382017-11-16 10:08:28 -0500469};
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400470struct ShapedLine {
471 SkTArray<ShapedRun> runs;
472 SkVector fAdvance = { 0, 0 };
473};
Ben Wagner8d45a382017-11-16 10:08:28 -0500474
475static constexpr bool is_LTR(UBiDiLevel level) {
476 return (level & 1) == 0;
477}
478
Florin Malita950243d2019-01-11 11:08:35 -0500479static void append(SkShaper::RunHandler* handler, const SkShaper::RunHandler::RunInfo& runInfo,
480 const ShapedRun& run, int start, int end,
Florin Malita9867f612018-12-12 10:54:49 -0500481 SkPoint* p) {
Ben Wagner8d45a382017-11-16 10:08:28 -0500482 unsigned len = end - start;
Florin Malita9867f612018-12-12 10:54:49 -0500483
Florin Malita950243d2019-01-11 11:08:35 -0500484 const auto buffer = handler->newRunBuffer(runInfo, run.fFont, len, run.fUtf8End - run.fUtf8Start);
Florin Malita9867f612018-12-12 10:54:49 -0500485 SkASSERT(buffer.glyphs);
486 SkASSERT(buffer.positions);
487
488 if (buffer.utf8text) {
489 memcpy(buffer.utf8text, run.fUtf8Start, run.fUtf8End - run.fUtf8Start);
490 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500491
492 for (unsigned i = 0; i < len; i++) {
493 // Glyphs are in logical order, but output ltr since PDF readers seem to expect that.
494 const ShapedGlyph& glyph = run.fGlyphs[is_LTR(run.fLevel) ? start + i : end - 1 - i];
Florin Malita9867f612018-12-12 10:54:49 -0500495 buffer.glyphs[i] = glyph.fID;
496 buffer.positions[i] = SkPoint::Make(p->fX + glyph.fOffset.fX, p->fY - glyph.fOffset.fY);
497 if (buffer.clusters) {
498 buffer.clusters[i] = glyph.fCluster;
499 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500500 p->fX += glyph.fAdvance.fX;
501 p->fY += glyph.fAdvance.fY;
502 }
503}
504
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400505static void emit(const ShapedLine& line, SkShaper::RunHandler* handler,
506 SkPoint point, SkPoint& currentPoint, size_t& lineIndex)
507{
508 // Reorder the runs and glyphs per line and write them out.
509 SkScalar maxAscent = 0;
510 SkScalar maxDescent = 0;
511 SkScalar maxLeading = 0;
512 for (const ShapedRun& run : line.runs) {
513 SkFontMetrics metrics;
514 run.fFont.getMetrics(&metrics);
515 maxAscent = SkTMin(maxAscent, metrics.fAscent);
516 maxDescent = SkTMax(maxDescent, metrics.fDescent);
517 maxLeading = SkTMax(maxLeading, metrics.fLeading);
518 }
519
520 int numRuns = line.runs.size();
521 SkAutoSTMalloc<4, UBiDiLevel> runLevels(numRuns);
522 for (int i = 0; i < numRuns; ++i) {
523 runLevels[i] = line.runs[i].fLevel;
524 }
525 SkAutoSTMalloc<4, int32_t> logicalFromVisual(numRuns);
526 ubidi_reorderVisual(runLevels, numRuns, logicalFromVisual);
527
528 currentPoint.fY -= maxAscent;
529
530 for (int i = 0; i < numRuns; ++i) {
531 int logicalIndex = logicalFromVisual[i];
532
533 const auto& run = line.runs[logicalIndex];
534 const SkShaper::RunHandler::RunInfo info = {
535 lineIndex,
536 run.fAdvance,
537 maxAscent,
538 maxDescent,
539 maxLeading,
540 };
541 append(handler, info, run, 0, run.fNumGlyphs, &currentPoint);
542 }
543
544 currentPoint.fY += maxDescent + maxLeading;
545 currentPoint.fX = point.fX;
546
547 lineIndex++;
548}
549
Ben Wagner8d45a382017-11-16 10:08:28 -0500550struct ShapedRunGlyphIterator {
551 ShapedRunGlyphIterator(const SkTArray<ShapedRun>& origRuns)
552 : fRuns(&origRuns), fRunIndex(0), fGlyphIndex(0)
553 { }
554
555 ShapedRunGlyphIterator(const ShapedRunGlyphIterator& that) = default;
556 ShapedRunGlyphIterator& operator=(const ShapedRunGlyphIterator& that) = default;
557 bool operator==(const ShapedRunGlyphIterator& that) const {
558 return fRuns == that.fRuns &&
559 fRunIndex == that.fRunIndex &&
560 fGlyphIndex == that.fGlyphIndex;
561 }
562 bool operator!=(const ShapedRunGlyphIterator& that) const {
563 return fRuns != that.fRuns ||
564 fRunIndex != that.fRunIndex ||
565 fGlyphIndex != that.fGlyphIndex;
566 }
567
568 ShapedGlyph* next() {
569 const SkTArray<ShapedRun>& runs = *fRuns;
570 SkASSERT(fRunIndex < runs.count());
571 SkASSERT(fGlyphIndex < runs[fRunIndex].fNumGlyphs);
572
573 ++fGlyphIndex;
574 if (fGlyphIndex == runs[fRunIndex].fNumGlyphs) {
575 fGlyphIndex = 0;
576 ++fRunIndex;
577 if (fRunIndex >= runs.count()) {
578 return nullptr;
579 }
580 }
581 return &runs[fRunIndex].fGlyphs[fGlyphIndex];
582 }
583
584 ShapedGlyph* current() {
585 const SkTArray<ShapedRun>& runs = *fRuns;
586 if (fRunIndex >= runs.count()) {
587 return nullptr;
588 }
589 return &runs[fRunIndex].fGlyphs[fGlyphIndex];
590 }
591
592 const SkTArray<ShapedRun>* fRuns;
593 int fRunIndex;
594 int fGlyphIndex;
595};
596
597} // namespace
598
599struct SkShaper::Impl {
600 HBFont fHarfBuzzFont;
601 HBBuffer fBuffer;
602 sk_sp<SkTypeface> fTypeface;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400603 ICUBrk fLineBreakIterator;
604 ICUBrk fGraphemeBreakIterator;
605
606 SkPoint shapeCorrect(RunHandler* handler,
607 const char* utf8,
608 size_t utf8Bytes,
609 SkPoint point,
610 SkScalar width,
611 RunIteratorQueue& runSegmenter,
612 const BiDiRunIterator* bidi,
613 const LanguageRunIterator* language,
614 const ScriptRunIterator* script,
615 const FontRunIterator* font) const;
616
617 SkPoint shapeOk(RunHandler* handler,
618 const char* utf8,
619 size_t utf8Bytes,
620 SkPoint point,
621 SkScalar width,
622 RunIteratorQueue& runSegmenter,
623 const BiDiRunIterator* bidi,
624 const LanguageRunIterator* language,
625 const ScriptRunIterator* script,
626 const FontRunIterator* font) const;
627
628 ShapedRun shape(const char* utf8,
629 size_t utf8Bytes,
630 const char* utf8Start,
631 const char* utf8End,
632 const BiDiRunIterator* bidi,
633 const LanguageRunIterator* language,
634 const ScriptRunIterator* script,
635 const FontRunIterator* font) const;
Ben Wagner8d45a382017-11-16 10:08:28 -0500636};
637
Ben Wagnere0001732017-08-31 16:26:26 -0400638SkShaper::SkShaper(sk_sp<SkTypeface> tf) : fImpl(new Impl) {
Hal Canary0e07ad72018-02-08 13:06:56 -0500639 SkOnce once;
640 once([] { SkLoadICU(); });
641
Ben Wagnere0001732017-08-31 16:26:26 -0400642 fImpl->fTypeface = tf ? std::move(tf) : SkTypeface::MakeDefault();
643 fImpl->fHarfBuzzFont = create_hb_font(fImpl->fTypeface.get());
Florin Malitaa4e1a632019-01-22 16:27:01 -0500644 if (!fImpl->fHarfBuzzFont) {
645 SkDebugf("create_hb_font failed!\n");
646 }
Ben Wagnera25fbef2017-08-30 13:56:19 -0400647 fImpl->fBuffer.reset(hb_buffer_create());
Ben Wagner8d45a382017-11-16 10:08:28 -0500648 SkASSERT(fImpl->fBuffer);
649
Ben Wagner8d45a382017-11-16 10:08:28 -0500650 UErrorCode status = U_ZERO_ERROR;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400651 fImpl->fLineBreakIterator.reset(ubrk_open(UBRK_LINE, "th", nullptr, 0, &status));
Ben Wagner8d45a382017-11-16 10:08:28 -0500652 if (U_FAILURE(status)) {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400653 SkDebugf("Could not create line break iterator: %s", u_errorName(status));
Ben Wagner8d45a382017-11-16 10:08:28 -0500654 SK_ABORT("");
655 }
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400656
657 fImpl->fGraphemeBreakIterator.reset(ubrk_open(UBRK_CHARACTER, "th", nullptr, 0, &status));
658 if (U_FAILURE(status)) {
659 SkDebugf("Could not create grapheme break iterator: %s", u_errorName(status));
660 SK_ABORT("");
661 }
662
Ben Wagnera25fbef2017-08-30 13:56:19 -0400663}
664
665SkShaper::~SkShaper() {}
666
Ben Wagner8d45a382017-11-16 10:08:28 -0500667bool SkShaper::good() const {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400668 return fImpl->fBuffer &&
669 fImpl->fLineBreakIterator &&
670 fImpl->fGraphemeBreakIterator;
Ben Wagner8d45a382017-11-16 10:08:28 -0500671}
Ben Wagnera25fbef2017-08-30 13:56:19 -0400672
Florin Malita950243d2019-01-11 11:08:35 -0500673SkPoint SkShaper::shape(RunHandler* handler,
Kevin Lubick57abfe92019-01-28 13:15:51 -0500674 const SkFont& srcFont,
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500675 const char* utf8,
676 size_t utf8Bytes,
677 bool leftToRight,
678 SkPoint point,
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400679 SkScalar width) const
Ben Wagner8d45a382017-11-16 10:08:28 -0500680{
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400681 SkASSERT(handler);
682 sk_sp<SkFontMgr> fontMgr = SkFontMgr::RefDefault();
683 UBiDiLevel defaultLevel = leftToRight ? UBIDI_DEFAULT_LTR : UBIDI_DEFAULT_RTL;
684
Ben Wagner8d45a382017-11-16 10:08:28 -0500685 RunIteratorQueue runSegmenter;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400686
Ben Wagner8d45a382017-11-16 10:08:28 -0500687 SkTLazy<BiDiRunIterator> maybeBidi(BiDiRunIterator::Make(utf8, utf8Bytes, defaultLevel));
688 BiDiRunIterator* bidi = maybeBidi.getMaybeNull();
689 if (!bidi) {
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500690 return point;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400691 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500692 runSegmenter.insert(bidi);
Ben Wagnera25fbef2017-08-30 13:56:19 -0400693
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400694 SkTLazy<LanguageRunIterator> maybeLanguage(LanguageRunIterator::Make(utf8, utf8Bytes));
695 LanguageRunIterator* language = maybeLanguage.getMaybeNull();
696 if (!language) {
697 return point;
698 }
699 runSegmenter.insert(language);
700
Ben Wagner8d45a382017-11-16 10:08:28 -0500701 hb_unicode_funcs_t* hbUnicode = hb_buffer_get_unicode_funcs(fImpl->fBuffer.get());
702 SkTLazy<ScriptRunIterator> maybeScript(ScriptRunIterator::Make(utf8, utf8Bytes, hbUnicode));
703 ScriptRunIterator* script = maybeScript.getMaybeNull();
704 if (!script) {
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500705 return point;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400706 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500707 runSegmenter.insert(script);
Ben Wagnera25fbef2017-08-30 13:56:19 -0400708
Ben Wagner8d45a382017-11-16 10:08:28 -0500709 SkTLazy<FontRunIterator> maybeFont(FontRunIterator::Make(utf8, utf8Bytes,
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400710 srcFont, std::move(fontMgr)));
Ben Wagner8d45a382017-11-16 10:08:28 -0500711 FontRunIterator* font = maybeFont.getMaybeNull();
712 if (!font) {
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500713 return point;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400714 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500715 runSegmenter.insert(font);
Ben Wagnera25fbef2017-08-30 13:56:19 -0400716
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400717 if (true) {
718 return fImpl->shapeCorrect(handler, utf8, utf8Bytes, point, width,
719 runSegmenter, bidi, language, script, font);
720 } else {
721 return fImpl->shapeOk(handler, utf8, utf8Bytes, point, width,
722 runSegmenter, bidi, language, script, font);
723 }
724}
725
726SkPoint SkShaper::Impl::shapeCorrect(RunHandler* handler,
727 const char* utf8,
728 size_t utf8Bytes,
729 SkPoint point,
730 SkScalar width,
731 RunIteratorQueue& runSegmenter,
732 const BiDiRunIterator* bidi,
733 const LanguageRunIterator* language,
734 const ScriptRunIterator* script,
735 const FontRunIterator* font) const
736{
737 ShapedLine line;
738 size_t lineIndex = 0;
739 SkPoint currentPoint = point;
740
741 const char* utf8Start = nullptr;
742 const char* utf8End = utf8;
743 while (runSegmenter.advanceRuns()) { // For each item
744 utf8Start = utf8End;
745 utf8End = runSegmenter.endOfCurrentRun();
746
747 ShapedRun model(nullptr, nullptr, 0, SkFont(), 0, nullptr);
748 bool modelNeedsRegenerated = true;
749 int modelOffset = 0;
750
751 struct TextProps {
752 int glyphLen = 0;
753 SkVector advance = {0, 0};
754 };
755 // map from character position to [safe to break, glyph position, advance]
756 std::unique_ptr<TextProps[]> modelText;
757 int modelTextOffset = 0;
758 SkVector modelTextAdvanceOffset = {0, 0};
759
760 while (utf8Start < utf8End) { // While there are still code points left in this item
761 size_t utf8runLength = utf8End - utf8Start;
762 if (modelNeedsRegenerated) {
763 model = shape(utf8, utf8Bytes,
764 utf8Start, utf8End,
765 bidi, language, script, font);
766 modelOffset = 0;
767
768 SkVector advance = {0, 0};
769 modelText.reset(new TextProps[utf8runLength + 1]());
770 for (int i = 0; i < model.fNumGlyphs; ++i) {
771 SkASSERT(model.fGlyphs[i].fCluster < utf8runLength);
772 if (!model.fGlyphs[i].fUnsafeToBreak) {
773 modelText[model.fGlyphs[i].fCluster].glyphLen = i;
774 modelText[model.fGlyphs[i].fCluster].advance = advance;
775 }
776 advance += model.fGlyphs[i].fAdvance;
777 }
778 // Assume it is always safe to break after the end of an item
779 modelText[utf8runLength].glyphLen = model.fNumGlyphs;
780 modelText[utf8runLength].advance = model.fAdvance;
781 modelTextOffset = 0;
782 modelTextAdvanceOffset = {0, 0};
783 modelNeedsRegenerated = false;
784 }
785
786 // TODO: break iterator per item, but just reset position if needed?
787 // Maybe break iterator with model?
788 UBreakIterator& breakIterator = *fLineBreakIterator;
789 {
790 UErrorCode status = U_ZERO_ERROR;
791 UText utf8UText = UTEXT_INITIALIZER;
792 utext_openUTF8(&utf8UText, utf8Start, utf8runLength, &status);
793 std::unique_ptr<UText, SkFunctionWrapper<UText*, UText, utext_close>> autoClose(&utf8UText);
794 if (U_FAILURE(status)) {
795 SkDebugf("Could not create utf8UText: %s", u_errorName(status));
796 return point;
797 }
798 ubrk_setUText(&breakIterator, &utf8UText, &status);
799 if (U_FAILURE(status)) {
800 SkDebugf("Could not setText on break iterator: %s", u_errorName(status));
801 return point;
802 }
803 }
804
805 ShapedRun best(nullptr, nullptr, 0, SkFont(), 0, nullptr);
806 best.fAdvance = { SK_ScalarNegativeInfinity, SK_ScalarNegativeInfinity };
807 SkScalar widthLeft = width - line.fAdvance.fX;
808
809 for (int32_t breakIteratorCurrent = ubrk_next(&breakIterator);
810 breakIteratorCurrent != UBRK_DONE;
811 breakIteratorCurrent = ubrk_next(&breakIterator))
812 {
813 // TODO: if past a safe to break, future safe to break will be at least as long
814
815 // TODO: adjust breakIteratorCurrent by ignorable whitespace
816 ShapedRun candidate = modelText[breakIteratorCurrent + modelTextOffset].glyphLen
817 ? ShapedRun(utf8Start, utf8Start + breakIteratorCurrent,
818 modelText[breakIteratorCurrent + modelTextOffset].glyphLen - modelOffset,
819 *font->currentFont(),
820 bidi->currentLevel(),
821 std::unique_ptr<ShapedGlyph[]>())
822 : shape(utf8, utf8Bytes,
823 utf8Start, utf8Start + breakIteratorCurrent,
824 bidi, language, script, font);
825 if (!candidate.fUtf8Start) {
826 //report error
827 return point;
828 }
829 if (!candidate.fGlyphs) {
830 candidate.fAdvance = modelText[breakIteratorCurrent + modelTextOffset].advance - modelTextAdvanceOffset;
831 }
832 auto score = [widthLeft](const ShapedRun& run) -> SkScalar {
833 if (run.fAdvance.fX < widthLeft) {
834 if (run.fUtf8Start == nullptr) {
835 return SK_ScalarNegativeInfinity;
836 } else {
837 return run.fUtf8End - run.fUtf8Start;
838 }
839 } else {
840 return widthLeft - run.fAdvance.fX;
841 }
842 };
843 if (score(best) < score(candidate)) {
844 best = std::move(candidate);
845 }
846 }
847
848 // If nothing fit (best score is negative) and the line is not empty
849 if (width < line.fAdvance.fX + best.fAdvance.fX && !line.runs.empty()) {
850 emit(line, handler, point, currentPoint, lineIndex);
851 line.runs.reset();
852 line.fAdvance = {0, 0};
853 } else {
854 if (!best.fGlyphs) {
855 best.fGlyphs.reset(new ShapedGlyph[best.fNumGlyphs]);
856 memcpy(best.fGlyphs.get(), model.fGlyphs.get() + modelOffset,
857 best.fNumGlyphs * sizeof(ShapedGlyph));
858 modelOffset += best.fNumGlyphs;
859 modelTextOffset += best.fUtf8End - best.fUtf8Start;
860 modelTextAdvanceOffset += best.fAdvance;
861 } else {
862 modelNeedsRegenerated = true;
863 }
864 utf8Start = best.fUtf8End;
865 line.fAdvance += best.fAdvance;
866 line.runs.emplace_back(std::move(best));
867
868 // If item broken, emit line (prevent remainder from accidentally fitting)
869 if (utf8Start != utf8End) {
870 emit(line, handler, point, currentPoint, lineIndex);
871 line.runs.reset();
872 line.fAdvance = {0, 0};
873 }
874 }
875 }
876 }
877 emit(line, handler, point, currentPoint, lineIndex);
878 return currentPoint;
879}
880
881SkPoint SkShaper::Impl::shapeOk(RunHandler* handler,
882 const char* utf8,
883 size_t utf8Bytes,
884 SkPoint point,
885 SkScalar width,
886 RunIteratorQueue& runSegmenter,
887 const BiDiRunIterator* bidi,
888 const LanguageRunIterator* language,
889 const ScriptRunIterator* script,
890 const FontRunIterator* font) const
891{
892 SkTArray<ShapedRun> runs;
893{
894 UBreakIterator& lineBreakIterator = *fLineBreakIterator;
895 UBreakIterator& graphemeBreakIterator = *fGraphemeBreakIterator;
Ben Wagner8d45a382017-11-16 10:08:28 -0500896 {
897 UErrorCode status = U_ZERO_ERROR;
898 UText utf8UText = UTEXT_INITIALIZER;
899 utext_openUTF8(&utf8UText, utf8, utf8Bytes, &status);
900 std::unique_ptr<UText, SkFunctionWrapper<UText*, UText, utext_close>> autoClose(&utf8UText);
901 if (U_FAILURE(status)) {
902 SkDebugf("Could not create utf8UText: %s", u_errorName(status));
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500903 return point;
Ben Wagner8d45a382017-11-16 10:08:28 -0500904 }
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400905
906 ubrk_setUText(&lineBreakIterator, &utf8UText, &status);
Ben Wagner8d45a382017-11-16 10:08:28 -0500907 if (U_FAILURE(status)) {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400908 SkDebugf("Could not setText on line break iterator: %s", u_errorName(status));
909 return point;
910 }
911 ubrk_setUText(&graphemeBreakIterator, &utf8UText, &status);
912 if (U_FAILURE(status)) {
913 SkDebugf("Could not setText on grapheme break iterator: %s", u_errorName(status));
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500914 return point;
Ben Wagner8d45a382017-11-16 10:08:28 -0500915 }
Ben Wagnera25fbef2017-08-30 13:56:19 -0400916 }
917
Ben Wagner8d45a382017-11-16 10:08:28 -0500918 const char* utf8Start = nullptr;
919 const char* utf8End = utf8;
920 while (runSegmenter.advanceRuns()) {
921 utf8Start = utf8End;
922 utf8End = runSegmenter.endOfCurrentRun();
923
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400924 runs.emplace_back(shape(utf8, utf8Bytes,
925 utf8Start, utf8End,
926 bidi, language, script, font));
927 ShapedRun& run = runs.back();
Ben Wagnera25fbef2017-08-30 13:56:19 -0400928
Ben Wagner8d45a382017-11-16 10:08:28 -0500929 int32_t clusterOffset = utf8Start - utf8;
930 uint32_t previousCluster = 0xFFFFFFFF;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400931 for (int i = 0; i < run.fNumGlyphs; ++i) {
Ben Wagner8d45a382017-11-16 10:08:28 -0500932 ShapedGlyph& glyph = run.fGlyphs[i];
933 int32_t glyphCluster = glyph.fCluster + clusterOffset;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400934
935 int32_t lineBreakIteratorCurrent = ubrk_current(&lineBreakIterator);
936 while (lineBreakIteratorCurrent != UBRK_DONE &&
937 lineBreakIteratorCurrent < glyphCluster)
Ben Wagner8d45a382017-11-16 10:08:28 -0500938 {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400939 lineBreakIteratorCurrent = ubrk_next(&lineBreakIterator);
Ben Wagner2868b782017-08-31 14:12:27 -0400940 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500941 glyph.fMayLineBreakBefore = glyph.fCluster != previousCluster &&
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400942 lineBreakIteratorCurrent == glyphCluster;
943
944 int32_t graphemeBreakIteratorCurrent = ubrk_current(&graphemeBreakIterator);
945 while (graphemeBreakIteratorCurrent != UBRK_DONE &&
946 graphemeBreakIteratorCurrent < glyphCluster)
947 {
948 graphemeBreakIteratorCurrent = ubrk_next(&graphemeBreakIterator);
949 }
950 glyph.fGraphemeBreakBefore = glyph.fCluster != previousCluster &&
951 graphemeBreakIteratorCurrent == glyphCluster;
952
Ben Wagner8d45a382017-11-16 10:08:28 -0500953 previousCluster = glyph.fCluster;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400954 }
955 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500956}
957
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400958// Iterate over the glyphs in logical order to find potential line lengths.
Ben Wagner8d45a382017-11-16 10:08:28 -0500959{
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400960 /** The position of the beginning of the line. */
961 ShapedRunGlyphIterator beginning(runs);
962
963 /** The position of the candidate line break. */
964 ShapedRunGlyphIterator candidateLineBreak(runs);
965 SkScalar candidateLineBreakWidth = 0;
966
967 /** The position of the candidate grapheme break. */
968 ShapedRunGlyphIterator candidateGraphemeBreak(runs);
969 SkScalar candidateGraphemeBreakWidth = 0;
970
971 /** The position of the current location. */
972 ShapedRunGlyphIterator current(runs);
973 SkScalar currentWidth = 0;
974 while (ShapedGlyph* glyph = current.current()) {
975 // 'Break' at graphemes until a line boundary, then only at line boundaries.
976 // Only break at graphemes if no line boundary is valid.
977 if (current != beginning) {
978 if (glyph->fGraphemeBreakBefore || glyph->fMayLineBreakBefore) {
979 // TODO: preserve line breaks <= grapheme breaks
980 // and prevent line breaks inside graphemes
981 candidateGraphemeBreak = current;
982 candidateGraphemeBreakWidth = currentWidth;
983 if (glyph->fMayLineBreakBefore) {
984 candidateLineBreak = current;
985 candidateLineBreakWidth = currentWidth;
986 }
987 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500988 }
989
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400990 SkScalar glyphWidth = glyph->fAdvance.fX;
991 // Break when overwidth, the glyph has a visual representation, and some space is used.
992 if (width < currentWidth + glyphWidth && glyph->fHasVisual && candidateGraphemeBreakWidth > 0){
993 if (candidateLineBreak != beginning) {
994 beginning = candidateLineBreak;
995 currentWidth -= candidateLineBreakWidth;
996 candidateGraphemeBreakWidth -= candidateLineBreakWidth;
997 candidateLineBreakWidth = 0;
998 } else if (candidateGraphemeBreak != beginning) {
999 beginning = candidateGraphemeBreak;
1000 candidateLineBreak = beginning;
1001 currentWidth -= candidateGraphemeBreakWidth;
1002 candidateGraphemeBreakWidth = 0;
1003 candidateLineBreakWidth = 0;
1004 } else {
1005 SK_ABORT("");
1006 }
1007
1008 if (width < currentWidth) {
1009 if (width < candidateGraphemeBreakWidth) {
1010 candidateGraphemeBreak = candidateLineBreak;
1011 candidateGraphemeBreakWidth = candidateLineBreakWidth;
1012 }
1013 current = candidateGraphemeBreak;
1014 currentWidth = candidateGraphemeBreakWidth;
1015 }
1016
1017 glyph = beginning.current();
1018 if (glyph) {
1019 glyph->fMustLineBreakBefore = true;
1020 }
1021
1022 } else {
1023 current.next();
1024 currentWidth += glyphWidth;
Ben Wagner8d45a382017-11-16 10:08:28 -05001025 }
Ben Wagner8d45a382017-11-16 10:08:28 -05001026 }
1027}
1028
1029// Reorder the runs and glyphs per line and write them out.
Ben Wagner5d4dd8b2018-01-25 14:37:17 -05001030 SkPoint currentPoint = point;
Ben Wagner8d45a382017-11-16 10:08:28 -05001031{
1032 ShapedRunGlyphIterator previousBreak(runs);
1033 ShapedRunGlyphIterator glyphIterator(runs);
1034 SkScalar maxAscent = 0;
1035 SkScalar maxDescent = 0;
1036 SkScalar maxLeading = 0;
1037 int previousRunIndex = -1;
Florin Malita950243d2019-01-11 11:08:35 -05001038 size_t lineIndex = 0;
Ben Wagner8d45a382017-11-16 10:08:28 -05001039 while (glyphIterator.current()) {
1040 int runIndex = glyphIterator.fRunIndex;
1041 int glyphIndex = glyphIterator.fGlyphIndex;
1042 ShapedGlyph* nextGlyph = glyphIterator.next();
1043
1044 if (previousRunIndex != runIndex) {
Mike Reedb5784ac2018-11-12 09:35:15 -05001045 SkFontMetrics metrics;
Mike Reed6d595682018-12-05 17:28:14 -05001046 runs[runIndex].fFont.getMetrics(&metrics);
Ben Wagner8d45a382017-11-16 10:08:28 -05001047 maxAscent = SkTMin(maxAscent, metrics.fAscent);
1048 maxDescent = SkTMax(maxDescent, metrics.fDescent);
1049 maxLeading = SkTMax(maxLeading, metrics.fLeading);
1050 previousRunIndex = runIndex;
1051 }
1052
1053 // Nothing can be written until the baseline is known.
1054 if (!(nextGlyph == nullptr || nextGlyph->fMustLineBreakBefore)) {
1055 continue;
1056 }
1057
1058 currentPoint.fY -= maxAscent;
1059
1060 int numRuns = runIndex - previousBreak.fRunIndex + 1;
1061 SkAutoSTMalloc<4, UBiDiLevel> runLevels(numRuns);
1062 for (int i = 0; i < numRuns; ++i) {
1063 runLevels[i] = runs[previousBreak.fRunIndex + i].fLevel;
1064 }
1065 SkAutoSTMalloc<4, int32_t> logicalFromVisual(numRuns);
1066 ubidi_reorderVisual(runLevels, numRuns, logicalFromVisual);
1067
Ben Wagner0ec8ec22018-09-04 18:17:13 -04001068 // step through the runs in reverse visual order and the glyphs in reverse logical order
1069 // until a visible glyph is found and force them to the end of the visual line.
1070
Ben Wagner8d45a382017-11-16 10:08:28 -05001071 for (int i = 0; i < numRuns; ++i) {
1072 int logicalIndex = previousBreak.fRunIndex + logicalFromVisual[i];
1073
1074 int startGlyphIndex = (logicalIndex == previousBreak.fRunIndex)
1075 ? previousBreak.fGlyphIndex
1076 : 0;
1077 int endGlyphIndex = (logicalIndex == runIndex)
1078 ? glyphIndex + 1
1079 : runs[logicalIndex].fNumGlyphs;
Florin Malita950243d2019-01-11 11:08:35 -05001080
1081 const auto& run = runs[logicalIndex];
1082 const RunHandler::RunInfo info = {
1083 lineIndex,
1084 run.fAdvance,
1085 maxAscent,
1086 maxDescent,
1087 maxLeading,
1088 };
1089 append(handler, info, run, startGlyphIndex, endGlyphIndex, &currentPoint);
Ben Wagner8d45a382017-11-16 10:08:28 -05001090 }
1091
1092 currentPoint.fY += maxDescent + maxLeading;
1093 currentPoint.fX = point.fX;
1094 maxAscent = 0;
1095 maxDescent = 0;
1096 maxLeading = 0;
1097 previousRunIndex = -1;
Florin Malita950243d2019-01-11 11:08:35 -05001098 ++lineIndex;
Ben Wagner8d45a382017-11-16 10:08:28 -05001099 previousBreak = glyphIterator;
1100 }
1101}
1102
Ben Wagner5d4dd8b2018-01-25 14:37:17 -05001103 return currentPoint;
Ben Wagnera25fbef2017-08-30 13:56:19 -04001104}
Ben Wagner0ec8ec22018-09-04 18:17:13 -04001105
1106
1107ShapedRun SkShaper::Impl::shape(const char* utf8,
1108 size_t utf8Bytes,
1109 const char* utf8Start,
1110 const char* utf8End,
1111 const BiDiRunIterator* bidi,
1112 const LanguageRunIterator* language,
1113 const ScriptRunIterator* script,
1114 const FontRunIterator* font) const
1115{
1116 ShapedRun run(nullptr, nullptr, 0, SkFont(), 0, nullptr);
1117
1118 hb_buffer_t* buffer = fBuffer.get();
1119 SkAutoTCallVProc<hb_buffer_t, hb_buffer_clear_contents> autoClearBuffer(buffer);
1120 hb_buffer_set_content_type(buffer, HB_BUFFER_CONTENT_TYPE_UNICODE);
1121 hb_buffer_set_cluster_level(buffer, HB_BUFFER_CLUSTER_LEVEL_MONOTONE_CHARACTERS);
1122
1123 // Add precontext.
1124 hb_buffer_add_utf8(buffer, utf8, utf8Start - utf8, utf8Start - utf8, 0);
1125
1126 // Populate the hb_buffer directly with utf8 cluster indexes.
1127 const char* utf8Current = utf8Start;
1128 while (utf8Current < utf8End) {
1129 unsigned int cluster = utf8Current - utf8Start;
1130 hb_codepoint_t u = utf8_next(&utf8Current, utf8End);
1131 hb_buffer_add(buffer, u, cluster);
1132 }
1133
1134 // Add postcontext.
1135 hb_buffer_add_utf8(buffer, utf8Current, utf8 + utf8Bytes - utf8Current, 0, 0);
1136
1137 size_t utf8runLength = utf8End - utf8Start;
1138 if (!SkTFitsIn<int>(utf8runLength)) {
1139 SkDebugf("Shaping error: utf8 too long");
1140 return run;
1141 }
1142 hb_direction_t direction = is_LTR(bidi->currentLevel()) ? HB_DIRECTION_LTR:HB_DIRECTION_RTL;
1143 hb_buffer_set_direction(buffer, direction);
1144 hb_buffer_set_script(buffer, script->currentScript());
1145 hb_buffer_set_language(buffer, language->currentLanguage());
1146 hb_buffer_guess_segment_properties(buffer);
1147 // TODO: features
1148 if (!font->currentHBFont()) {
1149 return run;
1150 }
1151 hb_shape(font->currentHBFont(), buffer, nullptr, 0);
1152 unsigned len = hb_buffer_get_length(buffer);
1153 if (len == 0) {
1154 // TODO: this isn't an error, make it look different
1155 return run;
1156 }
1157
1158 if (direction == HB_DIRECTION_RTL) {
1159 // Put the clusters back in logical order.
1160 // Note that the advances remain ltr.
1161 hb_buffer_reverse(buffer);
1162 }
1163 hb_glyph_info_t* info = hb_buffer_get_glyph_infos(buffer, nullptr);
1164 hb_glyph_position_t* pos = hb_buffer_get_glyph_positions(buffer, nullptr);
1165
1166 if (!SkTFitsIn<int>(len)) {
1167 SkDebugf("Shaping error: too many glyphs");
1168 return run;
1169 }
1170
1171 run = ShapedRun(utf8Start, utf8End, len, *font->currentFont(),
1172 bidi->currentLevel(),
1173 std::unique_ptr<ShapedGlyph[]>(new ShapedGlyph[len]));
1174 int scaleX, scaleY;
1175 hb_font_get_scale(font->currentHBFont(), &scaleX, &scaleY);
1176 double textSizeY = run.fFont.getSize() / scaleY;
1177 double textSizeX = run.fFont.getSize() / scaleX * run.fFont.getScaleX();
1178 SkVector runAdvance = { 0, 0 };
1179 for (unsigned i = 0; i < len; i++) {
1180 ShapedGlyph& glyph = run.fGlyphs[i];
1181 glyph.fID = info[i].codepoint;
1182 glyph.fCluster = info[i].cluster;
1183 glyph.fOffset.fX = pos[i].x_offset * textSizeX;
1184 glyph.fOffset.fY = pos[i].y_offset * textSizeY;
1185 glyph.fAdvance.fX = pos[i].x_advance * textSizeX;
1186 glyph.fAdvance.fY = pos[i].y_advance * textSizeY;
1187
1188 SkRect bounds;
1189 SkScalar advance;
1190 SkPaint p;
1191 run.fFont.getWidthsBounds(&glyph.fID, 1, &advance, &bounds, &p);
1192 glyph.fHasVisual = !bounds.isEmpty(); //!font->currentTypeface()->glyphBoundsAreZero(glyph.fID);
1193 glyph.fUnsafeToBreak = info[i].mask & HB_GLYPH_FLAG_UNSAFE_TO_BREAK;
1194 glyph.fMustLineBreakBefore = false;
1195
1196 runAdvance += glyph.fAdvance;
1197 }
1198 run.fAdvance = runAdvance;
1199
1200 return run;
1201}