blob: a74d0c07af931817afc0434208c77cd12e67ceed [file] [log] [blame]
Ben Wagnera25fbef2017-08-30 13:56:19 -04001/*
2 * Copyright 2016 Google Inc.
3 *
4 * Use of this source code is governed by a BSD-style license that can be
5 * found in the LICENSE file.
6 */
7
Ben Wagner2fc14742019-02-06 16:37:44 -05008#include "SkBitmaskEnum.h"
Hal Canary61021922019-02-06 12:29:11 -05009#include "SkFont.h"
Ben Wagner17774242018-08-07 14:31:33 -040010#include "SkFontArguments.h"
Hal Canary61021922019-02-06 12:29:11 -050011#include "SkFontMetrics.h"
Ben Wagner67e3a302017-09-05 14:46:19 -040012#include "SkFontMgr.h"
Ben Wagner17774242018-08-07 14:31:33 -040013#include "SkMalloc.h"
Ben Wagner17774242018-08-07 14:31:33 -040014#include "SkPoint.h"
15#include "SkRefCnt.h"
16#include "SkScalar.h"
Ben Wagnera25fbef2017-08-30 13:56:19 -040017#include "SkShaper.h"
18#include "SkStream.h"
Ben Wagner17774242018-08-07 14:31:33 -040019#include "SkString.h"
20#include "SkTArray.h"
Ben Wagner8d45a382017-11-16 10:08:28 -050021#include "SkTDPQueue.h"
Ben Wagner17774242018-08-07 14:31:33 -040022#include "SkTFitsIn.h"
Ben Wagner8d45a382017-11-16 10:08:28 -050023#include "SkTLazy.h"
Ben Wagnere0001732017-08-31 16:26:26 -040024#include "SkTemplates.h"
Hal Canaryc640d0d2018-06-13 09:59:02 -040025#include "SkTo.h"
Ben Wagnera25fbef2017-08-30 13:56:19 -040026#include "SkTypeface.h"
Ben Wagner17774242018-08-07 14:31:33 -040027#include "SkTypes.h"
28#include "SkUTF.h"
29
30#include <hb.h>
31#include <hb-ot.h>
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -050032#include <unicode/ubrk.h>
Ben Wagner17774242018-08-07 14:31:33 -040033#include <unicode/ubidi.h>
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -050034#include <unicode/ustring.h>
Ben Wagner17774242018-08-07 14:31:33 -040035#include <unicode/urename.h>
36#include <unicode/utext.h>
37#include <unicode/utypes.h>
38
Ben Wagner0ec8ec22018-09-04 18:17:13 -040039#include <cstring>
40#include <locale>
Ben Wagner17774242018-08-07 14:31:33 -040041#include <memory>
42#include <utility>
Ben Wagnera25fbef2017-08-30 13:56:19 -040043
Hal Canary61021922019-02-06 12:29:11 -050044#if defined(SK_USING_THIRD_PARTY_ICU)
Hal Canary32498f02019-02-04 15:36:31 -050045#include "SkLoadICU.h"
Hal Canary61021922019-02-06 12:29:11 -050046#endif
Hal Canary32498f02019-02-04 15:36:31 -050047
Ben Wagner2fc14742019-02-06 16:37:44 -050048namespace skstd {
49template <> struct is_bitmask_enum<hb_buffer_flags_t> : std::true_type {};
50}
51
Ben Wagnera25fbef2017-08-30 13:56:19 -040052namespace {
53template <class T, void(*P)(T*)> using resource = std::unique_ptr<T, SkFunctionWrapper<void, T, P>>;
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -050054using HBBlob = resource<hb_blob_t , hb_blob_destroy >;
55using HBFace = resource<hb_face_t , hb_face_destroy >;
56using HBFont = resource<hb_font_t , hb_font_destroy >;
57using HBBuffer = resource<hb_buffer_t , hb_buffer_destroy>;
58using ICUBiDi = resource<UBiDi , ubidi_close >;
Ben Wagner0ec8ec22018-09-04 18:17:13 -040059using ICUBrk = resource<UBreakIterator, ubrk_close >;
Ben Wagnera25fbef2017-08-30 13:56:19 -040060
61HBBlob stream_to_blob(std::unique_ptr<SkStreamAsset> asset) {
62 size_t size = asset->getLength();
63 HBBlob blob;
64 if (const void* base = asset->getMemoryBase()) {
65 blob.reset(hb_blob_create((char*)base, SkToUInt(size),
66 HB_MEMORY_MODE_READONLY, asset.release(),
67 [](void* p) { delete (SkStreamAsset*)p; }));
68 } else {
69 // SkDebugf("Extra SkStreamAsset copy\n");
70 void* ptr = size ? sk_malloc_throw(size) : nullptr;
71 asset->read(ptr, size);
72 blob.reset(hb_blob_create((char*)ptr, SkToUInt(size),
73 HB_MEMORY_MODE_READONLY, ptr, sk_free));
74 }
75 SkASSERT(blob);
76 hb_blob_make_immutable(blob.get());
77 return blob;
78}
Ben Wagnera25fbef2017-08-30 13:56:19 -040079
Ben Wagner8d45a382017-11-16 10:08:28 -050080HBFont create_hb_font(SkTypeface* tf) {
Hal Canary0dfa2082018-10-31 13:02:49 -040081 if (!tf) {
82 return nullptr;
83 }
Ben Wagnera25fbef2017-08-30 13:56:19 -040084 int index;
Hal Canaryddef43f2018-11-16 10:53:51 -050085 std::unique_ptr<SkStreamAsset> typefaceAsset(tf->openStream(&index));
86 if (!typefaceAsset) {
87 SkString name;
88 tf->getFamilyName(&name);
89 SkDebugf("Typeface '%s' has no data :(\n", name.c_str());
90 return nullptr;
91 }
92 HBBlob blob(stream_to_blob(std::move(typefaceAsset)));
Ben Wagnera25fbef2017-08-30 13:56:19 -040093 HBFace face(hb_face_create(blob.get(), (unsigned)index));
94 SkASSERT(face);
95 if (!face) {
Ben Wagnere0001732017-08-31 16:26:26 -040096 return nullptr;
Ben Wagnera25fbef2017-08-30 13:56:19 -040097 }
98 hb_face_set_index(face.get(), (unsigned)index);
Ben Wagnere0001732017-08-31 16:26:26 -040099 hb_face_set_upem(face.get(), tf->getUnitsPerEm());
Ben Wagnera25fbef2017-08-30 13:56:19 -0400100
Ben Wagnere0001732017-08-31 16:26:26 -0400101 HBFont font(hb_font_create(face.get()));
102 SkASSERT(font);
103 if (!font) {
104 return nullptr;
105 }
Ben Wagnere0001732017-08-31 16:26:26 -0400106 hb_ot_font_set_funcs(font.get());
107 int axis_count = tf->getVariationDesignPosition(nullptr, 0);
108 if (axis_count > 0) {
109 SkAutoSTMalloc<4, SkFontArguments::VariationPosition::Coordinate> axis_values(axis_count);
110 if (tf->getVariationDesignPosition(axis_values, axis_count) == axis_count) {
111 hb_font_set_variations(font.get(),
112 reinterpret_cast<hb_variation_t*>(axis_values.get()),
113 axis_count);
114 }
115 }
116 return font;
117}
118
Hal Canaryf107a2f2018-07-25 16:52:48 -0400119/** this version replaces invalid utf-8 sequences with code point U+FFFD. */
120static inline SkUnichar utf8_next(const char** ptr, const char* end) {
121 SkUnichar val = SkUTF::NextUTF8(ptr, end);
122 if (val < 0) {
123 return 0xFFFD; // REPLACEMENT CHARACTER
124 }
125 return val;
126}
127
Ben Wagner8d45a382017-11-16 10:08:28 -0500128class RunIterator {
129public:
130 virtual ~RunIterator() {}
131 virtual void consume() = 0;
132 // Pointer one past the last (utf8) element in the current run.
133 virtual const char* endOfCurrentRun() const = 0;
134 virtual bool atEnd() const = 0;
135 bool operator<(const RunIterator& that) const {
136 return this->endOfCurrentRun() < that.endOfCurrentRun();
137 }
138};
139
140class BiDiRunIterator : public RunIterator {
141public:
142 static SkTLazy<BiDiRunIterator> Make(const char* utf8, size_t utf8Bytes, UBiDiLevel level) {
143 SkTLazy<BiDiRunIterator> ret;
144
145 // ubidi only accepts utf16 (though internally it basically works on utf32 chars).
146 // We want an ubidi_setPara(UBiDi*, UText*, UBiDiLevel, UBiDiLevel*, UErrorCode*);
147 if (!SkTFitsIn<int32_t>(utf8Bytes)) {
148 SkDebugf("Bidi error: text too long");
149 return ret;
150 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500151
152 UErrorCode status = U_ZERO_ERROR;
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -0500153
154 // Getting the length like this seems to always set U_BUFFER_OVERFLOW_ERROR
155 int32_t utf16Units;
156 u_strFromUTF8(nullptr, 0, &utf16Units, utf8, utf8Bytes, &status);
157 status = U_ZERO_ERROR;
158 std::unique_ptr<UChar[]> utf16(new UChar[utf16Units]);
159 u_strFromUTF8(utf16.get(), utf16Units, nullptr, utf8, utf8Bytes, &status);
160 if (U_FAILURE(status)) {
161 SkDebugf("Invalid utf8 input: %s", u_errorName(status));
162 return ret;
163 }
164
165 ICUBiDi bidi(ubidi_openSized(utf16Units, 0, &status));
Ben Wagner8d45a382017-11-16 10:08:28 -0500166 if (U_FAILURE(status)) {
167 SkDebugf("Bidi error: %s", u_errorName(status));
168 return ret;
169 }
170 SkASSERT(bidi);
171
172 // The required lifetime of utf16 isn't well documented.
173 // It appears it isn't used after ubidi_setPara except through ubidi_getText.
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -0500174 ubidi_setPara(bidi.get(), utf16.get(), utf16Units, level, nullptr, &status);
Ben Wagner8d45a382017-11-16 10:08:28 -0500175 if (U_FAILURE(status)) {
176 SkDebugf("Bidi error: %s", u_errorName(status));
177 return ret;
178 }
179
Hal Canary4014ba62018-07-24 11:33:21 -0400180 ret.init(utf8, utf8 + utf8Bytes, std::move(bidi));
Ben Wagner8d45a382017-11-16 10:08:28 -0500181 return ret;
182 }
Hal Canary4014ba62018-07-24 11:33:21 -0400183 BiDiRunIterator(const char* utf8, const char* end, ICUBiDi bidi)
Ben Wagner8d45a382017-11-16 10:08:28 -0500184 : fBidi(std::move(bidi))
185 , fEndOfCurrentRun(utf8)
Hal Canary4014ba62018-07-24 11:33:21 -0400186 , fEndOfAllRuns(end)
Ben Wagner8d45a382017-11-16 10:08:28 -0500187 , fUTF16LogicalPosition(0)
188 , fLevel(UBIDI_DEFAULT_LTR)
189 {}
190 void consume() override {
191 SkASSERT(fUTF16LogicalPosition < ubidi_getLength(fBidi.get()));
192 int32_t endPosition = ubidi_getLength(fBidi.get());
193 fLevel = ubidi_getLevelAt(fBidi.get(), fUTF16LogicalPosition);
Hal Canaryf107a2f2018-07-25 16:52:48 -0400194 SkUnichar u = utf8_next(&fEndOfCurrentRun, fEndOfAllRuns);
195 fUTF16LogicalPosition += SkUTF::ToUTF16(u);
Ben Wagner8d45a382017-11-16 10:08:28 -0500196 UBiDiLevel level;
197 while (fUTF16LogicalPosition < endPosition) {
198 level = ubidi_getLevelAt(fBidi.get(), fUTF16LogicalPosition);
199 if (level != fLevel) {
200 break;
201 }
Hal Canaryf107a2f2018-07-25 16:52:48 -0400202 u = utf8_next(&fEndOfCurrentRun, fEndOfAllRuns);
203 fUTF16LogicalPosition += SkUTF::ToUTF16(u);
Ben Wagner8d45a382017-11-16 10:08:28 -0500204 }
205 }
206 const char* endOfCurrentRun() const override {
207 return fEndOfCurrentRun;
208 }
209 bool atEnd() const override {
210 return fUTF16LogicalPosition == ubidi_getLength(fBidi.get());
211 }
212
213 UBiDiLevel currentLevel() const {
214 return fLevel;
215 }
216private:
217 ICUBiDi fBidi;
218 const char* fEndOfCurrentRun;
Hal Canary4014ba62018-07-24 11:33:21 -0400219 const char* fEndOfAllRuns;
Ben Wagner8d45a382017-11-16 10:08:28 -0500220 int32_t fUTF16LogicalPosition;
221 UBiDiLevel fLevel;
222};
223
224class ScriptRunIterator : public RunIterator {
225public:
226 static SkTLazy<ScriptRunIterator> Make(const char* utf8, size_t utf8Bytes,
227 hb_unicode_funcs_t* hbUnicode)
228 {
229 SkTLazy<ScriptRunIterator> ret;
230 ret.init(utf8, utf8Bytes, hbUnicode);
231 return ret;
232 }
233 ScriptRunIterator(const char* utf8, size_t utf8Bytes, hb_unicode_funcs_t* hbUnicode)
234 : fCurrent(utf8), fEnd(fCurrent + utf8Bytes)
235 , fHBUnicode(hbUnicode)
236 , fCurrentScript(HB_SCRIPT_UNKNOWN)
237 {}
238 void consume() override {
239 SkASSERT(fCurrent < fEnd);
Hal Canaryf107a2f2018-07-25 16:52:48 -0400240 SkUnichar u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500241 fCurrentScript = hb_unicode_script(fHBUnicode, u);
242 while (fCurrent < fEnd) {
243 const char* prev = fCurrent;
Hal Canaryf107a2f2018-07-25 16:52:48 -0400244 u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500245 const hb_script_t script = hb_unicode_script(fHBUnicode, u);
246 if (script != fCurrentScript) {
247 if (fCurrentScript == HB_SCRIPT_INHERITED || fCurrentScript == HB_SCRIPT_COMMON) {
248 fCurrentScript = script;
249 } else if (script == HB_SCRIPT_INHERITED || script == HB_SCRIPT_COMMON) {
250 continue;
251 } else {
252 fCurrent = prev;
253 break;
254 }
255 }
256 }
257 if (fCurrentScript == HB_SCRIPT_INHERITED) {
258 fCurrentScript = HB_SCRIPT_COMMON;
259 }
260 }
261 const char* endOfCurrentRun() const override {
262 return fCurrent;
263 }
264 bool atEnd() const override {
265 return fCurrent == fEnd;
266 }
267
268 hb_script_t currentScript() const {
269 return fCurrentScript;
270 }
271private:
272 const char* fCurrent;
273 const char* fEnd;
274 hb_unicode_funcs_t* fHBUnicode;
275 hb_script_t fCurrentScript;
276};
277
278class FontRunIterator : public RunIterator {
279public:
280 static SkTLazy<FontRunIterator> Make(const char* utf8, size_t utf8Bytes,
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400281 SkFont font,
Ben Wagner8d45a382017-11-16 10:08:28 -0500282 sk_sp<SkFontMgr> fallbackMgr)
283 {
284 SkTLazy<FontRunIterator> ret;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400285 font.setTypeface(font.refTypefaceOrDefault());
286 HBFont hbFont = create_hb_font(font.getTypeface());
287 if (!hbFont) {
288 SkDebugf("create_hb_font failed!\n");
289 return ret;
290 }
291 ret.init(utf8, utf8Bytes, std::move(font), std::move(hbFont), std::move(fallbackMgr));
Ben Wagner8d45a382017-11-16 10:08:28 -0500292 return ret;
293 }
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400294 FontRunIterator(const char* utf8, size_t utf8Bytes, SkFont font,
295 HBFont hbFont, sk_sp<SkFontMgr> fallbackMgr)
Ben Wagner8d45a382017-11-16 10:08:28 -0500296 : fCurrent(utf8), fEnd(fCurrent + utf8Bytes)
297 , fFallbackMgr(std::move(fallbackMgr))
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400298 , fHBFont(std::move(hbFont)), fFont(std::move(font))
299 , fFallbackHBFont(nullptr), fFallbackFont(fFont)
300 , fCurrentHBFont(fHBFont.get()), fCurrentFont(&fFont)
301 {
302 fFallbackFont.setTypeface(nullptr);
303 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500304 void consume() override {
305 SkASSERT(fCurrent < fEnd);
Hal Canaryf107a2f2018-07-25 16:52:48 -0400306 SkUnichar u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500307 // If the starting typeface can handle this character, use it.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400308 if (fFont.getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1)) {
309 fCurrentFont = &fFont;
310 fCurrentHBFont = fHBFont.get();
Ben Wagnera900ad52018-08-31 17:48:19 -0400311 // If the current fallback can handle this character, use it.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400312 } else if (fFallbackFont.getTypeface() &&
313 fFallbackFont.getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1))
Ben Wagnera900ad52018-08-31 17:48:19 -0400314 {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400315 fCurrentFont = &fFallbackFont;
Ben Wagnera900ad52018-08-31 17:48:19 -0400316 fCurrentHBFont = fFallbackHBFont.get();
Ben Wagner8d45a382017-11-16 10:08:28 -0500317 // If not, try to find a fallback typeface
318 } else {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400319 fFallbackFont.setTypeface(sk_ref_sp(fFallbackMgr->matchFamilyStyleCharacter(
320 nullptr, fFont.getTypeface()->fontStyle(), nullptr, 0, u)));
321 fFallbackHBFont = create_hb_font(fFallbackFont.getTypeface());
322 fCurrentFont = &fFallbackFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500323 fCurrentHBFont = fFallbackHBFont.get();
Ben Wagner8d45a382017-11-16 10:08:28 -0500324 }
325
326 while (fCurrent < fEnd) {
327 const char* prev = fCurrent;
Hal Canaryf107a2f2018-07-25 16:52:48 -0400328 u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500329
Ben Wagnera900ad52018-08-31 17:48:19 -0400330 // If not using initial typeface and initial typeface has this character, stop fallback.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400331 if (fCurrentFont->getTypeface() != fFont.getTypeface() &&
332 fFont.getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1))
Ben Wagner8d45a382017-11-16 10:08:28 -0500333 {
334 fCurrent = prev;
335 return;
336 }
337 // If the current typeface cannot handle this character, stop using it.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400338 if (!fCurrentFont->getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1)) {
Ben Wagner8d45a382017-11-16 10:08:28 -0500339 fCurrent = prev;
340 return;
341 }
342 }
343 }
344 const char* endOfCurrentRun() const override {
345 return fCurrent;
346 }
347 bool atEnd() const override {
348 return fCurrent == fEnd;
349 }
350
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400351 SkFont* currentFont() const {
352 return fCurrentFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500353 }
354 hb_font_t* currentHBFont() const {
355 return fCurrentHBFont;
356 }
357private:
358 const char* fCurrent;
359 const char* fEnd;
360 sk_sp<SkFontMgr> fFallbackMgr;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400361 HBFont fHBFont;
362 SkFont fFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500363 HBFont fFallbackHBFont;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400364 SkFont fFallbackFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500365 hb_font_t* fCurrentHBFont;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400366 SkFont* fCurrentFont;
367};
368
369class LanguageRunIterator : public RunIterator {
370public:
371 static SkTLazy<LanguageRunIterator> Make(const char* utf8, size_t utf8Bytes) {
372 SkTLazy<LanguageRunIterator> ret;
373 ret.init(utf8, utf8Bytes);
374 return ret;
375 }
376 LanguageRunIterator(const char* utf8, size_t utf8Bytes)
377 : fCurrent(utf8), fEnd(fCurrent + utf8Bytes)
378 , fLanguage(hb_language_from_string(std::locale().name().c_str(), -1))
379 { }
380 void consume() override {
381 // Ideally something like cld2/3 could be used, or user signals.
382 SkASSERT(fCurrent < fEnd);
383 fCurrent = fEnd;
384 }
385 const char* endOfCurrentRun() const override {
386 return fCurrent;
387 }
388 bool atEnd() const override {
389 return fCurrent == fEnd;
390 }
391
392 hb_language_t currentLanguage() const {
393 return fLanguage;
394 }
395private:
396 const char* fCurrent;
397 const char* fEnd;
398 hb_language_t fLanguage;
Ben Wagner8d45a382017-11-16 10:08:28 -0500399};
400
401class RunIteratorQueue {
402public:
403 void insert(RunIterator* runIterator) {
404 fRunIterators.insert(runIterator);
405 }
406
407 bool advanceRuns() {
408 const RunIterator* leastRun = fRunIterators.peek();
409 if (leastRun->atEnd()) {
410 SkASSERT(this->allRunsAreAtEnd());
411 return false;
412 }
413 const char* leastEnd = leastRun->endOfCurrentRun();
414 RunIterator* currentRun = nullptr;
415 SkDEBUGCODE(const char* previousEndOfCurrentRun);
416 while ((currentRun = fRunIterators.peek())->endOfCurrentRun() <= leastEnd) {
417 fRunIterators.pop();
418 SkDEBUGCODE(previousEndOfCurrentRun = currentRun->endOfCurrentRun());
419 currentRun->consume();
420 SkASSERT(previousEndOfCurrentRun < currentRun->endOfCurrentRun());
421 fRunIterators.insert(currentRun);
422 }
423 return true;
424 }
425
426 const char* endOfCurrentRun() const {
427 return fRunIterators.peek()->endOfCurrentRun();
428 }
429
430private:
431 bool allRunsAreAtEnd() const {
432 for (int i = 0; i < fRunIterators.count(); ++i) {
433 if (!fRunIterators.at(i)->atEnd()) {
434 return false;
435 }
436 }
437 return true;
438 }
439
440 static bool CompareRunIterator(RunIterator* const& a, RunIterator* const& b) {
441 return *a < *b;
442 }
443 SkTDPQueue<RunIterator*, CompareRunIterator> fRunIterators;
444};
445
446struct ShapedGlyph {
447 SkGlyphID fID;
448 uint32_t fCluster;
449 SkPoint fOffset;
450 SkVector fAdvance;
451 bool fMayLineBreakBefore;
452 bool fMustLineBreakBefore;
453 bool fHasVisual;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400454 bool fGraphemeBreakBefore;
455 bool fUnsafeToBreak;
Ben Wagner8d45a382017-11-16 10:08:28 -0500456};
457struct ShapedRun {
Mike Reed6d595682018-12-05 17:28:14 -0500458 ShapedRun(const char* utf8Start, const char* utf8End, int numGlyphs, const SkFont& font,
Ben Wagner8d45a382017-11-16 10:08:28 -0500459 UBiDiLevel level, std::unique_ptr<ShapedGlyph[]> glyphs)
Mike Reed6d595682018-12-05 17:28:14 -0500460 : fUtf8Start(utf8Start), fUtf8End(utf8End), fNumGlyphs(numGlyphs), fFont(font)
Ben Wagner8d45a382017-11-16 10:08:28 -0500461 , fLevel(level), fGlyphs(std::move(glyphs))
462 {}
463
464 const char* fUtf8Start;
465 const char* fUtf8End;
466 int fNumGlyphs;
Mike Reed6d595682018-12-05 17:28:14 -0500467 SkFont fFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500468 UBiDiLevel fLevel;
469 std::unique_ptr<ShapedGlyph[]> fGlyphs;
Florin Malita950243d2019-01-11 11:08:35 -0500470 SkVector fAdvance = { 0, 0 };
Ben Wagner8d45a382017-11-16 10:08:28 -0500471};
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400472struct ShapedLine {
473 SkTArray<ShapedRun> runs;
474 SkVector fAdvance = { 0, 0 };
475};
Ben Wagner8d45a382017-11-16 10:08:28 -0500476
477static constexpr bool is_LTR(UBiDiLevel level) {
478 return (level & 1) == 0;
479}
480
Florin Malita950243d2019-01-11 11:08:35 -0500481static void append(SkShaper::RunHandler* handler, const SkShaper::RunHandler::RunInfo& runInfo,
482 const ShapedRun& run, int start, int end,
Florin Malita9867f612018-12-12 10:54:49 -0500483 SkPoint* p) {
Ben Wagner8d45a382017-11-16 10:08:28 -0500484 unsigned len = end - start;
Florin Malita9867f612018-12-12 10:54:49 -0500485
Florin Malita950243d2019-01-11 11:08:35 -0500486 const auto buffer = handler->newRunBuffer(runInfo, run.fFont, len, run.fUtf8End - run.fUtf8Start);
Florin Malita9867f612018-12-12 10:54:49 -0500487 SkASSERT(buffer.glyphs);
488 SkASSERT(buffer.positions);
489
490 if (buffer.utf8text) {
491 memcpy(buffer.utf8text, run.fUtf8Start, run.fUtf8End - run.fUtf8Start);
492 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500493
494 for (unsigned i = 0; i < len; i++) {
495 // Glyphs are in logical order, but output ltr since PDF readers seem to expect that.
496 const ShapedGlyph& glyph = run.fGlyphs[is_LTR(run.fLevel) ? start + i : end - 1 - i];
Florin Malita9867f612018-12-12 10:54:49 -0500497 buffer.glyphs[i] = glyph.fID;
498 buffer.positions[i] = SkPoint::Make(p->fX + glyph.fOffset.fX, p->fY - glyph.fOffset.fY);
499 if (buffer.clusters) {
500 buffer.clusters[i] = glyph.fCluster;
501 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500502 p->fX += glyph.fAdvance.fX;
503 p->fY += glyph.fAdvance.fY;
504 }
505}
506
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400507static void emit(const ShapedLine& line, SkShaper::RunHandler* handler,
508 SkPoint point, SkPoint& currentPoint, size_t& lineIndex)
509{
510 // Reorder the runs and glyphs per line and write them out.
511 SkScalar maxAscent = 0;
512 SkScalar maxDescent = 0;
513 SkScalar maxLeading = 0;
514 for (const ShapedRun& run : line.runs) {
515 SkFontMetrics metrics;
516 run.fFont.getMetrics(&metrics);
517 maxAscent = SkTMin(maxAscent, metrics.fAscent);
518 maxDescent = SkTMax(maxDescent, metrics.fDescent);
519 maxLeading = SkTMax(maxLeading, metrics.fLeading);
520 }
521
522 int numRuns = line.runs.size();
523 SkAutoSTMalloc<4, UBiDiLevel> runLevels(numRuns);
524 for (int i = 0; i < numRuns; ++i) {
525 runLevels[i] = line.runs[i].fLevel;
526 }
527 SkAutoSTMalloc<4, int32_t> logicalFromVisual(numRuns);
528 ubidi_reorderVisual(runLevels, numRuns, logicalFromVisual);
529
530 currentPoint.fY -= maxAscent;
531
532 for (int i = 0; i < numRuns; ++i) {
533 int logicalIndex = logicalFromVisual[i];
534
535 const auto& run = line.runs[logicalIndex];
536 const SkShaper::RunHandler::RunInfo info = {
537 lineIndex,
538 run.fAdvance,
539 maxAscent,
540 maxDescent,
541 maxLeading,
542 };
543 append(handler, info, run, 0, run.fNumGlyphs, &currentPoint);
544 }
545
546 currentPoint.fY += maxDescent + maxLeading;
547 currentPoint.fX = point.fX;
548
549 lineIndex++;
550}
551
Ben Wagner8d45a382017-11-16 10:08:28 -0500552struct ShapedRunGlyphIterator {
553 ShapedRunGlyphIterator(const SkTArray<ShapedRun>& origRuns)
554 : fRuns(&origRuns), fRunIndex(0), fGlyphIndex(0)
555 { }
556
557 ShapedRunGlyphIterator(const ShapedRunGlyphIterator& that) = default;
558 ShapedRunGlyphIterator& operator=(const ShapedRunGlyphIterator& that) = default;
559 bool operator==(const ShapedRunGlyphIterator& that) const {
560 return fRuns == that.fRuns &&
561 fRunIndex == that.fRunIndex &&
562 fGlyphIndex == that.fGlyphIndex;
563 }
564 bool operator!=(const ShapedRunGlyphIterator& that) const {
565 return fRuns != that.fRuns ||
566 fRunIndex != that.fRunIndex ||
567 fGlyphIndex != that.fGlyphIndex;
568 }
569
570 ShapedGlyph* next() {
571 const SkTArray<ShapedRun>& runs = *fRuns;
572 SkASSERT(fRunIndex < runs.count());
573 SkASSERT(fGlyphIndex < runs[fRunIndex].fNumGlyphs);
574
575 ++fGlyphIndex;
576 if (fGlyphIndex == runs[fRunIndex].fNumGlyphs) {
577 fGlyphIndex = 0;
578 ++fRunIndex;
579 if (fRunIndex >= runs.count()) {
580 return nullptr;
581 }
582 }
583 return &runs[fRunIndex].fGlyphs[fGlyphIndex];
584 }
585
586 ShapedGlyph* current() {
587 const SkTArray<ShapedRun>& runs = *fRuns;
588 if (fRunIndex >= runs.count()) {
589 return nullptr;
590 }
591 return &runs[fRunIndex].fGlyphs[fGlyphIndex];
592 }
593
594 const SkTArray<ShapedRun>* fRuns;
595 int fRunIndex;
596 int fGlyphIndex;
597};
598
599} // namespace
600
601struct SkShaper::Impl {
602 HBFont fHarfBuzzFont;
603 HBBuffer fBuffer;
604 sk_sp<SkTypeface> fTypeface;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400605 ICUBrk fLineBreakIterator;
606 ICUBrk fGraphemeBreakIterator;
607
608 SkPoint shapeCorrect(RunHandler* handler,
609 const char* utf8,
610 size_t utf8Bytes,
611 SkPoint point,
612 SkScalar width,
613 RunIteratorQueue& runSegmenter,
614 const BiDiRunIterator* bidi,
615 const LanguageRunIterator* language,
616 const ScriptRunIterator* script,
617 const FontRunIterator* font) const;
618
619 SkPoint shapeOk(RunHandler* handler,
620 const char* utf8,
621 size_t utf8Bytes,
622 SkPoint point,
623 SkScalar width,
624 RunIteratorQueue& runSegmenter,
625 const BiDiRunIterator* bidi,
626 const LanguageRunIterator* language,
627 const ScriptRunIterator* script,
628 const FontRunIterator* font) const;
629
630 ShapedRun shape(const char* utf8,
631 size_t utf8Bytes,
632 const char* utf8Start,
633 const char* utf8End,
634 const BiDiRunIterator* bidi,
635 const LanguageRunIterator* language,
636 const ScriptRunIterator* script,
637 const FontRunIterator* font) const;
Ben Wagner8d45a382017-11-16 10:08:28 -0500638};
639
Ben Wagnere0001732017-08-31 16:26:26 -0400640SkShaper::SkShaper(sk_sp<SkTypeface> tf) : fImpl(new Impl) {
Hal Canary61021922019-02-06 12:29:11 -0500641#if defined(SK_USING_THIRD_PARTY_ICU)
642 if (!SkLoadICU()) {
643 SkDebugf("SkLoadICU() failed!\n");
644 return;
645 }
646#endif
Ben Wagnere0001732017-08-31 16:26:26 -0400647 fImpl->fTypeface = tf ? std::move(tf) : SkTypeface::MakeDefault();
648 fImpl->fHarfBuzzFont = create_hb_font(fImpl->fTypeface.get());
Florin Malitaa4e1a632019-01-22 16:27:01 -0500649 if (!fImpl->fHarfBuzzFont) {
650 SkDebugf("create_hb_font failed!\n");
651 }
Ben Wagnera25fbef2017-08-30 13:56:19 -0400652 fImpl->fBuffer.reset(hb_buffer_create());
Ben Wagner8d45a382017-11-16 10:08:28 -0500653 SkASSERT(fImpl->fBuffer);
654
Ben Wagner8d45a382017-11-16 10:08:28 -0500655 UErrorCode status = U_ZERO_ERROR;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400656 fImpl->fLineBreakIterator.reset(ubrk_open(UBRK_LINE, "th", nullptr, 0, &status));
Ben Wagner8d45a382017-11-16 10:08:28 -0500657 if (U_FAILURE(status)) {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400658 SkDebugf("Could not create line break iterator: %s", u_errorName(status));
Ben Wagner8d45a382017-11-16 10:08:28 -0500659 SK_ABORT("");
660 }
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400661
662 fImpl->fGraphemeBreakIterator.reset(ubrk_open(UBRK_CHARACTER, "th", nullptr, 0, &status));
663 if (U_FAILURE(status)) {
664 SkDebugf("Could not create grapheme break iterator: %s", u_errorName(status));
665 SK_ABORT("");
666 }
667
Ben Wagnera25fbef2017-08-30 13:56:19 -0400668}
669
670SkShaper::~SkShaper() {}
671
Ben Wagner8d45a382017-11-16 10:08:28 -0500672bool SkShaper::good() const {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400673 return fImpl->fBuffer &&
674 fImpl->fLineBreakIterator &&
675 fImpl->fGraphemeBreakIterator;
Ben Wagner8d45a382017-11-16 10:08:28 -0500676}
Ben Wagnera25fbef2017-08-30 13:56:19 -0400677
Florin Malita950243d2019-01-11 11:08:35 -0500678SkPoint SkShaper::shape(RunHandler* handler,
Kevin Lubick57abfe92019-01-28 13:15:51 -0500679 const SkFont& srcFont,
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500680 const char* utf8,
681 size_t utf8Bytes,
682 bool leftToRight,
683 SkPoint point,
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400684 SkScalar width) const
Ben Wagner8d45a382017-11-16 10:08:28 -0500685{
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400686 SkASSERT(handler);
687 sk_sp<SkFontMgr> fontMgr = SkFontMgr::RefDefault();
688 UBiDiLevel defaultLevel = leftToRight ? UBIDI_DEFAULT_LTR : UBIDI_DEFAULT_RTL;
689
Ben Wagner8d45a382017-11-16 10:08:28 -0500690 RunIteratorQueue runSegmenter;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400691
Ben Wagner8d45a382017-11-16 10:08:28 -0500692 SkTLazy<BiDiRunIterator> maybeBidi(BiDiRunIterator::Make(utf8, utf8Bytes, defaultLevel));
693 BiDiRunIterator* bidi = maybeBidi.getMaybeNull();
694 if (!bidi) {
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500695 return point;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400696 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500697 runSegmenter.insert(bidi);
Ben Wagnera25fbef2017-08-30 13:56:19 -0400698
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400699 SkTLazy<LanguageRunIterator> maybeLanguage(LanguageRunIterator::Make(utf8, utf8Bytes));
700 LanguageRunIterator* language = maybeLanguage.getMaybeNull();
701 if (!language) {
702 return point;
703 }
704 runSegmenter.insert(language);
705
Ben Wagner8d45a382017-11-16 10:08:28 -0500706 hb_unicode_funcs_t* hbUnicode = hb_buffer_get_unicode_funcs(fImpl->fBuffer.get());
707 SkTLazy<ScriptRunIterator> maybeScript(ScriptRunIterator::Make(utf8, utf8Bytes, hbUnicode));
708 ScriptRunIterator* script = maybeScript.getMaybeNull();
709 if (!script) {
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500710 return point;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400711 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500712 runSegmenter.insert(script);
Ben Wagnera25fbef2017-08-30 13:56:19 -0400713
Ben Wagner8d45a382017-11-16 10:08:28 -0500714 SkTLazy<FontRunIterator> maybeFont(FontRunIterator::Make(utf8, utf8Bytes,
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400715 srcFont, std::move(fontMgr)));
Ben Wagner8d45a382017-11-16 10:08:28 -0500716 FontRunIterator* font = maybeFont.getMaybeNull();
717 if (!font) {
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500718 return point;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400719 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500720 runSegmenter.insert(font);
Ben Wagnera25fbef2017-08-30 13:56:19 -0400721
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400722 if (true) {
723 return fImpl->shapeCorrect(handler, utf8, utf8Bytes, point, width,
724 runSegmenter, bidi, language, script, font);
725 } else {
726 return fImpl->shapeOk(handler, utf8, utf8Bytes, point, width,
727 runSegmenter, bidi, language, script, font);
728 }
729}
730
731SkPoint SkShaper::Impl::shapeCorrect(RunHandler* handler,
732 const char* utf8,
733 size_t utf8Bytes,
734 SkPoint point,
735 SkScalar width,
736 RunIteratorQueue& runSegmenter,
737 const BiDiRunIterator* bidi,
738 const LanguageRunIterator* language,
739 const ScriptRunIterator* script,
740 const FontRunIterator* font) const
741{
742 ShapedLine line;
743 size_t lineIndex = 0;
744 SkPoint currentPoint = point;
745
746 const char* utf8Start = nullptr;
747 const char* utf8End = utf8;
748 while (runSegmenter.advanceRuns()) { // For each item
749 utf8Start = utf8End;
750 utf8End = runSegmenter.endOfCurrentRun();
751
752 ShapedRun model(nullptr, nullptr, 0, SkFont(), 0, nullptr);
753 bool modelNeedsRegenerated = true;
754 int modelOffset = 0;
755
756 struct TextProps {
757 int glyphLen = 0;
758 SkVector advance = {0, 0};
759 };
760 // map from character position to [safe to break, glyph position, advance]
761 std::unique_ptr<TextProps[]> modelText;
762 int modelTextOffset = 0;
763 SkVector modelTextAdvanceOffset = {0, 0};
764
765 while (utf8Start < utf8End) { // While there are still code points left in this item
766 size_t utf8runLength = utf8End - utf8Start;
767 if (modelNeedsRegenerated) {
768 model = shape(utf8, utf8Bytes,
769 utf8Start, utf8End,
770 bidi, language, script, font);
771 modelOffset = 0;
772
773 SkVector advance = {0, 0};
774 modelText.reset(new TextProps[utf8runLength + 1]());
775 for (int i = 0; i < model.fNumGlyphs; ++i) {
776 SkASSERT(model.fGlyphs[i].fCluster < utf8runLength);
777 if (!model.fGlyphs[i].fUnsafeToBreak) {
778 modelText[model.fGlyphs[i].fCluster].glyphLen = i;
779 modelText[model.fGlyphs[i].fCluster].advance = advance;
780 }
781 advance += model.fGlyphs[i].fAdvance;
782 }
783 // Assume it is always safe to break after the end of an item
784 modelText[utf8runLength].glyphLen = model.fNumGlyphs;
785 modelText[utf8runLength].advance = model.fAdvance;
786 modelTextOffset = 0;
787 modelTextAdvanceOffset = {0, 0};
788 modelNeedsRegenerated = false;
789 }
790
791 // TODO: break iterator per item, but just reset position if needed?
792 // Maybe break iterator with model?
793 UBreakIterator& breakIterator = *fLineBreakIterator;
794 {
795 UErrorCode status = U_ZERO_ERROR;
796 UText utf8UText = UTEXT_INITIALIZER;
797 utext_openUTF8(&utf8UText, utf8Start, utf8runLength, &status);
798 std::unique_ptr<UText, SkFunctionWrapper<UText*, UText, utext_close>> autoClose(&utf8UText);
799 if (U_FAILURE(status)) {
800 SkDebugf("Could not create utf8UText: %s", u_errorName(status));
801 return point;
802 }
803 ubrk_setUText(&breakIterator, &utf8UText, &status);
804 if (U_FAILURE(status)) {
805 SkDebugf("Could not setText on break iterator: %s", u_errorName(status));
806 return point;
807 }
808 }
809
810 ShapedRun best(nullptr, nullptr, 0, SkFont(), 0, nullptr);
811 best.fAdvance = { SK_ScalarNegativeInfinity, SK_ScalarNegativeInfinity };
812 SkScalar widthLeft = width - line.fAdvance.fX;
813
814 for (int32_t breakIteratorCurrent = ubrk_next(&breakIterator);
815 breakIteratorCurrent != UBRK_DONE;
816 breakIteratorCurrent = ubrk_next(&breakIterator))
817 {
818 // TODO: if past a safe to break, future safe to break will be at least as long
819
820 // TODO: adjust breakIteratorCurrent by ignorable whitespace
821 ShapedRun candidate = modelText[breakIteratorCurrent + modelTextOffset].glyphLen
822 ? ShapedRun(utf8Start, utf8Start + breakIteratorCurrent,
823 modelText[breakIteratorCurrent + modelTextOffset].glyphLen - modelOffset,
824 *font->currentFont(),
825 bidi->currentLevel(),
826 std::unique_ptr<ShapedGlyph[]>())
827 : shape(utf8, utf8Bytes,
828 utf8Start, utf8Start + breakIteratorCurrent,
829 bidi, language, script, font);
830 if (!candidate.fUtf8Start) {
831 //report error
832 return point;
833 }
834 if (!candidate.fGlyphs) {
835 candidate.fAdvance = modelText[breakIteratorCurrent + modelTextOffset].advance - modelTextAdvanceOffset;
836 }
837 auto score = [widthLeft](const ShapedRun& run) -> SkScalar {
838 if (run.fAdvance.fX < widthLeft) {
839 if (run.fUtf8Start == nullptr) {
840 return SK_ScalarNegativeInfinity;
841 } else {
842 return run.fUtf8End - run.fUtf8Start;
843 }
844 } else {
845 return widthLeft - run.fAdvance.fX;
846 }
847 };
848 if (score(best) < score(candidate)) {
849 best = std::move(candidate);
850 }
851 }
852
853 // If nothing fit (best score is negative) and the line is not empty
854 if (width < line.fAdvance.fX + best.fAdvance.fX && !line.runs.empty()) {
855 emit(line, handler, point, currentPoint, lineIndex);
856 line.runs.reset();
857 line.fAdvance = {0, 0};
858 } else {
859 if (!best.fGlyphs) {
860 best.fGlyphs.reset(new ShapedGlyph[best.fNumGlyphs]);
861 memcpy(best.fGlyphs.get(), model.fGlyphs.get() + modelOffset,
862 best.fNumGlyphs * sizeof(ShapedGlyph));
863 modelOffset += best.fNumGlyphs;
864 modelTextOffset += best.fUtf8End - best.fUtf8Start;
865 modelTextAdvanceOffset += best.fAdvance;
866 } else {
867 modelNeedsRegenerated = true;
868 }
869 utf8Start = best.fUtf8End;
870 line.fAdvance += best.fAdvance;
871 line.runs.emplace_back(std::move(best));
872
873 // If item broken, emit line (prevent remainder from accidentally fitting)
874 if (utf8Start != utf8End) {
875 emit(line, handler, point, currentPoint, lineIndex);
876 line.runs.reset();
877 line.fAdvance = {0, 0};
878 }
879 }
880 }
881 }
882 emit(line, handler, point, currentPoint, lineIndex);
883 return currentPoint;
884}
885
886SkPoint SkShaper::Impl::shapeOk(RunHandler* handler,
887 const char* utf8,
888 size_t utf8Bytes,
889 SkPoint point,
890 SkScalar width,
891 RunIteratorQueue& runSegmenter,
892 const BiDiRunIterator* bidi,
893 const LanguageRunIterator* language,
894 const ScriptRunIterator* script,
895 const FontRunIterator* font) const
896{
897 SkTArray<ShapedRun> runs;
898{
899 UBreakIterator& lineBreakIterator = *fLineBreakIterator;
900 UBreakIterator& graphemeBreakIterator = *fGraphemeBreakIterator;
Ben Wagner8d45a382017-11-16 10:08:28 -0500901 {
902 UErrorCode status = U_ZERO_ERROR;
903 UText utf8UText = UTEXT_INITIALIZER;
904 utext_openUTF8(&utf8UText, utf8, utf8Bytes, &status);
905 std::unique_ptr<UText, SkFunctionWrapper<UText*, UText, utext_close>> autoClose(&utf8UText);
906 if (U_FAILURE(status)) {
907 SkDebugf("Could not create utf8UText: %s", u_errorName(status));
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500908 return point;
Ben Wagner8d45a382017-11-16 10:08:28 -0500909 }
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400910
911 ubrk_setUText(&lineBreakIterator, &utf8UText, &status);
Ben Wagner8d45a382017-11-16 10:08:28 -0500912 if (U_FAILURE(status)) {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400913 SkDebugf("Could not setText on line break iterator: %s", u_errorName(status));
914 return point;
915 }
916 ubrk_setUText(&graphemeBreakIterator, &utf8UText, &status);
917 if (U_FAILURE(status)) {
918 SkDebugf("Could not setText on grapheme break iterator: %s", u_errorName(status));
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500919 return point;
Ben Wagner8d45a382017-11-16 10:08:28 -0500920 }
Ben Wagnera25fbef2017-08-30 13:56:19 -0400921 }
922
Ben Wagner8d45a382017-11-16 10:08:28 -0500923 const char* utf8Start = nullptr;
924 const char* utf8End = utf8;
925 while (runSegmenter.advanceRuns()) {
926 utf8Start = utf8End;
927 utf8End = runSegmenter.endOfCurrentRun();
928
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400929 runs.emplace_back(shape(utf8, utf8Bytes,
930 utf8Start, utf8End,
931 bidi, language, script, font));
932 ShapedRun& run = runs.back();
Ben Wagnera25fbef2017-08-30 13:56:19 -0400933
Ben Wagner8d45a382017-11-16 10:08:28 -0500934 int32_t clusterOffset = utf8Start - utf8;
935 uint32_t previousCluster = 0xFFFFFFFF;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400936 for (int i = 0; i < run.fNumGlyphs; ++i) {
Ben Wagner8d45a382017-11-16 10:08:28 -0500937 ShapedGlyph& glyph = run.fGlyphs[i];
938 int32_t glyphCluster = glyph.fCluster + clusterOffset;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400939
940 int32_t lineBreakIteratorCurrent = ubrk_current(&lineBreakIterator);
941 while (lineBreakIteratorCurrent != UBRK_DONE &&
942 lineBreakIteratorCurrent < glyphCluster)
Ben Wagner8d45a382017-11-16 10:08:28 -0500943 {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400944 lineBreakIteratorCurrent = ubrk_next(&lineBreakIterator);
Ben Wagner2868b782017-08-31 14:12:27 -0400945 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500946 glyph.fMayLineBreakBefore = glyph.fCluster != previousCluster &&
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400947 lineBreakIteratorCurrent == glyphCluster;
948
949 int32_t graphemeBreakIteratorCurrent = ubrk_current(&graphemeBreakIterator);
950 while (graphemeBreakIteratorCurrent != UBRK_DONE &&
951 graphemeBreakIteratorCurrent < glyphCluster)
952 {
953 graphemeBreakIteratorCurrent = ubrk_next(&graphemeBreakIterator);
954 }
955 glyph.fGraphemeBreakBefore = glyph.fCluster != previousCluster &&
956 graphemeBreakIteratorCurrent == glyphCluster;
957
Ben Wagner8d45a382017-11-16 10:08:28 -0500958 previousCluster = glyph.fCluster;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400959 }
960 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500961}
962
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400963// Iterate over the glyphs in logical order to find potential line lengths.
Ben Wagner8d45a382017-11-16 10:08:28 -0500964{
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400965 /** The position of the beginning of the line. */
966 ShapedRunGlyphIterator beginning(runs);
967
968 /** The position of the candidate line break. */
969 ShapedRunGlyphIterator candidateLineBreak(runs);
970 SkScalar candidateLineBreakWidth = 0;
971
972 /** The position of the candidate grapheme break. */
973 ShapedRunGlyphIterator candidateGraphemeBreak(runs);
974 SkScalar candidateGraphemeBreakWidth = 0;
975
976 /** The position of the current location. */
977 ShapedRunGlyphIterator current(runs);
978 SkScalar currentWidth = 0;
979 while (ShapedGlyph* glyph = current.current()) {
980 // 'Break' at graphemes until a line boundary, then only at line boundaries.
981 // Only break at graphemes if no line boundary is valid.
982 if (current != beginning) {
983 if (glyph->fGraphemeBreakBefore || glyph->fMayLineBreakBefore) {
984 // TODO: preserve line breaks <= grapheme breaks
985 // and prevent line breaks inside graphemes
986 candidateGraphemeBreak = current;
987 candidateGraphemeBreakWidth = currentWidth;
988 if (glyph->fMayLineBreakBefore) {
989 candidateLineBreak = current;
990 candidateLineBreakWidth = currentWidth;
991 }
992 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500993 }
994
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400995 SkScalar glyphWidth = glyph->fAdvance.fX;
996 // Break when overwidth, the glyph has a visual representation, and some space is used.
997 if (width < currentWidth + glyphWidth && glyph->fHasVisual && candidateGraphemeBreakWidth > 0){
998 if (candidateLineBreak != beginning) {
999 beginning = candidateLineBreak;
1000 currentWidth -= candidateLineBreakWidth;
1001 candidateGraphemeBreakWidth -= candidateLineBreakWidth;
1002 candidateLineBreakWidth = 0;
1003 } else if (candidateGraphemeBreak != beginning) {
1004 beginning = candidateGraphemeBreak;
1005 candidateLineBreak = beginning;
1006 currentWidth -= candidateGraphemeBreakWidth;
1007 candidateGraphemeBreakWidth = 0;
1008 candidateLineBreakWidth = 0;
1009 } else {
1010 SK_ABORT("");
1011 }
1012
1013 if (width < currentWidth) {
1014 if (width < candidateGraphemeBreakWidth) {
1015 candidateGraphemeBreak = candidateLineBreak;
1016 candidateGraphemeBreakWidth = candidateLineBreakWidth;
1017 }
1018 current = candidateGraphemeBreak;
1019 currentWidth = candidateGraphemeBreakWidth;
1020 }
1021
1022 glyph = beginning.current();
1023 if (glyph) {
1024 glyph->fMustLineBreakBefore = true;
1025 }
1026
1027 } else {
1028 current.next();
1029 currentWidth += glyphWidth;
Ben Wagner8d45a382017-11-16 10:08:28 -05001030 }
Ben Wagner8d45a382017-11-16 10:08:28 -05001031 }
1032}
1033
1034// Reorder the runs and glyphs per line and write them out.
Ben Wagner5d4dd8b2018-01-25 14:37:17 -05001035 SkPoint currentPoint = point;
Ben Wagner8d45a382017-11-16 10:08:28 -05001036{
1037 ShapedRunGlyphIterator previousBreak(runs);
1038 ShapedRunGlyphIterator glyphIterator(runs);
1039 SkScalar maxAscent = 0;
1040 SkScalar maxDescent = 0;
1041 SkScalar maxLeading = 0;
1042 int previousRunIndex = -1;
Florin Malita950243d2019-01-11 11:08:35 -05001043 size_t lineIndex = 0;
Ben Wagner8d45a382017-11-16 10:08:28 -05001044 while (glyphIterator.current()) {
1045 int runIndex = glyphIterator.fRunIndex;
1046 int glyphIndex = glyphIterator.fGlyphIndex;
1047 ShapedGlyph* nextGlyph = glyphIterator.next();
1048
1049 if (previousRunIndex != runIndex) {
Mike Reedb5784ac2018-11-12 09:35:15 -05001050 SkFontMetrics metrics;
Mike Reed6d595682018-12-05 17:28:14 -05001051 runs[runIndex].fFont.getMetrics(&metrics);
Ben Wagner8d45a382017-11-16 10:08:28 -05001052 maxAscent = SkTMin(maxAscent, metrics.fAscent);
1053 maxDescent = SkTMax(maxDescent, metrics.fDescent);
1054 maxLeading = SkTMax(maxLeading, metrics.fLeading);
1055 previousRunIndex = runIndex;
1056 }
1057
1058 // Nothing can be written until the baseline is known.
1059 if (!(nextGlyph == nullptr || nextGlyph->fMustLineBreakBefore)) {
1060 continue;
1061 }
1062
1063 currentPoint.fY -= maxAscent;
1064
1065 int numRuns = runIndex - previousBreak.fRunIndex + 1;
1066 SkAutoSTMalloc<4, UBiDiLevel> runLevels(numRuns);
1067 for (int i = 0; i < numRuns; ++i) {
1068 runLevels[i] = runs[previousBreak.fRunIndex + i].fLevel;
1069 }
1070 SkAutoSTMalloc<4, int32_t> logicalFromVisual(numRuns);
1071 ubidi_reorderVisual(runLevels, numRuns, logicalFromVisual);
1072
Ben Wagner0ec8ec22018-09-04 18:17:13 -04001073 // step through the runs in reverse visual order and the glyphs in reverse logical order
1074 // until a visible glyph is found and force them to the end of the visual line.
1075
Ben Wagner8d45a382017-11-16 10:08:28 -05001076 for (int i = 0; i < numRuns; ++i) {
1077 int logicalIndex = previousBreak.fRunIndex + logicalFromVisual[i];
1078
1079 int startGlyphIndex = (logicalIndex == previousBreak.fRunIndex)
1080 ? previousBreak.fGlyphIndex
1081 : 0;
1082 int endGlyphIndex = (logicalIndex == runIndex)
1083 ? glyphIndex + 1
1084 : runs[logicalIndex].fNumGlyphs;
Florin Malita950243d2019-01-11 11:08:35 -05001085
1086 const auto& run = runs[logicalIndex];
1087 const RunHandler::RunInfo info = {
1088 lineIndex,
1089 run.fAdvance,
1090 maxAscent,
1091 maxDescent,
1092 maxLeading,
1093 };
1094 append(handler, info, run, startGlyphIndex, endGlyphIndex, &currentPoint);
Ben Wagner8d45a382017-11-16 10:08:28 -05001095 }
1096
1097 currentPoint.fY += maxDescent + maxLeading;
1098 currentPoint.fX = point.fX;
1099 maxAscent = 0;
1100 maxDescent = 0;
1101 maxLeading = 0;
1102 previousRunIndex = -1;
Florin Malita950243d2019-01-11 11:08:35 -05001103 ++lineIndex;
Ben Wagner8d45a382017-11-16 10:08:28 -05001104 previousBreak = glyphIterator;
1105 }
1106}
1107
Ben Wagner5d4dd8b2018-01-25 14:37:17 -05001108 return currentPoint;
Ben Wagnera25fbef2017-08-30 13:56:19 -04001109}
Ben Wagner0ec8ec22018-09-04 18:17:13 -04001110
1111
1112ShapedRun SkShaper::Impl::shape(const char* utf8,
Ben Wagner2fc14742019-02-06 16:37:44 -05001113 const size_t utf8Bytes,
Ben Wagner0ec8ec22018-09-04 18:17:13 -04001114 const char* utf8Start,
1115 const char* utf8End,
1116 const BiDiRunIterator* bidi,
1117 const LanguageRunIterator* language,
1118 const ScriptRunIterator* script,
1119 const FontRunIterator* font) const
1120{
1121 ShapedRun run(nullptr, nullptr, 0, SkFont(), 0, nullptr);
1122
1123 hb_buffer_t* buffer = fBuffer.get();
1124 SkAutoTCallVProc<hb_buffer_t, hb_buffer_clear_contents> autoClearBuffer(buffer);
1125 hb_buffer_set_content_type(buffer, HB_BUFFER_CONTENT_TYPE_UNICODE);
1126 hb_buffer_set_cluster_level(buffer, HB_BUFFER_CLUSTER_LEVEL_MONOTONE_CHARACTERS);
1127
Ben Wagner2fc14742019-02-06 16:37:44 -05001128 // See 763e5466c0a03a7c27020e1e2598e488612529a7 for documentation.
1129 hb_buffer_set_flags(buffer, HB_BUFFER_FLAG_BOT | HB_BUFFER_FLAG_EOT);
1130
Ben Wagner0ec8ec22018-09-04 18:17:13 -04001131 // Add precontext.
1132 hb_buffer_add_utf8(buffer, utf8, utf8Start - utf8, utf8Start - utf8, 0);
1133
1134 // Populate the hb_buffer directly with utf8 cluster indexes.
1135 const char* utf8Current = utf8Start;
1136 while (utf8Current < utf8End) {
1137 unsigned int cluster = utf8Current - utf8Start;
1138 hb_codepoint_t u = utf8_next(&utf8Current, utf8End);
1139 hb_buffer_add(buffer, u, cluster);
1140 }
1141
1142 // Add postcontext.
1143 hb_buffer_add_utf8(buffer, utf8Current, utf8 + utf8Bytes - utf8Current, 0, 0);
1144
1145 size_t utf8runLength = utf8End - utf8Start;
1146 if (!SkTFitsIn<int>(utf8runLength)) {
1147 SkDebugf("Shaping error: utf8 too long");
1148 return run;
1149 }
1150 hb_direction_t direction = is_LTR(bidi->currentLevel()) ? HB_DIRECTION_LTR:HB_DIRECTION_RTL;
1151 hb_buffer_set_direction(buffer, direction);
1152 hb_buffer_set_script(buffer, script->currentScript());
1153 hb_buffer_set_language(buffer, language->currentLanguage());
1154 hb_buffer_guess_segment_properties(buffer);
1155 // TODO: features
1156 if (!font->currentHBFont()) {
1157 return run;
1158 }
1159 hb_shape(font->currentHBFont(), buffer, nullptr, 0);
1160 unsigned len = hb_buffer_get_length(buffer);
1161 if (len == 0) {
1162 // TODO: this isn't an error, make it look different
1163 return run;
1164 }
1165
1166 if (direction == HB_DIRECTION_RTL) {
1167 // Put the clusters back in logical order.
1168 // Note that the advances remain ltr.
1169 hb_buffer_reverse(buffer);
1170 }
1171 hb_glyph_info_t* info = hb_buffer_get_glyph_infos(buffer, nullptr);
1172 hb_glyph_position_t* pos = hb_buffer_get_glyph_positions(buffer, nullptr);
1173
1174 if (!SkTFitsIn<int>(len)) {
1175 SkDebugf("Shaping error: too many glyphs");
1176 return run;
1177 }
1178
1179 run = ShapedRun(utf8Start, utf8End, len, *font->currentFont(),
1180 bidi->currentLevel(),
1181 std::unique_ptr<ShapedGlyph[]>(new ShapedGlyph[len]));
1182 int scaleX, scaleY;
1183 hb_font_get_scale(font->currentHBFont(), &scaleX, &scaleY);
1184 double textSizeY = run.fFont.getSize() / scaleY;
1185 double textSizeX = run.fFont.getSize() / scaleX * run.fFont.getScaleX();
1186 SkVector runAdvance = { 0, 0 };
1187 for (unsigned i = 0; i < len; i++) {
1188 ShapedGlyph& glyph = run.fGlyphs[i];
1189 glyph.fID = info[i].codepoint;
1190 glyph.fCluster = info[i].cluster;
1191 glyph.fOffset.fX = pos[i].x_offset * textSizeX;
1192 glyph.fOffset.fY = pos[i].y_offset * textSizeY;
1193 glyph.fAdvance.fX = pos[i].x_advance * textSizeX;
1194 glyph.fAdvance.fY = pos[i].y_advance * textSizeY;
1195
1196 SkRect bounds;
1197 SkScalar advance;
1198 SkPaint p;
1199 run.fFont.getWidthsBounds(&glyph.fID, 1, &advance, &bounds, &p);
1200 glyph.fHasVisual = !bounds.isEmpty(); //!font->currentTypeface()->glyphBoundsAreZero(glyph.fID);
1201 glyph.fUnsafeToBreak = info[i].mask & HB_GLYPH_FLAG_UNSAFE_TO_BREAK;
1202 glyph.fMustLineBreakBefore = false;
1203
1204 runAdvance += glyph.fAdvance;
1205 }
1206 run.fAdvance = runAdvance;
1207
1208 return run;
1209}