blob: 57f3df63350c5f35eb96437321fec528856ee9d4 [file] [log] [blame]
Ben Wagnera25fbef2017-08-30 13:56:19 -04001/*
2 * Copyright 2016 Google Inc.
3 *
4 * Use of this source code is governed by a BSD-style license that can be
5 * found in the LICENSE file.
6 */
7
Ben Wagner2fc14742019-02-06 16:37:44 -05008#include "SkBitmaskEnum.h"
Hal Canary61021922019-02-06 12:29:11 -05009#include "SkFont.h"
Ben Wagner17774242018-08-07 14:31:33 -040010#include "SkFontArguments.h"
Hal Canary61021922019-02-06 12:29:11 -050011#include "SkFontMetrics.h"
Ben Wagner67e3a302017-09-05 14:46:19 -040012#include "SkFontMgr.h"
Ben Wagner17774242018-08-07 14:31:33 -040013#include "SkMalloc.h"
Ben Wagner17774242018-08-07 14:31:33 -040014#include "SkPoint.h"
15#include "SkRefCnt.h"
16#include "SkScalar.h"
Ben Wagnera25fbef2017-08-30 13:56:19 -040017#include "SkShaper.h"
18#include "SkStream.h"
Ben Wagner17774242018-08-07 14:31:33 -040019#include "SkString.h"
20#include "SkTArray.h"
Ben Wagner8d45a382017-11-16 10:08:28 -050021#include "SkTDPQueue.h"
Ben Wagner17774242018-08-07 14:31:33 -040022#include "SkTFitsIn.h"
Ben Wagner8d45a382017-11-16 10:08:28 -050023#include "SkTLazy.h"
Ben Wagnere0001732017-08-31 16:26:26 -040024#include "SkTemplates.h"
Hal Canaryc640d0d2018-06-13 09:59:02 -040025#include "SkTo.h"
Ben Wagnera25fbef2017-08-30 13:56:19 -040026#include "SkTypeface.h"
Ben Wagner17774242018-08-07 14:31:33 -040027#include "SkTypes.h"
28#include "SkUTF.h"
29
30#include <hb.h>
31#include <hb-ot.h>
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -050032#include <unicode/ubrk.h>
Ben Wagner17774242018-08-07 14:31:33 -040033#include <unicode/ubidi.h>
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -050034#include <unicode/ustring.h>
Ben Wagner17774242018-08-07 14:31:33 -040035#include <unicode/urename.h>
36#include <unicode/utext.h>
37#include <unicode/utypes.h>
38
Ben Wagner0ec8ec22018-09-04 18:17:13 -040039#include <cstring>
40#include <locale>
Ben Wagner17774242018-08-07 14:31:33 -040041#include <memory>
42#include <utility>
Ben Wagnera25fbef2017-08-30 13:56:19 -040043
Hal Canary61021922019-02-06 12:29:11 -050044#if defined(SK_USING_THIRD_PARTY_ICU)
Hal Canary32498f02019-02-04 15:36:31 -050045#include "SkLoadICU.h"
Hal Canary61021922019-02-06 12:29:11 -050046#endif
Hal Canary32498f02019-02-04 15:36:31 -050047
Ben Wagner2fc14742019-02-06 16:37:44 -050048namespace skstd {
49template <> struct is_bitmask_enum<hb_buffer_flags_t> : std::true_type {};
50}
51
Ben Wagnera25fbef2017-08-30 13:56:19 -040052namespace {
53template <class T, void(*P)(T*)> using resource = std::unique_ptr<T, SkFunctionWrapper<void, T, P>>;
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -050054using HBBlob = resource<hb_blob_t , hb_blob_destroy >;
55using HBFace = resource<hb_face_t , hb_face_destroy >;
56using HBFont = resource<hb_font_t , hb_font_destroy >;
57using HBBuffer = resource<hb_buffer_t , hb_buffer_destroy>;
58using ICUBiDi = resource<UBiDi , ubidi_close >;
Ben Wagner0ec8ec22018-09-04 18:17:13 -040059using ICUBrk = resource<UBreakIterator, ubrk_close >;
Ben Wagnera25fbef2017-08-30 13:56:19 -040060
61HBBlob stream_to_blob(std::unique_ptr<SkStreamAsset> asset) {
62 size_t size = asset->getLength();
63 HBBlob blob;
64 if (const void* base = asset->getMemoryBase()) {
65 blob.reset(hb_blob_create((char*)base, SkToUInt(size),
66 HB_MEMORY_MODE_READONLY, asset.release(),
67 [](void* p) { delete (SkStreamAsset*)p; }));
68 } else {
69 // SkDebugf("Extra SkStreamAsset copy\n");
70 void* ptr = size ? sk_malloc_throw(size) : nullptr;
71 asset->read(ptr, size);
72 blob.reset(hb_blob_create((char*)ptr, SkToUInt(size),
73 HB_MEMORY_MODE_READONLY, ptr, sk_free));
74 }
75 SkASSERT(blob);
76 hb_blob_make_immutable(blob.get());
77 return blob;
78}
Ben Wagnera25fbef2017-08-30 13:56:19 -040079
Ben Wagner8d45a382017-11-16 10:08:28 -050080HBFont create_hb_font(SkTypeface* tf) {
Hal Canary0dfa2082018-10-31 13:02:49 -040081 if (!tf) {
82 return nullptr;
83 }
Ben Wagnera25fbef2017-08-30 13:56:19 -040084 int index;
Hal Canaryddef43f2018-11-16 10:53:51 -050085 std::unique_ptr<SkStreamAsset> typefaceAsset(tf->openStream(&index));
86 if (!typefaceAsset) {
87 SkString name;
88 tf->getFamilyName(&name);
89 SkDebugf("Typeface '%s' has no data :(\n", name.c_str());
90 return nullptr;
91 }
92 HBBlob blob(stream_to_blob(std::move(typefaceAsset)));
Ben Wagnera25fbef2017-08-30 13:56:19 -040093 HBFace face(hb_face_create(blob.get(), (unsigned)index));
94 SkASSERT(face);
95 if (!face) {
Ben Wagnere0001732017-08-31 16:26:26 -040096 return nullptr;
Ben Wagnera25fbef2017-08-30 13:56:19 -040097 }
98 hb_face_set_index(face.get(), (unsigned)index);
Ben Wagnere0001732017-08-31 16:26:26 -040099 hb_face_set_upem(face.get(), tf->getUnitsPerEm());
Ben Wagnera25fbef2017-08-30 13:56:19 -0400100
Ben Wagnere0001732017-08-31 16:26:26 -0400101 HBFont font(hb_font_create(face.get()));
102 SkASSERT(font);
103 if (!font) {
104 return nullptr;
105 }
Ben Wagnere0001732017-08-31 16:26:26 -0400106 hb_ot_font_set_funcs(font.get());
107 int axis_count = tf->getVariationDesignPosition(nullptr, 0);
108 if (axis_count > 0) {
109 SkAutoSTMalloc<4, SkFontArguments::VariationPosition::Coordinate> axis_values(axis_count);
110 if (tf->getVariationDesignPosition(axis_values, axis_count) == axis_count) {
111 hb_font_set_variations(font.get(),
112 reinterpret_cast<hb_variation_t*>(axis_values.get()),
113 axis_count);
114 }
115 }
116 return font;
117}
118
Hal Canaryf107a2f2018-07-25 16:52:48 -0400119/** this version replaces invalid utf-8 sequences with code point U+FFFD. */
120static inline SkUnichar utf8_next(const char** ptr, const char* end) {
121 SkUnichar val = SkUTF::NextUTF8(ptr, end);
122 if (val < 0) {
123 return 0xFFFD; // REPLACEMENT CHARACTER
124 }
125 return val;
126}
127
Ben Wagner8d45a382017-11-16 10:08:28 -0500128class RunIterator {
129public:
130 virtual ~RunIterator() {}
131 virtual void consume() = 0;
132 // Pointer one past the last (utf8) element in the current run.
133 virtual const char* endOfCurrentRun() const = 0;
134 virtual bool atEnd() const = 0;
135 bool operator<(const RunIterator& that) const {
136 return this->endOfCurrentRun() < that.endOfCurrentRun();
137 }
138};
139
140class BiDiRunIterator : public RunIterator {
141public:
142 static SkTLazy<BiDiRunIterator> Make(const char* utf8, size_t utf8Bytes, UBiDiLevel level) {
143 SkTLazy<BiDiRunIterator> ret;
144
145 // ubidi only accepts utf16 (though internally it basically works on utf32 chars).
146 // We want an ubidi_setPara(UBiDi*, UText*, UBiDiLevel, UBiDiLevel*, UErrorCode*);
147 if (!SkTFitsIn<int32_t>(utf8Bytes)) {
148 SkDebugf("Bidi error: text too long");
149 return ret;
150 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500151
152 UErrorCode status = U_ZERO_ERROR;
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -0500153
154 // Getting the length like this seems to always set U_BUFFER_OVERFLOW_ERROR
155 int32_t utf16Units;
156 u_strFromUTF8(nullptr, 0, &utf16Units, utf8, utf8Bytes, &status);
157 status = U_ZERO_ERROR;
158 std::unique_ptr<UChar[]> utf16(new UChar[utf16Units]);
159 u_strFromUTF8(utf16.get(), utf16Units, nullptr, utf8, utf8Bytes, &status);
160 if (U_FAILURE(status)) {
161 SkDebugf("Invalid utf8 input: %s", u_errorName(status));
162 return ret;
163 }
164
165 ICUBiDi bidi(ubidi_openSized(utf16Units, 0, &status));
Ben Wagner8d45a382017-11-16 10:08:28 -0500166 if (U_FAILURE(status)) {
167 SkDebugf("Bidi error: %s", u_errorName(status));
168 return ret;
169 }
170 SkASSERT(bidi);
171
172 // The required lifetime of utf16 isn't well documented.
173 // It appears it isn't used after ubidi_setPara except through ubidi_getText.
Ben Wagnerc5aa8eb2019-01-24 16:15:55 -0500174 ubidi_setPara(bidi.get(), utf16.get(), utf16Units, level, nullptr, &status);
Ben Wagner8d45a382017-11-16 10:08:28 -0500175 if (U_FAILURE(status)) {
176 SkDebugf("Bidi error: %s", u_errorName(status));
177 return ret;
178 }
179
Hal Canary4014ba62018-07-24 11:33:21 -0400180 ret.init(utf8, utf8 + utf8Bytes, std::move(bidi));
Ben Wagner8d45a382017-11-16 10:08:28 -0500181 return ret;
182 }
Hal Canary4014ba62018-07-24 11:33:21 -0400183 BiDiRunIterator(const char* utf8, const char* end, ICUBiDi bidi)
Ben Wagner8d45a382017-11-16 10:08:28 -0500184 : fBidi(std::move(bidi))
185 , fEndOfCurrentRun(utf8)
Hal Canary4014ba62018-07-24 11:33:21 -0400186 , fEndOfAllRuns(end)
Ben Wagner8d45a382017-11-16 10:08:28 -0500187 , fUTF16LogicalPosition(0)
188 , fLevel(UBIDI_DEFAULT_LTR)
189 {}
190 void consume() override {
191 SkASSERT(fUTF16LogicalPosition < ubidi_getLength(fBidi.get()));
192 int32_t endPosition = ubidi_getLength(fBidi.get());
193 fLevel = ubidi_getLevelAt(fBidi.get(), fUTF16LogicalPosition);
Hal Canaryf107a2f2018-07-25 16:52:48 -0400194 SkUnichar u = utf8_next(&fEndOfCurrentRun, fEndOfAllRuns);
195 fUTF16LogicalPosition += SkUTF::ToUTF16(u);
Ben Wagner8d45a382017-11-16 10:08:28 -0500196 UBiDiLevel level;
197 while (fUTF16LogicalPosition < endPosition) {
198 level = ubidi_getLevelAt(fBidi.get(), fUTF16LogicalPosition);
199 if (level != fLevel) {
200 break;
201 }
Hal Canaryf107a2f2018-07-25 16:52:48 -0400202 u = utf8_next(&fEndOfCurrentRun, fEndOfAllRuns);
203 fUTF16LogicalPosition += SkUTF::ToUTF16(u);
Ben Wagner8d45a382017-11-16 10:08:28 -0500204 }
205 }
206 const char* endOfCurrentRun() const override {
207 return fEndOfCurrentRun;
208 }
209 bool atEnd() const override {
210 return fUTF16LogicalPosition == ubidi_getLength(fBidi.get());
211 }
212
213 UBiDiLevel currentLevel() const {
214 return fLevel;
215 }
216private:
217 ICUBiDi fBidi;
218 const char* fEndOfCurrentRun;
Hal Canary4014ba62018-07-24 11:33:21 -0400219 const char* fEndOfAllRuns;
Ben Wagner8d45a382017-11-16 10:08:28 -0500220 int32_t fUTF16LogicalPosition;
221 UBiDiLevel fLevel;
222};
223
224class ScriptRunIterator : public RunIterator {
225public:
226 static SkTLazy<ScriptRunIterator> Make(const char* utf8, size_t utf8Bytes,
227 hb_unicode_funcs_t* hbUnicode)
228 {
229 SkTLazy<ScriptRunIterator> ret;
230 ret.init(utf8, utf8Bytes, hbUnicode);
231 return ret;
232 }
233 ScriptRunIterator(const char* utf8, size_t utf8Bytes, hb_unicode_funcs_t* hbUnicode)
234 : fCurrent(utf8), fEnd(fCurrent + utf8Bytes)
235 , fHBUnicode(hbUnicode)
236 , fCurrentScript(HB_SCRIPT_UNKNOWN)
237 {}
238 void consume() override {
239 SkASSERT(fCurrent < fEnd);
Hal Canaryf107a2f2018-07-25 16:52:48 -0400240 SkUnichar u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500241 fCurrentScript = hb_unicode_script(fHBUnicode, u);
242 while (fCurrent < fEnd) {
243 const char* prev = fCurrent;
Hal Canaryf107a2f2018-07-25 16:52:48 -0400244 u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500245 const hb_script_t script = hb_unicode_script(fHBUnicode, u);
246 if (script != fCurrentScript) {
247 if (fCurrentScript == HB_SCRIPT_INHERITED || fCurrentScript == HB_SCRIPT_COMMON) {
248 fCurrentScript = script;
249 } else if (script == HB_SCRIPT_INHERITED || script == HB_SCRIPT_COMMON) {
250 continue;
251 } else {
252 fCurrent = prev;
253 break;
254 }
255 }
256 }
257 if (fCurrentScript == HB_SCRIPT_INHERITED) {
258 fCurrentScript = HB_SCRIPT_COMMON;
259 }
260 }
261 const char* endOfCurrentRun() const override {
262 return fCurrent;
263 }
264 bool atEnd() const override {
265 return fCurrent == fEnd;
266 }
267
268 hb_script_t currentScript() const {
269 return fCurrentScript;
270 }
271private:
272 const char* fCurrent;
273 const char* fEnd;
274 hb_unicode_funcs_t* fHBUnicode;
275 hb_script_t fCurrentScript;
276};
277
278class FontRunIterator : public RunIterator {
279public:
280 static SkTLazy<FontRunIterator> Make(const char* utf8, size_t utf8Bytes,
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400281 SkFont font,
Ben Wagner8d45a382017-11-16 10:08:28 -0500282 sk_sp<SkFontMgr> fallbackMgr)
283 {
284 SkTLazy<FontRunIterator> ret;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400285 font.setTypeface(font.refTypefaceOrDefault());
286 HBFont hbFont = create_hb_font(font.getTypeface());
287 if (!hbFont) {
288 SkDebugf("create_hb_font failed!\n");
289 return ret;
290 }
291 ret.init(utf8, utf8Bytes, std::move(font), std::move(hbFont), std::move(fallbackMgr));
Ben Wagner8d45a382017-11-16 10:08:28 -0500292 return ret;
293 }
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400294 FontRunIterator(const char* utf8, size_t utf8Bytes, SkFont font,
295 HBFont hbFont, sk_sp<SkFontMgr> fallbackMgr)
Ben Wagner8d45a382017-11-16 10:08:28 -0500296 : fCurrent(utf8), fEnd(fCurrent + utf8Bytes)
297 , fFallbackMgr(std::move(fallbackMgr))
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400298 , fHBFont(std::move(hbFont)), fFont(std::move(font))
299 , fFallbackHBFont(nullptr), fFallbackFont(fFont)
300 , fCurrentHBFont(fHBFont.get()), fCurrentFont(&fFont)
301 {
302 fFallbackFont.setTypeface(nullptr);
303 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500304 void consume() override {
305 SkASSERT(fCurrent < fEnd);
Hal Canaryf107a2f2018-07-25 16:52:48 -0400306 SkUnichar u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500307 // If the starting typeface can handle this character, use it.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400308 if (fFont.getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1)) {
309 fCurrentFont = &fFont;
310 fCurrentHBFont = fHBFont.get();
Ben Wagnera900ad52018-08-31 17:48:19 -0400311 // If the current fallback can handle this character, use it.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400312 } else if (fFallbackFont.getTypeface() &&
313 fFallbackFont.getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1))
Ben Wagnera900ad52018-08-31 17:48:19 -0400314 {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400315 fCurrentFont = &fFallbackFont;
Ben Wagnera900ad52018-08-31 17:48:19 -0400316 fCurrentHBFont = fFallbackHBFont.get();
Ben Wagner8d45a382017-11-16 10:08:28 -0500317 // If not, try to find a fallback typeface
318 } else {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400319 fFallbackFont.setTypeface(sk_ref_sp(fFallbackMgr->matchFamilyStyleCharacter(
320 nullptr, fFont.getTypeface()->fontStyle(), nullptr, 0, u)));
321 fFallbackHBFont = create_hb_font(fFallbackFont.getTypeface());
322 fCurrentFont = &fFallbackFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500323 fCurrentHBFont = fFallbackHBFont.get();
Ben Wagner8d45a382017-11-16 10:08:28 -0500324 }
325
326 while (fCurrent < fEnd) {
327 const char* prev = fCurrent;
Hal Canaryf107a2f2018-07-25 16:52:48 -0400328 u = utf8_next(&fCurrent, fEnd);
Ben Wagner8d45a382017-11-16 10:08:28 -0500329
Ben Wagnera900ad52018-08-31 17:48:19 -0400330 // If not using initial typeface and initial typeface has this character, stop fallback.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400331 if (fCurrentFont->getTypeface() != fFont.getTypeface() &&
332 fFont.getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1))
Ben Wagner8d45a382017-11-16 10:08:28 -0500333 {
334 fCurrent = prev;
335 return;
336 }
337 // If the current typeface cannot handle this character, stop using it.
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400338 if (!fCurrentFont->getTypeface()->charsToGlyphs(&u, SkTypeface::kUTF32_Encoding, nullptr, 1)) {
Ben Wagner8d45a382017-11-16 10:08:28 -0500339 fCurrent = prev;
340 return;
341 }
342 }
343 }
344 const char* endOfCurrentRun() const override {
345 return fCurrent;
346 }
347 bool atEnd() const override {
348 return fCurrent == fEnd;
349 }
350
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400351 SkFont* currentFont() const {
352 return fCurrentFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500353 }
354 hb_font_t* currentHBFont() const {
355 return fCurrentHBFont;
356 }
357private:
358 const char* fCurrent;
359 const char* fEnd;
360 sk_sp<SkFontMgr> fFallbackMgr;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400361 HBFont fHBFont;
362 SkFont fFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500363 HBFont fFallbackHBFont;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400364 SkFont fFallbackFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500365 hb_font_t* fCurrentHBFont;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400366 SkFont* fCurrentFont;
367};
368
369class LanguageRunIterator : public RunIterator {
370public:
371 static SkTLazy<LanguageRunIterator> Make(const char* utf8, size_t utf8Bytes) {
372 SkTLazy<LanguageRunIterator> ret;
373 ret.init(utf8, utf8Bytes);
374 return ret;
375 }
376 LanguageRunIterator(const char* utf8, size_t utf8Bytes)
377 : fCurrent(utf8), fEnd(fCurrent + utf8Bytes)
378 , fLanguage(hb_language_from_string(std::locale().name().c_str(), -1))
379 { }
380 void consume() override {
381 // Ideally something like cld2/3 could be used, or user signals.
382 SkASSERT(fCurrent < fEnd);
383 fCurrent = fEnd;
384 }
385 const char* endOfCurrentRun() const override {
386 return fCurrent;
387 }
388 bool atEnd() const override {
389 return fCurrent == fEnd;
390 }
391
392 hb_language_t currentLanguage() const {
393 return fLanguage;
394 }
395private:
396 const char* fCurrent;
397 const char* fEnd;
398 hb_language_t fLanguage;
Ben Wagner8d45a382017-11-16 10:08:28 -0500399};
400
401class RunIteratorQueue {
402public:
403 void insert(RunIterator* runIterator) {
404 fRunIterators.insert(runIterator);
405 }
406
407 bool advanceRuns() {
408 const RunIterator* leastRun = fRunIterators.peek();
409 if (leastRun->atEnd()) {
410 SkASSERT(this->allRunsAreAtEnd());
411 return false;
412 }
413 const char* leastEnd = leastRun->endOfCurrentRun();
414 RunIterator* currentRun = nullptr;
415 SkDEBUGCODE(const char* previousEndOfCurrentRun);
416 while ((currentRun = fRunIterators.peek())->endOfCurrentRun() <= leastEnd) {
417 fRunIterators.pop();
418 SkDEBUGCODE(previousEndOfCurrentRun = currentRun->endOfCurrentRun());
419 currentRun->consume();
420 SkASSERT(previousEndOfCurrentRun < currentRun->endOfCurrentRun());
421 fRunIterators.insert(currentRun);
422 }
423 return true;
424 }
425
426 const char* endOfCurrentRun() const {
427 return fRunIterators.peek()->endOfCurrentRun();
428 }
429
430private:
431 bool allRunsAreAtEnd() const {
432 for (int i = 0; i < fRunIterators.count(); ++i) {
433 if (!fRunIterators.at(i)->atEnd()) {
434 return false;
435 }
436 }
437 return true;
438 }
439
440 static bool CompareRunIterator(RunIterator* const& a, RunIterator* const& b) {
441 return *a < *b;
442 }
443 SkTDPQueue<RunIterator*, CompareRunIterator> fRunIterators;
444};
445
446struct ShapedGlyph {
447 SkGlyphID fID;
448 uint32_t fCluster;
449 SkPoint fOffset;
450 SkVector fAdvance;
451 bool fMayLineBreakBefore;
452 bool fMustLineBreakBefore;
453 bool fHasVisual;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400454 bool fGraphemeBreakBefore;
455 bool fUnsafeToBreak;
Ben Wagner8d45a382017-11-16 10:08:28 -0500456};
457struct ShapedRun {
Mike Reed6d595682018-12-05 17:28:14 -0500458 ShapedRun(const char* utf8Start, const char* utf8End, int numGlyphs, const SkFont& font,
Ben Wagner8d45a382017-11-16 10:08:28 -0500459 UBiDiLevel level, std::unique_ptr<ShapedGlyph[]> glyphs)
Mike Reed6d595682018-12-05 17:28:14 -0500460 : fUtf8Start(utf8Start), fUtf8End(utf8End), fNumGlyphs(numGlyphs), fFont(font)
Ben Wagner8d45a382017-11-16 10:08:28 -0500461 , fLevel(level), fGlyphs(std::move(glyphs))
462 {}
463
464 const char* fUtf8Start;
465 const char* fUtf8End;
466 int fNumGlyphs;
Mike Reed6d595682018-12-05 17:28:14 -0500467 SkFont fFont;
Ben Wagner8d45a382017-11-16 10:08:28 -0500468 UBiDiLevel fLevel;
469 std::unique_ptr<ShapedGlyph[]> fGlyphs;
Florin Malita950243d2019-01-11 11:08:35 -0500470 SkVector fAdvance = { 0, 0 };
Ben Wagner8d45a382017-11-16 10:08:28 -0500471};
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400472struct ShapedLine {
473 SkTArray<ShapedRun> runs;
474 SkVector fAdvance = { 0, 0 };
475};
Ben Wagner8d45a382017-11-16 10:08:28 -0500476
477static constexpr bool is_LTR(UBiDiLevel level) {
478 return (level & 1) == 0;
479}
480
Florin Malita950243d2019-01-11 11:08:35 -0500481static void append(SkShaper::RunHandler* handler, const SkShaper::RunHandler::RunInfo& runInfo,
482 const ShapedRun& run, int start, int end,
Florin Malita9867f612018-12-12 10:54:49 -0500483 SkPoint* p) {
Ben Wagner8d45a382017-11-16 10:08:28 -0500484 unsigned len = end - start;
Florin Malita9867f612018-12-12 10:54:49 -0500485
Florin Malita950243d2019-01-11 11:08:35 -0500486 const auto buffer = handler->newRunBuffer(runInfo, run.fFont, len, run.fUtf8End - run.fUtf8Start);
Florin Malita9867f612018-12-12 10:54:49 -0500487 SkASSERT(buffer.glyphs);
488 SkASSERT(buffer.positions);
489
490 if (buffer.utf8text) {
491 memcpy(buffer.utf8text, run.fUtf8Start, run.fUtf8End - run.fUtf8Start);
492 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500493
494 for (unsigned i = 0; i < len; i++) {
495 // Glyphs are in logical order, but output ltr since PDF readers seem to expect that.
496 const ShapedGlyph& glyph = run.fGlyphs[is_LTR(run.fLevel) ? start + i : end - 1 - i];
Florin Malita9867f612018-12-12 10:54:49 -0500497 buffer.glyphs[i] = glyph.fID;
498 buffer.positions[i] = SkPoint::Make(p->fX + glyph.fOffset.fX, p->fY - glyph.fOffset.fY);
499 if (buffer.clusters) {
500 buffer.clusters[i] = glyph.fCluster;
501 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500502 p->fX += glyph.fAdvance.fX;
503 p->fY += glyph.fAdvance.fY;
504 }
505}
506
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400507static void emit(const ShapedLine& line, SkShaper::RunHandler* handler,
Florin Malita500133b2019-02-07 10:56:55 -0500508 SkPoint point, SkPoint& currentPoint)
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400509{
510 // Reorder the runs and glyphs per line and write them out.
511 SkScalar maxAscent = 0;
512 SkScalar maxDescent = 0;
513 SkScalar maxLeading = 0;
514 for (const ShapedRun& run : line.runs) {
515 SkFontMetrics metrics;
516 run.fFont.getMetrics(&metrics);
517 maxAscent = SkTMin(maxAscent, metrics.fAscent);
518 maxDescent = SkTMax(maxDescent, metrics.fDescent);
519 maxLeading = SkTMax(maxLeading, metrics.fLeading);
520 }
521
522 int numRuns = line.runs.size();
523 SkAutoSTMalloc<4, UBiDiLevel> runLevels(numRuns);
524 for (int i = 0; i < numRuns; ++i) {
525 runLevels[i] = line.runs[i].fLevel;
526 }
527 SkAutoSTMalloc<4, int32_t> logicalFromVisual(numRuns);
528 ubidi_reorderVisual(runLevels, numRuns, logicalFromVisual);
529
530 currentPoint.fY -= maxAscent;
531
532 for (int i = 0; i < numRuns; ++i) {
533 int logicalIndex = logicalFromVisual[i];
534
535 const auto& run = line.runs[logicalIndex];
536 const SkShaper::RunHandler::RunInfo info = {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400537 run.fAdvance,
538 maxAscent,
539 maxDescent,
540 maxLeading,
541 };
542 append(handler, info, run, 0, run.fNumGlyphs, &currentPoint);
543 }
544
545 currentPoint.fY += maxDescent + maxLeading;
546 currentPoint.fX = point.fX;
547
Florin Malita500133b2019-02-07 10:56:55 -0500548 handler->commitLine();
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400549}
550
Ben Wagner8d45a382017-11-16 10:08:28 -0500551struct ShapedRunGlyphIterator {
552 ShapedRunGlyphIterator(const SkTArray<ShapedRun>& origRuns)
553 : fRuns(&origRuns), fRunIndex(0), fGlyphIndex(0)
554 { }
555
556 ShapedRunGlyphIterator(const ShapedRunGlyphIterator& that) = default;
557 ShapedRunGlyphIterator& operator=(const ShapedRunGlyphIterator& that) = default;
558 bool operator==(const ShapedRunGlyphIterator& that) const {
559 return fRuns == that.fRuns &&
560 fRunIndex == that.fRunIndex &&
561 fGlyphIndex == that.fGlyphIndex;
562 }
563 bool operator!=(const ShapedRunGlyphIterator& that) const {
564 return fRuns != that.fRuns ||
565 fRunIndex != that.fRunIndex ||
566 fGlyphIndex != that.fGlyphIndex;
567 }
568
569 ShapedGlyph* next() {
570 const SkTArray<ShapedRun>& runs = *fRuns;
571 SkASSERT(fRunIndex < runs.count());
572 SkASSERT(fGlyphIndex < runs[fRunIndex].fNumGlyphs);
573
574 ++fGlyphIndex;
575 if (fGlyphIndex == runs[fRunIndex].fNumGlyphs) {
576 fGlyphIndex = 0;
577 ++fRunIndex;
578 if (fRunIndex >= runs.count()) {
579 return nullptr;
580 }
581 }
582 return &runs[fRunIndex].fGlyphs[fGlyphIndex];
583 }
584
585 ShapedGlyph* current() {
586 const SkTArray<ShapedRun>& runs = *fRuns;
587 if (fRunIndex >= runs.count()) {
588 return nullptr;
589 }
590 return &runs[fRunIndex].fGlyphs[fGlyphIndex];
591 }
592
593 const SkTArray<ShapedRun>* fRuns;
594 int fRunIndex;
595 int fGlyphIndex;
596};
597
598} // namespace
599
600struct SkShaper::Impl {
601 HBFont fHarfBuzzFont;
602 HBBuffer fBuffer;
603 sk_sp<SkTypeface> fTypeface;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400604 ICUBrk fLineBreakIterator;
605 ICUBrk fGraphemeBreakIterator;
606
607 SkPoint shapeCorrect(RunHandler* handler,
608 const char* utf8,
609 size_t utf8Bytes,
610 SkPoint point,
611 SkScalar width,
612 RunIteratorQueue& runSegmenter,
613 const BiDiRunIterator* bidi,
614 const LanguageRunIterator* language,
615 const ScriptRunIterator* script,
616 const FontRunIterator* font) const;
617
618 SkPoint shapeOk(RunHandler* handler,
619 const char* utf8,
620 size_t utf8Bytes,
621 SkPoint point,
622 SkScalar width,
623 RunIteratorQueue& runSegmenter,
624 const BiDiRunIterator* bidi,
625 const LanguageRunIterator* language,
626 const ScriptRunIterator* script,
627 const FontRunIterator* font) const;
628
629 ShapedRun shape(const char* utf8,
630 size_t utf8Bytes,
631 const char* utf8Start,
632 const char* utf8End,
633 const BiDiRunIterator* bidi,
634 const LanguageRunIterator* language,
635 const ScriptRunIterator* script,
636 const FontRunIterator* font) const;
Ben Wagner8d45a382017-11-16 10:08:28 -0500637};
638
Ben Wagnere0001732017-08-31 16:26:26 -0400639SkShaper::SkShaper(sk_sp<SkTypeface> tf) : fImpl(new Impl) {
Hal Canary61021922019-02-06 12:29:11 -0500640#if defined(SK_USING_THIRD_PARTY_ICU)
641 if (!SkLoadICU()) {
642 SkDebugf("SkLoadICU() failed!\n");
643 return;
644 }
645#endif
Ben Wagnere0001732017-08-31 16:26:26 -0400646 fImpl->fTypeface = tf ? std::move(tf) : SkTypeface::MakeDefault();
647 fImpl->fHarfBuzzFont = create_hb_font(fImpl->fTypeface.get());
Florin Malitaa4e1a632019-01-22 16:27:01 -0500648 if (!fImpl->fHarfBuzzFont) {
649 SkDebugf("create_hb_font failed!\n");
650 }
Ben Wagnera25fbef2017-08-30 13:56:19 -0400651 fImpl->fBuffer.reset(hb_buffer_create());
Ben Wagner8d45a382017-11-16 10:08:28 -0500652 SkASSERT(fImpl->fBuffer);
653
Ben Wagner8d45a382017-11-16 10:08:28 -0500654 UErrorCode status = U_ZERO_ERROR;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400655 fImpl->fLineBreakIterator.reset(ubrk_open(UBRK_LINE, "th", nullptr, 0, &status));
Ben Wagner8d45a382017-11-16 10:08:28 -0500656 if (U_FAILURE(status)) {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400657 SkDebugf("Could not create line break iterator: %s", u_errorName(status));
Ben Wagner8d45a382017-11-16 10:08:28 -0500658 SK_ABORT("");
659 }
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400660
661 fImpl->fGraphemeBreakIterator.reset(ubrk_open(UBRK_CHARACTER, "th", nullptr, 0, &status));
662 if (U_FAILURE(status)) {
663 SkDebugf("Could not create grapheme break iterator: %s", u_errorName(status));
664 SK_ABORT("");
665 }
666
Ben Wagnera25fbef2017-08-30 13:56:19 -0400667}
668
669SkShaper::~SkShaper() {}
670
Ben Wagner8d45a382017-11-16 10:08:28 -0500671bool SkShaper::good() const {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400672 return fImpl->fBuffer &&
673 fImpl->fLineBreakIterator &&
674 fImpl->fGraphemeBreakIterator;
Ben Wagner8d45a382017-11-16 10:08:28 -0500675}
Ben Wagnera25fbef2017-08-30 13:56:19 -0400676
Florin Malita950243d2019-01-11 11:08:35 -0500677SkPoint SkShaper::shape(RunHandler* handler,
Kevin Lubick57abfe92019-01-28 13:15:51 -0500678 const SkFont& srcFont,
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500679 const char* utf8,
680 size_t utf8Bytes,
681 bool leftToRight,
682 SkPoint point,
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400683 SkScalar width) const
Ben Wagner8d45a382017-11-16 10:08:28 -0500684{
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400685 SkASSERT(handler);
686 sk_sp<SkFontMgr> fontMgr = SkFontMgr::RefDefault();
687 UBiDiLevel defaultLevel = leftToRight ? UBIDI_DEFAULT_LTR : UBIDI_DEFAULT_RTL;
688
Ben Wagner8d45a382017-11-16 10:08:28 -0500689 RunIteratorQueue runSegmenter;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400690
Ben Wagner8d45a382017-11-16 10:08:28 -0500691 SkTLazy<BiDiRunIterator> maybeBidi(BiDiRunIterator::Make(utf8, utf8Bytes, defaultLevel));
692 BiDiRunIterator* bidi = maybeBidi.getMaybeNull();
693 if (!bidi) {
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500694 return point;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400695 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500696 runSegmenter.insert(bidi);
Ben Wagnera25fbef2017-08-30 13:56:19 -0400697
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400698 SkTLazy<LanguageRunIterator> maybeLanguage(LanguageRunIterator::Make(utf8, utf8Bytes));
699 LanguageRunIterator* language = maybeLanguage.getMaybeNull();
700 if (!language) {
701 return point;
702 }
703 runSegmenter.insert(language);
704
Ben Wagner8d45a382017-11-16 10:08:28 -0500705 hb_unicode_funcs_t* hbUnicode = hb_buffer_get_unicode_funcs(fImpl->fBuffer.get());
706 SkTLazy<ScriptRunIterator> maybeScript(ScriptRunIterator::Make(utf8, utf8Bytes, hbUnicode));
707 ScriptRunIterator* script = maybeScript.getMaybeNull();
708 if (!script) {
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500709 return point;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400710 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500711 runSegmenter.insert(script);
Ben Wagnera25fbef2017-08-30 13:56:19 -0400712
Ben Wagner8d45a382017-11-16 10:08:28 -0500713 SkTLazy<FontRunIterator> maybeFont(FontRunIterator::Make(utf8, utf8Bytes,
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400714 srcFont, std::move(fontMgr)));
Ben Wagner8d45a382017-11-16 10:08:28 -0500715 FontRunIterator* font = maybeFont.getMaybeNull();
716 if (!font) {
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500717 return point;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400718 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500719 runSegmenter.insert(font);
Ben Wagnera25fbef2017-08-30 13:56:19 -0400720
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400721 if (true) {
722 return fImpl->shapeCorrect(handler, utf8, utf8Bytes, point, width,
723 runSegmenter, bidi, language, script, font);
724 } else {
725 return fImpl->shapeOk(handler, utf8, utf8Bytes, point, width,
726 runSegmenter, bidi, language, script, font);
727 }
728}
729
730SkPoint SkShaper::Impl::shapeCorrect(RunHandler* handler,
731 const char* utf8,
732 size_t utf8Bytes,
733 SkPoint point,
734 SkScalar width,
735 RunIteratorQueue& runSegmenter,
736 const BiDiRunIterator* bidi,
737 const LanguageRunIterator* language,
738 const ScriptRunIterator* script,
739 const FontRunIterator* font) const
740{
741 ShapedLine line;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400742 SkPoint currentPoint = point;
743
744 const char* utf8Start = nullptr;
745 const char* utf8End = utf8;
746 while (runSegmenter.advanceRuns()) { // For each item
747 utf8Start = utf8End;
748 utf8End = runSegmenter.endOfCurrentRun();
749
750 ShapedRun model(nullptr, nullptr, 0, SkFont(), 0, nullptr);
751 bool modelNeedsRegenerated = true;
752 int modelOffset = 0;
753
754 struct TextProps {
755 int glyphLen = 0;
756 SkVector advance = {0, 0};
757 };
758 // map from character position to [safe to break, glyph position, advance]
759 std::unique_ptr<TextProps[]> modelText;
760 int modelTextOffset = 0;
761 SkVector modelTextAdvanceOffset = {0, 0};
762
763 while (utf8Start < utf8End) { // While there are still code points left in this item
764 size_t utf8runLength = utf8End - utf8Start;
765 if (modelNeedsRegenerated) {
766 model = shape(utf8, utf8Bytes,
767 utf8Start, utf8End,
768 bidi, language, script, font);
769 modelOffset = 0;
770
771 SkVector advance = {0, 0};
772 modelText.reset(new TextProps[utf8runLength + 1]());
773 for (int i = 0; i < model.fNumGlyphs; ++i) {
774 SkASSERT(model.fGlyphs[i].fCluster < utf8runLength);
775 if (!model.fGlyphs[i].fUnsafeToBreak) {
776 modelText[model.fGlyphs[i].fCluster].glyphLen = i;
777 modelText[model.fGlyphs[i].fCluster].advance = advance;
778 }
779 advance += model.fGlyphs[i].fAdvance;
780 }
781 // Assume it is always safe to break after the end of an item
782 modelText[utf8runLength].glyphLen = model.fNumGlyphs;
783 modelText[utf8runLength].advance = model.fAdvance;
784 modelTextOffset = 0;
785 modelTextAdvanceOffset = {0, 0};
786 modelNeedsRegenerated = false;
787 }
788
789 // TODO: break iterator per item, but just reset position if needed?
790 // Maybe break iterator with model?
791 UBreakIterator& breakIterator = *fLineBreakIterator;
792 {
793 UErrorCode status = U_ZERO_ERROR;
794 UText utf8UText = UTEXT_INITIALIZER;
795 utext_openUTF8(&utf8UText, utf8Start, utf8runLength, &status);
796 std::unique_ptr<UText, SkFunctionWrapper<UText*, UText, utext_close>> autoClose(&utf8UText);
797 if (U_FAILURE(status)) {
798 SkDebugf("Could not create utf8UText: %s", u_errorName(status));
799 return point;
800 }
801 ubrk_setUText(&breakIterator, &utf8UText, &status);
802 if (U_FAILURE(status)) {
803 SkDebugf("Could not setText on break iterator: %s", u_errorName(status));
804 return point;
805 }
806 }
807
808 ShapedRun best(nullptr, nullptr, 0, SkFont(), 0, nullptr);
809 best.fAdvance = { SK_ScalarNegativeInfinity, SK_ScalarNegativeInfinity };
810 SkScalar widthLeft = width - line.fAdvance.fX;
811
812 for (int32_t breakIteratorCurrent = ubrk_next(&breakIterator);
813 breakIteratorCurrent != UBRK_DONE;
814 breakIteratorCurrent = ubrk_next(&breakIterator))
815 {
816 // TODO: if past a safe to break, future safe to break will be at least as long
817
818 // TODO: adjust breakIteratorCurrent by ignorable whitespace
819 ShapedRun candidate = modelText[breakIteratorCurrent + modelTextOffset].glyphLen
820 ? ShapedRun(utf8Start, utf8Start + breakIteratorCurrent,
821 modelText[breakIteratorCurrent + modelTextOffset].glyphLen - modelOffset,
822 *font->currentFont(),
823 bidi->currentLevel(),
824 std::unique_ptr<ShapedGlyph[]>())
825 : shape(utf8, utf8Bytes,
826 utf8Start, utf8Start + breakIteratorCurrent,
827 bidi, language, script, font);
828 if (!candidate.fUtf8Start) {
829 //report error
830 return point;
831 }
832 if (!candidate.fGlyphs) {
833 candidate.fAdvance = modelText[breakIteratorCurrent + modelTextOffset].advance - modelTextAdvanceOffset;
834 }
835 auto score = [widthLeft](const ShapedRun& run) -> SkScalar {
836 if (run.fAdvance.fX < widthLeft) {
837 if (run.fUtf8Start == nullptr) {
838 return SK_ScalarNegativeInfinity;
839 } else {
840 return run.fUtf8End - run.fUtf8Start;
841 }
842 } else {
843 return widthLeft - run.fAdvance.fX;
844 }
845 };
846 if (score(best) < score(candidate)) {
847 best = std::move(candidate);
848 }
849 }
850
851 // If nothing fit (best score is negative) and the line is not empty
852 if (width < line.fAdvance.fX + best.fAdvance.fX && !line.runs.empty()) {
Florin Malita500133b2019-02-07 10:56:55 -0500853 emit(line, handler, point, currentPoint);
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400854 line.runs.reset();
855 line.fAdvance = {0, 0};
856 } else {
857 if (!best.fGlyphs) {
858 best.fGlyphs.reset(new ShapedGlyph[best.fNumGlyphs]);
859 memcpy(best.fGlyphs.get(), model.fGlyphs.get() + modelOffset,
860 best.fNumGlyphs * sizeof(ShapedGlyph));
861 modelOffset += best.fNumGlyphs;
862 modelTextOffset += best.fUtf8End - best.fUtf8Start;
863 modelTextAdvanceOffset += best.fAdvance;
864 } else {
865 modelNeedsRegenerated = true;
866 }
867 utf8Start = best.fUtf8End;
868 line.fAdvance += best.fAdvance;
869 line.runs.emplace_back(std::move(best));
870
871 // If item broken, emit line (prevent remainder from accidentally fitting)
872 if (utf8Start != utf8End) {
Florin Malita500133b2019-02-07 10:56:55 -0500873 emit(line, handler, point, currentPoint);
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400874 line.runs.reset();
875 line.fAdvance = {0, 0};
876 }
877 }
878 }
879 }
Florin Malita500133b2019-02-07 10:56:55 -0500880 emit(line, handler, point, currentPoint);
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400881 return currentPoint;
882}
883
884SkPoint SkShaper::Impl::shapeOk(RunHandler* handler,
885 const char* utf8,
886 size_t utf8Bytes,
887 SkPoint point,
888 SkScalar width,
889 RunIteratorQueue& runSegmenter,
890 const BiDiRunIterator* bidi,
891 const LanguageRunIterator* language,
892 const ScriptRunIterator* script,
893 const FontRunIterator* font) const
894{
895 SkTArray<ShapedRun> runs;
896{
897 UBreakIterator& lineBreakIterator = *fLineBreakIterator;
898 UBreakIterator& graphemeBreakIterator = *fGraphemeBreakIterator;
Ben Wagner8d45a382017-11-16 10:08:28 -0500899 {
900 UErrorCode status = U_ZERO_ERROR;
901 UText utf8UText = UTEXT_INITIALIZER;
902 utext_openUTF8(&utf8UText, utf8, utf8Bytes, &status);
903 std::unique_ptr<UText, SkFunctionWrapper<UText*, UText, utext_close>> autoClose(&utf8UText);
904 if (U_FAILURE(status)) {
905 SkDebugf("Could not create utf8UText: %s", u_errorName(status));
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500906 return point;
Ben Wagner8d45a382017-11-16 10:08:28 -0500907 }
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400908
909 ubrk_setUText(&lineBreakIterator, &utf8UText, &status);
Ben Wagner8d45a382017-11-16 10:08:28 -0500910 if (U_FAILURE(status)) {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400911 SkDebugf("Could not setText on line break iterator: %s", u_errorName(status));
912 return point;
913 }
914 ubrk_setUText(&graphemeBreakIterator, &utf8UText, &status);
915 if (U_FAILURE(status)) {
916 SkDebugf("Could not setText on grapheme break iterator: %s", u_errorName(status));
Ben Wagner5d4dd8b2018-01-25 14:37:17 -0500917 return point;
Ben Wagner8d45a382017-11-16 10:08:28 -0500918 }
Ben Wagnera25fbef2017-08-30 13:56:19 -0400919 }
920
Ben Wagner8d45a382017-11-16 10:08:28 -0500921 const char* utf8Start = nullptr;
922 const char* utf8End = utf8;
923 while (runSegmenter.advanceRuns()) {
924 utf8Start = utf8End;
925 utf8End = runSegmenter.endOfCurrentRun();
926
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400927 runs.emplace_back(shape(utf8, utf8Bytes,
928 utf8Start, utf8End,
929 bidi, language, script, font));
930 ShapedRun& run = runs.back();
Ben Wagnera25fbef2017-08-30 13:56:19 -0400931
Ben Wagner8d45a382017-11-16 10:08:28 -0500932 int32_t clusterOffset = utf8Start - utf8;
933 uint32_t previousCluster = 0xFFFFFFFF;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400934 for (int i = 0; i < run.fNumGlyphs; ++i) {
Ben Wagner8d45a382017-11-16 10:08:28 -0500935 ShapedGlyph& glyph = run.fGlyphs[i];
936 int32_t glyphCluster = glyph.fCluster + clusterOffset;
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400937
938 int32_t lineBreakIteratorCurrent = ubrk_current(&lineBreakIterator);
939 while (lineBreakIteratorCurrent != UBRK_DONE &&
940 lineBreakIteratorCurrent < glyphCluster)
Ben Wagner8d45a382017-11-16 10:08:28 -0500941 {
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400942 lineBreakIteratorCurrent = ubrk_next(&lineBreakIterator);
Ben Wagner2868b782017-08-31 14:12:27 -0400943 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500944 glyph.fMayLineBreakBefore = glyph.fCluster != previousCluster &&
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400945 lineBreakIteratorCurrent == glyphCluster;
946
947 int32_t graphemeBreakIteratorCurrent = ubrk_current(&graphemeBreakIterator);
948 while (graphemeBreakIteratorCurrent != UBRK_DONE &&
949 graphemeBreakIteratorCurrent < glyphCluster)
950 {
951 graphemeBreakIteratorCurrent = ubrk_next(&graphemeBreakIterator);
952 }
953 glyph.fGraphemeBreakBefore = glyph.fCluster != previousCluster &&
954 graphemeBreakIteratorCurrent == glyphCluster;
955
Ben Wagner8d45a382017-11-16 10:08:28 -0500956 previousCluster = glyph.fCluster;
Ben Wagnera25fbef2017-08-30 13:56:19 -0400957 }
958 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500959}
960
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400961// Iterate over the glyphs in logical order to find potential line lengths.
Ben Wagner8d45a382017-11-16 10:08:28 -0500962{
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400963 /** The position of the beginning of the line. */
964 ShapedRunGlyphIterator beginning(runs);
965
966 /** The position of the candidate line break. */
967 ShapedRunGlyphIterator candidateLineBreak(runs);
968 SkScalar candidateLineBreakWidth = 0;
969
970 /** The position of the candidate grapheme break. */
971 ShapedRunGlyphIterator candidateGraphemeBreak(runs);
972 SkScalar candidateGraphemeBreakWidth = 0;
973
974 /** The position of the current location. */
975 ShapedRunGlyphIterator current(runs);
976 SkScalar currentWidth = 0;
977 while (ShapedGlyph* glyph = current.current()) {
978 // 'Break' at graphemes until a line boundary, then only at line boundaries.
979 // Only break at graphemes if no line boundary is valid.
980 if (current != beginning) {
981 if (glyph->fGraphemeBreakBefore || glyph->fMayLineBreakBefore) {
982 // TODO: preserve line breaks <= grapheme breaks
983 // and prevent line breaks inside graphemes
984 candidateGraphemeBreak = current;
985 candidateGraphemeBreakWidth = currentWidth;
986 if (glyph->fMayLineBreakBefore) {
987 candidateLineBreak = current;
988 candidateLineBreakWidth = currentWidth;
989 }
990 }
Ben Wagner8d45a382017-11-16 10:08:28 -0500991 }
992
Ben Wagner0ec8ec22018-09-04 18:17:13 -0400993 SkScalar glyphWidth = glyph->fAdvance.fX;
994 // Break when overwidth, the glyph has a visual representation, and some space is used.
995 if (width < currentWidth + glyphWidth && glyph->fHasVisual && candidateGraphemeBreakWidth > 0){
996 if (candidateLineBreak != beginning) {
997 beginning = candidateLineBreak;
998 currentWidth -= candidateLineBreakWidth;
999 candidateGraphemeBreakWidth -= candidateLineBreakWidth;
1000 candidateLineBreakWidth = 0;
1001 } else if (candidateGraphemeBreak != beginning) {
1002 beginning = candidateGraphemeBreak;
1003 candidateLineBreak = beginning;
1004 currentWidth -= candidateGraphemeBreakWidth;
1005 candidateGraphemeBreakWidth = 0;
1006 candidateLineBreakWidth = 0;
1007 } else {
1008 SK_ABORT("");
1009 }
1010
1011 if (width < currentWidth) {
1012 if (width < candidateGraphemeBreakWidth) {
1013 candidateGraphemeBreak = candidateLineBreak;
1014 candidateGraphemeBreakWidth = candidateLineBreakWidth;
1015 }
1016 current = candidateGraphemeBreak;
1017 currentWidth = candidateGraphemeBreakWidth;
1018 }
1019
1020 glyph = beginning.current();
1021 if (glyph) {
1022 glyph->fMustLineBreakBefore = true;
1023 }
1024
1025 } else {
1026 current.next();
1027 currentWidth += glyphWidth;
Ben Wagner8d45a382017-11-16 10:08:28 -05001028 }
Ben Wagner8d45a382017-11-16 10:08:28 -05001029 }
1030}
1031
1032// Reorder the runs and glyphs per line and write them out.
Ben Wagner5d4dd8b2018-01-25 14:37:17 -05001033 SkPoint currentPoint = point;
Ben Wagner8d45a382017-11-16 10:08:28 -05001034{
1035 ShapedRunGlyphIterator previousBreak(runs);
1036 ShapedRunGlyphIterator glyphIterator(runs);
1037 SkScalar maxAscent = 0;
1038 SkScalar maxDescent = 0;
1039 SkScalar maxLeading = 0;
1040 int previousRunIndex = -1;
1041 while (glyphIterator.current()) {
1042 int runIndex = glyphIterator.fRunIndex;
1043 int glyphIndex = glyphIterator.fGlyphIndex;
1044 ShapedGlyph* nextGlyph = glyphIterator.next();
1045
1046 if (previousRunIndex != runIndex) {
Mike Reedb5784ac2018-11-12 09:35:15 -05001047 SkFontMetrics metrics;
Mike Reed6d595682018-12-05 17:28:14 -05001048 runs[runIndex].fFont.getMetrics(&metrics);
Ben Wagner8d45a382017-11-16 10:08:28 -05001049 maxAscent = SkTMin(maxAscent, metrics.fAscent);
1050 maxDescent = SkTMax(maxDescent, metrics.fDescent);
1051 maxLeading = SkTMax(maxLeading, metrics.fLeading);
1052 previousRunIndex = runIndex;
1053 }
1054
1055 // Nothing can be written until the baseline is known.
1056 if (!(nextGlyph == nullptr || nextGlyph->fMustLineBreakBefore)) {
1057 continue;
1058 }
1059
1060 currentPoint.fY -= maxAscent;
1061
1062 int numRuns = runIndex - previousBreak.fRunIndex + 1;
1063 SkAutoSTMalloc<4, UBiDiLevel> runLevels(numRuns);
1064 for (int i = 0; i < numRuns; ++i) {
1065 runLevels[i] = runs[previousBreak.fRunIndex + i].fLevel;
1066 }
1067 SkAutoSTMalloc<4, int32_t> logicalFromVisual(numRuns);
1068 ubidi_reorderVisual(runLevels, numRuns, logicalFromVisual);
1069
Ben Wagner0ec8ec22018-09-04 18:17:13 -04001070 // step through the runs in reverse visual order and the glyphs in reverse logical order
1071 // until a visible glyph is found and force them to the end of the visual line.
1072
Ben Wagner8d45a382017-11-16 10:08:28 -05001073 for (int i = 0; i < numRuns; ++i) {
1074 int logicalIndex = previousBreak.fRunIndex + logicalFromVisual[i];
1075
1076 int startGlyphIndex = (logicalIndex == previousBreak.fRunIndex)
1077 ? previousBreak.fGlyphIndex
1078 : 0;
1079 int endGlyphIndex = (logicalIndex == runIndex)
1080 ? glyphIndex + 1
1081 : runs[logicalIndex].fNumGlyphs;
Florin Malita950243d2019-01-11 11:08:35 -05001082
1083 const auto& run = runs[logicalIndex];
1084 const RunHandler::RunInfo info = {
Florin Malita950243d2019-01-11 11:08:35 -05001085 run.fAdvance,
1086 maxAscent,
1087 maxDescent,
1088 maxLeading,
1089 };
1090 append(handler, info, run, startGlyphIndex, endGlyphIndex, &currentPoint);
Ben Wagner8d45a382017-11-16 10:08:28 -05001091 }
1092
Florin Malita500133b2019-02-07 10:56:55 -05001093 handler->commitLine();
1094
Ben Wagner8d45a382017-11-16 10:08:28 -05001095 currentPoint.fY += maxDescent + maxLeading;
1096 currentPoint.fX = point.fX;
1097 maxAscent = 0;
1098 maxDescent = 0;
1099 maxLeading = 0;
1100 previousRunIndex = -1;
1101 previousBreak = glyphIterator;
1102 }
1103}
1104
Ben Wagner5d4dd8b2018-01-25 14:37:17 -05001105 return currentPoint;
Ben Wagnera25fbef2017-08-30 13:56:19 -04001106}
Ben Wagner0ec8ec22018-09-04 18:17:13 -04001107
1108
1109ShapedRun SkShaper::Impl::shape(const char* utf8,
Ben Wagner2fc14742019-02-06 16:37:44 -05001110 const size_t utf8Bytes,
Ben Wagner0ec8ec22018-09-04 18:17:13 -04001111 const char* utf8Start,
1112 const char* utf8End,
1113 const BiDiRunIterator* bidi,
1114 const LanguageRunIterator* language,
1115 const ScriptRunIterator* script,
1116 const FontRunIterator* font) const
1117{
1118 ShapedRun run(nullptr, nullptr, 0, SkFont(), 0, nullptr);
1119
1120 hb_buffer_t* buffer = fBuffer.get();
1121 SkAutoTCallVProc<hb_buffer_t, hb_buffer_clear_contents> autoClearBuffer(buffer);
1122 hb_buffer_set_content_type(buffer, HB_BUFFER_CONTENT_TYPE_UNICODE);
1123 hb_buffer_set_cluster_level(buffer, HB_BUFFER_CLUSTER_LEVEL_MONOTONE_CHARACTERS);
1124
Ben Wagner2fc14742019-02-06 16:37:44 -05001125 // See 763e5466c0a03a7c27020e1e2598e488612529a7 for documentation.
1126 hb_buffer_set_flags(buffer, HB_BUFFER_FLAG_BOT | HB_BUFFER_FLAG_EOT);
1127
Ben Wagner0ec8ec22018-09-04 18:17:13 -04001128 // Add precontext.
1129 hb_buffer_add_utf8(buffer, utf8, utf8Start - utf8, utf8Start - utf8, 0);
1130
1131 // Populate the hb_buffer directly with utf8 cluster indexes.
1132 const char* utf8Current = utf8Start;
1133 while (utf8Current < utf8End) {
1134 unsigned int cluster = utf8Current - utf8Start;
1135 hb_codepoint_t u = utf8_next(&utf8Current, utf8End);
1136 hb_buffer_add(buffer, u, cluster);
1137 }
1138
1139 // Add postcontext.
1140 hb_buffer_add_utf8(buffer, utf8Current, utf8 + utf8Bytes - utf8Current, 0, 0);
1141
1142 size_t utf8runLength = utf8End - utf8Start;
1143 if (!SkTFitsIn<int>(utf8runLength)) {
1144 SkDebugf("Shaping error: utf8 too long");
1145 return run;
1146 }
1147 hb_direction_t direction = is_LTR(bidi->currentLevel()) ? HB_DIRECTION_LTR:HB_DIRECTION_RTL;
1148 hb_buffer_set_direction(buffer, direction);
1149 hb_buffer_set_script(buffer, script->currentScript());
1150 hb_buffer_set_language(buffer, language->currentLanguage());
1151 hb_buffer_guess_segment_properties(buffer);
1152 // TODO: features
1153 if (!font->currentHBFont()) {
1154 return run;
1155 }
1156 hb_shape(font->currentHBFont(), buffer, nullptr, 0);
1157 unsigned len = hb_buffer_get_length(buffer);
1158 if (len == 0) {
1159 // TODO: this isn't an error, make it look different
1160 return run;
1161 }
1162
1163 if (direction == HB_DIRECTION_RTL) {
1164 // Put the clusters back in logical order.
1165 // Note that the advances remain ltr.
1166 hb_buffer_reverse(buffer);
1167 }
1168 hb_glyph_info_t* info = hb_buffer_get_glyph_infos(buffer, nullptr);
1169 hb_glyph_position_t* pos = hb_buffer_get_glyph_positions(buffer, nullptr);
1170
1171 if (!SkTFitsIn<int>(len)) {
1172 SkDebugf("Shaping error: too many glyphs");
1173 return run;
1174 }
1175
1176 run = ShapedRun(utf8Start, utf8End, len, *font->currentFont(),
1177 bidi->currentLevel(),
1178 std::unique_ptr<ShapedGlyph[]>(new ShapedGlyph[len]));
1179 int scaleX, scaleY;
1180 hb_font_get_scale(font->currentHBFont(), &scaleX, &scaleY);
1181 double textSizeY = run.fFont.getSize() / scaleY;
1182 double textSizeX = run.fFont.getSize() / scaleX * run.fFont.getScaleX();
1183 SkVector runAdvance = { 0, 0 };
1184 for (unsigned i = 0; i < len; i++) {
1185 ShapedGlyph& glyph = run.fGlyphs[i];
1186 glyph.fID = info[i].codepoint;
1187 glyph.fCluster = info[i].cluster;
1188 glyph.fOffset.fX = pos[i].x_offset * textSizeX;
1189 glyph.fOffset.fY = pos[i].y_offset * textSizeY;
1190 glyph.fAdvance.fX = pos[i].x_advance * textSizeX;
1191 glyph.fAdvance.fY = pos[i].y_advance * textSizeY;
1192
1193 SkRect bounds;
1194 SkScalar advance;
1195 SkPaint p;
1196 run.fFont.getWidthsBounds(&glyph.fID, 1, &advance, &bounds, &p);
1197 glyph.fHasVisual = !bounds.isEmpty(); //!font->currentTypeface()->glyphBoundsAreZero(glyph.fID);
1198 glyph.fUnsafeToBreak = info[i].mask & HB_GLYPH_FLAG_UNSAFE_TO_BREAK;
1199 glyph.fMustLineBreakBefore = false;
1200
1201 runAdvance += glyph.fAdvance;
1202 }
1203 run.fAdvance = runAdvance;
1204
1205 return run;
1206}