xref: /aosp_15_r20/external/skia/modules/skshaper/src/SkShaper_skunicode.cpp (revision c8dee2aa9b3f27cf6c858bd81872bdeb2c07ed17)
1*c8dee2aaSAndroid Build Coastguard Worker /*
2*c8dee2aaSAndroid Build Coastguard Worker  * Copyright 2023 Google Inc.
3*c8dee2aaSAndroid Build Coastguard Worker  *
4*c8dee2aaSAndroid Build Coastguard Worker  * Use of this source code is governed by a BSD-style license that can be
5*c8dee2aaSAndroid Build Coastguard Worker  * found in the LICENSE file.
6*c8dee2aaSAndroid Build Coastguard Worker  */
7*c8dee2aaSAndroid Build Coastguard Worker #include "include/core/SkRefCnt.h"
8*c8dee2aaSAndroid Build Coastguard Worker #include "include/private/base/SkAssert.h"
9*c8dee2aaSAndroid Build Coastguard Worker #include "include/private/base/SkDebug.h"
10*c8dee2aaSAndroid Build Coastguard Worker #include "include/private/base/SkTFitsIn.h"
11*c8dee2aaSAndroid Build Coastguard Worker #include "modules/skshaper/include/SkShaper.h"
12*c8dee2aaSAndroid Build Coastguard Worker #include "modules/skshaper/include/SkShaper_skunicode.h"
13*c8dee2aaSAndroid Build Coastguard Worker #include "modules/skunicode/include/SkUnicode.h"
14*c8dee2aaSAndroid Build Coastguard Worker #include "src/base/SkUTF.h"
15*c8dee2aaSAndroid Build Coastguard Worker 
16*c8dee2aaSAndroid Build Coastguard Worker #include <cstddef>
17*c8dee2aaSAndroid Build Coastguard Worker #include <cstdint>
18*c8dee2aaSAndroid Build Coastguard Worker #include <memory>
19*c8dee2aaSAndroid Build Coastguard Worker #include <utility>
20*c8dee2aaSAndroid Build Coastguard Worker 
21*c8dee2aaSAndroid Build Coastguard Worker using SkUnicodeBidi = std::unique_ptr<SkBidiIterator>;
22*c8dee2aaSAndroid Build Coastguard Worker 
23*c8dee2aaSAndroid Build Coastguard Worker /** Replaces invalid utf-8 sequences with REPLACEMENT CHARACTER U+FFFD. */
utf8_next(const char ** ptr,const char * end)24*c8dee2aaSAndroid Build Coastguard Worker static inline SkUnichar utf8_next(const char** ptr, const char* end) {
25*c8dee2aaSAndroid Build Coastguard Worker     SkUnichar val = SkUTF::NextUTF8(ptr, end);
26*c8dee2aaSAndroid Build Coastguard Worker     return val < 0 ? 0xFFFD : val;
27*c8dee2aaSAndroid Build Coastguard Worker }
28*c8dee2aaSAndroid Build Coastguard Worker 
29*c8dee2aaSAndroid Build Coastguard Worker class SkUnicodeBidiRunIterator final : public SkShaper::BiDiRunIterator {
30*c8dee2aaSAndroid Build Coastguard Worker public:
SkUnicodeBidiRunIterator(const char * utf8,const char * end,SkUnicodeBidi bidi)31*c8dee2aaSAndroid Build Coastguard Worker     SkUnicodeBidiRunIterator(const char* utf8, const char* end, SkUnicodeBidi bidi)
32*c8dee2aaSAndroid Build Coastguard Worker         : fBidi(std::move(bidi))
33*c8dee2aaSAndroid Build Coastguard Worker         , fEndOfCurrentRun(utf8)
34*c8dee2aaSAndroid Build Coastguard Worker         , fBegin(utf8)
35*c8dee2aaSAndroid Build Coastguard Worker         , fEnd(end)
36*c8dee2aaSAndroid Build Coastguard Worker         , fUTF16LogicalPosition(0)
37*c8dee2aaSAndroid Build Coastguard Worker         , fLevel(SkBidiIterator::kLTR)
38*c8dee2aaSAndroid Build Coastguard Worker     {}
39*c8dee2aaSAndroid Build Coastguard Worker 
consume()40*c8dee2aaSAndroid Build Coastguard Worker     void consume() override {
41*c8dee2aaSAndroid Build Coastguard Worker         SkASSERT(fUTF16LogicalPosition < fBidi->getLength());
42*c8dee2aaSAndroid Build Coastguard Worker         int32_t endPosition = fBidi->getLength();
43*c8dee2aaSAndroid Build Coastguard Worker         fLevel = fBidi->getLevelAt(fUTF16LogicalPosition);
44*c8dee2aaSAndroid Build Coastguard Worker         SkUnichar u = utf8_next(&fEndOfCurrentRun, fEnd);
45*c8dee2aaSAndroid Build Coastguard Worker         fUTF16LogicalPosition += SkUTF::ToUTF16(u);
46*c8dee2aaSAndroid Build Coastguard Worker         SkBidiIterator::Level level;
47*c8dee2aaSAndroid Build Coastguard Worker         while (fUTF16LogicalPosition < endPosition) {
48*c8dee2aaSAndroid Build Coastguard Worker             level = fBidi->getLevelAt(fUTF16LogicalPosition);
49*c8dee2aaSAndroid Build Coastguard Worker             if (level != fLevel) {
50*c8dee2aaSAndroid Build Coastguard Worker                 break;
51*c8dee2aaSAndroid Build Coastguard Worker             }
52*c8dee2aaSAndroid Build Coastguard Worker             u = utf8_next(&fEndOfCurrentRun, fEnd);
53*c8dee2aaSAndroid Build Coastguard Worker 
54*c8dee2aaSAndroid Build Coastguard Worker             fUTF16LogicalPosition += SkUTF::ToUTF16(u);
55*c8dee2aaSAndroid Build Coastguard Worker         }
56*c8dee2aaSAndroid Build Coastguard Worker     }
endOfCurrentRun() const57*c8dee2aaSAndroid Build Coastguard Worker     size_t endOfCurrentRun() const override {
58*c8dee2aaSAndroid Build Coastguard Worker         return fEndOfCurrentRun - fBegin;
59*c8dee2aaSAndroid Build Coastguard Worker     }
atEnd() const60*c8dee2aaSAndroid Build Coastguard Worker     bool atEnd() const override {
61*c8dee2aaSAndroid Build Coastguard Worker         return fUTF16LogicalPosition == fBidi->getLength();
62*c8dee2aaSAndroid Build Coastguard Worker     }
currentLevel() const63*c8dee2aaSAndroid Build Coastguard Worker     SkBidiIterator::Level currentLevel() const override {
64*c8dee2aaSAndroid Build Coastguard Worker         return fLevel;
65*c8dee2aaSAndroid Build Coastguard Worker     }
66*c8dee2aaSAndroid Build Coastguard Worker private:
67*c8dee2aaSAndroid Build Coastguard Worker     SkUnicodeBidi fBidi;
68*c8dee2aaSAndroid Build Coastguard Worker     char const * fEndOfCurrentRun;
69*c8dee2aaSAndroid Build Coastguard Worker     char const * const fBegin;
70*c8dee2aaSAndroid Build Coastguard Worker     char const * const fEnd;
71*c8dee2aaSAndroid Build Coastguard Worker     int32_t fUTF16LogicalPosition;
72*c8dee2aaSAndroid Build Coastguard Worker     SkBidiIterator::Level fLevel;
73*c8dee2aaSAndroid Build Coastguard Worker };
74*c8dee2aaSAndroid Build Coastguard Worker 
75*c8dee2aaSAndroid Build Coastguard Worker #if !defined(SK_DISABLE_LEGACY_SKSHAPER_FUNCTIONS)
76*c8dee2aaSAndroid Build Coastguard Worker 
77*c8dee2aaSAndroid Build Coastguard Worker #if defined(SK_UNICODE_ICU_IMPLEMENTATION)
78*c8dee2aaSAndroid Build Coastguard Worker #include "modules/skunicode/include/SkUnicode_icu.h"
79*c8dee2aaSAndroid Build Coastguard Worker #endif
80*c8dee2aaSAndroid Build Coastguard Worker 
81*c8dee2aaSAndroid Build Coastguard Worker #if defined(SK_UNICODE_LIBGRAPHEME_IMPLEMENTATION)
82*c8dee2aaSAndroid Build Coastguard Worker #include "modules/skunicode/include/SkUnicode_libgrapheme.h"
83*c8dee2aaSAndroid Build Coastguard Worker #endif
84*c8dee2aaSAndroid Build Coastguard Worker 
85*c8dee2aaSAndroid Build Coastguard Worker #if defined(SK_UNICODE_ICU4X_IMPLEMENTATION)
86*c8dee2aaSAndroid Build Coastguard Worker #include "modules/skunicode/include/SkUnicode_icu4x.h"
87*c8dee2aaSAndroid Build Coastguard Worker #endif
88*c8dee2aaSAndroid Build Coastguard Worker 
get_unicode()89*c8dee2aaSAndroid Build Coastguard Worker sk_sp<SkUnicode> get_unicode() {
90*c8dee2aaSAndroid Build Coastguard Worker #if defined(SK_UNICODE_ICU_IMPLEMENTATION)
91*c8dee2aaSAndroid Build Coastguard Worker     if (auto unicode = SkUnicodes::ICU::Make()) {
92*c8dee2aaSAndroid Build Coastguard Worker         return unicode;
93*c8dee2aaSAndroid Build Coastguard Worker     }
94*c8dee2aaSAndroid Build Coastguard Worker #endif  // defined(SK_UNICODE_ICU_IMPLEMENTATION)
95*c8dee2aaSAndroid Build Coastguard Worker #if defined(SK_UNICODE_LIBGRAPHEME_IMPLEMENTATION)
96*c8dee2aaSAndroid Build Coastguard Worker     if (auto unicode = SkUnicodes::Libgrapheme::Make()) {
97*c8dee2aaSAndroid Build Coastguard Worker         return unicode;
98*c8dee2aaSAndroid Build Coastguard Worker     }
99*c8dee2aaSAndroid Build Coastguard Worker #endif
100*c8dee2aaSAndroid Build Coastguard Worker #if defined(SK_UNICODE_ICU4X_IMPLEMENTATION)
101*c8dee2aaSAndroid Build Coastguard Worker     if (auto unicode = SkUnicodes::ICU4X::Make()) {
102*c8dee2aaSAndroid Build Coastguard Worker         return unicode;
103*c8dee2aaSAndroid Build Coastguard Worker     }
104*c8dee2aaSAndroid Build Coastguard Worker #endif
105*c8dee2aaSAndroid Build Coastguard Worker     return nullptr;
106*c8dee2aaSAndroid Build Coastguard Worker }
107*c8dee2aaSAndroid Build Coastguard Worker 
MakeIcuBiDiRunIterator(const char * utf8,size_t utf8Bytes,uint8_t bidiLevel)108*c8dee2aaSAndroid Build Coastguard Worker std::unique_ptr<SkShaper::BiDiRunIterator> SkShaper::MakeIcuBiDiRunIterator(const char* utf8,
109*c8dee2aaSAndroid Build Coastguard Worker                                                                             size_t utf8Bytes,
110*c8dee2aaSAndroid Build Coastguard Worker                                                                             uint8_t bidiLevel) {
111*c8dee2aaSAndroid Build Coastguard Worker     static auto unicode = get_unicode();
112*c8dee2aaSAndroid Build Coastguard Worker     if (!unicode) {
113*c8dee2aaSAndroid Build Coastguard Worker         return nullptr;
114*c8dee2aaSAndroid Build Coastguard Worker     }
115*c8dee2aaSAndroid Build Coastguard Worker     return SkShapers::unicode::BidiRunIterator(unicode, utf8, utf8Bytes, bidiLevel);
116*c8dee2aaSAndroid Build Coastguard Worker }
117*c8dee2aaSAndroid Build Coastguard Worker #endif  //  !defined(SK_DISABLE_LEGACY_SKSHAPER_FUNCTIONS)
118*c8dee2aaSAndroid Build Coastguard Worker 
119*c8dee2aaSAndroid Build Coastguard Worker namespace SkShapers::unicode {
BidiRunIterator(sk_sp<SkUnicode> unicode,const char * utf8,size_t utf8Bytes,uint8_t bidiLevel)120*c8dee2aaSAndroid Build Coastguard Worker std::unique_ptr<SkShaper::BiDiRunIterator> BidiRunIterator(sk_sp<SkUnicode> unicode,
121*c8dee2aaSAndroid Build Coastguard Worker                                                            const char* utf8,
122*c8dee2aaSAndroid Build Coastguard Worker                                                            size_t utf8Bytes,
123*c8dee2aaSAndroid Build Coastguard Worker                                                            uint8_t bidiLevel) {
124*c8dee2aaSAndroid Build Coastguard Worker     if (!unicode) {
125*c8dee2aaSAndroid Build Coastguard Worker         return nullptr;
126*c8dee2aaSAndroid Build Coastguard Worker     }
127*c8dee2aaSAndroid Build Coastguard Worker     // ubidi only accepts utf16 (though internally it basically works on utf32 chars).
128*c8dee2aaSAndroid Build Coastguard Worker     // We want an ubidi_setPara(UBiDi*, UText*, UBiDiLevel, UBiDiLevel*, UErrorCode*);
129*c8dee2aaSAndroid Build Coastguard Worker     if (!SkTFitsIn<int32_t>(utf8Bytes)) {
130*c8dee2aaSAndroid Build Coastguard Worker         SkDEBUGF("Bidi error: text too long");
131*c8dee2aaSAndroid Build Coastguard Worker         return nullptr;
132*c8dee2aaSAndroid Build Coastguard Worker     }
133*c8dee2aaSAndroid Build Coastguard Worker 
134*c8dee2aaSAndroid Build Coastguard Worker     int32_t utf16Units = SkUTF::UTF8ToUTF16(nullptr, 0, utf8, utf8Bytes);
135*c8dee2aaSAndroid Build Coastguard Worker     if (utf16Units < 0) {
136*c8dee2aaSAndroid Build Coastguard Worker         SkDEBUGF("Invalid utf8 input\n");
137*c8dee2aaSAndroid Build Coastguard Worker         return nullptr;
138*c8dee2aaSAndroid Build Coastguard Worker     }
139*c8dee2aaSAndroid Build Coastguard Worker 
140*c8dee2aaSAndroid Build Coastguard Worker     std::unique_ptr<uint16_t[]> utf16(new uint16_t[utf16Units]);
141*c8dee2aaSAndroid Build Coastguard Worker     (void)SkUTF::UTF8ToUTF16(utf16.get(), utf16Units, utf8, utf8Bytes);
142*c8dee2aaSAndroid Build Coastguard Worker 
143*c8dee2aaSAndroid Build Coastguard Worker     auto bidiDir = (bidiLevel % 2 == 0) ? SkBidiIterator::kLTR : SkBidiIterator::kRTL;
144*c8dee2aaSAndroid Build Coastguard Worker     SkUnicodeBidi bidi = unicode->makeBidiIterator(utf16.get(), utf16Units, bidiDir);
145*c8dee2aaSAndroid Build Coastguard Worker     if (!bidi) {
146*c8dee2aaSAndroid Build Coastguard Worker         SkDEBUGF("Bidi error\n");
147*c8dee2aaSAndroid Build Coastguard Worker         return nullptr;
148*c8dee2aaSAndroid Build Coastguard Worker     }
149*c8dee2aaSAndroid Build Coastguard Worker 
150*c8dee2aaSAndroid Build Coastguard Worker     return std::make_unique<SkUnicodeBidiRunIterator>(utf8, utf8 + utf8Bytes, std::move(bidi));
151*c8dee2aaSAndroid Build Coastguard Worker }
152*c8dee2aaSAndroid Build Coastguard Worker }  // namespace SkShapers::unicode
153