xref: /aosp_15_r20/external/libtextclassifier/native/annotator/zlib-utils.cc (revision 993b0882672172b81d12fad7a7ac0c3e5c824a12)
1*993b0882SAndroid Build Coastguard Worker /*
2*993b0882SAndroid Build Coastguard Worker  * Copyright (C) 2018 The Android Open Source Project
3*993b0882SAndroid Build Coastguard Worker  *
4*993b0882SAndroid Build Coastguard Worker  * Licensed under the Apache License, Version 2.0 (the "License");
5*993b0882SAndroid Build Coastguard Worker  * you may not use this file except in compliance with the License.
6*993b0882SAndroid Build Coastguard Worker  * You may obtain a copy of the License at
7*993b0882SAndroid Build Coastguard Worker  *
8*993b0882SAndroid Build Coastguard Worker  *      http://www.apache.org/licenses/LICENSE-2.0
9*993b0882SAndroid Build Coastguard Worker  *
10*993b0882SAndroid Build Coastguard Worker  * Unless required by applicable law or agreed to in writing, software
11*993b0882SAndroid Build Coastguard Worker  * distributed under the License is distributed on an "AS IS" BASIS,
12*993b0882SAndroid Build Coastguard Worker  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*993b0882SAndroid Build Coastguard Worker  * See the License for the specific language governing permissions and
14*993b0882SAndroid Build Coastguard Worker  * limitations under the License.
15*993b0882SAndroid Build Coastguard Worker  */
16*993b0882SAndroid Build Coastguard Worker 
17*993b0882SAndroid Build Coastguard Worker #include "annotator/zlib-utils.h"
18*993b0882SAndroid Build Coastguard Worker 
19*993b0882SAndroid Build Coastguard Worker #include <memory>
20*993b0882SAndroid Build Coastguard Worker 
21*993b0882SAndroid Build Coastguard Worker #include "utils/base/logging.h"
22*993b0882SAndroid Build Coastguard Worker #include "utils/intents/zlib-utils.h"
23*993b0882SAndroid Build Coastguard Worker #include "utils/zlib/zlib.h"
24*993b0882SAndroid Build Coastguard Worker 
25*993b0882SAndroid Build Coastguard Worker namespace libtextclassifier3 {
26*993b0882SAndroid Build Coastguard Worker 
27*993b0882SAndroid Build Coastguard Worker // Compress rule fields in the model.
CompressModel(ModelT * model)28*993b0882SAndroid Build Coastguard Worker bool CompressModel(ModelT* model) {
29*993b0882SAndroid Build Coastguard Worker   std::unique_ptr<ZlibCompressor> zlib_compressor = ZlibCompressor::Instance();
30*993b0882SAndroid Build Coastguard Worker   if (!zlib_compressor) {
31*993b0882SAndroid Build Coastguard Worker     TC3_LOG(ERROR) << "Cannot compress model.";
32*993b0882SAndroid Build Coastguard Worker     return false;
33*993b0882SAndroid Build Coastguard Worker   }
34*993b0882SAndroid Build Coastguard Worker 
35*993b0882SAndroid Build Coastguard Worker   // Compress regex rules.
36*993b0882SAndroid Build Coastguard Worker   if (model->regex_model != nullptr) {
37*993b0882SAndroid Build Coastguard Worker     for (int i = 0; i < model->regex_model->patterns.size(); i++) {
38*993b0882SAndroid Build Coastguard Worker       RegexModel_::PatternT* pattern = model->regex_model->patterns[i].get();
39*993b0882SAndroid Build Coastguard Worker       pattern->compressed_pattern.reset(new CompressedBufferT);
40*993b0882SAndroid Build Coastguard Worker       zlib_compressor->Compress(pattern->pattern,
41*993b0882SAndroid Build Coastguard Worker                                 pattern->compressed_pattern.get());
42*993b0882SAndroid Build Coastguard Worker       pattern->pattern.clear();
43*993b0882SAndroid Build Coastguard Worker     }
44*993b0882SAndroid Build Coastguard Worker   }
45*993b0882SAndroid Build Coastguard Worker 
46*993b0882SAndroid Build Coastguard Worker   // Compress date-time rules.
47*993b0882SAndroid Build Coastguard Worker   if (model->datetime_model != nullptr) {
48*993b0882SAndroid Build Coastguard Worker     for (int i = 0; i < model->datetime_model->patterns.size(); i++) {
49*993b0882SAndroid Build Coastguard Worker       DatetimeModelPatternT* pattern = model->datetime_model->patterns[i].get();
50*993b0882SAndroid Build Coastguard Worker       for (int j = 0; j < pattern->regexes.size(); j++) {
51*993b0882SAndroid Build Coastguard Worker         DatetimeModelPattern_::RegexT* regex = pattern->regexes[j].get();
52*993b0882SAndroid Build Coastguard Worker         regex->compressed_pattern.reset(new CompressedBufferT);
53*993b0882SAndroid Build Coastguard Worker         zlib_compressor->Compress(regex->pattern,
54*993b0882SAndroid Build Coastguard Worker                                   regex->compressed_pattern.get());
55*993b0882SAndroid Build Coastguard Worker         regex->pattern.clear();
56*993b0882SAndroid Build Coastguard Worker       }
57*993b0882SAndroid Build Coastguard Worker     }
58*993b0882SAndroid Build Coastguard Worker     for (int i = 0; i < model->datetime_model->extractors.size(); i++) {
59*993b0882SAndroid Build Coastguard Worker       DatetimeModelExtractorT* extractor =
60*993b0882SAndroid Build Coastguard Worker           model->datetime_model->extractors[i].get();
61*993b0882SAndroid Build Coastguard Worker       extractor->compressed_pattern.reset(new CompressedBufferT);
62*993b0882SAndroid Build Coastguard Worker       zlib_compressor->Compress(extractor->pattern,
63*993b0882SAndroid Build Coastguard Worker                                 extractor->compressed_pattern.get());
64*993b0882SAndroid Build Coastguard Worker       extractor->pattern.clear();
65*993b0882SAndroid Build Coastguard Worker     }
66*993b0882SAndroid Build Coastguard Worker   }
67*993b0882SAndroid Build Coastguard Worker 
68*993b0882SAndroid Build Coastguard Worker   // Compress intent generator.
69*993b0882SAndroid Build Coastguard Worker   if (model->intent_options != nullptr) {
70*993b0882SAndroid Build Coastguard Worker     CompressIntentModel(model->intent_options.get());
71*993b0882SAndroid Build Coastguard Worker   }
72*993b0882SAndroid Build Coastguard Worker 
73*993b0882SAndroid Build Coastguard Worker   return true;
74*993b0882SAndroid Build Coastguard Worker }
75*993b0882SAndroid Build Coastguard Worker 
DecompressModel(ModelT * model)76*993b0882SAndroid Build Coastguard Worker bool DecompressModel(ModelT* model) {
77*993b0882SAndroid Build Coastguard Worker   std::unique_ptr<ZlibDecompressor> zlib_decompressor =
78*993b0882SAndroid Build Coastguard Worker       ZlibDecompressor::Instance();
79*993b0882SAndroid Build Coastguard Worker   if (!zlib_decompressor) {
80*993b0882SAndroid Build Coastguard Worker     TC3_LOG(ERROR) << "Cannot initialize decompressor.";
81*993b0882SAndroid Build Coastguard Worker     return false;
82*993b0882SAndroid Build Coastguard Worker   }
83*993b0882SAndroid Build Coastguard Worker 
84*993b0882SAndroid Build Coastguard Worker   // Decompress regex rules.
85*993b0882SAndroid Build Coastguard Worker   if (model->regex_model != nullptr) {
86*993b0882SAndroid Build Coastguard Worker     for (int i = 0; i < model->regex_model->patterns.size(); i++) {
87*993b0882SAndroid Build Coastguard Worker       RegexModel_::PatternT* pattern = model->regex_model->patterns[i].get();
88*993b0882SAndroid Build Coastguard Worker       if (!zlib_decompressor->MaybeDecompress(pattern->compressed_pattern.get(),
89*993b0882SAndroid Build Coastguard Worker                                               &pattern->pattern)) {
90*993b0882SAndroid Build Coastguard Worker         TC3_LOG(ERROR) << "Cannot decompress pattern: " << i;
91*993b0882SAndroid Build Coastguard Worker         return false;
92*993b0882SAndroid Build Coastguard Worker       }
93*993b0882SAndroid Build Coastguard Worker       pattern->compressed_pattern.reset(nullptr);
94*993b0882SAndroid Build Coastguard Worker     }
95*993b0882SAndroid Build Coastguard Worker   }
96*993b0882SAndroid Build Coastguard Worker 
97*993b0882SAndroid Build Coastguard Worker   // Decompress date-time rules.
98*993b0882SAndroid Build Coastguard Worker   if (model->datetime_model != nullptr) {
99*993b0882SAndroid Build Coastguard Worker     for (int i = 0; i < model->datetime_model->patterns.size(); i++) {
100*993b0882SAndroid Build Coastguard Worker       DatetimeModelPatternT* pattern = model->datetime_model->patterns[i].get();
101*993b0882SAndroid Build Coastguard Worker       for (int j = 0; j < pattern->regexes.size(); j++) {
102*993b0882SAndroid Build Coastguard Worker         DatetimeModelPattern_::RegexT* regex = pattern->regexes[j].get();
103*993b0882SAndroid Build Coastguard Worker         if (!zlib_decompressor->MaybeDecompress(regex->compressed_pattern.get(),
104*993b0882SAndroid Build Coastguard Worker                                                 &regex->pattern)) {
105*993b0882SAndroid Build Coastguard Worker           TC3_LOG(ERROR) << "Cannot decompress pattern: " << i << " " << j;
106*993b0882SAndroid Build Coastguard Worker           return false;
107*993b0882SAndroid Build Coastguard Worker         }
108*993b0882SAndroid Build Coastguard Worker         regex->compressed_pattern.reset(nullptr);
109*993b0882SAndroid Build Coastguard Worker       }
110*993b0882SAndroid Build Coastguard Worker     }
111*993b0882SAndroid Build Coastguard Worker     for (int i = 0; i < model->datetime_model->extractors.size(); i++) {
112*993b0882SAndroid Build Coastguard Worker       DatetimeModelExtractorT* extractor =
113*993b0882SAndroid Build Coastguard Worker           model->datetime_model->extractors[i].get();
114*993b0882SAndroid Build Coastguard Worker       if (!zlib_decompressor->MaybeDecompress(
115*993b0882SAndroid Build Coastguard Worker               extractor->compressed_pattern.get(), &extractor->pattern)) {
116*993b0882SAndroid Build Coastguard Worker         TC3_LOG(ERROR) << "Cannot decompress pattern: " << i;
117*993b0882SAndroid Build Coastguard Worker         return false;
118*993b0882SAndroid Build Coastguard Worker       }
119*993b0882SAndroid Build Coastguard Worker       extractor->compressed_pattern.reset(nullptr);
120*993b0882SAndroid Build Coastguard Worker     }
121*993b0882SAndroid Build Coastguard Worker   }
122*993b0882SAndroid Build Coastguard Worker 
123*993b0882SAndroid Build Coastguard Worker   if (model->intent_options != nullptr) {
124*993b0882SAndroid Build Coastguard Worker     DecompressIntentModel(model->intent_options.get());
125*993b0882SAndroid Build Coastguard Worker   }
126*993b0882SAndroid Build Coastguard Worker 
127*993b0882SAndroid Build Coastguard Worker   return true;
128*993b0882SAndroid Build Coastguard Worker }
129*993b0882SAndroid Build Coastguard Worker 
CompressSerializedModel(const std::string & model)130*993b0882SAndroid Build Coastguard Worker std::string CompressSerializedModel(const std::string& model) {
131*993b0882SAndroid Build Coastguard Worker   std::unique_ptr<ModelT> unpacked_model = UnPackModel(model.c_str());
132*993b0882SAndroid Build Coastguard Worker   TC3_CHECK(unpacked_model != nullptr);
133*993b0882SAndroid Build Coastguard Worker   TC3_CHECK(CompressModel(unpacked_model.get()));
134*993b0882SAndroid Build Coastguard Worker   flatbuffers::FlatBufferBuilder builder;
135*993b0882SAndroid Build Coastguard Worker   FinishModelBuffer(builder, Model::Pack(builder, unpacked_model.get()));
136*993b0882SAndroid Build Coastguard Worker   return std::string(reinterpret_cast<const char*>(builder.GetBufferPointer()),
137*993b0882SAndroid Build Coastguard Worker                      builder.GetSize());
138*993b0882SAndroid Build Coastguard Worker }
139*993b0882SAndroid Build Coastguard Worker 
140*993b0882SAndroid Build Coastguard Worker }  // namespace libtextclassifier3
141