1*993b0882SAndroid Build Coastguard Worker /*
2*993b0882SAndroid Build Coastguard Worker * Copyright (C) 2018 The Android Open Source Project
3*993b0882SAndroid Build Coastguard Worker *
4*993b0882SAndroid Build Coastguard Worker * Licensed under the Apache License, Version 2.0 (the "License");
5*993b0882SAndroid Build Coastguard Worker * you may not use this file except in compliance with the License.
6*993b0882SAndroid Build Coastguard Worker * You may obtain a copy of the License at
7*993b0882SAndroid Build Coastguard Worker *
8*993b0882SAndroid Build Coastguard Worker * http://www.apache.org/licenses/LICENSE-2.0
9*993b0882SAndroid Build Coastguard Worker *
10*993b0882SAndroid Build Coastguard Worker * Unless required by applicable law or agreed to in writing, software
11*993b0882SAndroid Build Coastguard Worker * distributed under the License is distributed on an "AS IS" BASIS,
12*993b0882SAndroid Build Coastguard Worker * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*993b0882SAndroid Build Coastguard Worker * See the License for the specific language governing permissions and
14*993b0882SAndroid Build Coastguard Worker * limitations under the License.
15*993b0882SAndroid Build Coastguard Worker */
16*993b0882SAndroid Build Coastguard Worker
17*993b0882SAndroid Build Coastguard Worker #include "annotator/model-executor.h"
18*993b0882SAndroid Build Coastguard Worker
19*993b0882SAndroid Build Coastguard Worker #include "annotator/quantization.h"
20*993b0882SAndroid Build Coastguard Worker #include "utils/base/logging.h"
21*993b0882SAndroid Build Coastguard Worker
22*993b0882SAndroid Build Coastguard Worker namespace libtextclassifier3 {
23*993b0882SAndroid Build Coastguard Worker
ComputeLogits(const TensorView<float> & features,tflite::Interpreter * interpreter) const24*993b0882SAndroid Build Coastguard Worker TensorView<float> ModelExecutor::ComputeLogits(
25*993b0882SAndroid Build Coastguard Worker const TensorView<float>& features, tflite::Interpreter* interpreter) const {
26*993b0882SAndroid Build Coastguard Worker if (!interpreter) {
27*993b0882SAndroid Build Coastguard Worker return TensorView<float>::Invalid();
28*993b0882SAndroid Build Coastguard Worker }
29*993b0882SAndroid Build Coastguard Worker interpreter->ResizeInputTensor(kInputIndexFeatures, features.shape());
30*993b0882SAndroid Build Coastguard Worker if (interpreter->AllocateTensors() != kTfLiteOk) {
31*993b0882SAndroid Build Coastguard Worker TC3_VLOG(1) << "Allocation failed.";
32*993b0882SAndroid Build Coastguard Worker return TensorView<float>::Invalid();
33*993b0882SAndroid Build Coastguard Worker }
34*993b0882SAndroid Build Coastguard Worker
35*993b0882SAndroid Build Coastguard Worker SetInput<float>(kInputIndexFeatures, features, interpreter);
36*993b0882SAndroid Build Coastguard Worker
37*993b0882SAndroid Build Coastguard Worker if (interpreter->Invoke() != kTfLiteOk) {
38*993b0882SAndroid Build Coastguard Worker TC3_VLOG(1) << "Interpreter failed.";
39*993b0882SAndroid Build Coastguard Worker return TensorView<float>::Invalid();
40*993b0882SAndroid Build Coastguard Worker }
41*993b0882SAndroid Build Coastguard Worker
42*993b0882SAndroid Build Coastguard Worker return OutputView<float>(kOutputIndexLogits, interpreter);
43*993b0882SAndroid Build Coastguard Worker }
44*993b0882SAndroid Build Coastguard Worker
FromBuffer(const flatbuffers::Vector<uint8_t> * model_spec_buffer,int embedding_size,int quantization_bits,const Model_::EmbeddingPruningMask * embedding_pruning_mask)45*993b0882SAndroid Build Coastguard Worker std::unique_ptr<TFLiteEmbeddingExecutor> TFLiteEmbeddingExecutor::FromBuffer(
46*993b0882SAndroid Build Coastguard Worker const flatbuffers::Vector<uint8_t>* model_spec_buffer, int embedding_size,
47*993b0882SAndroid Build Coastguard Worker int quantization_bits,
48*993b0882SAndroid Build Coastguard Worker const Model_::EmbeddingPruningMask* embedding_pruning_mask) {
49*993b0882SAndroid Build Coastguard Worker std::unique_ptr<TfLiteModelExecutor> executor =
50*993b0882SAndroid Build Coastguard Worker TfLiteModelExecutor::FromBuffer(model_spec_buffer);
51*993b0882SAndroid Build Coastguard Worker if (!executor) {
52*993b0882SAndroid Build Coastguard Worker TC3_LOG(ERROR) << "Could not load TFLite model for embeddings.";
53*993b0882SAndroid Build Coastguard Worker return nullptr;
54*993b0882SAndroid Build Coastguard Worker }
55*993b0882SAndroid Build Coastguard Worker
56*993b0882SAndroid Build Coastguard Worker std::unique_ptr<tflite::Interpreter> interpreter =
57*993b0882SAndroid Build Coastguard Worker executor->CreateInterpreter();
58*993b0882SAndroid Build Coastguard Worker if (!interpreter) {
59*993b0882SAndroid Build Coastguard Worker TC3_LOG(ERROR) << "Could not build TFLite interpreter for embeddings.";
60*993b0882SAndroid Build Coastguard Worker return nullptr;
61*993b0882SAndroid Build Coastguard Worker }
62*993b0882SAndroid Build Coastguard Worker
63*993b0882SAndroid Build Coastguard Worker if (interpreter->tensors_size() != 2) {
64*993b0882SAndroid Build Coastguard Worker return nullptr;
65*993b0882SAndroid Build Coastguard Worker }
66*993b0882SAndroid Build Coastguard Worker const TfLiteTensor* embeddings = interpreter->tensor(0);
67*993b0882SAndroid Build Coastguard Worker if (embeddings->dims->size != 2) {
68*993b0882SAndroid Build Coastguard Worker return nullptr;
69*993b0882SAndroid Build Coastguard Worker }
70*993b0882SAndroid Build Coastguard Worker int num_buckets = embeddings->dims->data[0];
71*993b0882SAndroid Build Coastguard Worker const TfLiteTensor* scales = interpreter->tensor(1);
72*993b0882SAndroid Build Coastguard Worker if (scales->dims->size != 2 || scales->dims->data[0] != num_buckets ||
73*993b0882SAndroid Build Coastguard Worker scales->dims->data[1] != 1) {
74*993b0882SAndroid Build Coastguard Worker return nullptr;
75*993b0882SAndroid Build Coastguard Worker }
76*993b0882SAndroid Build Coastguard Worker int bytes_per_embedding = embeddings->dims->data[1];
77*993b0882SAndroid Build Coastguard Worker if (!CheckQuantizationParams(bytes_per_embedding, quantization_bits,
78*993b0882SAndroid Build Coastguard Worker embedding_size)) {
79*993b0882SAndroid Build Coastguard Worker TC3_LOG(ERROR) << "Mismatch in quantization parameters.";
80*993b0882SAndroid Build Coastguard Worker return nullptr;
81*993b0882SAndroid Build Coastguard Worker }
82*993b0882SAndroid Build Coastguard Worker
83*993b0882SAndroid Build Coastguard Worker return std::unique_ptr<TFLiteEmbeddingExecutor>(new TFLiteEmbeddingExecutor(
84*993b0882SAndroid Build Coastguard Worker std::move(executor), quantization_bits, num_buckets, bytes_per_embedding,
85*993b0882SAndroid Build Coastguard Worker embedding_size, scales, embeddings, std::move(interpreter),
86*993b0882SAndroid Build Coastguard Worker embedding_pruning_mask));
87*993b0882SAndroid Build Coastguard Worker }
88*993b0882SAndroid Build Coastguard Worker
TFLiteEmbeddingExecutor(std::unique_ptr<TfLiteModelExecutor> executor,int quantization_bits,int num_buckets,int bytes_per_embedding,int output_embedding_size,const TfLiteTensor * scales,const TfLiteTensor * embeddings,std::unique_ptr<tflite::Interpreter> interpreter,const Model_::EmbeddingPruningMask * embedding_pruning_mask)89*993b0882SAndroid Build Coastguard Worker TFLiteEmbeddingExecutor::TFLiteEmbeddingExecutor(
90*993b0882SAndroid Build Coastguard Worker std::unique_ptr<TfLiteModelExecutor> executor, int quantization_bits,
91*993b0882SAndroid Build Coastguard Worker int num_buckets, int bytes_per_embedding, int output_embedding_size,
92*993b0882SAndroid Build Coastguard Worker const TfLiteTensor* scales, const TfLiteTensor* embeddings,
93*993b0882SAndroid Build Coastguard Worker std::unique_ptr<tflite::Interpreter> interpreter,
94*993b0882SAndroid Build Coastguard Worker const Model_::EmbeddingPruningMask* embedding_pruning_mask)
95*993b0882SAndroid Build Coastguard Worker : executor_(std::move(executor)),
96*993b0882SAndroid Build Coastguard Worker quantization_bits_(quantization_bits),
97*993b0882SAndroid Build Coastguard Worker num_buckets_(num_buckets),
98*993b0882SAndroid Build Coastguard Worker bytes_per_embedding_(bytes_per_embedding),
99*993b0882SAndroid Build Coastguard Worker output_embedding_size_(output_embedding_size),
100*993b0882SAndroid Build Coastguard Worker scales_(scales),
101*993b0882SAndroid Build Coastguard Worker embeddings_(embeddings),
102*993b0882SAndroid Build Coastguard Worker interpreter_(std::move(interpreter)) {
103*993b0882SAndroid Build Coastguard Worker if ((embedding_pruning_mask != nullptr) &&
104*993b0882SAndroid Build Coastguard Worker (embedding_pruning_mask->enabled())) {
105*993b0882SAndroid Build Coastguard Worker for (int i = 0; i < embedding_pruning_mask->pruning_mask()->size(); i++) {
106*993b0882SAndroid Build Coastguard Worker pruning_mask_.push_back((*(embedding_pruning_mask->pruning_mask()))[i]);
107*993b0882SAndroid Build Coastguard Worker }
108*993b0882SAndroid Build Coastguard Worker ComputePrefixCounts();
109*993b0882SAndroid Build Coastguard Worker full_num_buckets_ = embedding_pruning_mask->full_num_buckets();
110*993b0882SAndroid Build Coastguard Worker pruned_row_bucket_id_ = embedding_pruning_mask->pruned_row_bucket_id();
111*993b0882SAndroid Build Coastguard Worker } else {
112*993b0882SAndroid Build Coastguard Worker full_num_buckets_ = num_buckets;
113*993b0882SAndroid Build Coastguard Worker }
114*993b0882SAndroid Build Coastguard Worker }
115*993b0882SAndroid Build Coastguard Worker
ComputePrefixCounts()116*993b0882SAndroid Build Coastguard Worker void TFLiteEmbeddingExecutor::ComputePrefixCounts() {
117*993b0882SAndroid Build Coastguard Worker // Pre-compute the prefix sums.
118*993b0882SAndroid Build Coastguard Worker // For each i in {0, 1,...,pruning_mask_.size()-1}, we compute number of 1s
119*993b0882SAndroid Build Coastguard Worker // in binary representations of the uint64 values in pruning_mask_ before
120*993b0882SAndroid Build Coastguard Worker // index i. We set pruned_row_bucket_id_ to the total number of 1s
121*993b0882SAndroid Build Coastguard Worker // in binary representations of all values in pruning_mask_.
122*993b0882SAndroid Build Coastguard Worker int count = 0;
123*993b0882SAndroid Build Coastguard Worker for (const uint64 mask : pruning_mask_) {
124*993b0882SAndroid Build Coastguard Worker prefix_counts_.push_back(count);
125*993b0882SAndroid Build Coastguard Worker count += __builtin_popcountll(mask);
126*993b0882SAndroid Build Coastguard Worker }
127*993b0882SAndroid Build Coastguard Worker }
128*993b0882SAndroid Build Coastguard Worker
PruneBucketId(int bucket_id) const129*993b0882SAndroid Build Coastguard Worker int TFLiteEmbeddingExecutor::PruneBucketId(int bucket_id) const {
130*993b0882SAndroid Build Coastguard Worker // Implements auxiliary data structure for computing the pruned index of a
131*993b0882SAndroid Build Coastguard Worker // given bucket_id.
132*993b0882SAndroid Build Coastguard Worker // If bucket_id is present in pruning_mask_, we compute floor(bucket_id/64),
133*993b0882SAndroid Build Coastguard Worker // look it up in the auxiliary array prefix_counts_, and add to it the number
134*993b0882SAndroid Build Coastguard Worker // of 1s before before bucket_id % 64 in the 64-bit sequence
135*993b0882SAndroid Build Coastguard Worker // pruning_mask_[floor(bucket_id/64)].
136*993b0882SAndroid Build Coastguard Worker // If bucket_id is absent from pruning_mask_, we return pruned_row_bucket_id_.
137*993b0882SAndroid Build Coastguard Worker const int bucket_id_major = bucket_id >> 6;
138*993b0882SAndroid Build Coastguard Worker const int bucket_id_minor = bucket_id & 63;
139*993b0882SAndroid Build Coastguard Worker uint64_t one = 1;
140*993b0882SAndroid Build Coastguard Worker if (!(pruning_mask_[bucket_id_major] & (one << bucket_id_minor)))
141*993b0882SAndroid Build Coastguard Worker return pruned_row_bucket_id_;
142*993b0882SAndroid Build Coastguard Worker const uint64 zero = 0;
143*993b0882SAndroid Build Coastguard Worker uint64 minor_mask;
144*993b0882SAndroid Build Coastguard Worker if (bucket_id_minor == 0)
145*993b0882SAndroid Build Coastguard Worker minor_mask = zero;
146*993b0882SAndroid Build Coastguard Worker else
147*993b0882SAndroid Build Coastguard Worker minor_mask = ((~zero) >> (64 - bucket_id_minor));
148*993b0882SAndroid Build Coastguard Worker return prefix_counts_[bucket_id_major] +
149*993b0882SAndroid Build Coastguard Worker __builtin_popcountll(pruning_mask_[bucket_id_major] & minor_mask);
150*993b0882SAndroid Build Coastguard Worker }
151*993b0882SAndroid Build Coastguard Worker
AddEmbedding(const TensorView<int> & sparse_features,float * dest,int dest_size) const152*993b0882SAndroid Build Coastguard Worker bool TFLiteEmbeddingExecutor::AddEmbedding(
153*993b0882SAndroid Build Coastguard Worker const TensorView<int>& sparse_features, float* dest, int dest_size) const {
154*993b0882SAndroid Build Coastguard Worker if (dest_size != output_embedding_size_) {
155*993b0882SAndroid Build Coastguard Worker TC3_LOG(ERROR) << "Mismatching dest_size and output_embedding_size: "
156*993b0882SAndroid Build Coastguard Worker << dest_size << " " << output_embedding_size_;
157*993b0882SAndroid Build Coastguard Worker return false;
158*993b0882SAndroid Build Coastguard Worker }
159*993b0882SAndroid Build Coastguard Worker const int num_sparse_features = sparse_features.size();
160*993b0882SAndroid Build Coastguard Worker for (int i = 0; i < num_sparse_features; ++i) {
161*993b0882SAndroid Build Coastguard Worker const int bucket_id = sparse_features.data()[i];
162*993b0882SAndroid Build Coastguard Worker int full_num_buckets;
163*993b0882SAndroid Build Coastguard Worker if (!pruning_mask_.empty()) {
164*993b0882SAndroid Build Coastguard Worker full_num_buckets = full_num_buckets_;
165*993b0882SAndroid Build Coastguard Worker } else {
166*993b0882SAndroid Build Coastguard Worker full_num_buckets = num_buckets_;
167*993b0882SAndroid Build Coastguard Worker }
168*993b0882SAndroid Build Coastguard Worker if (bucket_id >= full_num_buckets) {
169*993b0882SAndroid Build Coastguard Worker return false;
170*993b0882SAndroid Build Coastguard Worker }
171*993b0882SAndroid Build Coastguard Worker int final_bucket_id;
172*993b0882SAndroid Build Coastguard Worker if (!pruning_mask_.empty()) {
173*993b0882SAndroid Build Coastguard Worker final_bucket_id = PruneBucketId(bucket_id);
174*993b0882SAndroid Build Coastguard Worker } else {
175*993b0882SAndroid Build Coastguard Worker final_bucket_id = bucket_id;
176*993b0882SAndroid Build Coastguard Worker }
177*993b0882SAndroid Build Coastguard Worker if (!DequantizeAdd(scales_->data.f, embeddings_->data.uint8,
178*993b0882SAndroid Build Coastguard Worker bytes_per_embedding_, num_sparse_features,
179*993b0882SAndroid Build Coastguard Worker quantization_bits_, final_bucket_id, dest, dest_size)) {
180*993b0882SAndroid Build Coastguard Worker return false;
181*993b0882SAndroid Build Coastguard Worker }
182*993b0882SAndroid Build Coastguard Worker }
183*993b0882SAndroid Build Coastguard Worker return true;
184*993b0882SAndroid Build Coastguard Worker }
185*993b0882SAndroid Build Coastguard Worker
186*993b0882SAndroid Build Coastguard Worker } // namespace libtextclassifier3
187