xref: /aosp_15_r20/external/libtextclassifier/native/annotator/quantization.cc (revision 993b0882672172b81d12fad7a7ac0c3e5c824a12)
1*993b0882SAndroid Build Coastguard Worker /*
2*993b0882SAndroid Build Coastguard Worker  * Copyright (C) 2018 The Android Open Source Project
3*993b0882SAndroid Build Coastguard Worker  *
4*993b0882SAndroid Build Coastguard Worker  * Licensed under the Apache License, Version 2.0 (the "License");
5*993b0882SAndroid Build Coastguard Worker  * you may not use this file except in compliance with the License.
6*993b0882SAndroid Build Coastguard Worker  * You may obtain a copy of the License at
7*993b0882SAndroid Build Coastguard Worker  *
8*993b0882SAndroid Build Coastguard Worker  *      http://www.apache.org/licenses/LICENSE-2.0
9*993b0882SAndroid Build Coastguard Worker  *
10*993b0882SAndroid Build Coastguard Worker  * Unless required by applicable law or agreed to in writing, software
11*993b0882SAndroid Build Coastguard Worker  * distributed under the License is distributed on an "AS IS" BASIS,
12*993b0882SAndroid Build Coastguard Worker  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*993b0882SAndroid Build Coastguard Worker  * See the License for the specific language governing permissions and
14*993b0882SAndroid Build Coastguard Worker  * limitations under the License.
15*993b0882SAndroid Build Coastguard Worker  */
16*993b0882SAndroid Build Coastguard Worker 
17*993b0882SAndroid Build Coastguard Worker #include "annotator/quantization.h"
18*993b0882SAndroid Build Coastguard Worker 
19*993b0882SAndroid Build Coastguard Worker #include "utils/base/logging.h"
20*993b0882SAndroid Build Coastguard Worker 
21*993b0882SAndroid Build Coastguard Worker namespace libtextclassifier3 {
22*993b0882SAndroid Build Coastguard Worker namespace {
DequantizeValue(int num_sparse_features,int quantization_bias,float multiplier,int value)23*993b0882SAndroid Build Coastguard Worker float DequantizeValue(int num_sparse_features, int quantization_bias,
24*993b0882SAndroid Build Coastguard Worker                       float multiplier, int value) {
25*993b0882SAndroid Build Coastguard Worker   return 1.0 / num_sparse_features * (value - quantization_bias) * multiplier;
26*993b0882SAndroid Build Coastguard Worker }
27*993b0882SAndroid Build Coastguard Worker 
DequantizeAdd8bit(const float * scales,const uint8 * embeddings,int bytes_per_embedding,const int num_sparse_features,const int bucket_id,float * dest,int dest_size)28*993b0882SAndroid Build Coastguard Worker void DequantizeAdd8bit(const float* scales, const uint8* embeddings,
29*993b0882SAndroid Build Coastguard Worker                        int bytes_per_embedding, const int num_sparse_features,
30*993b0882SAndroid Build Coastguard Worker                        const int bucket_id, float* dest, int dest_size) {
31*993b0882SAndroid Build Coastguard Worker   static const int kQuantizationBias8bit = 128;
32*993b0882SAndroid Build Coastguard Worker   const float multiplier = scales[bucket_id];
33*993b0882SAndroid Build Coastguard Worker   for (int k = 0; k < dest_size; ++k) {
34*993b0882SAndroid Build Coastguard Worker     dest[k] +=
35*993b0882SAndroid Build Coastguard Worker         DequantizeValue(num_sparse_features, kQuantizationBias8bit, multiplier,
36*993b0882SAndroid Build Coastguard Worker                         embeddings[bucket_id * bytes_per_embedding + k]);
37*993b0882SAndroid Build Coastguard Worker   }
38*993b0882SAndroid Build Coastguard Worker }
39*993b0882SAndroid Build Coastguard Worker 
DequantizeAddNBit(const float * scales,const uint8 * embeddings,int bytes_per_embedding,int num_sparse_features,int quantization_bits,int bucket_id,float * dest,int dest_size)40*993b0882SAndroid Build Coastguard Worker void DequantizeAddNBit(const float* scales, const uint8* embeddings,
41*993b0882SAndroid Build Coastguard Worker                        int bytes_per_embedding, int num_sparse_features,
42*993b0882SAndroid Build Coastguard Worker                        int quantization_bits, int bucket_id, float* dest,
43*993b0882SAndroid Build Coastguard Worker                        int dest_size) {
44*993b0882SAndroid Build Coastguard Worker   const int quantization_bias = 1 << (quantization_bits - 1);
45*993b0882SAndroid Build Coastguard Worker   const float multiplier = scales[bucket_id];
46*993b0882SAndroid Build Coastguard Worker   for (int i = 0; i < dest_size; ++i) {
47*993b0882SAndroid Build Coastguard Worker     const int bit_offset = i * quantization_bits;
48*993b0882SAndroid Build Coastguard Worker     const int read16_offset = bit_offset / 8;
49*993b0882SAndroid Build Coastguard Worker 
50*993b0882SAndroid Build Coastguard Worker     uint16 data = embeddings[bucket_id * bytes_per_embedding + read16_offset];
51*993b0882SAndroid Build Coastguard Worker     // If we are not at the end of the embedding row, we can read 2-byte uint16,
52*993b0882SAndroid Build Coastguard Worker     // but if we are, we need to only read uint8.
53*993b0882SAndroid Build Coastguard Worker     if (read16_offset < bytes_per_embedding - 1) {
54*993b0882SAndroid Build Coastguard Worker       data |= embeddings[bucket_id * bytes_per_embedding + read16_offset + 1]
55*993b0882SAndroid Build Coastguard Worker               << 8;
56*993b0882SAndroid Build Coastguard Worker     }
57*993b0882SAndroid Build Coastguard Worker     int value = (data >> (bit_offset % 8)) & ((1 << quantization_bits) - 1);
58*993b0882SAndroid Build Coastguard Worker     dest[i] += DequantizeValue(num_sparse_features, quantization_bias,
59*993b0882SAndroid Build Coastguard Worker                                multiplier, value);
60*993b0882SAndroid Build Coastguard Worker   }
61*993b0882SAndroid Build Coastguard Worker }
62*993b0882SAndroid Build Coastguard Worker }  // namespace
63*993b0882SAndroid Build Coastguard Worker 
CheckQuantizationParams(int bytes_per_embedding,int quantization_bits,int output_embedding_size)64*993b0882SAndroid Build Coastguard Worker bool CheckQuantizationParams(int bytes_per_embedding, int quantization_bits,
65*993b0882SAndroid Build Coastguard Worker                              int output_embedding_size) {
66*993b0882SAndroid Build Coastguard Worker   if (bytes_per_embedding * 8 / quantization_bits < output_embedding_size) {
67*993b0882SAndroid Build Coastguard Worker     return false;
68*993b0882SAndroid Build Coastguard Worker   }
69*993b0882SAndroid Build Coastguard Worker 
70*993b0882SAndroid Build Coastguard Worker   return true;
71*993b0882SAndroid Build Coastguard Worker }
72*993b0882SAndroid Build Coastguard Worker 
DequantizeAdd(const float * scales,const uint8 * embeddings,int bytes_per_embedding,int num_sparse_features,int quantization_bits,int bucket_id,float * dest,int dest_size)73*993b0882SAndroid Build Coastguard Worker bool DequantizeAdd(const float* scales, const uint8* embeddings,
74*993b0882SAndroid Build Coastguard Worker                    int bytes_per_embedding, int num_sparse_features,
75*993b0882SAndroid Build Coastguard Worker                    int quantization_bits, int bucket_id, float* dest,
76*993b0882SAndroid Build Coastguard Worker                    int dest_size) {
77*993b0882SAndroid Build Coastguard Worker   if (quantization_bits == 8) {
78*993b0882SAndroid Build Coastguard Worker     DequantizeAdd8bit(scales, embeddings, bytes_per_embedding,
79*993b0882SAndroid Build Coastguard Worker                       num_sparse_features, bucket_id, dest, dest_size);
80*993b0882SAndroid Build Coastguard Worker   } else if (quantization_bits != 8) {
81*993b0882SAndroid Build Coastguard Worker     DequantizeAddNBit(scales, embeddings, bytes_per_embedding,
82*993b0882SAndroid Build Coastguard Worker                       num_sparse_features, quantization_bits, bucket_id, dest,
83*993b0882SAndroid Build Coastguard Worker                       dest_size);
84*993b0882SAndroid Build Coastguard Worker   } else {
85*993b0882SAndroid Build Coastguard Worker     TC3_LOG(ERROR) << "Unsupported quantization_bits: " << quantization_bits;
86*993b0882SAndroid Build Coastguard Worker     return false;
87*993b0882SAndroid Build Coastguard Worker   }
88*993b0882SAndroid Build Coastguard Worker 
89*993b0882SAndroid Build Coastguard Worker   return true;
90*993b0882SAndroid Build Coastguard Worker }
91*993b0882SAndroid Build Coastguard Worker 
92*993b0882SAndroid Build Coastguard Worker }  // namespace libtextclassifier3
93