1*993b0882SAndroid Build Coastguard Worker /*
2*993b0882SAndroid Build Coastguard Worker * Copyright (C) 2018 The Android Open Source Project
3*993b0882SAndroid Build Coastguard Worker *
4*993b0882SAndroid Build Coastguard Worker * Licensed under the Apache License, Version 2.0 (the "License");
5*993b0882SAndroid Build Coastguard Worker * you may not use this file except in compliance with the License.
6*993b0882SAndroid Build Coastguard Worker * You may obtain a copy of the License at
7*993b0882SAndroid Build Coastguard Worker *
8*993b0882SAndroid Build Coastguard Worker * http://www.apache.org/licenses/LICENSE-2.0
9*993b0882SAndroid Build Coastguard Worker *
10*993b0882SAndroid Build Coastguard Worker * Unless required by applicable law or agreed to in writing, software
11*993b0882SAndroid Build Coastguard Worker * distributed under the License is distributed on an "AS IS" BASIS,
12*993b0882SAndroid Build Coastguard Worker * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*993b0882SAndroid Build Coastguard Worker * See the License for the specific language governing permissions and
14*993b0882SAndroid Build Coastguard Worker * limitations under the License.
15*993b0882SAndroid Build Coastguard Worker */
16*993b0882SAndroid Build Coastguard Worker
17*993b0882SAndroid Build Coastguard Worker #include "annotator/quantization.h"
18*993b0882SAndroid Build Coastguard Worker
19*993b0882SAndroid Build Coastguard Worker #include "utils/base/logging.h"
20*993b0882SAndroid Build Coastguard Worker
21*993b0882SAndroid Build Coastguard Worker namespace libtextclassifier3 {
22*993b0882SAndroid Build Coastguard Worker namespace {
DequantizeValue(int num_sparse_features,int quantization_bias,float multiplier,int value)23*993b0882SAndroid Build Coastguard Worker float DequantizeValue(int num_sparse_features, int quantization_bias,
24*993b0882SAndroid Build Coastguard Worker float multiplier, int value) {
25*993b0882SAndroid Build Coastguard Worker return 1.0 / num_sparse_features * (value - quantization_bias) * multiplier;
26*993b0882SAndroid Build Coastguard Worker }
27*993b0882SAndroid Build Coastguard Worker
DequantizeAdd8bit(const float * scales,const uint8 * embeddings,int bytes_per_embedding,const int num_sparse_features,const int bucket_id,float * dest,int dest_size)28*993b0882SAndroid Build Coastguard Worker void DequantizeAdd8bit(const float* scales, const uint8* embeddings,
29*993b0882SAndroid Build Coastguard Worker int bytes_per_embedding, const int num_sparse_features,
30*993b0882SAndroid Build Coastguard Worker const int bucket_id, float* dest, int dest_size) {
31*993b0882SAndroid Build Coastguard Worker static const int kQuantizationBias8bit = 128;
32*993b0882SAndroid Build Coastguard Worker const float multiplier = scales[bucket_id];
33*993b0882SAndroid Build Coastguard Worker for (int k = 0; k < dest_size; ++k) {
34*993b0882SAndroid Build Coastguard Worker dest[k] +=
35*993b0882SAndroid Build Coastguard Worker DequantizeValue(num_sparse_features, kQuantizationBias8bit, multiplier,
36*993b0882SAndroid Build Coastguard Worker embeddings[bucket_id * bytes_per_embedding + k]);
37*993b0882SAndroid Build Coastguard Worker }
38*993b0882SAndroid Build Coastguard Worker }
39*993b0882SAndroid Build Coastguard Worker
DequantizeAddNBit(const float * scales,const uint8 * embeddings,int bytes_per_embedding,int num_sparse_features,int quantization_bits,int bucket_id,float * dest,int dest_size)40*993b0882SAndroid Build Coastguard Worker void DequantizeAddNBit(const float* scales, const uint8* embeddings,
41*993b0882SAndroid Build Coastguard Worker int bytes_per_embedding, int num_sparse_features,
42*993b0882SAndroid Build Coastguard Worker int quantization_bits, int bucket_id, float* dest,
43*993b0882SAndroid Build Coastguard Worker int dest_size) {
44*993b0882SAndroid Build Coastguard Worker const int quantization_bias = 1 << (quantization_bits - 1);
45*993b0882SAndroid Build Coastguard Worker const float multiplier = scales[bucket_id];
46*993b0882SAndroid Build Coastguard Worker for (int i = 0; i < dest_size; ++i) {
47*993b0882SAndroid Build Coastguard Worker const int bit_offset = i * quantization_bits;
48*993b0882SAndroid Build Coastguard Worker const int read16_offset = bit_offset / 8;
49*993b0882SAndroid Build Coastguard Worker
50*993b0882SAndroid Build Coastguard Worker uint16 data = embeddings[bucket_id * bytes_per_embedding + read16_offset];
51*993b0882SAndroid Build Coastguard Worker // If we are not at the end of the embedding row, we can read 2-byte uint16,
52*993b0882SAndroid Build Coastguard Worker // but if we are, we need to only read uint8.
53*993b0882SAndroid Build Coastguard Worker if (read16_offset < bytes_per_embedding - 1) {
54*993b0882SAndroid Build Coastguard Worker data |= embeddings[bucket_id * bytes_per_embedding + read16_offset + 1]
55*993b0882SAndroid Build Coastguard Worker << 8;
56*993b0882SAndroid Build Coastguard Worker }
57*993b0882SAndroid Build Coastguard Worker int value = (data >> (bit_offset % 8)) & ((1 << quantization_bits) - 1);
58*993b0882SAndroid Build Coastguard Worker dest[i] += DequantizeValue(num_sparse_features, quantization_bias,
59*993b0882SAndroid Build Coastguard Worker multiplier, value);
60*993b0882SAndroid Build Coastguard Worker }
61*993b0882SAndroid Build Coastguard Worker }
62*993b0882SAndroid Build Coastguard Worker } // namespace
63*993b0882SAndroid Build Coastguard Worker
CheckQuantizationParams(int bytes_per_embedding,int quantization_bits,int output_embedding_size)64*993b0882SAndroid Build Coastguard Worker bool CheckQuantizationParams(int bytes_per_embedding, int quantization_bits,
65*993b0882SAndroid Build Coastguard Worker int output_embedding_size) {
66*993b0882SAndroid Build Coastguard Worker if (bytes_per_embedding * 8 / quantization_bits < output_embedding_size) {
67*993b0882SAndroid Build Coastguard Worker return false;
68*993b0882SAndroid Build Coastguard Worker }
69*993b0882SAndroid Build Coastguard Worker
70*993b0882SAndroid Build Coastguard Worker return true;
71*993b0882SAndroid Build Coastguard Worker }
72*993b0882SAndroid Build Coastguard Worker
DequantizeAdd(const float * scales,const uint8 * embeddings,int bytes_per_embedding,int num_sparse_features,int quantization_bits,int bucket_id,float * dest,int dest_size)73*993b0882SAndroid Build Coastguard Worker bool DequantizeAdd(const float* scales, const uint8* embeddings,
74*993b0882SAndroid Build Coastguard Worker int bytes_per_embedding, int num_sparse_features,
75*993b0882SAndroid Build Coastguard Worker int quantization_bits, int bucket_id, float* dest,
76*993b0882SAndroid Build Coastguard Worker int dest_size) {
77*993b0882SAndroid Build Coastguard Worker if (quantization_bits == 8) {
78*993b0882SAndroid Build Coastguard Worker DequantizeAdd8bit(scales, embeddings, bytes_per_embedding,
79*993b0882SAndroid Build Coastguard Worker num_sparse_features, bucket_id, dest, dest_size);
80*993b0882SAndroid Build Coastguard Worker } else if (quantization_bits != 8) {
81*993b0882SAndroid Build Coastguard Worker DequantizeAddNBit(scales, embeddings, bytes_per_embedding,
82*993b0882SAndroid Build Coastguard Worker num_sparse_features, quantization_bits, bucket_id, dest,
83*993b0882SAndroid Build Coastguard Worker dest_size);
84*993b0882SAndroid Build Coastguard Worker } else {
85*993b0882SAndroid Build Coastguard Worker TC3_LOG(ERROR) << "Unsupported quantization_bits: " << quantization_bits;
86*993b0882SAndroid Build Coastguard Worker return false;
87*993b0882SAndroid Build Coastguard Worker }
88*993b0882SAndroid Build Coastguard Worker
89*993b0882SAndroid Build Coastguard Worker return true;
90*993b0882SAndroid Build Coastguard Worker }
91*993b0882SAndroid Build Coastguard Worker
92*993b0882SAndroid Build Coastguard Worker } // namespace libtextclassifier3
93