1*77c1e3ccSAndroid Build Coastguard Worker /*
2*77c1e3ccSAndroid Build Coastguard Worker * Copyright (c) 2016, Alliance for Open Media. All rights reserved.
3*77c1e3ccSAndroid Build Coastguard Worker *
4*77c1e3ccSAndroid Build Coastguard Worker * This source code is subject to the terms of the BSD 2 Clause License and
5*77c1e3ccSAndroid Build Coastguard Worker * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6*77c1e3ccSAndroid Build Coastguard Worker * was not distributed with this source code in the LICENSE file, you can
7*77c1e3ccSAndroid Build Coastguard Worker * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8*77c1e3ccSAndroid Build Coastguard Worker * Media Patent License 1.0 was not distributed with this source code in the
9*77c1e3ccSAndroid Build Coastguard Worker * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10*77c1e3ccSAndroid Build Coastguard Worker */
11*77c1e3ccSAndroid Build Coastguard Worker
12*77c1e3ccSAndroid Build Coastguard Worker #include <assert.h>
13*77c1e3ccSAndroid Build Coastguard Worker #include <stdint.h>
14*77c1e3ccSAndroid Build Coastguard Worker #include <stdlib.h>
15*77c1e3ccSAndroid Build Coastguard Worker #include <string.h>
16*77c1e3ccSAndroid Build Coastguard Worker
17*77c1e3ccSAndroid Build Coastguard Worker #include "av1/common/blockd.h"
18*77c1e3ccSAndroid Build Coastguard Worker #include "av1/encoder/palette.h"
19*77c1e3ccSAndroid Build Coastguard Worker #include "av1/encoder/random.h"
20*77c1e3ccSAndroid Build Coastguard Worker
21*77c1e3ccSAndroid Build Coastguard Worker #ifndef AV1_K_MEANS_DIM
22*77c1e3ccSAndroid Build Coastguard Worker #error "This template requires AV1_K_MEANS_DIM to be defined"
23*77c1e3ccSAndroid Build Coastguard Worker #endif
24*77c1e3ccSAndroid Build Coastguard Worker
25*77c1e3ccSAndroid Build Coastguard Worker #define RENAME_(x, y) AV1_K_MEANS_RENAME(x, y)
26*77c1e3ccSAndroid Build Coastguard Worker #define RENAME(x) RENAME_(x, AV1_K_MEANS_DIM)
27*77c1e3ccSAndroid Build Coastguard Worker #define K_MEANS_RENAME_C(x, y) x##_dim##y##_c
28*77c1e3ccSAndroid Build Coastguard Worker #define RENAME_C_(x, y) K_MEANS_RENAME_C(x, y)
29*77c1e3ccSAndroid Build Coastguard Worker #define RENAME_C(x) RENAME_C_(x, AV1_K_MEANS_DIM)
30*77c1e3ccSAndroid Build Coastguard Worker
31*77c1e3ccSAndroid Build Coastguard Worker // Though we want to compute the smallest L2 norm, in 1 dimension,
32*77c1e3ccSAndroid Build Coastguard Worker // it is equivalent to find the smallest L1 norm and then square it.
33*77c1e3ccSAndroid Build Coastguard Worker // This is preferrable for speed, especially on the SIMD side.
RENAME(calc_dist)34*77c1e3ccSAndroid Build Coastguard Worker static int RENAME(calc_dist)(const int16_t *p1, const int16_t *p2) {
35*77c1e3ccSAndroid Build Coastguard Worker #if AV1_K_MEANS_DIM == 1
36*77c1e3ccSAndroid Build Coastguard Worker return abs(p1[0] - p2[0]);
37*77c1e3ccSAndroid Build Coastguard Worker #else
38*77c1e3ccSAndroid Build Coastguard Worker int dist = 0;
39*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < AV1_K_MEANS_DIM; ++i) {
40*77c1e3ccSAndroid Build Coastguard Worker const int diff = p1[i] - p2[i];
41*77c1e3ccSAndroid Build Coastguard Worker dist += diff * diff;
42*77c1e3ccSAndroid Build Coastguard Worker }
43*77c1e3ccSAndroid Build Coastguard Worker return dist;
44*77c1e3ccSAndroid Build Coastguard Worker #endif
45*77c1e3ccSAndroid Build Coastguard Worker }
46*77c1e3ccSAndroid Build Coastguard Worker
RENAME_C(av1_calc_indices)47*77c1e3ccSAndroid Build Coastguard Worker void RENAME_C(av1_calc_indices)(const int16_t *data, const int16_t *centroids,
48*77c1e3ccSAndroid Build Coastguard Worker uint8_t *indices, int64_t *dist, int n, int k) {
49*77c1e3ccSAndroid Build Coastguard Worker if (dist) {
50*77c1e3ccSAndroid Build Coastguard Worker *dist = 0;
51*77c1e3ccSAndroid Build Coastguard Worker }
52*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < n; ++i) {
53*77c1e3ccSAndroid Build Coastguard Worker int min_dist = RENAME(calc_dist)(data + i * AV1_K_MEANS_DIM, centroids);
54*77c1e3ccSAndroid Build Coastguard Worker indices[i] = 0;
55*77c1e3ccSAndroid Build Coastguard Worker for (int j = 1; j < k; ++j) {
56*77c1e3ccSAndroid Build Coastguard Worker const int this_dist = RENAME(calc_dist)(data + i * AV1_K_MEANS_DIM,
57*77c1e3ccSAndroid Build Coastguard Worker centroids + j * AV1_K_MEANS_DIM);
58*77c1e3ccSAndroid Build Coastguard Worker if (this_dist < min_dist) {
59*77c1e3ccSAndroid Build Coastguard Worker min_dist = this_dist;
60*77c1e3ccSAndroid Build Coastguard Worker indices[i] = j;
61*77c1e3ccSAndroid Build Coastguard Worker }
62*77c1e3ccSAndroid Build Coastguard Worker }
63*77c1e3ccSAndroid Build Coastguard Worker if (dist) {
64*77c1e3ccSAndroid Build Coastguard Worker #if AV1_K_MEANS_DIM == 1
65*77c1e3ccSAndroid Build Coastguard Worker *dist += min_dist * min_dist;
66*77c1e3ccSAndroid Build Coastguard Worker #else
67*77c1e3ccSAndroid Build Coastguard Worker *dist += min_dist;
68*77c1e3ccSAndroid Build Coastguard Worker #endif
69*77c1e3ccSAndroid Build Coastguard Worker }
70*77c1e3ccSAndroid Build Coastguard Worker }
71*77c1e3ccSAndroid Build Coastguard Worker }
72*77c1e3ccSAndroid Build Coastguard Worker
RENAME(calc_centroids)73*77c1e3ccSAndroid Build Coastguard Worker static void RENAME(calc_centroids)(const int16_t *data, int16_t *centroids,
74*77c1e3ccSAndroid Build Coastguard Worker const uint8_t *indices, int n, int k) {
75*77c1e3ccSAndroid Build Coastguard Worker int i, j;
76*77c1e3ccSAndroid Build Coastguard Worker int count[PALETTE_MAX_SIZE] = { 0 };
77*77c1e3ccSAndroid Build Coastguard Worker int centroids_sum[AV1_K_MEANS_DIM * PALETTE_MAX_SIZE];
78*77c1e3ccSAndroid Build Coastguard Worker unsigned int rand_state = (unsigned int)data[0];
79*77c1e3ccSAndroid Build Coastguard Worker assert(n <= 32768);
80*77c1e3ccSAndroid Build Coastguard Worker memset(centroids_sum, 0, sizeof(centroids_sum[0]) * k * AV1_K_MEANS_DIM);
81*77c1e3ccSAndroid Build Coastguard Worker
82*77c1e3ccSAndroid Build Coastguard Worker for (i = 0; i < n; ++i) {
83*77c1e3ccSAndroid Build Coastguard Worker const int index = indices[i];
84*77c1e3ccSAndroid Build Coastguard Worker assert(index < k);
85*77c1e3ccSAndroid Build Coastguard Worker ++count[index];
86*77c1e3ccSAndroid Build Coastguard Worker for (j = 0; j < AV1_K_MEANS_DIM; ++j) {
87*77c1e3ccSAndroid Build Coastguard Worker centroids_sum[index * AV1_K_MEANS_DIM + j] +=
88*77c1e3ccSAndroid Build Coastguard Worker data[i * AV1_K_MEANS_DIM + j];
89*77c1e3ccSAndroid Build Coastguard Worker }
90*77c1e3ccSAndroid Build Coastguard Worker }
91*77c1e3ccSAndroid Build Coastguard Worker
92*77c1e3ccSAndroid Build Coastguard Worker for (i = 0; i < k; ++i) {
93*77c1e3ccSAndroid Build Coastguard Worker if (count[i] == 0) {
94*77c1e3ccSAndroid Build Coastguard Worker memcpy(centroids + i * AV1_K_MEANS_DIM,
95*77c1e3ccSAndroid Build Coastguard Worker data + (lcg_rand16(&rand_state) % n) * AV1_K_MEANS_DIM,
96*77c1e3ccSAndroid Build Coastguard Worker sizeof(centroids[0]) * AV1_K_MEANS_DIM);
97*77c1e3ccSAndroid Build Coastguard Worker } else {
98*77c1e3ccSAndroid Build Coastguard Worker for (j = 0; j < AV1_K_MEANS_DIM; ++j) {
99*77c1e3ccSAndroid Build Coastguard Worker centroids[i * AV1_K_MEANS_DIM + j] =
100*77c1e3ccSAndroid Build Coastguard Worker DIVIDE_AND_ROUND(centroids_sum[i * AV1_K_MEANS_DIM + j], count[i]);
101*77c1e3ccSAndroid Build Coastguard Worker }
102*77c1e3ccSAndroid Build Coastguard Worker }
103*77c1e3ccSAndroid Build Coastguard Worker }
104*77c1e3ccSAndroid Build Coastguard Worker }
105*77c1e3ccSAndroid Build Coastguard Worker
RENAME(av1_k_means)106*77c1e3ccSAndroid Build Coastguard Worker void RENAME(av1_k_means)(const int16_t *data, int16_t *centroids,
107*77c1e3ccSAndroid Build Coastguard Worker uint8_t *indices, int n, int k, int max_itr) {
108*77c1e3ccSAndroid Build Coastguard Worker int16_t centroids_tmp[AV1_K_MEANS_DIM * PALETTE_MAX_SIZE];
109*77c1e3ccSAndroid Build Coastguard Worker uint8_t indices_tmp[MAX_PALETTE_BLOCK_WIDTH * MAX_PALETTE_BLOCK_HEIGHT];
110*77c1e3ccSAndroid Build Coastguard Worker int16_t *meta_centroids[2] = { centroids, centroids_tmp };
111*77c1e3ccSAndroid Build Coastguard Worker uint8_t *meta_indices[2] = { indices, indices_tmp };
112*77c1e3ccSAndroid Build Coastguard Worker int i, l = 0, prev_l, best_l = 0;
113*77c1e3ccSAndroid Build Coastguard Worker int64_t this_dist;
114*77c1e3ccSAndroid Build Coastguard Worker
115*77c1e3ccSAndroid Build Coastguard Worker assert(n <= MAX_PALETTE_BLOCK_WIDTH * MAX_PALETTE_BLOCK_HEIGHT);
116*77c1e3ccSAndroid Build Coastguard Worker
117*77c1e3ccSAndroid Build Coastguard Worker #if AV1_K_MEANS_DIM == 1
118*77c1e3ccSAndroid Build Coastguard Worker av1_calc_indices_dim1(data, centroids, indices, &this_dist, n, k);
119*77c1e3ccSAndroid Build Coastguard Worker #else
120*77c1e3ccSAndroid Build Coastguard Worker av1_calc_indices_dim2(data, centroids, indices, &this_dist, n, k);
121*77c1e3ccSAndroid Build Coastguard Worker #endif
122*77c1e3ccSAndroid Build Coastguard Worker
123*77c1e3ccSAndroid Build Coastguard Worker for (i = 0; i < max_itr; ++i) {
124*77c1e3ccSAndroid Build Coastguard Worker const int64_t prev_dist = this_dist;
125*77c1e3ccSAndroid Build Coastguard Worker prev_l = l;
126*77c1e3ccSAndroid Build Coastguard Worker l = (l == 1) ? 0 : 1;
127*77c1e3ccSAndroid Build Coastguard Worker
128*77c1e3ccSAndroid Build Coastguard Worker RENAME(calc_centroids)(data, meta_centroids[l], meta_indices[prev_l], n, k);
129*77c1e3ccSAndroid Build Coastguard Worker if (!memcmp(meta_centroids[l], meta_centroids[prev_l],
130*77c1e3ccSAndroid Build Coastguard Worker sizeof(centroids[0]) * k * AV1_K_MEANS_DIM)) {
131*77c1e3ccSAndroid Build Coastguard Worker break;
132*77c1e3ccSAndroid Build Coastguard Worker }
133*77c1e3ccSAndroid Build Coastguard Worker #if AV1_K_MEANS_DIM == 1
134*77c1e3ccSAndroid Build Coastguard Worker av1_calc_indices_dim1(data, meta_centroids[l], meta_indices[l], &this_dist,
135*77c1e3ccSAndroid Build Coastguard Worker n, k);
136*77c1e3ccSAndroid Build Coastguard Worker #else
137*77c1e3ccSAndroid Build Coastguard Worker av1_calc_indices_dim2(data, meta_centroids[l], meta_indices[l], &this_dist,
138*77c1e3ccSAndroid Build Coastguard Worker n, k);
139*77c1e3ccSAndroid Build Coastguard Worker #endif
140*77c1e3ccSAndroid Build Coastguard Worker
141*77c1e3ccSAndroid Build Coastguard Worker if (this_dist > prev_dist) {
142*77c1e3ccSAndroid Build Coastguard Worker best_l = prev_l;
143*77c1e3ccSAndroid Build Coastguard Worker break;
144*77c1e3ccSAndroid Build Coastguard Worker }
145*77c1e3ccSAndroid Build Coastguard Worker }
146*77c1e3ccSAndroid Build Coastguard Worker if (i == max_itr) best_l = l;
147*77c1e3ccSAndroid Build Coastguard Worker if (best_l != 0) {
148*77c1e3ccSAndroid Build Coastguard Worker memcpy(centroids, meta_centroids[1],
149*77c1e3ccSAndroid Build Coastguard Worker sizeof(centroids[0]) * k * AV1_K_MEANS_DIM);
150*77c1e3ccSAndroid Build Coastguard Worker memcpy(indices, meta_indices[1], sizeof(indices[0]) * n);
151*77c1e3ccSAndroid Build Coastguard Worker }
152*77c1e3ccSAndroid Build Coastguard Worker }
153*77c1e3ccSAndroid Build Coastguard Worker #undef RENAME_
154*77c1e3ccSAndroid Build Coastguard Worker #undef RENAME
155*77c1e3ccSAndroid Build Coastguard Worker #undef K_MEANS_RENAME_C
156*77c1e3ccSAndroid Build Coastguard Worker #undef RENAME_C_
157*77c1e3ccSAndroid Build Coastguard Worker #undef RENAME_C
158