1*b2055c35SXin Li // Copyright 2011 Google Inc. All Rights Reserved.
2*b2055c35SXin Li //
3*b2055c35SXin Li // Use of this source code is governed by a BSD-style license
4*b2055c35SXin Li // that can be found in the COPYING file in the root of the source
5*b2055c35SXin Li // tree. An additional intellectual property rights grant can be found
6*b2055c35SXin Li // in the file PATENTS. All contributing project authors may
7*b2055c35SXin Li // be found in the AUTHORS file in the root of the source tree.
8*b2055c35SXin Li // -----------------------------------------------------------------------------
9*b2055c35SXin Li //
10*b2055c35SXin Li // Quantize levels for specified number of quantization-levels ([2, 256]).
11*b2055c35SXin Li // Min and max values are preserved (usual 0 and 255 for alpha plane).
12*b2055c35SXin Li //
13*b2055c35SXin Li // Author: Skal ([email protected])
14*b2055c35SXin Li
15*b2055c35SXin Li #include <assert.h>
16*b2055c35SXin Li
17*b2055c35SXin Li #include "src/utils/quant_levels_utils.h"
18*b2055c35SXin Li
19*b2055c35SXin Li #define NUM_SYMBOLS 256
20*b2055c35SXin Li
21*b2055c35SXin Li #define MAX_ITER 6 // Maximum number of convergence steps.
22*b2055c35SXin Li #define ERROR_THRESHOLD 1e-4 // MSE stopping criterion.
23*b2055c35SXin Li
24*b2055c35SXin Li // -----------------------------------------------------------------------------
25*b2055c35SXin Li // Quantize levels.
26*b2055c35SXin Li
QuantizeLevels(uint8_t * const data,int width,int height,int num_levels,uint64_t * const sse)27*b2055c35SXin Li int QuantizeLevels(uint8_t* const data, int width, int height,
28*b2055c35SXin Li int num_levels, uint64_t* const sse) {
29*b2055c35SXin Li int freq[NUM_SYMBOLS] = { 0 };
30*b2055c35SXin Li int q_level[NUM_SYMBOLS] = { 0 };
31*b2055c35SXin Li double inv_q_level[NUM_SYMBOLS] = { 0 };
32*b2055c35SXin Li int min_s = 255, max_s = 0;
33*b2055c35SXin Li const size_t data_size = height * width;
34*b2055c35SXin Li int i, num_levels_in, iter;
35*b2055c35SXin Li double last_err = 1.e38, err = 0.;
36*b2055c35SXin Li const double err_threshold = ERROR_THRESHOLD * data_size;
37*b2055c35SXin Li
38*b2055c35SXin Li if (data == NULL) {
39*b2055c35SXin Li return 0;
40*b2055c35SXin Li }
41*b2055c35SXin Li
42*b2055c35SXin Li if (width <= 0 || height <= 0) {
43*b2055c35SXin Li return 0;
44*b2055c35SXin Li }
45*b2055c35SXin Li
46*b2055c35SXin Li if (num_levels < 2 || num_levels > 256) {
47*b2055c35SXin Li return 0;
48*b2055c35SXin Li }
49*b2055c35SXin Li
50*b2055c35SXin Li {
51*b2055c35SXin Li size_t n;
52*b2055c35SXin Li num_levels_in = 0;
53*b2055c35SXin Li for (n = 0; n < data_size; ++n) {
54*b2055c35SXin Li num_levels_in += (freq[data[n]] == 0);
55*b2055c35SXin Li if (min_s > data[n]) min_s = data[n];
56*b2055c35SXin Li if (max_s < data[n]) max_s = data[n];
57*b2055c35SXin Li ++freq[data[n]];
58*b2055c35SXin Li }
59*b2055c35SXin Li }
60*b2055c35SXin Li
61*b2055c35SXin Li if (num_levels_in <= num_levels) goto End; // nothing to do!
62*b2055c35SXin Li
63*b2055c35SXin Li // Start with uniformly spread centroids.
64*b2055c35SXin Li for (i = 0; i < num_levels; ++i) {
65*b2055c35SXin Li inv_q_level[i] = min_s + (double)(max_s - min_s) * i / (num_levels - 1);
66*b2055c35SXin Li }
67*b2055c35SXin Li
68*b2055c35SXin Li // Fixed values. Won't be changed.
69*b2055c35SXin Li q_level[min_s] = 0;
70*b2055c35SXin Li q_level[max_s] = num_levels - 1;
71*b2055c35SXin Li assert(inv_q_level[0] == min_s);
72*b2055c35SXin Li assert(inv_q_level[num_levels - 1] == max_s);
73*b2055c35SXin Li
74*b2055c35SXin Li // k-Means iterations.
75*b2055c35SXin Li for (iter = 0; iter < MAX_ITER; ++iter) {
76*b2055c35SXin Li double q_sum[NUM_SYMBOLS] = { 0 };
77*b2055c35SXin Li double q_count[NUM_SYMBOLS] = { 0 };
78*b2055c35SXin Li int s, slot = 0;
79*b2055c35SXin Li
80*b2055c35SXin Li // Assign classes to representatives.
81*b2055c35SXin Li for (s = min_s; s <= max_s; ++s) {
82*b2055c35SXin Li // Keep track of the nearest neighbour 'slot'
83*b2055c35SXin Li while (slot < num_levels - 1 &&
84*b2055c35SXin Li 2 * s > inv_q_level[slot] + inv_q_level[slot + 1]) {
85*b2055c35SXin Li ++slot;
86*b2055c35SXin Li }
87*b2055c35SXin Li if (freq[s] > 0) {
88*b2055c35SXin Li q_sum[slot] += s * freq[s];
89*b2055c35SXin Li q_count[slot] += freq[s];
90*b2055c35SXin Li }
91*b2055c35SXin Li q_level[s] = slot;
92*b2055c35SXin Li }
93*b2055c35SXin Li
94*b2055c35SXin Li // Assign new representatives to classes.
95*b2055c35SXin Li if (num_levels > 2) {
96*b2055c35SXin Li for (slot = 1; slot < num_levels - 1; ++slot) {
97*b2055c35SXin Li const double count = q_count[slot];
98*b2055c35SXin Li if (count > 0.) {
99*b2055c35SXin Li inv_q_level[slot] = q_sum[slot] / count;
100*b2055c35SXin Li }
101*b2055c35SXin Li }
102*b2055c35SXin Li }
103*b2055c35SXin Li
104*b2055c35SXin Li // Compute convergence error.
105*b2055c35SXin Li err = 0.;
106*b2055c35SXin Li for (s = min_s; s <= max_s; ++s) {
107*b2055c35SXin Li const double error = s - inv_q_level[q_level[s]];
108*b2055c35SXin Li err += freq[s] * error * error;
109*b2055c35SXin Li }
110*b2055c35SXin Li
111*b2055c35SXin Li // Check for convergence: we stop as soon as the error is no
112*b2055c35SXin Li // longer improving.
113*b2055c35SXin Li if (last_err - err < err_threshold) break;
114*b2055c35SXin Li last_err = err;
115*b2055c35SXin Li }
116*b2055c35SXin Li
117*b2055c35SXin Li // Remap the alpha plane to quantized values.
118*b2055c35SXin Li {
119*b2055c35SXin Li // double->int rounding operation can be costly, so we do it
120*b2055c35SXin Li // once for all before remapping. We also perform the data[] -> slot
121*b2055c35SXin Li // mapping, while at it (avoid one indirection in the final loop).
122*b2055c35SXin Li uint8_t map[NUM_SYMBOLS];
123*b2055c35SXin Li int s;
124*b2055c35SXin Li size_t n;
125*b2055c35SXin Li for (s = min_s; s <= max_s; ++s) {
126*b2055c35SXin Li const int slot = q_level[s];
127*b2055c35SXin Li map[s] = (uint8_t)(inv_q_level[slot] + .5);
128*b2055c35SXin Li }
129*b2055c35SXin Li // Final pass.
130*b2055c35SXin Li for (n = 0; n < data_size; ++n) {
131*b2055c35SXin Li data[n] = map[data[n]];
132*b2055c35SXin Li }
133*b2055c35SXin Li }
134*b2055c35SXin Li End:
135*b2055c35SXin Li // Store sum of squared error if needed.
136*b2055c35SXin Li if (sse != NULL) *sse = (uint64_t)err;
137*b2055c35SXin Li
138*b2055c35SXin Li return 1;
139*b2055c35SXin Li }
140*b2055c35SXin Li
141