xref: /aosp_15_r20/external/webp/src/utils/quant_levels_utils.c (revision b2055c353e87c8814eb2b6b1b11112a1562253bd)
1*b2055c35SXin Li // Copyright 2011 Google Inc. All Rights Reserved.
2*b2055c35SXin Li //
3*b2055c35SXin Li // Use of this source code is governed by a BSD-style license
4*b2055c35SXin Li // that can be found in the COPYING file in the root of the source
5*b2055c35SXin Li // tree. An additional intellectual property rights grant can be found
6*b2055c35SXin Li // in the file PATENTS. All contributing project authors may
7*b2055c35SXin Li // be found in the AUTHORS file in the root of the source tree.
8*b2055c35SXin Li // -----------------------------------------------------------------------------
9*b2055c35SXin Li //
10*b2055c35SXin Li // Quantize levels for specified number of quantization-levels ([2, 256]).
11*b2055c35SXin Li // Min and max values are preserved (usual 0 and 255 for alpha plane).
12*b2055c35SXin Li //
13*b2055c35SXin Li // Author: Skal ([email protected])
14*b2055c35SXin Li 
15*b2055c35SXin Li #include <assert.h>
16*b2055c35SXin Li 
17*b2055c35SXin Li #include "src/utils/quant_levels_utils.h"
18*b2055c35SXin Li 
19*b2055c35SXin Li #define NUM_SYMBOLS     256
20*b2055c35SXin Li 
21*b2055c35SXin Li #define MAX_ITER  6             // Maximum number of convergence steps.
22*b2055c35SXin Li #define ERROR_THRESHOLD 1e-4    // MSE stopping criterion.
23*b2055c35SXin Li 
24*b2055c35SXin Li // -----------------------------------------------------------------------------
25*b2055c35SXin Li // Quantize levels.
26*b2055c35SXin Li 
QuantizeLevels(uint8_t * const data,int width,int height,int num_levels,uint64_t * const sse)27*b2055c35SXin Li int QuantizeLevels(uint8_t* const data, int width, int height,
28*b2055c35SXin Li                    int num_levels, uint64_t* const sse) {
29*b2055c35SXin Li   int freq[NUM_SYMBOLS] = { 0 };
30*b2055c35SXin Li   int q_level[NUM_SYMBOLS] = { 0 };
31*b2055c35SXin Li   double inv_q_level[NUM_SYMBOLS] = { 0 };
32*b2055c35SXin Li   int min_s = 255, max_s = 0;
33*b2055c35SXin Li   const size_t data_size = height * width;
34*b2055c35SXin Li   int i, num_levels_in, iter;
35*b2055c35SXin Li   double last_err = 1.e38, err = 0.;
36*b2055c35SXin Li   const double err_threshold = ERROR_THRESHOLD * data_size;
37*b2055c35SXin Li 
38*b2055c35SXin Li   if (data == NULL) {
39*b2055c35SXin Li     return 0;
40*b2055c35SXin Li   }
41*b2055c35SXin Li 
42*b2055c35SXin Li   if (width <= 0 || height <= 0) {
43*b2055c35SXin Li     return 0;
44*b2055c35SXin Li   }
45*b2055c35SXin Li 
46*b2055c35SXin Li   if (num_levels < 2 || num_levels > 256) {
47*b2055c35SXin Li     return 0;
48*b2055c35SXin Li   }
49*b2055c35SXin Li 
50*b2055c35SXin Li   {
51*b2055c35SXin Li     size_t n;
52*b2055c35SXin Li     num_levels_in = 0;
53*b2055c35SXin Li     for (n = 0; n < data_size; ++n) {
54*b2055c35SXin Li       num_levels_in += (freq[data[n]] == 0);
55*b2055c35SXin Li       if (min_s > data[n]) min_s = data[n];
56*b2055c35SXin Li       if (max_s < data[n]) max_s = data[n];
57*b2055c35SXin Li       ++freq[data[n]];
58*b2055c35SXin Li     }
59*b2055c35SXin Li   }
60*b2055c35SXin Li 
61*b2055c35SXin Li   if (num_levels_in <= num_levels) goto End;  // nothing to do!
62*b2055c35SXin Li 
63*b2055c35SXin Li   // Start with uniformly spread centroids.
64*b2055c35SXin Li   for (i = 0; i < num_levels; ++i) {
65*b2055c35SXin Li     inv_q_level[i] = min_s + (double)(max_s - min_s) * i / (num_levels - 1);
66*b2055c35SXin Li   }
67*b2055c35SXin Li 
68*b2055c35SXin Li   // Fixed values. Won't be changed.
69*b2055c35SXin Li   q_level[min_s] = 0;
70*b2055c35SXin Li   q_level[max_s] = num_levels - 1;
71*b2055c35SXin Li   assert(inv_q_level[0] == min_s);
72*b2055c35SXin Li   assert(inv_q_level[num_levels - 1] == max_s);
73*b2055c35SXin Li 
74*b2055c35SXin Li   // k-Means iterations.
75*b2055c35SXin Li   for (iter = 0; iter < MAX_ITER; ++iter) {
76*b2055c35SXin Li     double q_sum[NUM_SYMBOLS] = { 0 };
77*b2055c35SXin Li     double q_count[NUM_SYMBOLS] = { 0 };
78*b2055c35SXin Li     int s, slot = 0;
79*b2055c35SXin Li 
80*b2055c35SXin Li     // Assign classes to representatives.
81*b2055c35SXin Li     for (s = min_s; s <= max_s; ++s) {
82*b2055c35SXin Li       // Keep track of the nearest neighbour 'slot'
83*b2055c35SXin Li       while (slot < num_levels - 1 &&
84*b2055c35SXin Li              2 * s > inv_q_level[slot] + inv_q_level[slot + 1]) {
85*b2055c35SXin Li         ++slot;
86*b2055c35SXin Li       }
87*b2055c35SXin Li       if (freq[s] > 0) {
88*b2055c35SXin Li         q_sum[slot] += s * freq[s];
89*b2055c35SXin Li         q_count[slot] += freq[s];
90*b2055c35SXin Li       }
91*b2055c35SXin Li       q_level[s] = slot;
92*b2055c35SXin Li     }
93*b2055c35SXin Li 
94*b2055c35SXin Li     // Assign new representatives to classes.
95*b2055c35SXin Li     if (num_levels > 2) {
96*b2055c35SXin Li       for (slot = 1; slot < num_levels - 1; ++slot) {
97*b2055c35SXin Li         const double count = q_count[slot];
98*b2055c35SXin Li         if (count > 0.) {
99*b2055c35SXin Li           inv_q_level[slot] = q_sum[slot] / count;
100*b2055c35SXin Li         }
101*b2055c35SXin Li       }
102*b2055c35SXin Li     }
103*b2055c35SXin Li 
104*b2055c35SXin Li     // Compute convergence error.
105*b2055c35SXin Li     err = 0.;
106*b2055c35SXin Li     for (s = min_s; s <= max_s; ++s) {
107*b2055c35SXin Li       const double error = s - inv_q_level[q_level[s]];
108*b2055c35SXin Li       err += freq[s] * error * error;
109*b2055c35SXin Li     }
110*b2055c35SXin Li 
111*b2055c35SXin Li     // Check for convergence: we stop as soon as the error is no
112*b2055c35SXin Li     // longer improving.
113*b2055c35SXin Li     if (last_err - err < err_threshold) break;
114*b2055c35SXin Li     last_err = err;
115*b2055c35SXin Li   }
116*b2055c35SXin Li 
117*b2055c35SXin Li   // Remap the alpha plane to quantized values.
118*b2055c35SXin Li   {
119*b2055c35SXin Li     // double->int rounding operation can be costly, so we do it
120*b2055c35SXin Li     // once for all before remapping. We also perform the data[] -> slot
121*b2055c35SXin Li     // mapping, while at it (avoid one indirection in the final loop).
122*b2055c35SXin Li     uint8_t map[NUM_SYMBOLS];
123*b2055c35SXin Li     int s;
124*b2055c35SXin Li     size_t n;
125*b2055c35SXin Li     for (s = min_s; s <= max_s; ++s) {
126*b2055c35SXin Li       const int slot = q_level[s];
127*b2055c35SXin Li       map[s] = (uint8_t)(inv_q_level[slot] + .5);
128*b2055c35SXin Li     }
129*b2055c35SXin Li     // Final pass.
130*b2055c35SXin Li     for (n = 0; n < data_size; ++n) {
131*b2055c35SXin Li       data[n] = map[data[n]];
132*b2055c35SXin Li     }
133*b2055c35SXin Li   }
134*b2055c35SXin Li  End:
135*b2055c35SXin Li   // Store sum of squared error if needed.
136*b2055c35SXin Li   if (sse != NULL) *sse = (uint64_t)err;
137*b2055c35SXin Li 
138*b2055c35SXin Li   return 1;
139*b2055c35SXin Li }
140*b2055c35SXin Li 
141