1 /* NOLINT(build/header_guard) */ 2 /* Copyright 2013 Google Inc. All Rights Reserved. 3 4 Distributed under MIT license. 5 See file LICENSE for detail or copy at https://opensource.org/licenses/MIT 6 */ 7 8 /* template parameters: FN */ 9 10 #define HistogramType FN(Histogram) 11 12 double FN(BrotliPopulationCost)(const HistogramType* histogram) { 13 static const double kOneSymbolHistogramCost = 12; 14 static const double kTwoSymbolHistogramCost = 20; 15 static const double kThreeSymbolHistogramCost = 28; 16 static const double kFourSymbolHistogramCost = 37; 17 const size_t data_size = FN(HistogramDataSize)(); 18 int count = 0; 19 size_t s[5]; 20 double bits = 0.0; 21 size_t i; 22 if (histogram->total_count_ == 0) { 23 return kOneSymbolHistogramCost; 24 } 25 for (i = 0; i < data_size; ++i) { 26 if (histogram->data_[i] > 0) { 27 s[count] = i; 28 ++count; 29 if (count > 4) break; 30 } 31 } 32 if (count == 1) { 33 return kOneSymbolHistogramCost; 34 } 35 if (count == 2) { 36 return (kTwoSymbolHistogramCost + (double)histogram->total_count_); 37 } 38 if (count == 3) { 39 const uint32_t histo0 = histogram->data_[s[0]]; 40 const uint32_t histo1 = histogram->data_[s[1]]; 41 const uint32_t histo2 = histogram->data_[s[2]]; 42 const uint32_t histomax = 43 BROTLI_MAX(uint32_t, histo0, BROTLI_MAX(uint32_t, histo1, histo2)); 44 return (kThreeSymbolHistogramCost + 45 2 * (histo0 + histo1 + histo2) - histomax); 46 } 47 if (count == 4) { 48 uint32_t histo[4]; 49 uint32_t h23; 50 uint32_t histomax; 51 for (i = 0; i < 4; ++i) { 52 histo[i] = histogram->data_[s[i]]; 53 } 54 /* Sort */ 55 for (i = 0; i < 4; ++i) { 56 size_t j; 57 for (j = i + 1; j < 4; ++j) { 58 if (histo[j] > histo[i]) { 59 BROTLI_SWAP(uint32_t, histo, j, i); 60 } 61 } 62 } 63 h23 = histo[2] + histo[3]; 64 histomax = BROTLI_MAX(uint32_t, h23, histo[0]); 65 return (kFourSymbolHistogramCost + 66 3 * h23 + 2 * (histo[0] + histo[1]) - histomax); 67 } 68 69 { 70 /* In this loop we compute the entropy of the histogram and simultaneously 71 build a simplified histogram of the code length codes where we use the 72 zero repeat code 17, but we don't use the non-zero repeat code 16. */ 73 size_t max_depth = 1; 74 uint32_t depth_histo[BROTLI_CODE_LENGTH_CODES] = { 0 }; 75 const double log2total = FastLog2(histogram->total_count_); 76 for (i = 0; i < data_size;) { 77 if (histogram->data_[i] > 0) { 78 /* Compute -log2(P(symbol)) = -log2(count(symbol)/total_count) = 79 = log2(total_count) - log2(count(symbol)) */ 80 double log2p = log2total - FastLog2(histogram->data_[i]); 81 /* Approximate the bit depth by round(-log2(P(symbol))) */ 82 size_t depth = (size_t)(log2p + 0.5); 83 bits += histogram->data_[i] * log2p; 84 if (depth > 15) { 85 depth = 15; 86 } 87 if (depth > max_depth) { 88 max_depth = depth; 89 } 90 ++depth_histo[depth]; 91 ++i; 92 } else { 93 /* Compute the run length of zeros and add the appropriate number of 0 94 and 17 code length codes to the code length code histogram. */ 95 uint32_t reps = 1; 96 size_t k; 97 for (k = i + 1; k < data_size && histogram->data_[k] == 0; ++k) { 98 ++reps; 99 } 100 i += reps; 101 if (i == data_size) { 102 /* Don't add any cost for the last zero run, since these are encoded 103 only implicitly. */ 104 break; 105 } 106 if (reps < 3) { 107 depth_histo[0] += reps; 108 } else { 109 reps -= 2; 110 while (reps > 0) { 111 ++depth_histo[BROTLI_REPEAT_ZERO_CODE_LENGTH]; 112 /* Add the 3 extra bits for the 17 code length code. */ 113 bits += 3; 114 reps >>= 3; 115 } 116 } 117 } 118 } 119 /* Add the estimated encoding cost of the code length code histogram. */ 120 bits += (double)(18 + 2 * max_depth); 121 /* Add the entropy of the code length code histogram. */ 122 bits += BitsEntropy(depth_histo, BROTLI_CODE_LENGTH_CODES); 123 } 124 return bits; 125 } 126 127 #undef HistogramType 128