metablock.c 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663
  1. /* Copyright 2015 Google Inc. All Rights Reserved.
  2. Distributed under MIT license.
  3. See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
  4. */
  5. /* Algorithms for distributing the literals and commands of a metablock between
  6. block types and contexts. */
  7. #include "./metablock.h"
  8. #include "../common/constants.h"
  9. #include "../common/context.h"
  10. #include "../common/platform.h"
  11. #include <brotli/types.h>
  12. #include "./bit_cost.h"
  13. #include "./block_splitter.h"
  14. #include "./cluster.h"
  15. #include "./entropy_encode.h"
  16. #include "./histogram.h"
  17. #include "./memory.h"
  18. #include "./quality.h"
  19. #if defined(__cplusplus) || defined(c_plusplus)
  20. extern "C" {
  21. #endif
  22. void BrotliInitDistanceParams(BrotliEncoderParams* params,
  23. uint32_t npostfix, uint32_t ndirect) {
  24. BrotliDistanceParams* dist_params = &params->dist;
  25. uint32_t alphabet_size_max;
  26. uint32_t alphabet_size_limit;
  27. uint32_t max_distance;
  28. dist_params->distance_postfix_bits = npostfix;
  29. dist_params->num_direct_distance_codes = ndirect;
  30. alphabet_size_max = BROTLI_DISTANCE_ALPHABET_SIZE(
  31. npostfix, ndirect, BROTLI_MAX_DISTANCE_BITS);
  32. alphabet_size_limit = alphabet_size_max;
  33. max_distance = ndirect + (1U << (BROTLI_MAX_DISTANCE_BITS + npostfix + 2)) -
  34. (1U << (npostfix + 2));
  35. if (params->large_window) {
  36. BrotliDistanceCodeLimit limit = BrotliCalculateDistanceCodeLimit(
  37. BROTLI_MAX_ALLOWED_DISTANCE, npostfix, ndirect);
  38. alphabet_size_max = BROTLI_DISTANCE_ALPHABET_SIZE(
  39. npostfix, ndirect, BROTLI_LARGE_MAX_DISTANCE_BITS);
  40. alphabet_size_limit = limit.max_alphabet_size;
  41. max_distance = limit.max_distance;
  42. }
  43. dist_params->alphabet_size_max = alphabet_size_max;
  44. dist_params->alphabet_size_limit = alphabet_size_limit;
  45. dist_params->max_distance = max_distance;
  46. }
  47. static void RecomputeDistancePrefixes(Command* cmds,
  48. size_t num_commands,
  49. const BrotliDistanceParams* orig_params,
  50. const BrotliDistanceParams* new_params) {
  51. size_t i;
  52. if (orig_params->distance_postfix_bits == new_params->distance_postfix_bits &&
  53. orig_params->num_direct_distance_codes ==
  54. new_params->num_direct_distance_codes) {
  55. return;
  56. }
  57. for (i = 0; i < num_commands; ++i) {
  58. Command* cmd = &cmds[i];
  59. if (CommandCopyLen(cmd) && cmd->cmd_prefix_ >= 128) {
  60. PrefixEncodeCopyDistance(CommandRestoreDistanceCode(cmd, orig_params),
  61. new_params->num_direct_distance_codes,
  62. new_params->distance_postfix_bits,
  63. &cmd->dist_prefix_,
  64. &cmd->dist_extra_);
  65. }
  66. }
  67. }
  68. static BROTLI_BOOL ComputeDistanceCost(const Command* cmds,
  69. size_t num_commands,
  70. const BrotliDistanceParams* orig_params,
  71. const BrotliDistanceParams* new_params,
  72. double* cost) {
  73. size_t i;
  74. BROTLI_BOOL equal_params = BROTLI_FALSE;
  75. uint16_t dist_prefix;
  76. uint32_t dist_extra;
  77. double extra_bits = 0.0;
  78. HistogramDistance histo;
  79. HistogramClearDistance(&histo);
  80. if (orig_params->distance_postfix_bits == new_params->distance_postfix_bits &&
  81. orig_params->num_direct_distance_codes ==
  82. new_params->num_direct_distance_codes) {
  83. equal_params = BROTLI_TRUE;
  84. }
  85. for (i = 0; i < num_commands; i++) {
  86. const Command* cmd = &cmds[i];
  87. if (CommandCopyLen(cmd) && cmd->cmd_prefix_ >= 128) {
  88. if (equal_params) {
  89. dist_prefix = cmd->dist_prefix_;
  90. } else {
  91. uint32_t distance = CommandRestoreDistanceCode(cmd, orig_params);
  92. if (distance > new_params->max_distance) {
  93. return BROTLI_FALSE;
  94. }
  95. PrefixEncodeCopyDistance(distance,
  96. new_params->num_direct_distance_codes,
  97. new_params->distance_postfix_bits,
  98. &dist_prefix,
  99. &dist_extra);
  100. }
  101. HistogramAddDistance(&histo, dist_prefix & 0x3FF);
  102. extra_bits += dist_prefix >> 10;
  103. }
  104. }
  105. *cost = BrotliPopulationCostDistance(&histo) + extra_bits;
  106. return BROTLI_TRUE;
  107. }
  108. void BrotliBuildMetaBlock(MemoryManager* m,
  109. const uint8_t* ringbuffer,
  110. const size_t pos,
  111. const size_t mask,
  112. BrotliEncoderParams* params,
  113. uint8_t prev_byte,
  114. uint8_t prev_byte2,
  115. Command* cmds,
  116. size_t num_commands,
  117. ContextType literal_context_mode,
  118. MetaBlockSplit* mb) {
  119. /* Histogram ids need to fit in one byte. */
  120. static const size_t kMaxNumberOfHistograms = 256;
  121. HistogramDistance* distance_histograms;
  122. HistogramLiteral* literal_histograms;
  123. ContextType* literal_context_modes = NULL;
  124. size_t literal_histograms_size;
  125. size_t distance_histograms_size;
  126. size_t i;
  127. size_t literal_context_multiplier = 1;
  128. uint32_t npostfix;
  129. uint32_t ndirect_msb = 0;
  130. BROTLI_BOOL check_orig = BROTLI_TRUE;
  131. double best_dist_cost = 1e99;
  132. BrotliEncoderParams orig_params = *params;
  133. BrotliEncoderParams new_params = *params;
  134. for (npostfix = 0; npostfix <= BROTLI_MAX_NPOSTFIX; npostfix++) {
  135. for (; ndirect_msb < 16; ndirect_msb++) {
  136. uint32_t ndirect = ndirect_msb << npostfix;
  137. BROTLI_BOOL skip;
  138. double dist_cost;
  139. BrotliInitDistanceParams(&new_params, npostfix, ndirect);
  140. if (npostfix == orig_params.dist.distance_postfix_bits &&
  141. ndirect == orig_params.dist.num_direct_distance_codes) {
  142. check_orig = BROTLI_FALSE;
  143. }
  144. skip = !ComputeDistanceCost(
  145. cmds, num_commands,
  146. &orig_params.dist, &new_params.dist, &dist_cost);
  147. if (skip || (dist_cost > best_dist_cost)) {
  148. break;
  149. }
  150. best_dist_cost = dist_cost;
  151. params->dist = new_params.dist;
  152. }
  153. if (ndirect_msb > 0) ndirect_msb--;
  154. ndirect_msb /= 2;
  155. }
  156. if (check_orig) {
  157. double dist_cost;
  158. ComputeDistanceCost(cmds, num_commands,
  159. &orig_params.dist, &orig_params.dist, &dist_cost);
  160. if (dist_cost < best_dist_cost) {
  161. /* NB: currently unused; uncomment when more param tuning is added. */
  162. /* best_dist_cost = dist_cost; */
  163. params->dist = orig_params.dist;
  164. }
  165. }
  166. RecomputeDistancePrefixes(cmds, num_commands,
  167. &orig_params.dist, &params->dist);
  168. BrotliSplitBlock(m, cmds, num_commands,
  169. ringbuffer, pos, mask, params,
  170. &mb->literal_split,
  171. &mb->command_split,
  172. &mb->distance_split);
  173. if (BROTLI_IS_OOM(m)) return;
  174. if (!params->disable_literal_context_modeling) {
  175. literal_context_multiplier = 1 << BROTLI_LITERAL_CONTEXT_BITS;
  176. literal_context_modes =
  177. BROTLI_ALLOC(m, ContextType, mb->literal_split.num_types);
  178. if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(literal_context_modes)) return;
  179. for (i = 0; i < mb->literal_split.num_types; ++i) {
  180. literal_context_modes[i] = literal_context_mode;
  181. }
  182. }
  183. literal_histograms_size =
  184. mb->literal_split.num_types * literal_context_multiplier;
  185. literal_histograms =
  186. BROTLI_ALLOC(m, HistogramLiteral, literal_histograms_size);
  187. if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(literal_histograms)) return;
  188. ClearHistogramsLiteral(literal_histograms, literal_histograms_size);
  189. distance_histograms_size =
  190. mb->distance_split.num_types << BROTLI_DISTANCE_CONTEXT_BITS;
  191. distance_histograms =
  192. BROTLI_ALLOC(m, HistogramDistance, distance_histograms_size);
  193. if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(distance_histograms)) return;
  194. ClearHistogramsDistance(distance_histograms, distance_histograms_size);
  195. BROTLI_DCHECK(mb->command_histograms == 0);
  196. mb->command_histograms_size = mb->command_split.num_types;
  197. mb->command_histograms =
  198. BROTLI_ALLOC(m, HistogramCommand, mb->command_histograms_size);
  199. if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->command_histograms)) return;
  200. ClearHistogramsCommand(mb->command_histograms, mb->command_histograms_size);
  201. BrotliBuildHistogramsWithContext(cmds, num_commands,
  202. &mb->literal_split, &mb->command_split, &mb->distance_split,
  203. ringbuffer, pos, mask, prev_byte, prev_byte2, literal_context_modes,
  204. literal_histograms, mb->command_histograms, distance_histograms);
  205. BROTLI_FREE(m, literal_context_modes);
  206. BROTLI_DCHECK(mb->literal_context_map == 0);
  207. mb->literal_context_map_size =
  208. mb->literal_split.num_types << BROTLI_LITERAL_CONTEXT_BITS;
  209. mb->literal_context_map =
  210. BROTLI_ALLOC(m, uint32_t, mb->literal_context_map_size);
  211. if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->literal_context_map)) return;
  212. BROTLI_DCHECK(mb->literal_histograms == 0);
  213. mb->literal_histograms_size = mb->literal_context_map_size;
  214. mb->literal_histograms =
  215. BROTLI_ALLOC(m, HistogramLiteral, mb->literal_histograms_size);
  216. if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->literal_histograms)) return;
  217. BrotliClusterHistogramsLiteral(m, literal_histograms, literal_histograms_size,
  218. kMaxNumberOfHistograms, mb->literal_histograms,
  219. &mb->literal_histograms_size, mb->literal_context_map);
  220. if (BROTLI_IS_OOM(m)) return;
  221. BROTLI_FREE(m, literal_histograms);
  222. if (params->disable_literal_context_modeling) {
  223. /* Distribute assignment to all contexts. */
  224. for (i = mb->literal_split.num_types; i != 0;) {
  225. size_t j = 0;
  226. i--;
  227. for (; j < (1 << BROTLI_LITERAL_CONTEXT_BITS); j++) {
  228. mb->literal_context_map[(i << BROTLI_LITERAL_CONTEXT_BITS) + j] =
  229. mb->literal_context_map[i];
  230. }
  231. }
  232. }
  233. BROTLI_DCHECK(mb->distance_context_map == 0);
  234. mb->distance_context_map_size =
  235. mb->distance_split.num_types << BROTLI_DISTANCE_CONTEXT_BITS;
  236. mb->distance_context_map =
  237. BROTLI_ALLOC(m, uint32_t, mb->distance_context_map_size);
  238. if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->distance_context_map)) return;
  239. BROTLI_DCHECK(mb->distance_histograms == 0);
  240. mb->distance_histograms_size = mb->distance_context_map_size;
  241. mb->distance_histograms =
  242. BROTLI_ALLOC(m, HistogramDistance, mb->distance_histograms_size);
  243. if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->distance_histograms)) return;
  244. BrotliClusterHistogramsDistance(m, distance_histograms,
  245. mb->distance_context_map_size,
  246. kMaxNumberOfHistograms,
  247. mb->distance_histograms,
  248. &mb->distance_histograms_size,
  249. mb->distance_context_map);
  250. if (BROTLI_IS_OOM(m)) return;
  251. BROTLI_FREE(m, distance_histograms);
  252. }
  253. #define FN(X) X ## Literal
  254. #include "./metablock_inc.h" /* NOLINT(build/include) */
  255. #undef FN
  256. #define FN(X) X ## Command
  257. #include "./metablock_inc.h" /* NOLINT(build/include) */
  258. #undef FN
  259. #define FN(X) X ## Distance
  260. #include "./metablock_inc.h" /* NOLINT(build/include) */
  261. #undef FN
  262. #define BROTLI_MAX_STATIC_CONTEXTS 13
  263. /* Greedy block splitter for one block category (literal, command or distance).
  264. Gathers histograms for all context buckets. */
  265. typedef struct ContextBlockSplitter {
  266. /* Alphabet size of particular block category. */
  267. size_t alphabet_size_;
  268. size_t num_contexts_;
  269. size_t max_block_types_;
  270. /* We collect at least this many symbols for each block. */
  271. size_t min_block_size_;
  272. /* We merge histograms A and B if
  273. entropy(A+B) < entropy(A) + entropy(B) + split_threshold_,
  274. where A is the current histogram and B is the histogram of the last or the
  275. second last block type. */
  276. double split_threshold_;
  277. size_t num_blocks_;
  278. BlockSplit* split_; /* not owned */
  279. HistogramLiteral* histograms_; /* not owned */
  280. size_t* histograms_size_; /* not owned */
  281. /* The number of symbols that we want to collect before deciding on whether
  282. or not to merge the block with a previous one or emit a new block. */
  283. size_t target_block_size_;
  284. /* The number of symbols in the current histogram. */
  285. size_t block_size_;
  286. /* Offset of the current histogram. */
  287. size_t curr_histogram_ix_;
  288. /* Offset of the histograms of the previous two block types. */
  289. size_t last_histogram_ix_[2];
  290. /* Entropy of the previous two block types. */
  291. double last_entropy_[2 * BROTLI_MAX_STATIC_CONTEXTS];
  292. /* The number of times we merged the current block with the last one. */
  293. size_t merge_last_count_;
  294. } ContextBlockSplitter;
  295. static void InitContextBlockSplitter(
  296. MemoryManager* m, ContextBlockSplitter* self, size_t alphabet_size,
  297. size_t num_contexts, size_t min_block_size, double split_threshold,
  298. size_t num_symbols, BlockSplit* split, HistogramLiteral** histograms,
  299. size_t* histograms_size) {
  300. size_t max_num_blocks = num_symbols / min_block_size + 1;
  301. size_t max_num_types;
  302. BROTLI_DCHECK(num_contexts <= BROTLI_MAX_STATIC_CONTEXTS);
  303. self->alphabet_size_ = alphabet_size;
  304. self->num_contexts_ = num_contexts;
  305. self->max_block_types_ = BROTLI_MAX_NUMBER_OF_BLOCK_TYPES / num_contexts;
  306. self->min_block_size_ = min_block_size;
  307. self->split_threshold_ = split_threshold;
  308. self->num_blocks_ = 0;
  309. self->split_ = split;
  310. self->histograms_size_ = histograms_size;
  311. self->target_block_size_ = min_block_size;
  312. self->block_size_ = 0;
  313. self->curr_histogram_ix_ = 0;
  314. self->merge_last_count_ = 0;
  315. /* We have to allocate one more histogram than the maximum number of block
  316. types for the current histogram when the meta-block is too big. */
  317. max_num_types =
  318. BROTLI_MIN(size_t, max_num_blocks, self->max_block_types_ + 1);
  319. BROTLI_ENSURE_CAPACITY(m, uint8_t,
  320. split->types, split->types_alloc_size, max_num_blocks);
  321. BROTLI_ENSURE_CAPACITY(m, uint32_t,
  322. split->lengths, split->lengths_alloc_size, max_num_blocks);
  323. if (BROTLI_IS_OOM(m)) return;
  324. split->num_blocks = max_num_blocks;
  325. if (BROTLI_IS_OOM(m)) return;
  326. BROTLI_DCHECK(*histograms == 0);
  327. *histograms_size = max_num_types * num_contexts;
  328. *histograms = BROTLI_ALLOC(m, HistogramLiteral, *histograms_size);
  329. self->histograms_ = *histograms;
  330. if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(*histograms)) return;
  331. /* Clear only current histogram. */
  332. ClearHistogramsLiteral(&self->histograms_[0], num_contexts);
  333. self->last_histogram_ix_[0] = self->last_histogram_ix_[1] = 0;
  334. }
  335. /* Does either of three things:
  336. (1) emits the current block with a new block type;
  337. (2) emits the current block with the type of the second last block;
  338. (3) merges the current block with the last block. */
  339. static void ContextBlockSplitterFinishBlock(
  340. ContextBlockSplitter* self, MemoryManager* m, BROTLI_BOOL is_final) {
  341. BlockSplit* split = self->split_;
  342. const size_t num_contexts = self->num_contexts_;
  343. double* last_entropy = self->last_entropy_;
  344. HistogramLiteral* histograms = self->histograms_;
  345. if (self->block_size_ < self->min_block_size_) {
  346. self->block_size_ = self->min_block_size_;
  347. }
  348. if (self->num_blocks_ == 0) {
  349. size_t i;
  350. /* Create first block. */
  351. split->lengths[0] = (uint32_t)self->block_size_;
  352. split->types[0] = 0;
  353. for (i = 0; i < num_contexts; ++i) {
  354. last_entropy[i] =
  355. BitsEntropy(histograms[i].data_, self->alphabet_size_);
  356. last_entropy[num_contexts + i] = last_entropy[i];
  357. }
  358. ++self->num_blocks_;
  359. ++split->num_types;
  360. self->curr_histogram_ix_ += num_contexts;
  361. if (self->curr_histogram_ix_ < *self->histograms_size_) {
  362. ClearHistogramsLiteral(
  363. &self->histograms_[self->curr_histogram_ix_], self->num_contexts_);
  364. }
  365. self->block_size_ = 0;
  366. } else if (self->block_size_ > 0) {
  367. /* Try merging the set of histograms for the current block type with the
  368. respective set of histograms for the last and second last block types.
  369. Decide over the split based on the total reduction of entropy across
  370. all contexts. */
  371. double entropy[BROTLI_MAX_STATIC_CONTEXTS];
  372. HistogramLiteral* combined_histo =
  373. BROTLI_ALLOC(m, HistogramLiteral, 2 * num_contexts);
  374. double combined_entropy[2 * BROTLI_MAX_STATIC_CONTEXTS];
  375. double diff[2] = { 0.0 };
  376. size_t i;
  377. if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(combined_histo)) return;
  378. for (i = 0; i < num_contexts; ++i) {
  379. size_t curr_histo_ix = self->curr_histogram_ix_ + i;
  380. size_t j;
  381. entropy[i] = BitsEntropy(histograms[curr_histo_ix].data_,
  382. self->alphabet_size_);
  383. for (j = 0; j < 2; ++j) {
  384. size_t jx = j * num_contexts + i;
  385. size_t last_histogram_ix = self->last_histogram_ix_[j] + i;
  386. combined_histo[jx] = histograms[curr_histo_ix];
  387. HistogramAddHistogramLiteral(&combined_histo[jx],
  388. &histograms[last_histogram_ix]);
  389. combined_entropy[jx] = BitsEntropy(
  390. &combined_histo[jx].data_[0], self->alphabet_size_);
  391. diff[j] += combined_entropy[jx] - entropy[i] - last_entropy[jx];
  392. }
  393. }
  394. if (split->num_types < self->max_block_types_ &&
  395. diff[0] > self->split_threshold_ &&
  396. diff[1] > self->split_threshold_) {
  397. /* Create new block. */
  398. split->lengths[self->num_blocks_] = (uint32_t)self->block_size_;
  399. split->types[self->num_blocks_] = (uint8_t)split->num_types;
  400. self->last_histogram_ix_[1] = self->last_histogram_ix_[0];
  401. self->last_histogram_ix_[0] = split->num_types * num_contexts;
  402. for (i = 0; i < num_contexts; ++i) {
  403. last_entropy[num_contexts + i] = last_entropy[i];
  404. last_entropy[i] = entropy[i];
  405. }
  406. ++self->num_blocks_;
  407. ++split->num_types;
  408. self->curr_histogram_ix_ += num_contexts;
  409. if (self->curr_histogram_ix_ < *self->histograms_size_) {
  410. ClearHistogramsLiteral(
  411. &self->histograms_[self->curr_histogram_ix_], self->num_contexts_);
  412. }
  413. self->block_size_ = 0;
  414. self->merge_last_count_ = 0;
  415. self->target_block_size_ = self->min_block_size_;
  416. } else if (diff[1] < diff[0] - 20.0) {
  417. /* Combine this block with second last block. */
  418. split->lengths[self->num_blocks_] = (uint32_t)self->block_size_;
  419. split->types[self->num_blocks_] = split->types[self->num_blocks_ - 2];
  420. BROTLI_SWAP(size_t, self->last_histogram_ix_, 0, 1);
  421. for (i = 0; i < num_contexts; ++i) {
  422. histograms[self->last_histogram_ix_[0] + i] =
  423. combined_histo[num_contexts + i];
  424. last_entropy[num_contexts + i] = last_entropy[i];
  425. last_entropy[i] = combined_entropy[num_contexts + i];
  426. HistogramClearLiteral(&histograms[self->curr_histogram_ix_ + i]);
  427. }
  428. ++self->num_blocks_;
  429. self->block_size_ = 0;
  430. self->merge_last_count_ = 0;
  431. self->target_block_size_ = self->min_block_size_;
  432. } else {
  433. /* Combine this block with last block. */
  434. split->lengths[self->num_blocks_ - 1] += (uint32_t)self->block_size_;
  435. for (i = 0; i < num_contexts; ++i) {
  436. histograms[self->last_histogram_ix_[0] + i] = combined_histo[i];
  437. last_entropy[i] = combined_entropy[i];
  438. if (split->num_types == 1) {
  439. last_entropy[num_contexts + i] = last_entropy[i];
  440. }
  441. HistogramClearLiteral(&histograms[self->curr_histogram_ix_ + i]);
  442. }
  443. self->block_size_ = 0;
  444. if (++self->merge_last_count_ > 1) {
  445. self->target_block_size_ += self->min_block_size_;
  446. }
  447. }
  448. BROTLI_FREE(m, combined_histo);
  449. }
  450. if (is_final) {
  451. *self->histograms_size_ = split->num_types * num_contexts;
  452. split->num_blocks = self->num_blocks_;
  453. }
  454. }
  455. /* Adds the next symbol to the current block type and context. When the
  456. current block reaches the target size, decides on merging the block. */
  457. static void ContextBlockSplitterAddSymbol(
  458. ContextBlockSplitter* self, MemoryManager* m,
  459. size_t symbol, size_t context) {
  460. HistogramAddLiteral(&self->histograms_[self->curr_histogram_ix_ + context],
  461. symbol);
  462. ++self->block_size_;
  463. if (self->block_size_ == self->target_block_size_) {
  464. ContextBlockSplitterFinishBlock(self, m, /* is_final = */ BROTLI_FALSE);
  465. if (BROTLI_IS_OOM(m)) return;
  466. }
  467. }
  468. static void MapStaticContexts(MemoryManager* m,
  469. size_t num_contexts,
  470. const uint32_t* static_context_map,
  471. MetaBlockSplit* mb) {
  472. size_t i;
  473. BROTLI_DCHECK(mb->literal_context_map == 0);
  474. mb->literal_context_map_size =
  475. mb->literal_split.num_types << BROTLI_LITERAL_CONTEXT_BITS;
  476. mb->literal_context_map =
  477. BROTLI_ALLOC(m, uint32_t, mb->literal_context_map_size);
  478. if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->literal_context_map)) return;
  479. for (i = 0; i < mb->literal_split.num_types; ++i) {
  480. uint32_t offset = (uint32_t)(i * num_contexts);
  481. size_t j;
  482. for (j = 0; j < (1u << BROTLI_LITERAL_CONTEXT_BITS); ++j) {
  483. mb->literal_context_map[(i << BROTLI_LITERAL_CONTEXT_BITS) + j] =
  484. offset + static_context_map[j];
  485. }
  486. }
  487. }
  488. static BROTLI_INLINE void BrotliBuildMetaBlockGreedyInternal(
  489. MemoryManager* m, const uint8_t* ringbuffer, size_t pos, size_t mask,
  490. uint8_t prev_byte, uint8_t prev_byte2, ContextLut literal_context_lut,
  491. const size_t num_contexts, const uint32_t* static_context_map,
  492. const Command* commands, size_t n_commands, MetaBlockSplit* mb) {
  493. union {
  494. BlockSplitterLiteral plain;
  495. ContextBlockSplitter ctx;
  496. } lit_blocks;
  497. BlockSplitterCommand cmd_blocks;
  498. BlockSplitterDistance dist_blocks;
  499. size_t num_literals = 0;
  500. size_t i;
  501. for (i = 0; i < n_commands; ++i) {
  502. num_literals += commands[i].insert_len_;
  503. }
  504. if (num_contexts == 1) {
  505. InitBlockSplitterLiteral(m, &lit_blocks.plain, 256, 512, 400.0,
  506. num_literals, &mb->literal_split, &mb->literal_histograms,
  507. &mb->literal_histograms_size);
  508. } else {
  509. InitContextBlockSplitter(m, &lit_blocks.ctx, 256, num_contexts, 512, 400.0,
  510. num_literals, &mb->literal_split, &mb->literal_histograms,
  511. &mb->literal_histograms_size);
  512. }
  513. if (BROTLI_IS_OOM(m)) return;
  514. InitBlockSplitterCommand(m, &cmd_blocks, BROTLI_NUM_COMMAND_SYMBOLS, 1024,
  515. 500.0, n_commands, &mb->command_split, &mb->command_histograms,
  516. &mb->command_histograms_size);
  517. if (BROTLI_IS_OOM(m)) return;
  518. InitBlockSplitterDistance(m, &dist_blocks, 64, 512, 100.0, n_commands,
  519. &mb->distance_split, &mb->distance_histograms,
  520. &mb->distance_histograms_size);
  521. if (BROTLI_IS_OOM(m)) return;
  522. for (i = 0; i < n_commands; ++i) {
  523. const Command cmd = commands[i];
  524. size_t j;
  525. BlockSplitterAddSymbolCommand(&cmd_blocks, cmd.cmd_prefix_);
  526. for (j = cmd.insert_len_; j != 0; --j) {
  527. uint8_t literal = ringbuffer[pos & mask];
  528. if (num_contexts == 1) {
  529. BlockSplitterAddSymbolLiteral(&lit_blocks.plain, literal);
  530. } else {
  531. size_t context =
  532. BROTLI_CONTEXT(prev_byte, prev_byte2, literal_context_lut);
  533. ContextBlockSplitterAddSymbol(&lit_blocks.ctx, m, literal,
  534. static_context_map[context]);
  535. if (BROTLI_IS_OOM(m)) return;
  536. }
  537. prev_byte2 = prev_byte;
  538. prev_byte = literal;
  539. ++pos;
  540. }
  541. pos += CommandCopyLen(&cmd);
  542. if (CommandCopyLen(&cmd)) {
  543. prev_byte2 = ringbuffer[(pos - 2) & mask];
  544. prev_byte = ringbuffer[(pos - 1) & mask];
  545. if (cmd.cmd_prefix_ >= 128) {
  546. BlockSplitterAddSymbolDistance(&dist_blocks, cmd.dist_prefix_ & 0x3FF);
  547. }
  548. }
  549. }
  550. if (num_contexts == 1) {
  551. BlockSplitterFinishBlockLiteral(
  552. &lit_blocks.plain, /* is_final = */ BROTLI_TRUE);
  553. } else {
  554. ContextBlockSplitterFinishBlock(
  555. &lit_blocks.ctx, m, /* is_final = */ BROTLI_TRUE);
  556. if (BROTLI_IS_OOM(m)) return;
  557. }
  558. BlockSplitterFinishBlockCommand(&cmd_blocks, /* is_final = */ BROTLI_TRUE);
  559. BlockSplitterFinishBlockDistance(&dist_blocks, /* is_final = */ BROTLI_TRUE);
  560. if (num_contexts > 1) {
  561. MapStaticContexts(m, num_contexts, static_context_map, mb);
  562. }
  563. }
  564. void BrotliBuildMetaBlockGreedy(MemoryManager* m,
  565. const uint8_t* ringbuffer,
  566. size_t pos,
  567. size_t mask,
  568. uint8_t prev_byte,
  569. uint8_t prev_byte2,
  570. ContextLut literal_context_lut,
  571. size_t num_contexts,
  572. const uint32_t* static_context_map,
  573. const Command* commands,
  574. size_t n_commands,
  575. MetaBlockSplit* mb) {
  576. if (num_contexts == 1) {
  577. BrotliBuildMetaBlockGreedyInternal(m, ringbuffer, pos, mask, prev_byte,
  578. prev_byte2, literal_context_lut, 1, NULL, commands, n_commands, mb);
  579. } else {
  580. BrotliBuildMetaBlockGreedyInternal(m, ringbuffer, pos, mask, prev_byte,
  581. prev_byte2, literal_context_lut, num_contexts, static_context_map,
  582. commands, n_commands, mb);
  583. }
  584. }
  585. void BrotliOptimizeHistograms(uint32_t num_distance_codes,
  586. MetaBlockSplit* mb) {
  587. uint8_t good_for_rle[BROTLI_NUM_COMMAND_SYMBOLS];
  588. size_t i;
  589. for (i = 0; i < mb->literal_histograms_size; ++i) {
  590. BrotliOptimizeHuffmanCountsForRle(256, mb->literal_histograms[i].data_,
  591. good_for_rle);
  592. }
  593. for (i = 0; i < mb->command_histograms_size; ++i) {
  594. BrotliOptimizeHuffmanCountsForRle(BROTLI_NUM_COMMAND_SYMBOLS,
  595. mb->command_histograms[i].data_,
  596. good_for_rle);
  597. }
  598. for (i = 0; i < mb->distance_histograms_size; ++i) {
  599. BrotliOptimizeHuffmanCountsForRle(num_distance_codes,
  600. mb->distance_histograms[i].data_,
  601. good_for_rle);
  602. }
  603. }
  604. #if defined(__cplusplus) || defined(c_plusplus)
  605. } /* extern "C" */
  606. #endif