| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262 |
- // File: huffman_codes.cpp
- // See Copyright Notice and license at the end of include/lzham.h
- #include "lzham_core.h"
- #include "lzham_huffman_codes.h"
- namespace lzham
- {
- struct sym_freq
- {
- uint m_freq;
- uint16 m_left;
- uint16 m_right;
- inline bool operator< (const sym_freq& other) const
- {
- return m_freq > other.m_freq;
- }
- };
-
- static inline sym_freq* radix_sort_syms(uint num_syms, sym_freq* syms0, sym_freq* syms1)
- {
- const uint cMaxPasses = 2;
- uint hist[256 * cMaxPasses];
-
- memset(hist, 0, sizeof(hist[0]) * 256 * cMaxPasses);
- {
- sym_freq* p = syms0;
- sym_freq* q = syms0 + (num_syms >> 1) * 2;
- for ( ; p != q; p += 2)
- {
- const uint freq0 = p[0].m_freq;
- const uint freq1 = p[1].m_freq;
- hist[ freq0 & 0xFF]++;
- hist[256 + ((freq0 >> 8) & 0xFF)]++;
- hist[ freq1 & 0xFF]++;
- hist[256 + ((freq1 >> 8) & 0xFF)]++;
- }
-
- if (num_syms & 1)
- {
- const uint freq = p->m_freq;
- hist[ freq & 0xFF]++;
- hist[256 + ((freq >> 8) & 0xFF)]++;
- }
- }
-
- sym_freq* pCur_syms = syms0;
- sym_freq* pNew_syms = syms1;
-
- const uint total_passes = (hist[256] == num_syms) ? 1 : cMaxPasses;
- for (uint pass = 0; pass < total_passes; pass++)
- {
- const uint* pHist = &hist[pass << 8];
- uint offsets[256];
- uint cur_ofs = 0;
- for (uint i = 0; i < 256; i += 2)
- {
- offsets[i] = cur_ofs;
- cur_ofs += pHist[i];
- offsets[i+1] = cur_ofs;
- cur_ofs += pHist[i+1];
- }
- const uint pass_shift = pass << 3;
- sym_freq* p = pCur_syms;
- sym_freq* q = pCur_syms + (num_syms >> 1) * 2;
- for ( ; p != q; p += 2)
- {
- uint c0 = p[0].m_freq;
- uint c1 = p[1].m_freq;
-
- if (pass)
- {
- c0 >>= 8;
- c1 >>= 8;
- }
-
- c0 &= 0xFF;
- c1 &= 0xFF;
- if (c0 == c1)
- {
- uint dst_offset0 = offsets[c0];
- offsets[c0] = dst_offset0 + 2;
- pNew_syms[dst_offset0] = p[0];
- pNew_syms[dst_offset0 + 1] = p[1];
- }
- else
- {
- uint dst_offset0 = offsets[c0]++;
- uint dst_offset1 = offsets[c1]++;
- pNew_syms[dst_offset0] = p[0];
- pNew_syms[dst_offset1] = p[1];
- }
- }
- if (num_syms & 1)
- {
- uint c = ((p->m_freq) >> pass_shift) & 0xFF;
- uint dst_offset = offsets[c];
- offsets[c] = dst_offset + 1;
- pNew_syms[dst_offset] = *p;
- }
- sym_freq* t = pCur_syms;
- pCur_syms = pNew_syms;
- pNew_syms = t;
- }
- #if LZHAM_ASSERTS_ENABLED
- uint prev_freq = 0;
- for (uint i = 0; i < num_syms; i++)
- {
- LZHAM_ASSERT(!(pCur_syms[i].m_freq < prev_freq));
- prev_freq = pCur_syms[i].m_freq;
- }
- #endif
-
- return pCur_syms;
- }
-
- struct huffman_work_tables
- {
- enum { cMaxInternalNodes = cHuffmanMaxSupportedSyms };
-
- sym_freq syms0[cHuffmanMaxSupportedSyms + 1 + cMaxInternalNodes];
- sym_freq syms1[cHuffmanMaxSupportedSyms + 1 + cMaxInternalNodes];
- #if !USE_CALCULATE_MINIMUM_REDUNDANCY
- uint16 queue[cMaxInternalNodes];
- #endif
- };
-
- uint get_generate_huffman_codes_table_size()
- {
- return sizeof(huffman_work_tables);
- }
- // calculate_minimum_redundancy() written by Alistair Moffat, [email protected], Jyrki Katajainen, [email protected] November 1996.
- static void calculate_minimum_redundancy(int A[], int n)
- {
- int root; /* next root node to be used */
- int leaf; /* next leaf to be used */
- int next; /* next value to be assigned */
- int avbl; /* number of available nodes */
- int used; /* number of internal nodes */
- int dpth; /* current depth of leaves */
- /* check for pathological cases */
- if (n==0) { return; }
- if (n==1) { A[0] = 0; return; }
- /* first pass, left to right, setting parent pointers */
- A[0] += A[1]; root = 0; leaf = 2;
- for (next=1; next < n-1; next++) {
- /* select first item for a pairing */
- if (leaf>=n || A[root]<A[leaf]) {
- A[next] = A[root]; A[root++] = next;
- } else
- A[next] = A[leaf++];
- /* add on the second item */
- if (leaf>=n || (root<next && A[root]<A[leaf])) {
- A[next] += A[root]; A[root++] = next;
- } else
- A[next] += A[leaf++];
- }
- /* second pass, right to left, setting internal depths */
- A[n-2] = 0;
- for (next=n-3; next>=0; next--)
- A[next] = A[A[next]]+1;
- /* third pass, right to left, setting leaf depths */
- avbl = 1; used = dpth = 0; root = n-2; next = n-1;
- while (avbl>0) {
- while (root>=0 && A[root]==dpth) {
- used++; root--;
- }
- while (avbl>used) {
- A[next--] = dpth; avbl--;
- }
- avbl = 2*used; dpth++; used = 0;
- }
- }
- bool generate_huffman_codes(void* pContext, uint num_syms, const uint16* pFreq, uint8* pCodesizes, uint& max_code_size, uint& total_freq_ret)
- {
- if ((!num_syms) || (num_syms > cHuffmanMaxSupportedSyms))
- return false;
-
- huffman_work_tables& state = *static_cast<huffman_work_tables*>(pContext);;
-
- uint max_freq = 0;
- uint total_freq = 0;
-
- uint num_used_syms = 0;
- for (uint i = 0; i < num_syms; i++)
- {
- uint freq = pFreq[i];
-
- if (!freq)
- pCodesizes[i] = 0;
- else
- {
- total_freq += freq;
- max_freq = math::maximum(max_freq, freq);
-
- sym_freq& sf = state.syms0[num_used_syms];
- sf.m_left = (uint16)i;
- sf.m_right = UINT16_MAX;
- sf.m_freq = freq;
- num_used_syms++;
- }
- }
-
- total_freq_ret = total_freq;
- if (num_used_syms == 1)
- {
- pCodesizes[state.syms0[0].m_left] = 1;
- return true;
- }
- sym_freq* syms = radix_sort_syms(num_used_syms, state.syms0, state.syms1);
-
- int x[cHuffmanMaxSupportedSyms];
- for (uint i = 0; i < num_used_syms; i++)
- x[i] = syms[i].m_freq;
-
- calculate_minimum_redundancy(x, num_used_syms);
-
- uint max_len = 0;
- for (uint i = 0; i < num_used_syms; i++)
- {
- uint len = x[i];
- max_len = math::maximum(len, max_len);
- pCodesizes[syms[i].m_left] = static_cast<uint8>(len);
- }
- max_code_size = max_len;
-
- return true;
- }
- } // namespace lzham
|