DynamicHuffmanDecoder.hpp 5.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226
  1. /* Copyright (C) Teemu Suutari */
  2. #ifndef DYNAMICHUFFMANDECODER_HPP
  3. #define DYNAMICHUFFMANDECODER_HPP
  4. #include <cstddef>
  5. #include <cstdint>
  6. // For exception
  7. #include "Decompressor.hpp"
  8. namespace ancient::internal
  9. {
  10. template<uint32_t maxCount>
  11. class DynamicHuffmanDecoder
  12. {
  13. public:
  14. DynamicHuffmanDecoder(uint32_t initialCount=maxCount) :
  15. _initialCount(initialCount)
  16. {
  17. if (_initialCount>maxCount) throw Decompressor::DecompressionError();
  18. reset();
  19. }
  20. ~DynamicHuffmanDecoder()
  21. {
  22. // nothing needed
  23. }
  24. void reset()
  25. {
  26. _count=_initialCount;
  27. if (!_count) return;
  28. for (uint32_t i=0;i<_count;i++)
  29. {
  30. _nodes[i].frequency=1;
  31. _nodes[i].index=i+(maxCount-_count)*2;
  32. _nodes[i].parent=maxCount*2-_count+(i>>1);
  33. _nodes[i].leaves[0]=0;
  34. _nodes[i].leaves[1]=0;
  35. _codeMap[i+(maxCount-_count)*2]=i;
  36. }
  37. for (uint32_t i=maxCount*2-_count,j=0;i<maxCount*2-1;i++,j+=2)
  38. {
  39. uint32_t l=(j>=_count)?j+(maxCount-_count)*2:j;
  40. uint32_t r=(j+1>=_count)?j+1+(maxCount-_count)*2:(j+1);
  41. _nodes[i].frequency=_nodes[l].frequency+_nodes[r].frequency;
  42. _nodes[i].index=i;
  43. _nodes[i].parent=maxCount+(i>>1);
  44. _nodes[i].leaves[0]=l;
  45. _nodes[i].leaves[1]=r;
  46. _codeMap[i]=i;
  47. }
  48. }
  49. template<typename F>
  50. uint32_t decode(F bitReader) const
  51. {
  52. if (!_count) throw Decompressor::DecompressionError();
  53. if (_count==1) return 0;
  54. uint32_t code=maxCount*2-2;
  55. while (code>=maxCount)
  56. code=_nodes[code].leaves[bitReader()?1:0];
  57. return code;
  58. }
  59. void update(uint32_t code)
  60. {
  61. if (code>=_count) throw Decompressor::DecompressionError();
  62. // this is a bug in LH2. Nobody else uses this codepath, so we can let it be...
  63. if (_count==1)
  64. {
  65. _nodes[0].frequency=1;
  66. return;
  67. }
  68. while (code!=maxCount*2-2)
  69. {
  70. _nodes[code].frequency++;
  71. uint32_t index=_nodes[code].index;
  72. uint32_t destIndex=index;
  73. uint32_t freq=_nodes[code].frequency;
  74. while (destIndex!=maxCount*2-2 && freq>_nodes[_codeMap[destIndex+1]].frequency) destIndex++;
  75. if (index!=destIndex)
  76. {
  77. auto getParentLeaf=[&](uint32_t currentCode)->uint32_t&
  78. {
  79. Node &parent=_nodes[_nodes[currentCode].parent];
  80. return parent.leaves[(parent.leaves[0]==currentCode)?0:1];
  81. };
  82. uint32_t destCode=_codeMap[destIndex];
  83. std::swap(_nodes[code].index,_nodes[destCode].index);
  84. std::swap(_codeMap[index],_codeMap[destIndex]);
  85. std::swap(getParentLeaf(code),getParentLeaf(destCode));
  86. std::swap(_nodes[code].parent,_nodes[destCode].parent);
  87. }
  88. code=_nodes[code].parent;
  89. }
  90. _nodes[code].frequency++;
  91. }
  92. // halve the frequencies rounding upwards
  93. void halve()
  94. {
  95. if (!_count) return;
  96. else if (_count==1)
  97. {
  98. _nodes[0].frequency=(_nodes[0].frequency+1)>>1;
  99. return;
  100. }
  101. for (uint32_t i=(maxCount-_count)*2,j=(maxCount-_count)*2;i<maxCount*2-1&&j<maxCount*2-_count;i++)
  102. if (_codeMap[i]<maxCount) _nodes[_codeMap[i]].index=j++;
  103. for (uint32_t i=0;i<_count;i++)
  104. {
  105. _nodes[i].frequency=(_nodes[i].frequency+1)>>1;
  106. _nodes[i].parent=maxCount+(_nodes[i].index>>1);
  107. _codeMap[_nodes[i].index]=i;
  108. }
  109. for (uint32_t i=maxCount*2-_count,j=(maxCount-_count)*2;i<maxCount*2-1;i++,j+=2)
  110. {
  111. uint32_t l=_codeMap[j];
  112. uint32_t r=_codeMap[j+1];
  113. uint32_t freq=_nodes[l].frequency+_nodes[r].frequency;
  114. _nodes[i].frequency=freq;
  115. _nodes[i].index=i;
  116. _nodes[i].parent=maxCount+(i>>1);
  117. _nodes[i].leaves[0]=l;
  118. _nodes[i].leaves[1]=r;
  119. _codeMap[i]=i;
  120. for (uint32_t k=i;freq<_nodes[_codeMap[k-1]].frequency;k--)
  121. {
  122. uint32_t &code=_codeMap[k];
  123. uint32_t &destCode=_codeMap[k-1];
  124. std::swap(_nodes[code].index,_nodes[destCode].index);
  125. std::swap(_nodes[code].parent,_nodes[destCode].parent);
  126. std::swap(code,destCode);
  127. }
  128. }
  129. }
  130. // Defined as in LH2
  131. void addCode()
  132. {
  133. if (_count>=maxCount) throw Decompressor::DecompressionError();
  134. uint32_t newIndex=(maxCount-_count-1)*2;
  135. if (!_count)
  136. {
  137. _nodes[0].frequency=0;
  138. _nodes[0].index=newIndex-1;
  139. _nodes[0].parent=maxCount*2-2;
  140. _nodes[0].leaves[0]=0;
  141. _nodes[0].leaves[1]=0;
  142. _codeMap[newIndex-1]=0;
  143. _count++;
  144. } else {
  145. _nodes[_count].frequency=0;
  146. _nodes[_count].index=newIndex;
  147. _nodes[_count].parent=maxCount*2-_count-1;
  148. _nodes[_count].leaves[0]=0;
  149. _nodes[_count].leaves[1]=0;
  150. _codeMap[newIndex]=_count;
  151. uint32_t insertIndex=newIndex+2;
  152. uint32_t repNode;
  153. uint32_t parentNode;
  154. uint32_t insertNode=maxCount*2-_count-1;
  155. if (_count>1)
  156. {
  157. _codeMap[insertIndex-1]=_codeMap[insertIndex];
  158. _nodes[_codeMap[insertIndex-1]].index--;
  159. repNode=_codeMap[(maxCount-_count)*2];
  160. parentNode=_nodes[repNode].parent;
  161. _nodes[parentNode].leaves[(_nodes[parentNode].leaves[0]==repNode)?0:1]=insertNode;
  162. _nodes[repNode].parent=insertNode;
  163. } else {
  164. repNode=0;
  165. parentNode=maxCount*2-1;
  166. }
  167. _nodes[insertNode].frequency=_nodes[repNode].frequency;
  168. _nodes[insertNode].index=insertIndex;
  169. _nodes[insertNode].parent=parentNode;
  170. _nodes[insertNode].leaves[0]=_count;
  171. _nodes[insertNode].leaves[1]=repNode;
  172. _codeMap[insertIndex]=insertNode;
  173. Node &parent=_nodes[parentNode];
  174. if (_count>1 && _nodes[parent.leaves[0]].index>_nodes[parent.leaves[1]].index)
  175. std::swap(parent.leaves[0],parent.leaves[1]);
  176. _count++;
  177. }
  178. }
  179. uint32_t getMaxFrequency() const
  180. {
  181. return _nodes[maxCount*2-2].frequency;
  182. }
  183. private:
  184. struct Node
  185. {
  186. uint32_t frequency;
  187. uint32_t index;
  188. uint32_t parent;
  189. uint32_t leaves[2];
  190. };
  191. uint32_t _initialCount;
  192. uint32_t _count;
  193. Node _nodes[maxCount*2-1];
  194. uint32_t _codeMap[maxCount*2-1];
  195. };
  196. }
  197. #endif