all repos — mgba @ b1d915abbc8924613bea12ae37e3a39d35d8c08f

mGBA Game Boy Advance Emulator

src/third-party/lzma/Bcj2Enc.c (view raw)

  1/* Bcj2Enc.c -- BCJ2 Encoder (Converter for x86 code)
  22014-11-10 : Igor Pavlov : Public domain */
  3
  4#include "Precomp.h"
  5
  6/* #define SHOW_STAT */
  7
  8#ifdef SHOW_STAT
  9#include <stdio.h>
 10#define PRF(x) x
 11#else
 12#define PRF(x)
 13#endif
 14
 15#include <windows.h>
 16#include <string.h>
 17
 18#include "Bcj2.h"
 19#include "CpuArch.h"
 20
 21#define CProb UInt16
 22
 23#define kTopValue ((UInt32)1 << 24)
 24#define kNumModelBits 11
 25#define kBitModelTotal (1 << kNumModelBits)
 26#define kNumMoveBits 5
 27
 28void Bcj2Enc_Init(CBcj2Enc *p)
 29{
 30  unsigned i;
 31
 32  p->state = BCJ2_ENC_STATE_OK;
 33  p->finishMode = BCJ2_ENC_FINISH_MODE_CONTINUE;
 34
 35  p->prevByte = 0;
 36
 37  p->cache = 0;
 38  p->range = 0xFFFFFFFF;
 39  p->low = 0;
 40  p->cacheSize = 1;
 41
 42  p->ip = 0;
 43
 44  p->fileIp = 0;
 45  p->fileSize = 0;
 46  p->relatLimit = BCJ2_RELAT_LIMIT;
 47
 48  p->tempPos = 0;
 49
 50  p->flushPos = 0;
 51
 52  for (i = 0; i < sizeof(p->probs) / sizeof(p->probs[0]); i++)
 53    p->probs[i] = kBitModelTotal >> 1;
 54}
 55
 56static Bool MY_FAST_CALL RangeEnc_ShiftLow(CBcj2Enc *p)
 57{
 58  if ((UInt32)p->low < (UInt32)0xFF000000 || (UInt32)(p->low >> 32) != 0)
 59  {
 60    Byte *buf = p->bufs[BCJ2_STREAM_RC];
 61    do
 62    {
 63      if (buf == p->lims[BCJ2_STREAM_RC])
 64      {
 65        p->state = BCJ2_STREAM_RC;
 66        p->bufs[BCJ2_STREAM_RC] = buf;
 67        return True;
 68      }
 69      *buf++ = (Byte)(p->cache + (Byte)(p->low >> 32));
 70      p->cache = 0xFF;
 71    }
 72    while (--p->cacheSize);
 73    p->bufs[BCJ2_STREAM_RC] = buf;
 74    p->cache = (Byte)((UInt32)p->low >> 24);
 75  }
 76  p->cacheSize++;
 77  p->low = (UInt32)p->low << 8;
 78  return False;
 79}
 80
 81static void Bcj2Enc_Encode_2(CBcj2Enc *p)
 82{
 83  if (BCJ2_IS_32BIT_STREAM(p->state))
 84  {
 85    Byte *cur = p->bufs[p->state];
 86    if (cur == p->lims[p->state])
 87      return;
 88    SetBe32(cur, p->tempTarget);
 89    p->bufs[p->state] = cur + 4;
 90  }
 91
 92  p->state = BCJ2_ENC_STATE_ORIG;
 93
 94  for (;;)
 95  {
 96    if (p->range < kTopValue)
 97    {
 98      if (RangeEnc_ShiftLow(p))
 99        return;
100      p->range <<= 8;
101    }
102
103    {
104      {
105        const Byte *src = p->src;
106        const Byte *srcLim;
107        Byte *dest;
108        SizeT num = p->srcLim - src;
109
110        if (p->finishMode == BCJ2_ENC_FINISH_MODE_CONTINUE)
111        {
112          if (num <= 4)
113            return;
114          num -= 4;
115        }
116        else if (num == 0)
117          break;
118
119        dest = p->bufs[BCJ2_STREAM_MAIN];
120        if (num > (SizeT)(p->lims[BCJ2_STREAM_MAIN] - dest))
121        {
122          num = p->lims[BCJ2_STREAM_MAIN] - dest;
123          if (num == 0)
124          {
125            p->state = BCJ2_STREAM_MAIN;
126            return;
127          }
128        }
129       
130        srcLim = src + num;
131
132        if (p->prevByte == 0x0F && (src[0] & 0xF0) == 0x80)
133          *dest = src[0];
134        else for (;;)
135        {
136          Byte b = *src;
137          *dest = b;
138          if (b != 0x0F)
139          {
140            if ((b & 0xFE) == 0xE8)
141              break;
142            dest++;
143            if (++src != srcLim)
144              continue;
145            break;
146          }
147          dest++;
148          if (++src == srcLim)
149            break;
150          if ((*src & 0xF0) != 0x80)
151            continue;
152          *dest = *src;
153          break;
154        }
155        
156        num = src - p->src;
157        
158        if (src == srcLim)
159        {
160          p->prevByte = src[-1];
161          p->bufs[BCJ2_STREAM_MAIN] = dest;
162          p->src = src;
163          p->ip += (UInt32)num;
164          continue;
165        }
166 
167        {
168          Byte context = (Byte)(num == 0 ? p->prevByte : src[-1]);
169          Bool needConvert;
170
171          p->bufs[BCJ2_STREAM_MAIN] = dest + 1;
172          p->ip += (UInt32)num + 1;
173          src++;
174          
175          needConvert = False;
176
177          if ((SizeT)(p->srcLim - src) >= 4)
178          {
179            UInt32 relatVal = GetUi32(src);
180            if ((p->fileSize == 0 || (UInt32)(p->ip + 4 + relatVal - p->fileIp) < p->fileSize)
181                && ((relatVal + p->relatLimit) >> 1) < p->relatLimit)
182              needConvert = True;
183          }
184
185          {
186            UInt32 bound;
187            unsigned ttt;
188            Byte b = src[-1];
189            CProb *prob = p->probs + (unsigned)(b == 0xE8 ? 2 + (unsigned)context : (b == 0xE9 ? 1 : 0));
190
191            ttt = *prob;
192            bound = (p->range >> kNumModelBits) * ttt;
193            
194            if (!needConvert)
195            {
196              p->range = bound;
197              *prob = (CProb)(ttt + ((kBitModelTotal - ttt) >> kNumMoveBits));
198              p->src = src;
199              p->prevByte = b;
200              continue;
201            }
202            
203            p->low += bound;
204            p->range -= bound;
205            *prob = (CProb)(ttt - (ttt >> kNumMoveBits));
206
207            {
208              UInt32 relatVal = GetUi32(src);
209              UInt32 absVal;
210              p->ip += 4;
211              absVal = p->ip + relatVal;
212              p->prevByte = src[3];
213              src += 4;
214              p->src = src;
215              {
216                unsigned cj = (b == 0xE8) ? BCJ2_STREAM_CALL : BCJ2_STREAM_JUMP;
217                Byte *cur = p->bufs[cj];
218                if (cur == p->lims[cj])
219                {
220                  p->state = cj;
221                  p->tempTarget = absVal;
222                  return;
223                }
224                SetBe32(cur, absVal);
225                p->bufs[cj] = cur + 4;
226              }
227            }
228          }
229        }
230      }
231    }
232  }
233
234  if (p->finishMode != BCJ2_ENC_FINISH_MODE_END_STREAM)
235    return;
236
237  for (; p->flushPos < 5; p->flushPos++)
238    if (RangeEnc_ShiftLow(p))
239      return;
240  p->state = BCJ2_ENC_STATE_OK;
241}
242
243
244void Bcj2Enc_Encode(CBcj2Enc *p)
245{
246  PRF(printf("\n"));
247  PRF(printf("---- ip = %8d   tempPos = %8d   src = %8d\n", p->ip, p->tempPos, p->srcLim - p->src));
248
249  if (p->tempPos != 0)
250  {
251    unsigned extra = 0;
252   
253    for (;;)
254    {
255      const Byte *src = p->src;
256      const Byte *srcLim = p->srcLim;
257      unsigned finishMode = p->finishMode;
258      
259      p->src = p->temp;
260      p->srcLim = p->temp + p->tempPos;
261      if (src != srcLim)
262        p->finishMode = BCJ2_ENC_FINISH_MODE_CONTINUE;
263      
264      PRF(printf("     ip = %8d   tempPos = %8d   src = %8d\n", p->ip, p->tempPos, p->srcLim - p->src));
265
266      Bcj2Enc_Encode_2(p);
267      
268      {
269        unsigned num = (unsigned)(p->src - p->temp);
270        unsigned tempPos = p->tempPos - num;
271        unsigned i;
272        p->tempPos = tempPos;
273        for (i = 0; i < tempPos; i++)
274          p->temp[i] = p->temp[i + num];
275      
276        p->src = src;
277        p->srcLim = srcLim;
278        p->finishMode = finishMode;
279        
280        if (p->state != BCJ2_ENC_STATE_ORIG || src == srcLim)
281          return;
282        
283        if (extra >= tempPos)
284        {
285          p->src = src - tempPos;
286          p->tempPos = 0;
287          break;
288        }
289        
290        p->temp[tempPos] = src[0];
291        p->tempPos = tempPos + 1;
292        p->src = src + 1;
293        extra++;
294      }
295    }
296  }
297
298  PRF(printf("++++ ip = %8d   tempPos = %8d   src = %8d\n", p->ip, p->tempPos, p->srcLim - p->src));
299
300  Bcj2Enc_Encode_2(p);
301  
302  if (p->state == BCJ2_ENC_STATE_ORIG)
303  {
304    const Byte *src = p->src;
305    unsigned rem = (unsigned)(p->srcLim - src);
306    unsigned i;
307    for (i = 0; i < rem; i++)
308      p->temp[i] = src[i];
309    p->tempPos = rem;
310    p->src = src + rem;
311  }
312}