all repos — mgba @ b2d406a411b31acce5bbf0246af32a80c22ca834

mGBA Game Boy Advance Emulator

src/third-party/lzma/Bcj2Enc.c (view raw)

  1/* Bcj2Enc.c -- BCJ2 Encoder (Converter for x86 code)
  22019-02-02 : Igor Pavlov : Public domain */
  3
  4#include "Precomp.h"
  5
  6/* #define SHOW_STAT */
  7
  8#ifdef SHOW_STAT
  9#include <stdio.h>
 10#define PRF(x) x
 11#else
 12#define PRF(x)
 13#endif
 14
 15#include <string.h>
 16
 17#include "Bcj2.h"
 18#include "CpuArch.h"
 19
 20#define CProb UInt16
 21
 22#define kTopValue ((UInt32)1 << 24)
 23#define kNumModelBits 11
 24#define kBitModelTotal (1 << kNumModelBits)
 25#define kNumMoveBits 5
 26
 27void Bcj2Enc_Init(CBcj2Enc *p)
 28{
 29  unsigned i;
 30
 31  p->state = BCJ2_ENC_STATE_OK;
 32  p->finishMode = BCJ2_ENC_FINISH_MODE_CONTINUE;
 33
 34  p->prevByte = 0;
 35
 36  p->cache = 0;
 37  p->range = 0xFFFFFFFF;
 38  p->low = 0;
 39  p->cacheSize = 1;
 40
 41  p->ip = 0;
 42
 43  p->fileIp = 0;
 44  p->fileSize = 0;
 45  p->relatLimit = BCJ2_RELAT_LIMIT;
 46
 47  p->tempPos = 0;
 48
 49  p->flushPos = 0;
 50
 51  for (i = 0; i < sizeof(p->probs) / sizeof(p->probs[0]); i++)
 52    p->probs[i] = kBitModelTotal >> 1;
 53}
 54
 55static BoolInt MY_FAST_CALL RangeEnc_ShiftLow(CBcj2Enc *p)
 56{
 57  if ((UInt32)p->low < (UInt32)0xFF000000 || (UInt32)(p->low >> 32) != 0)
 58  {
 59    Byte *buf = p->bufs[BCJ2_STREAM_RC];
 60    do
 61    {
 62      if (buf == p->lims[BCJ2_STREAM_RC])
 63      {
 64        p->state = BCJ2_STREAM_RC;
 65        p->bufs[BCJ2_STREAM_RC] = buf;
 66        return True;
 67      }
 68      *buf++ = (Byte)(p->cache + (Byte)(p->low >> 32));
 69      p->cache = 0xFF;
 70    }
 71    while (--p->cacheSize);
 72    p->bufs[BCJ2_STREAM_RC] = buf;
 73    p->cache = (Byte)((UInt32)p->low >> 24);
 74  }
 75  p->cacheSize++;
 76  p->low = (UInt32)p->low << 8;
 77  return False;
 78}
 79
 80static void Bcj2Enc_Encode_2(CBcj2Enc *p)
 81{
 82  if (BCJ2_IS_32BIT_STREAM(p->state))
 83  {
 84    Byte *cur = p->bufs[p->state];
 85    if (cur == p->lims[p->state])
 86      return;
 87    SetBe32(cur, p->tempTarget);
 88    p->bufs[p->state] = cur + 4;
 89  }
 90
 91  p->state = BCJ2_ENC_STATE_ORIG;
 92
 93  for (;;)
 94  {
 95    if (p->range < kTopValue)
 96    {
 97      if (RangeEnc_ShiftLow(p))
 98        return;
 99      p->range <<= 8;
100    }
101
102    {
103      {
104        const Byte *src = p->src;
105        const Byte *srcLim;
106        Byte *dest;
107        SizeT num = p->srcLim - src;
108
109        if (p->finishMode == BCJ2_ENC_FINISH_MODE_CONTINUE)
110        {
111          if (num <= 4)
112            return;
113          num -= 4;
114        }
115        else if (num == 0)
116          break;
117
118        dest = p->bufs[BCJ2_STREAM_MAIN];
119        if (num > (SizeT)(p->lims[BCJ2_STREAM_MAIN] - dest))
120        {
121          num = p->lims[BCJ2_STREAM_MAIN] - dest;
122          if (num == 0)
123          {
124            p->state = BCJ2_STREAM_MAIN;
125            return;
126          }
127        }
128       
129        srcLim = src + num;
130
131        if (p->prevByte == 0x0F && (src[0] & 0xF0) == 0x80)
132          *dest = src[0];
133        else for (;;)
134        {
135          Byte b = *src;
136          *dest = b;
137          if (b != 0x0F)
138          {
139            if ((b & 0xFE) == 0xE8)
140              break;
141            dest++;
142            if (++src != srcLim)
143              continue;
144            break;
145          }
146          dest++;
147          if (++src == srcLim)
148            break;
149          if ((*src & 0xF0) != 0x80)
150            continue;
151          *dest = *src;
152          break;
153        }
154        
155        num = src - p->src;
156        
157        if (src == srcLim)
158        {
159          p->prevByte = src[-1];
160          p->bufs[BCJ2_STREAM_MAIN] = dest;
161          p->src = src;
162          p->ip += (UInt32)num;
163          continue;
164        }
165 
166        {
167          Byte context = (Byte)(num == 0 ? p->prevByte : src[-1]);
168          BoolInt needConvert;
169
170          p->bufs[BCJ2_STREAM_MAIN] = dest + 1;
171          p->ip += (UInt32)num + 1;
172          src++;
173          
174          needConvert = False;
175
176          if ((SizeT)(p->srcLim - src) >= 4)
177          {
178            UInt32 relatVal = GetUi32(src);
179            if ((p->fileSize == 0 || (UInt32)(p->ip + 4 + relatVal - p->fileIp) < p->fileSize)
180                && ((relatVal + p->relatLimit) >> 1) < p->relatLimit)
181              needConvert = True;
182          }
183
184          {
185            UInt32 bound;
186            unsigned ttt;
187            Byte b = src[-1];
188            CProb *prob = p->probs + (unsigned)(b == 0xE8 ? 2 + (unsigned)context : (b == 0xE9 ? 1 : 0));
189
190            ttt = *prob;
191            bound = (p->range >> kNumModelBits) * ttt;
192            
193            if (!needConvert)
194            {
195              p->range = bound;
196              *prob = (CProb)(ttt + ((kBitModelTotal - ttt) >> kNumMoveBits));
197              p->src = src;
198              p->prevByte = b;
199              continue;
200            }
201            
202            p->low += bound;
203            p->range -= bound;
204            *prob = (CProb)(ttt - (ttt >> kNumMoveBits));
205
206            {
207              UInt32 relatVal = GetUi32(src);
208              UInt32 absVal;
209              p->ip += 4;
210              absVal = p->ip + relatVal;
211              p->prevByte = src[3];
212              src += 4;
213              p->src = src;
214              {
215                unsigned cj = (b == 0xE8) ? BCJ2_STREAM_CALL : BCJ2_STREAM_JUMP;
216                Byte *cur = p->bufs[cj];
217                if (cur == p->lims[cj])
218                {
219                  p->state = cj;
220                  p->tempTarget = absVal;
221                  return;
222                }
223                SetBe32(cur, absVal);
224                p->bufs[cj] = cur + 4;
225              }
226            }
227          }
228        }
229      }
230    }
231  }
232
233  if (p->finishMode != BCJ2_ENC_FINISH_MODE_END_STREAM)
234    return;
235
236  for (; p->flushPos < 5; p->flushPos++)
237    if (RangeEnc_ShiftLow(p))
238      return;
239  p->state = BCJ2_ENC_STATE_OK;
240}
241
242
243void Bcj2Enc_Encode(CBcj2Enc *p)
244{
245  PRF(printf("\n"));
246  PRF(printf("---- ip = %8d   tempPos = %8d   src = %8d\n", p->ip, p->tempPos, p->srcLim - p->src));
247
248  if (p->tempPos != 0)
249  {
250    unsigned extra = 0;
251   
252    for (;;)
253    {
254      const Byte *src = p->src;
255      const Byte *srcLim = p->srcLim;
256      EBcj2Enc_FinishMode finishMode = p->finishMode;
257      
258      p->src = p->temp;
259      p->srcLim = p->temp + p->tempPos;
260      if (src != srcLim)
261        p->finishMode = BCJ2_ENC_FINISH_MODE_CONTINUE;
262      
263      PRF(printf("     ip = %8d   tempPos = %8d   src = %8d\n", p->ip, p->tempPos, p->srcLim - p->src));
264
265      Bcj2Enc_Encode_2(p);
266      
267      {
268        unsigned num = (unsigned)(p->src - p->temp);
269        unsigned tempPos = p->tempPos - num;
270        unsigned i;
271        p->tempPos = tempPos;
272        for (i = 0; i < tempPos; i++)
273          p->temp[i] = p->temp[(size_t)i + num];
274      
275        p->src = src;
276        p->srcLim = srcLim;
277        p->finishMode = finishMode;
278        
279        if (p->state != BCJ2_ENC_STATE_ORIG || src == srcLim)
280          return;
281        
282        if (extra >= tempPos)
283        {
284          p->src = src - tempPos;
285          p->tempPos = 0;
286          break;
287        }
288        
289        p->temp[tempPos] = src[0];
290        p->tempPos = tempPos + 1;
291        p->src = src + 1;
292        extra++;
293      }
294    }
295  }
296
297  PRF(printf("++++ ip = %8d   tempPos = %8d   src = %8d\n", p->ip, p->tempPos, p->srcLim - p->src));
298
299  Bcj2Enc_Encode_2(p);
300  
301  if (p->state == BCJ2_ENC_STATE_ORIG)
302  {
303    const Byte *src = p->src;
304    unsigned rem = (unsigned)(p->srcLim - src);
305    unsigned i;
306    for (i = 0; i < rem; i++)
307      p->temp[i] = src[i];
308    p->tempPos = rem;
309    p->src = src + rem;
310  }
311}