187 lines
4.7 KiB
C
187 lines
4.7 KiB
C
#include <stdlib.h>
|
|
#include <stdint.h>
|
|
#include <string.h>
|
|
|
|
uint32_t RabinKarp(uint8_t*, int, int, uint32_t*);
|
|
uint32_t findBest(uint8_t*, int, int, uint32_t*, uint32_t*, uint32_t*, uint8_t*);
|
|
int yaz0_internal(uint8_t*, int, uint8_t*);
|
|
void yaz0_encode(uint8_t*, int, uint8_t*, int*);
|
|
|
|
uint32_t RabinKarp(uint8_t* src, int srcSize, int srcPos, uint32_t* matchPos)
|
|
{
|
|
int startPos, smp, i;
|
|
uint32_t hash, curHash, curSize;
|
|
uint32_t bestSize, bestPos;
|
|
|
|
smp = srcSize - srcPos;
|
|
startPos = srcPos - 0x1000;
|
|
bestPos = bestSize = 0;
|
|
|
|
/* If available size is too small, return */
|
|
if(smp < 3)
|
|
return(0);
|
|
|
|
/* If available size is too big, reduce it */
|
|
if(smp > 0x111)
|
|
smp = 0x111;
|
|
|
|
/* If start position is negative, make it 0 */
|
|
if(startPos < 0)
|
|
startPos = 0;
|
|
|
|
/* Generate "hash" by converting to an int */
|
|
hash = bSwap32(*(int*)(src + srcPos));
|
|
hash = hash >> 8;
|
|
curHash = bSwap32(*(int*)(src + startPos));
|
|
curHash = curHash >> 8;
|
|
|
|
/* Search through data */
|
|
for(i = startPos; i < srcPos; i++)
|
|
{
|
|
/* If 3 bytes match, check for more */
|
|
if(curHash == hash)
|
|
{
|
|
for(curSize = 3; curSize < smp; curSize++)
|
|
if(src[i + curSize] != src[srcPos + curSize])
|
|
break;
|
|
|
|
/* Uodate best if needed */
|
|
if(curSize > bestSize)
|
|
{
|
|
bestSize = curSize;
|
|
bestPos = i;
|
|
if(bestSize == 0x111)
|
|
break;
|
|
}
|
|
}
|
|
|
|
/* Scoot over 1 byte */
|
|
curHash = (curHash << 8 | src[i + 3]) & 0x00FFFFFF;
|
|
}
|
|
|
|
/* Set match position, return the size of the match */
|
|
*matchPos = bestPos;
|
|
return(bestSize);
|
|
}
|
|
|
|
uint32_t findBest(uint8_t* src, int srcSize, int srcPos, uint32_t* matchPos, uint32_t* pMatch, uint32_t* pSize, uint8_t* pFlag)
|
|
{
|
|
int rv;
|
|
|
|
/* Check to see if this location was found by a look-ahead */
|
|
if(*pFlag == 1)
|
|
{
|
|
*pFlag = 0;
|
|
return(*pSize);
|
|
}
|
|
|
|
/* Find best match */
|
|
*pFlag = 0;
|
|
rv = RabinKarp(src, srcSize, srcPos, matchPos);
|
|
|
|
/* Look-ahead */
|
|
if(rv >= 3)
|
|
{
|
|
/* Find best match if current one were to be a 1 byte copy */
|
|
*pSize = RabinKarp(src, srcSize, srcPos+1, pMatch);
|
|
if(*pSize >= rv+2)
|
|
{
|
|
rv = *pFlag = 1;
|
|
*matchPos = *pMatch;
|
|
}
|
|
}
|
|
|
|
return(rv);
|
|
}
|
|
|
|
int yaz0_internal(uint8_t* src, int srcSize, uint8_t* dst)
|
|
{
|
|
int dstPos, srcPos, codeBytePos;
|
|
uint32_t numBytes, matchPos, dist, pMatch, pSize;
|
|
uint8_t codeByte, bitmask, pFlag;
|
|
|
|
srcPos = codeBytePos = 0;
|
|
dstPos = codeBytePos + 1;
|
|
bitmask = 0x80;
|
|
codeByte = pFlag = 0;
|
|
|
|
/* Go through all of src */
|
|
while(srcPos < srcSize)
|
|
{
|
|
/* Try to find matching bytes for compressing */
|
|
numBytes = findBest(src, srcSize, srcPos, &matchPos, &pMatch, &pSize, &pFlag);
|
|
|
|
/* Single byte copy */
|
|
if(numBytes < 3)
|
|
{
|
|
dst[dstPos++] = src[srcPos++];
|
|
codeByte |= bitmask;
|
|
}
|
|
|
|
/* Three byte encoding */
|
|
else if (numBytes > 0x11)
|
|
{
|
|
dist = srcPos - matchPos - 1;
|
|
|
|
/* Copy over 0R RR */
|
|
dst[dstPos++] = dist >> 8;
|
|
dst[dstPos++] = dist & 0xFF;
|
|
|
|
/* Reduce N if needed, copy over NN */
|
|
if(numBytes > 0x111)
|
|
numBytes = 0x111;
|
|
dst[dstPos++] = (numBytes - 0x12) & 0xFF;
|
|
|
|
srcPos += numBytes;
|
|
}
|
|
|
|
/* Two byte encoding */
|
|
else
|
|
{
|
|
dist = srcPos - matchPos - 1;
|
|
|
|
/* Copy over NR RR */
|
|
dst[dstPos++] = ((numBytes - 2) << 4) | (dist >> 8);
|
|
dst[dstPos++] = dist & 0xFF;
|
|
|
|
srcPos += numBytes;
|
|
}
|
|
|
|
/* Move bitmask to next byte */
|
|
bitmask = bitmask >> 1;
|
|
|
|
/* If all 8 bytes were used, write and move to the next one */
|
|
if(bitmask == 0)
|
|
{
|
|
dst[codeBytePos] = codeByte;
|
|
codeBytePos = dstPos;
|
|
if(srcPos < srcSize)
|
|
dstPos++;
|
|
codeByte = 0;
|
|
bitmask = 0x80;
|
|
}
|
|
}
|
|
|
|
/* Copy over last byte if it hasn't already */
|
|
if(bitmask != 0)
|
|
dst[codeBytePos] = codeByte;
|
|
|
|
/* Return size of dst */
|
|
return(dstPos);
|
|
}
|
|
|
|
void yaz0_encode(uint8_t* src, int srcSize, uint8_t* dst, int* dstSize)
|
|
{
|
|
int temp;
|
|
|
|
/* Write Yaz0 header */
|
|
temp = bSwap32(srcSize);
|
|
memcpy(dst, "Yaz0", 4);
|
|
memcpy(dst + 4, &temp, 4);
|
|
|
|
/* Encode, adjust dstSize */
|
|
temp = yaz0_internal(src, srcSize, dst + 16);
|
|
*dstSize = (temp + 31) & -16;
|
|
return;
|
|
}
|