123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693 |
- #include "stdafx.h"
- #include "Lzari.h"
- LZARI::LZARI()
- {
- infile = NULL;
- outfile = NULL;
- textsize = 0;
- codesize = 0;
- printcount = 0;
- low = 0;
- high = Q4;
- value = 0;
- shifts = 0;
-
- m_bMem = FALSE;
- m_pInBuffer = NULL;
- m_nInLength = 0;
- m_nInCur = 0;
-
- m_nOutLength = 0;
- buffer_putbit = 0;
- mask_putbit = 128;
- buffer_getbit = 0;
- mask_getbit = 0;
- }
- LZARI::~LZARI()
- {
- Release();
- }
- void LZARI::Error(char *message)
- {
- #ifdef _OUTPUT_STATUS
- printf("\n%s\n", message);
- #endif
-
- int e = 1;
- throw e;
- }
- void LZARI::PutBit(int bit)
- {
- if (bit) buffer_putbit |= mask_putbit;
- if ((mask_putbit >>= 1) == 0)
- {
- if (!m_bMem)
- {
- if (putc(buffer_putbit, outfile) == EOF) Error("Write Error");
- }
- else
- {
-
-
- m_OutBuffer.push_back(buffer_putbit);
-
- }
- buffer_putbit = 0;
- mask_putbit = 128;
- codesize++;
- }
- }
- void LZARI::FlushBitBuffer(void)
- {
- int i;
-
- for (i = 0; i < 7; i++) PutBit(0);
- }
- int LZARI::GetBit(void)
- {
- if ((mask_getbit >>= 1) == 0)
- {
- if (!m_bMem)
- buffer_getbit = getc(infile);
- else
- buffer_getbit = m_pInBuffer[m_nInCur++];
- mask_getbit = 128;
- }
- return ((buffer_getbit & mask_getbit) != 0);
- }
- void LZARI::InitTree(void)
- {
- int i;
-
- for (i = N + 1; i <= N + 256; i++) rson[i] = NIL;
- for (i = 0; i < N; i++) dad[i] = NIL;
- }
- void LZARI::InsertNode(int r)
-
- {
- int i, p, cmp, temp;
- unsigned char *key;
- cmp = 1; key = &text_buf[r]; p = N + 1 + key[0];
- rson[r] = lson[r] = NIL; match_length = 0;
- for ( ; ; )
- {
- if (cmp >= 0)
- {
- if (rson[p] != NIL) p = rson[p];
- else { rson[p] = r; dad[r] = p; return; }
- } else
- {
- if (lson[p] != NIL) p = lson[p];
- else { lson[p] = r; dad[r] = p; return; }
- }
- for (i = 1; i < F; i++)
- if ((cmp = key[i] - text_buf[p + i]) != 0) break;
- if (i > THRESHOLD)
- {
- if (i > match_length)
- {
- match_position = (r - p) & (N - 1);
- if ((match_length = i) >= F) break;
- } else if (i == match_length)
- {
- if ((temp = (r - p) & (N - 1)) < match_position)
- match_position = temp;
- }
- }
- }
- dad[r] = dad[p]; lson[r] = lson[p]; rson[r] = rson[p];
- dad[lson[p]] = r; dad[rson[p]] = r;
- if (rson[dad[p]] == p) rson[dad[p]] = r;
- else lson[dad[p]] = r;
- dad[p] = NIL;
- }
- void LZARI::DeleteNode(int p)
- {
- int q;
-
- if (dad[p] == NIL) return;
- if (rson[p] == NIL) q = lson[p];
- else if (lson[p] == NIL) q = rson[p];
- else
- {
- q = lson[p];
- if (rson[q] != NIL)
- {
- do { q = rson[q]; } while (rson[q] != NIL);
- rson[dad[q]] = lson[q]; dad[lson[q]] = dad[q];
- lson[q] = lson[p]; dad[lson[p]] = q;
- }
- rson[q] = rson[p]; dad[rson[p]] = q;
- }
- dad[q] = dad[p];
- if (rson[dad[p]] == p) rson[dad[p]] = q;
- else lson[dad[p]] = q;
- dad[p] = NIL;
- }
-
- void LZARI::StartModel(void)
- {
- int ch, sym, i;
-
- sym_cum[N_CHAR] = 0;
- for (sym = N_CHAR; sym >= 1; sym--)
- {
- ch = sym - 1;
- char_to_sym[ch] = sym; sym_to_char[sym] = ch;
- sym_freq[sym] = 1;
- sym_cum[sym - 1] = sym_cum[sym] + sym_freq[sym];
- }
- sym_freq[0] = 0;
- position_cum[N] = 0;
- for (i = N; i >= 1; i--)
- position_cum[i - 1] = position_cum[i] + 10000 / (i + 200);
-
-
- }
- void LZARI::UpdateModel(int sym)
- {
- int i, c, ch_i, ch_sym;
-
- if (sym_cum[0] >= MAX_CUM)
- {
- c = 0;
- for (i = N_CHAR; i > 0; i--)
- {
- sym_cum[i] = c;
- c += (sym_freq[i] = (sym_freq[i] + 1) >> 1);
- }
- sym_cum[0] = c;
- }
- for (i = sym; sym_freq[i] == sym_freq[i - 1]; i--) ;
- if (i < sym)
- {
- ch_i = sym_to_char[i]; ch_sym = sym_to_char[sym];
- sym_to_char[i] = ch_sym; sym_to_char[sym] = ch_i;
- char_to_sym[ch_i] = sym; char_to_sym[ch_sym] = i;
- }
- sym_freq[i]++;
- while (--i >= 0) sym_cum[i]++;
- }
- void LZARI::Output(int bit)
- {
- PutBit(bit);
- for ( ; shifts > 0; shifts--) PutBit(! bit);
- }
- void LZARI::EncodeChar(int ch)
- {
- int sym;
- unsigned long int range;
- sym = char_to_sym[ch];
- range = high - low;
- high = low + (range * sym_cum[sym - 1]) / sym_cum[0];
- low += (range * sym_cum[sym ]) / sym_cum[0];
- for ( ; ; )
- {
- if (high <= Q2) Output(0);
- else if (low >= Q2)
- {
- Output(1); low -= Q2; high -= Q2;
- }
- else if (low >= Q1 && high <= Q3)
- {
- shifts++; low -= Q1; high -= Q1;
- }
- else break;
- low += low;
- high += high;
- }
- UpdateModel(sym);
- }
- void LZARI::EncodePosition(int position)
- {
- unsigned long int range;
- range = high - low;
- high = low + (range * position_cum[position ]) / position_cum[0];
- low += (range * position_cum[position + 1]) / position_cum[0];
- for ( ; ; )
- {
- if (high <= Q2) Output(0);
- else if (low >= Q2)
- {
- Output(1); low -= Q2; high -= Q2;
- }
- else if (low >= Q1 && high <= Q3)
- {
- shifts++; low -= Q1; high -= Q1;
- }
- else break;
- low += low;
- high += high;
- }
- }
- void LZARI::EncodeEnd(void)
- {
- shifts++;
- if (low < Q1) Output(0); else Output(1);
- FlushBitBuffer();
- }
- int LZARI::BinarySearchSym(unsigned int x)
-
- {
- int i, j, k;
-
- i = 1; j = N_CHAR;
- while (i < j)
- {
- k = (i + j) / 2;
- if (sym_cum[k] > x) i = k + 1; else j = k;
- }
- return i;
- }
- int LZARI::BinarySearchPos(unsigned int x)
-
- {
- int i, j, k;
-
- i = 1; j = N;
- while (i < j)
- {
- k = (i + j) / 2;
- if (position_cum[k] > x) i = k + 1; else j = k;
- }
- return i - 1;
- }
- void LZARI::StartDecode(void)
- {
- int i;
- for (i = 0; i < M + 2; i++)
- value = 2 * value + GetBit();
- }
- int LZARI::DecodeChar(void)
- {
- int sym, ch;
- unsigned long int range;
-
- range = high - low;
- sym = BinarySearchSym((unsigned int)
- (((value - low + 1) * sym_cum[0] - 1) / range));
- high = low + (range * sym_cum[sym - 1]) / sym_cum[0];
- low += (range * sym_cum[sym ]) / sym_cum[0];
- for ( ; ; ) {
- if (low >= Q2) {
- value -= Q2; low -= Q2; high -= Q2;
- } else if (low >= Q1 && high <= Q3) {
- value -= Q1; low -= Q1; high -= Q1;
- } else if (high > Q2) break;
- low += low; high += high;
- value = 2 * value + GetBit();
- }
- ch = sym_to_char[sym];
- UpdateModel(sym);
- return ch;
- }
- int LZARI::DecodePosition(void)
- {
- int position;
- unsigned long int range;
-
- range = high - low;
- position = BinarySearchPos((unsigned int)
- (((value - low + 1) * position_cum[0] - 1) / range));
- high = low + (range * position_cum[position ]) / position_cum[0];
- low += (range * position_cum[position + 1]) / position_cum[0];
- for ( ; ; ) {
- if (low >= Q2) {
- value -= Q2; low -= Q2; high -= Q2;
- } else if (low >= Q1 && high <= Q3) {
- value -= Q1; low -= Q1; high -= Q1;
- } else if (high > Q2) break;
- low += low; high += high;
- value = 2 * value + GetBit();
- }
- return position;
- }
- void LZARI::Encode(void)
- {
- int i, c, len, r, s, last_match_length;
-
- if(!m_bMem)
- {
- fseek(infile, 0L, SEEK_END);
- textsize = ftell(infile);
- if (fwrite(&textsize, sizeof textsize, 1, outfile) < 1)
- Error("Write Error");
- codesize += sizeof textsize;
- if (textsize == 0) return;
- rewind(infile);
- textsize = 0;
- }
- else
- {
- textsize = m_nInLength;
- m_OutBuffer.resize(sizeof textsize);
- memcpy(&m_OutBuffer[0],&textsize,sizeof textsize);
-
- codesize += sizeof textsize;
- if(textsize == 0) return;
- m_nInCur = 0;
- textsize = 0;
- }
-
- StartModel();
- InitTree();
- s = 0; r = N - F;
- for (i = s; i < r; i++) text_buf[i] = ' ';
- if(!m_bMem)
- for (len = 0; len < F && (c = getc(infile)) != EOF; len++) text_buf[r + len] = c;
- else
- for (len = 0; len < F && m_nInCur < m_nInLength ; len++)
- {
- c = m_pInBuffer[m_nInCur++];
- text_buf[r + len] = c;
- }
-
- textsize = len;
- for (i = 1; i <= F; i++) InsertNode(r - i);
-
- InsertNode(r);
-
- do {
- if (match_length > len) match_length = len;
- if (match_length <= THRESHOLD)
- {
- match_length = 1; EncodeChar(text_buf[r]);
- }
- else
- {
- EncodeChar(255 - THRESHOLD + match_length);
- EncodePosition(match_position - 1);
- }
- last_match_length = match_length;
- if(!m_bMem)
- {
- for (i = 0; i < last_match_length && (c = getc(infile)) != EOF; i++)
- {
- DeleteNode(s); text_buf[s] = c;
- if (s < F - 1) text_buf[s + N] = c;
- s = (s + 1) & (N - 1);
- r = (r + 1) & (N - 1);
- InsertNode(r);
- }
- }
- else
- {
- for (i = 0; i < last_match_length && m_nInCur < m_nInLength ; i++)
- {
- c = m_pInBuffer[m_nInCur++];
- DeleteNode(s);
- text_buf[s] = c;
- if (s < F - 1) text_buf[s + N] = c;
- s = (s + 1) & (N - 1);
- r = (r + 1) & (N - 1);
- InsertNode(r);
- }
- }
- if ((textsize += i) > printcount)
- {
- #ifdef _OUTPUT_STATUS
- printf("%12ld\r", textsize);
- #endif
- printcount += 1024;
- }
- while (i++ < last_match_length)
- {
- DeleteNode(s);
- s = (s + 1) & (N - 1);
- r = (r + 1) & (N - 1);
- if (--len) InsertNode(r);
- }
- } while (len > 0);
-
- EncodeEnd();
- #ifdef _OUTPUT_STATUS
- printf("In : %lu bytes\n", textsize);
- printf("Out: %lu bytes\n", codesize);
- printf("Out/In: %.3f\n", (double)codesize / textsize);
- #endif
- }
- void LZARI::Decode(void)
- {
- int i, j, k, r, c;
- unsigned long int count;
- if (!m_bMem)
- {
- if (fread(&textsize, sizeof textsize, 1, infile) < 1)
- Error("Read Error");
- }
- else
- {
- if(m_nInLength < sizeof textsize)
- Error("Read Error");
- memcpy(&textsize,m_pInBuffer + m_nInCur,sizeof textsize);
-
-
- m_nOutLength = textsize;
-
-
- m_nInCur += sizeof textsize;
- }
-
- if (textsize == 0) return;
-
- StartDecode();
- StartModel();
-
- for (i = 0; i < N - F; i++) text_buf[i] = ' ';
- r = N - F;
- for (count = 0; count < textsize; )
- {
- c = DecodeChar();
- if (c < 256)
- {
- if(!m_bMem)
- putc(c, outfile);
- else
- {
-
- m_OutBuffer.push_back(c);
-
- }
- text_buf[r++] = c;
- r &= (N - 1);
- count++;
- }
- else
- {
- i = (r - DecodePosition() - 1) & (N - 1);
- j = c - 255 + THRESHOLD;
- for (k = 0; k < j; k++)
- {
- c = text_buf[(i + k) & (N - 1)];
- if(!m_bMem)
- putc(c, outfile);
- else
- {
-
- m_OutBuffer.push_back(c);
-
- }
- text_buf[r++] = c;
- r &= (N - 1);
- count++;
- }
- }
- if (count > printcount)
- {
- #ifdef _OUTPUT_STATUS
- printf("%12lu\r", count);
- #endif
- printcount += 1024;
- }
- }
- #ifdef _OUTPUT_STATUS
- printf("%12lu\n", count);
- #endif
- }
- void LZARI::Compress(const char *lpszInfile,const char *lpszOutfile)
- {
- m_bMem = FALSE;
-
- infile = fopen(lpszInfile,"rb");
- outfile = fopen(lpszOutfile,"wb");
- if(infile && outfile)
- {
- Encode();
- fclose(infile);
- fclose(outfile);
- infile = NULL;
- outfile = NULL;
- }
- }
- void LZARI::UnCompress(const char *lpszInfile,const char *lpszOutfile)
- {
- m_bMem = FALSE;
- infile = fopen(lpszInfile,"rb");
- outfile = fopen(lpszOutfile,"wb");
- if(infile && outfile)
- {
- Decode();
- fclose(infile);
- fclose(outfile);
- infile = NULL;
- outfile = NULL;
- }
- }
- void LZARI::Compress(const BYTE *pInBuffer,int nInLength,const BYTE *&pOutBuffer ,int &nOutLength)
- {
- m_pInBuffer = pInBuffer;
- m_nInLength = nInLength;
- m_nInCur = 0;
- m_bMem = TRUE;
- Encode();
- pOutBuffer = &m_OutBuffer[0];
- nOutLength = m_OutBuffer.size();
- }
- void LZARI::Release()
- {
- if(!m_OutBuffer.empty())
- {
- infile = NULL;
- outfile = NULL;
-
- textsize = 0;
- codesize = 0;
- printcount = 0;
-
- low = 0;
- high = Q4;
- value = 0;
- shifts = 0;
-
- m_bMem = FALSE;
-
- m_pInBuffer = NULL;
- m_nInLength = 0;
- m_nInCur = 0;
-
- m_OutBuffer.clear();
- m_nOutLength = 0;
- buffer_putbit = 0;
- mask_putbit = 128;
-
- buffer_getbit = 0;
- mask_getbit = 0;
- }
- }
- void LZARI::UnCompress(const BYTE *pInBuffer,int nInLength,const BYTE *&pOutBuffer ,int &nOutLength)
- {
- m_pInBuffer = pInBuffer;
- m_nInLength = nInLength;
- m_nInCur = 0;
- m_bMem = TRUE;
- Decode();
- pOutBuffer = &m_OutBuffer[0];
- nOutLength = m_OutBuffer.size();
- m_OutBuffer.push_back(0);
- }
|