mirror of
https://github.com/ventoy/Ventoy.git
synced 2025-01-09 22:13:24 -05:00
208 lines
5.3 KiB
C
208 lines
5.3 KiB
C
|
/*
|
||
|
* Copyright (C) 2014 Michael Brown <mbrown@fensystems.co.uk>.
|
||
|
*
|
||
|
* This program is free software; you can redistribute it and/or
|
||
|
* modify it under the terms of the GNU General Public License as
|
||
|
* published by the Free Software Foundation; either version 2 of the
|
||
|
* License, or (at your option) any later version.
|
||
|
*
|
||
|
* This program is distributed in the hope that it will be useful, but
|
||
|
* WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||
|
* General Public License for more details.
|
||
|
*
|
||
|
* You should have received a copy of the GNU General Public License
|
||
|
* along with this program; if not, write to the Free Software
|
||
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
|
||
|
* 02110-1301, USA.
|
||
|
*/
|
||
|
|
||
|
/**
|
||
|
* @file
|
||
|
*
|
||
|
* Huffman alphabets
|
||
|
*
|
||
|
*/
|
||
|
|
||
|
#include "wimboot.h"
|
||
|
#include "huffman.h"
|
||
|
|
||
|
/**
|
||
|
* Transcribe binary value (for debugging)
|
||
|
*
|
||
|
* @v value Value
|
||
|
* @v bits Length of value (in bits)
|
||
|
* @ret string Transcribed value
|
||
|
*/
|
||
|
const char * huffman_bin ( unsigned long value, unsigned int bits ) {
|
||
|
static char buf[ ( 8 * sizeof ( value ) ) + 1 /* NUL */ ];
|
||
|
char *out = buf;
|
||
|
|
||
|
/* Sanity check */
|
||
|
assert ( bits < sizeof ( buf ) );
|
||
|
|
||
|
/* Transcribe value */
|
||
|
while ( bits-- )
|
||
|
*(out++) = ( ( value & ( 1 << bits ) ) ? '1' : '0' );
|
||
|
*out = '\0';
|
||
|
|
||
|
return buf;
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* Dump Huffman alphabet (for debugging)
|
||
|
*
|
||
|
* @v alphabet Huffman alphabet
|
||
|
*/
|
||
|
static void __attribute__ (( unused ))
|
||
|
huffman_dump_alphabet ( struct huffman_alphabet *alphabet ) {
|
||
|
struct huffman_symbols *sym;
|
||
|
unsigned int bits;
|
||
|
unsigned int huf;
|
||
|
unsigned int i;
|
||
|
|
||
|
(void)huf;
|
||
|
|
||
|
/* Dump symbol table for each utilised length */
|
||
|
for ( bits = 1 ; bits <= ( sizeof ( alphabet->huf ) /
|
||
|
sizeof ( alphabet->huf[0] ) ) ; bits++ ) {
|
||
|
sym = &alphabet->huf[ bits - 1 ];
|
||
|
if ( sym->freq == 0 )
|
||
|
continue;
|
||
|
huf = ( sym->start >> sym->shift );
|
||
|
DBG ( "Huffman length %d start \"%s\" freq %d:", bits,
|
||
|
huffman_bin ( huf, sym->bits ), sym->freq );
|
||
|
for ( i = 0 ; i < sym->freq ; i++ ) {
|
||
|
DBG ( " %03x", sym->raw[ huf + i ] );
|
||
|
}
|
||
|
DBG ( "\n" );
|
||
|
}
|
||
|
|
||
|
/* Dump quick lookup table */
|
||
|
DBG ( "Huffman quick lookup:" );
|
||
|
for ( i = 0 ; i < ( sizeof ( alphabet->lookup ) /
|
||
|
sizeof ( alphabet->lookup[0] ) ) ; i++ ) {
|
||
|
DBG ( " %d", ( alphabet->lookup[i] + 1 ) );
|
||
|
}
|
||
|
DBG ( "\n" );
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* Construct Huffman alphabet
|
||
|
*
|
||
|
* @v alphabet Huffman alphabet
|
||
|
* @v lengths Symbol length table
|
||
|
* @v count Number of symbols
|
||
|
* @ret rc Return status code
|
||
|
*/
|
||
|
int huffman_alphabet ( struct huffman_alphabet *alphabet,
|
||
|
uint8_t *lengths, unsigned int count ) {
|
||
|
struct huffman_symbols *sym;
|
||
|
unsigned int huf;
|
||
|
unsigned int cum_freq;
|
||
|
unsigned int bits;
|
||
|
unsigned int raw;
|
||
|
unsigned int adjustment;
|
||
|
unsigned int prefix;
|
||
|
int empty;
|
||
|
int complete;
|
||
|
|
||
|
/* Clear symbol table */
|
||
|
memset ( alphabet->huf, 0, sizeof ( alphabet->huf ) );
|
||
|
|
||
|
/* Count number of symbols with each Huffman-coded length */
|
||
|
empty = 1;
|
||
|
for ( raw = 0 ; raw < count ; raw++ ) {
|
||
|
bits = lengths[raw];
|
||
|
if ( bits ) {
|
||
|
alphabet->huf[ bits - 1 ].freq++;
|
||
|
empty = 0;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/* In the degenerate case of having no symbols (i.e. an unused
|
||
|
* alphabet), generate a trivial alphabet with exactly two
|
||
|
* single-bit codes. This allows callers to avoid having to
|
||
|
* check for this special case.
|
||
|
*/
|
||
|
if ( empty )
|
||
|
alphabet->huf[0].freq = 2;
|
||
|
|
||
|
/* Populate Huffman-coded symbol table */
|
||
|
huf = 0;
|
||
|
cum_freq = 0;
|
||
|
for ( bits = 1 ; bits <= ( sizeof ( alphabet->huf ) /
|
||
|
sizeof ( alphabet->huf[0] ) ) ; bits++ ) {
|
||
|
sym = &alphabet->huf[ bits - 1 ];
|
||
|
sym->bits = bits;
|
||
|
sym->shift = ( HUFFMAN_BITS - bits );
|
||
|
sym->start = ( huf << sym->shift );
|
||
|
sym->raw = &alphabet->raw[cum_freq];
|
||
|
huf += sym->freq;
|
||
|
if ( huf > ( 1U << bits ) ) {
|
||
|
DBG ( "Huffman alphabet has too many symbols with "
|
||
|
"lengths <=%d\n", bits );
|
||
|
return -1;
|
||
|
}
|
||
|
huf <<= 1;
|
||
|
cum_freq += sym->freq;
|
||
|
}
|
||
|
complete = ( huf == ( 1U << bits ) );
|
||
|
|
||
|
/* Populate raw symbol table */
|
||
|
for ( raw = 0 ; raw < count ; raw++ ) {
|
||
|
bits = lengths[raw];
|
||
|
if ( bits ) {
|
||
|
sym = &alphabet->huf[ bits - 1 ];
|
||
|
*(sym->raw++) = raw;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/* Adjust Huffman-coded symbol table raw pointers and populate
|
||
|
* quick lookup table.
|
||
|
*/
|
||
|
for ( bits = 1 ; bits <= ( sizeof ( alphabet->huf ) /
|
||
|
sizeof ( alphabet->huf[0] ) ) ; bits++ ) {
|
||
|
sym = &alphabet->huf[ bits - 1 ];
|
||
|
|
||
|
/* Adjust raw pointer */
|
||
|
sym->raw -= sym->freq; /* Reset to first symbol */
|
||
|
adjustment = ( sym->start >> sym->shift );
|
||
|
sym->raw -= adjustment; /* Adjust for quick indexing */
|
||
|
|
||
|
/* Populate quick lookup table */
|
||
|
for ( prefix = ( sym->start >> HUFFMAN_QL_SHIFT ) ;
|
||
|
prefix < ( 1 << HUFFMAN_QL_BITS ) ; prefix++ ) {
|
||
|
alphabet->lookup[prefix] = ( bits - 1 );
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/* Check that there are no invalid codes */
|
||
|
if ( ! complete ) {
|
||
|
DBG ( "Huffman alphabet is incomplete\n" );
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* Get Huffman symbol set
|
||
|
*
|
||
|
* @v alphabet Huffman alphabet
|
||
|
* @v huf Raw input value (normalised to HUFFMAN_BITS bits)
|
||
|
* @ret sym Huffman symbol set
|
||
|
*/
|
||
|
struct huffman_symbols * huffman_sym ( struct huffman_alphabet *alphabet,
|
||
|
unsigned int huf ) {
|
||
|
struct huffman_symbols *sym;
|
||
|
unsigned int lookup_index;
|
||
|
|
||
|
/* Find symbol set for this length */
|
||
|
lookup_index = ( huf >> HUFFMAN_QL_SHIFT );
|
||
|
sym = &alphabet->huf[ alphabet->lookup[ lookup_index ] ];
|
||
|
while ( huf < sym->start )
|
||
|
sym--;
|
||
|
return sym;
|
||
|
}
|