brotli/enc/
literal_cost.rsuse core::cmp::min;
use super::util::{floatX, FastLog2f64};
use crate::enc::utf8_util::is_mostly_utf8;
static kMinUTF8Ratio: floatX = 0.75;
fn UTF8Position(last: usize, c: usize, clamp: usize) -> usize {
if c < 128usize {
0usize
} else if c >= 192usize {
min(1usize, clamp)
} else if last < 0xe0usize {
0usize
} else {
min(2usize, clamp)
}
}
fn DecideMultiByteStatsLevel(pos: usize, len: usize, mask: usize, data: &[u8]) -> usize {
let mut counts = [0usize; 3];
let mut max_utf8: usize = 1;
let mut last_c: usize = 0usize;
let mut i: usize;
i = 0usize;
while i < len {
{
let c: usize = data[(pos.wrapping_add(i) & mask)] as usize;
{
let _rhs = 1;
let _lhs = &mut counts[UTF8Position(last_c, c, 2usize)];
*_lhs = (*_lhs).wrapping_add(_rhs as usize);
}
last_c = c;
}
i = i.wrapping_add(1);
}
if counts[2] < 500usize {
max_utf8 = 1;
}
if counts[1].wrapping_add(counts[2]) < 25usize {
max_utf8 = 0usize;
}
max_utf8
}
fn EstimateBitCostsForLiteralsUTF8(
pos: usize,
len: usize,
mask: usize,
data: &[u8],
cost: &mut [floatX],
) {
let max_utf8: usize = DecideMultiByteStatsLevel(pos, len, mask, data);
let mut histogram = [[0usize; 256]; 3];
let window_half: usize = 495usize;
let in_window: usize = min(window_half, len);
let mut in_window_utf8 = [0usize; 3];
let mut i: usize;
{
let mut last_c: usize = 0usize;
let mut utf8_pos: usize = 0usize;
i = 0usize;
while i < in_window {
{
let c: usize = data[(pos.wrapping_add(i) & mask)] as usize;
{
let _rhs = 1;
let _lhs = &mut histogram[utf8_pos][c];
*_lhs = (*_lhs).wrapping_add(_rhs as usize);
}
{
let _rhs = 1;
let _lhs = &mut in_window_utf8[utf8_pos];
*_lhs = (*_lhs).wrapping_add(_rhs as usize);
}
utf8_pos = UTF8Position(last_c, c, max_utf8);
last_c = c;
}
i = i.wrapping_add(1);
}
}
i = 0usize;
while i < len {
{
if i >= window_half {
let c: usize = (if i < window_half.wrapping_add(1) {
0i32
} else {
data[(pos
.wrapping_add(i)
.wrapping_sub(window_half)
.wrapping_sub(1)
& mask)] as i32
}) as usize;
let last_c: usize = (if i < window_half.wrapping_add(2) {
0i32
} else {
data[(pos
.wrapping_add(i)
.wrapping_sub(window_half)
.wrapping_sub(2)
& mask)] as i32
}) as usize;
let utf8_pos2: usize = UTF8Position(last_c, c, max_utf8);
{
let _rhs = 1;
let _lhs = &mut histogram[utf8_pos2]
[data[(pos.wrapping_add(i).wrapping_sub(window_half) & mask)] as usize];
*_lhs = (*_lhs).wrapping_sub(_rhs as usize);
}
{
let _rhs = 1;
let _lhs = &mut in_window_utf8[utf8_pos2];
*_lhs = (*_lhs).wrapping_sub(_rhs as usize);
}
}
if i.wrapping_add(window_half) < len {
let c: usize = data[(pos
.wrapping_add(i)
.wrapping_add(window_half)
.wrapping_sub(1)
& mask)] as usize;
let last_c: usize = data[(pos
.wrapping_add(i)
.wrapping_add(window_half)
.wrapping_sub(2)
& mask)] as usize;
let utf8_pos2: usize = UTF8Position(last_c, c, max_utf8);
{
let _rhs = 1;
let _lhs = &mut histogram[utf8_pos2]
[data[(pos.wrapping_add(i).wrapping_add(window_half) & mask)] as usize];
*_lhs = (*_lhs).wrapping_add(_rhs as usize);
}
{
let _rhs = 1;
let _lhs = &mut in_window_utf8[utf8_pos2];
*_lhs = (*_lhs).wrapping_add(_rhs as usize);
}
}
{
let c: usize = (if i < 1 {
0i32
} else {
data[(pos.wrapping_add(i).wrapping_sub(1) & mask)] as i32
}) as usize;
let last_c: usize = (if i < 2usize {
0i32
} else {
data[(pos.wrapping_add(i).wrapping_sub(2) & mask)] as i32
}) as usize;
let utf8_pos: usize = UTF8Position(last_c, c, max_utf8);
let masked_pos: usize = pos.wrapping_add(i) & mask;
let mut histo: usize = histogram[utf8_pos][data[masked_pos] as usize];
let mut lit_cost: f64;
if histo == 0usize {
histo = 1;
}
lit_cost = FastLog2f64(in_window_utf8[utf8_pos] as u64) as f64
- FastLog2f64(histo as u64) as f64;
lit_cost += 0.02905;
if lit_cost < 1.0 {
lit_cost *= 0.5;
lit_cost += 0.5;
}
if i < 2000usize {
lit_cost += (0.7 - (2000usize).wrapping_sub(i) as (f64) / 2000.0 * 0.35);
}
cost[i] = lit_cost as floatX;
}
}
i = i.wrapping_add(1);
}
}
pub fn BrotliEstimateBitCostsForLiterals(
pos: usize,
len: usize,
mask: usize,
data: &[u8],
cost: &mut [floatX],
) {
if is_mostly_utf8(data, pos, mask, len, kMinUTF8Ratio) {
EstimateBitCostsForLiteralsUTF8(pos, len, mask, data, cost);
} else {
let mut histogram: [usize; 256] = [0; 256];
let window_half: usize = 2000usize;
let mut in_window: usize = min(window_half, len);
let mut i: usize;
for i in 0usize..in_window {
let _rhs = 1;
let _lhs = &mut histogram[data[(pos.wrapping_add(i) & mask)] as usize];
*_lhs = (*_lhs).wrapping_add(_rhs as usize);
}
i = 0usize;
while i < len {
{
let mut histo: usize;
if i >= window_half {
{
let _rhs = 1;
let _lhs = &mut histogram
[data[(pos.wrapping_add(i).wrapping_sub(window_half) & mask)] as usize];
*_lhs = (*_lhs).wrapping_sub(_rhs as usize);
}
in_window = in_window.wrapping_sub(1);
}
if i.wrapping_add(window_half) < len {
{
let _rhs = 1;
let _lhs = &mut histogram
[data[(pos.wrapping_add(i).wrapping_add(window_half) & mask)] as usize];
*_lhs = (*_lhs).wrapping_add(_rhs as usize);
}
in_window = in_window.wrapping_add(1);
}
histo = histogram[data[(pos.wrapping_add(i) & mask)] as usize];
if histo == 0usize {
histo = 1;
}
{
let mut lit_cost: f64 =
FastLog2f64(in_window as u64) as f64 - FastLog2f64(histo as u64) as f64;
lit_cost += 0.029;
if lit_cost < 1.0 {
lit_cost *= 0.5;
lit_cost += 0.5;
}
cost[i] = lit_cost as floatX;
}
}
i = i.wrapping_add(1);
}
}
}