2179 lines
72 KiB
C++
2179 lines
72 KiB
C++
// File: crn_comp.cpp
|
|
// See Copyright Notice and license at the end of inc/crnlib.h
|
|
#include "crn_core.h"
|
|
#include "crn_console.h"
|
|
#include "crn_comp.h"
|
|
#include "crn_zeng.h"
|
|
#include "crn_checksum.h"
|
|
|
|
#define CRNLIB_CREATE_DEBUG_IMAGES 0
|
|
#define CRNLIB_ENABLE_DEBUG_MESSAGES 0
|
|
|
|
namespace crnlib
|
|
{
|
|
static const uint cEncodingMapNumChunksPerCode = 3;
|
|
|
|
crn_comp::crn_comp() :
|
|
m_pParams(NULL)
|
|
{
|
|
}
|
|
|
|
crn_comp::~crn_comp()
|
|
{
|
|
}
|
|
|
|
float crn_comp::color_endpoint_similarity_func(uint index_a, uint index_b, void* pContext)
|
|
{
|
|
dxt_hc& hvq = *static_cast<dxt_hc*>(pContext);
|
|
|
|
uint endpoint_a = hvq.get_color_endpoint(index_a);
|
|
uint endpoint_b = hvq.get_color_endpoint(index_b);
|
|
|
|
color_quad_u8 a[2];
|
|
a[0] = dxt1_block::unpack_color((uint16)(endpoint_a & 0xFFFF), true);
|
|
a[1] = dxt1_block::unpack_color((uint16)((endpoint_a >> 16) & 0xFFFF), true);
|
|
|
|
color_quad_u8 b[2];
|
|
b[0] = dxt1_block::unpack_color((uint16)(endpoint_b & 0xFFFF), true);
|
|
b[1] = dxt1_block::unpack_color((uint16)((endpoint_b >> 16) & 0xFFFF), true);
|
|
|
|
uint total_error = color::elucidian_distance(a[0], b[0], false) + color::elucidian_distance(a[1], b[1], false);
|
|
|
|
float weight = 1.0f - math::clamp(total_error * 1.0f/8000.0f, 0.0f, 1.0f);
|
|
return weight;
|
|
}
|
|
|
|
float crn_comp::alpha_endpoint_similarity_func(uint index_a, uint index_b, void* pContext)
|
|
{
|
|
dxt_hc& hvq = *static_cast<dxt_hc*>(pContext);
|
|
|
|
uint endpoint_a = hvq.get_alpha_endpoint(index_a);
|
|
int endpoint_a_lo = dxt5_block::unpack_endpoint(endpoint_a, 0);
|
|
int endpoint_a_hi = dxt5_block::unpack_endpoint(endpoint_a, 1);
|
|
|
|
uint endpoint_b = hvq.get_alpha_endpoint(index_b);
|
|
int endpoint_b_lo = dxt5_block::unpack_endpoint(endpoint_b, 0);
|
|
int endpoint_b_hi = dxt5_block::unpack_endpoint(endpoint_b, 1);
|
|
|
|
int total_error = math::square(endpoint_a_lo - endpoint_b_lo) + math::square(endpoint_a_hi - endpoint_b_hi);
|
|
|
|
float weight = 1.0f - math::clamp(total_error * 1.0f/256.0f, 0.0f, 1.0f);
|
|
return weight;
|
|
}
|
|
|
|
void crn_comp::sort_color_endpoint_codebook(crnlib::vector<uint>& remapping, const crnlib::vector<uint>& endpoints)
|
|
{
|
|
remapping.resize(endpoints.size());
|
|
|
|
uint lowest_energy = UINT_MAX;
|
|
uint lowest_energy_index = 0;
|
|
|
|
for (uint i = 0; i < endpoints.size(); i++)
|
|
{
|
|
color_quad_u8 a(dxt1_block::unpack_color(static_cast<uint16>(endpoints[i] & 0xFFFF), true));
|
|
color_quad_u8 b(dxt1_block::unpack_color(static_cast<uint16>((endpoints[i] >> 16) & 0xFFFF), true));
|
|
|
|
uint total = a.r + a.g + a.b + b.r + b.g + b.b;
|
|
|
|
if (total < lowest_energy)
|
|
{
|
|
lowest_energy = total;
|
|
lowest_energy_index = i;
|
|
}
|
|
}
|
|
|
|
uint cur_index = lowest_energy_index;
|
|
|
|
crnlib::vector<bool> chosen_flags(endpoints.size());
|
|
|
|
uint n = 0;
|
|
for ( ; ; )
|
|
{
|
|
chosen_flags[cur_index] = true;
|
|
|
|
remapping[cur_index] = n;
|
|
n++;
|
|
if (n == endpoints.size())
|
|
break;
|
|
|
|
uint lowest_error = UINT_MAX;
|
|
uint lowest_error_index = 0;
|
|
|
|
color_quad_u8 a(dxt1_block::unpack_endpoint(endpoints[cur_index], 0, true));
|
|
color_quad_u8 b(dxt1_block::unpack_endpoint(endpoints[cur_index], 1, true));
|
|
|
|
for (uint i = 0; i < endpoints.size(); i++)
|
|
{
|
|
if (chosen_flags[i])
|
|
continue;
|
|
|
|
color_quad_u8 c(dxt1_block::unpack_endpoint(endpoints[i], 0, true));
|
|
color_quad_u8 d(dxt1_block::unpack_endpoint(endpoints[i], 1, true));
|
|
|
|
uint total = color::elucidian_distance(a, c, false) + color::elucidian_distance(b, d, false);
|
|
|
|
if (total < lowest_error)
|
|
{
|
|
lowest_error = total;
|
|
lowest_error_index = i;
|
|
}
|
|
}
|
|
|
|
cur_index = lowest_error_index;
|
|
}
|
|
}
|
|
|
|
void crn_comp::sort_alpha_endpoint_codebook(crnlib::vector<uint>& remapping, const crnlib::vector<uint>& endpoints)
|
|
{
|
|
remapping.resize(endpoints.size());
|
|
|
|
uint lowest_energy = UINT_MAX;
|
|
uint lowest_energy_index = 0;
|
|
|
|
for (uint i = 0; i < endpoints.size(); i++)
|
|
{
|
|
uint a = dxt5_block::unpack_endpoint(endpoints[i], 0);
|
|
uint b = dxt5_block::unpack_endpoint(endpoints[i], 1);
|
|
|
|
uint total = a + b;
|
|
|
|
if (total < lowest_energy)
|
|
{
|
|
lowest_energy = total;
|
|
lowest_energy_index = i;
|
|
}
|
|
}
|
|
|
|
uint cur_index = lowest_energy_index;
|
|
|
|
crnlib::vector<bool> chosen_flags(endpoints.size());
|
|
|
|
uint n = 0;
|
|
for ( ; ; )
|
|
{
|
|
chosen_flags[cur_index] = true;
|
|
|
|
remapping[cur_index] = n;
|
|
n++;
|
|
if (n == endpoints.size())
|
|
break;
|
|
|
|
uint lowest_error = UINT_MAX;
|
|
uint lowest_error_index = 0;
|
|
|
|
const int a = dxt5_block::unpack_endpoint(endpoints[cur_index], 0);
|
|
const int b = dxt5_block::unpack_endpoint(endpoints[cur_index], 1);
|
|
|
|
for (uint i = 0; i < endpoints.size(); i++)
|
|
{
|
|
if (chosen_flags[i])
|
|
continue;
|
|
|
|
const int c = dxt5_block::unpack_endpoint(endpoints[i], 0);
|
|
const int d = dxt5_block::unpack_endpoint(endpoints[i], 1);
|
|
|
|
uint total = math::square(a - c) + math::square(b - d);
|
|
|
|
if (total < lowest_error)
|
|
{
|
|
lowest_error = total;
|
|
lowest_error_index = i;
|
|
}
|
|
}
|
|
|
|
cur_index = lowest_error_index;
|
|
}
|
|
}
|
|
|
|
// The indices are only used for statistical purposes.
|
|
bool crn_comp::pack_color_endpoints(
|
|
crnlib::vector<uint8>& data,
|
|
const crnlib::vector<uint>& remapping,
|
|
const crnlib::vector<uint>& endpoint_indices,
|
|
uint trial_index)
|
|
{
|
|
trial_index;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("pack_color_endpoints: %u", trial_index);
|
|
#endif
|
|
|
|
crnlib::vector<uint> remapped_endpoints(m_hvq.get_color_endpoint_codebook_size());
|
|
|
|
for (uint i = 0; i < m_hvq.get_color_endpoint_codebook_size(); i++)
|
|
remapped_endpoints[remapping[i]] = m_hvq.get_color_endpoint(i);
|
|
|
|
const uint component_limits[6] = { 31, 63, 31, 31, 63, 31 };
|
|
|
|
symbol_histogram hist[2];
|
|
hist[0].resize(32);
|
|
hist[1].resize(64);
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
image_u8 endpoint_image(2, m_hvq.get_color_endpoint_codebook_size());
|
|
image_u8 endpoint_residual_image(2, m_hvq.get_color_endpoint_codebook_size());
|
|
#endif
|
|
|
|
crnlib::vector<uint> residual_syms;
|
|
residual_syms.reserve(m_hvq.get_color_endpoint_codebook_size()*2*3);
|
|
|
|
color_quad_u8 prev[2];
|
|
prev[0].clear();
|
|
prev[1].clear();
|
|
|
|
int total_residuals = 0;
|
|
|
|
for (uint endpoint_index = 0; endpoint_index < m_hvq.get_color_endpoint_codebook_size(); endpoint_index++)
|
|
{
|
|
const uint endpoint = remapped_endpoints[endpoint_index];
|
|
|
|
color_quad_u8 cur[2];
|
|
cur[0] = dxt1_block::unpack_color((uint16)(endpoint & 0xFFFF), false);
|
|
cur[1] = dxt1_block::unpack_color((uint16)((endpoint >> 16) & 0xFFFF), false);
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
endpoint_image(0, endpoint_index) = dxt1_block::unpack_color((uint16)(endpoint & 0xFFFF), true);
|
|
endpoint_image(1, endpoint_index) = dxt1_block::unpack_color((uint16)((endpoint >> 16) & 0xFFFF), true);
|
|
#endif
|
|
|
|
for (uint j = 0; j < 2; j++)
|
|
{
|
|
for (uint k = 0; k < 3; k++)
|
|
{
|
|
int delta = cur[j][k] - prev[j][k];
|
|
total_residuals += delta*delta;
|
|
|
|
int sym = delta & component_limits[j*3+k];
|
|
int table = (k == 1) ? 1 : 0;
|
|
|
|
hist[table].inc_freq(sym);
|
|
|
|
residual_syms.push_back(sym);
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
endpoint_residual_image(j, endpoint_index)[k] = static_cast<uint8>(sym);
|
|
#endif
|
|
}
|
|
}
|
|
|
|
prev[0] = cur[0];
|
|
prev[1] = cur[1];
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Total endpoint residuals: %i", total_residuals);
|
|
#endif
|
|
|
|
if (endpoint_indices.size() > 1)
|
|
{
|
|
uint prev_index = remapping[endpoint_indices[0]];
|
|
int64 total_delta = 0;
|
|
for (uint i = 1; i < endpoint_indices.size(); i++)
|
|
{
|
|
uint cur_index = remapping[endpoint_indices[i]];
|
|
int delta = cur_index - prev_index;
|
|
prev_index = cur_index;
|
|
total_delta += delta * delta;
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Total endpoint index delta: " CRNLIB_INT64_FORMAT_SPECIFIER, total_delta);
|
|
#endif
|
|
}
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
image_utils::write_to_file(dynamic_string(cVarArg, "color_endpoint_residuals_%u.tga", trial_index).get_ptr(), endpoint_residual_image);
|
|
image_utils::write_to_file(dynamic_string(cVarArg, "color_endpoints_%u.tga", trial_index).get_ptr(), endpoint_image);
|
|
#endif
|
|
|
|
static_huffman_data_model residual_dm[2];
|
|
|
|
symbol_codec codec;
|
|
codec.start_encoding(1024*1024);
|
|
|
|
// Transmit residuals
|
|
for (uint i = 0; i < 2; i++)
|
|
{
|
|
if (!residual_dm[i].init(true, hist[i], 15))
|
|
return false;
|
|
|
|
if (!codec.encode_transmit_static_huffman_data_model(residual_dm[i], false))
|
|
return false;
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Wrote %u bits for color endpoint residual Huffman tables", codec.encode_get_total_bits_written());
|
|
#endif
|
|
|
|
uint start_bits = codec.encode_get_total_bits_written();
|
|
start_bits;
|
|
|
|
for (uint i = 0; i < residual_syms.size(); i++)
|
|
{
|
|
const uint sym = residual_syms[i];
|
|
const uint table = ((i % 3) == 1) ? 1 : 0;
|
|
codec.encode(sym, residual_dm[table]);
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Wrote %u bits for color endpoint residuals", codec.encode_get_total_bits_written() - start_bits);
|
|
#endif
|
|
|
|
codec.stop_encoding(false);
|
|
|
|
data.swap(codec.get_encoding_buf());
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
{
|
|
console::debug("Wrote a total of %u bits for color endpoint codebook", codec.encode_get_total_bits_written());
|
|
|
|
console::debug("Wrote %f bits per each color endpoint", data.size() * 8.0f / m_hvq.get_color_endpoint_codebook_size());
|
|
}
|
|
#endif
|
|
|
|
return true;
|
|
}
|
|
|
|
// The indices are only used for statistical purposes.
|
|
bool crn_comp::pack_alpha_endpoints(
|
|
crnlib::vector<uint8>& data,
|
|
const crnlib::vector<uint>& remapping,
|
|
const crnlib::vector<uint>& endpoint_indices,
|
|
uint trial_index)
|
|
{
|
|
trial_index;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("pack_alpha_endpoints: %u", trial_index);
|
|
#endif
|
|
|
|
crnlib::vector<uint> remapped_endpoints(m_hvq.get_alpha_endpoint_codebook_size());
|
|
|
|
for (uint i = 0; i < m_hvq.get_alpha_endpoint_codebook_size(); i++)
|
|
remapped_endpoints[remapping[i]] = m_hvq.get_alpha_endpoint(i);
|
|
|
|
symbol_histogram hist;
|
|
hist.resize(256);
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
image_u8 endpoint_image(2, m_hvq.get_alpha_endpoint_codebook_size());
|
|
image_u8 endpoint_residual_image(2, m_hvq.get_alpha_endpoint_codebook_size());
|
|
#endif
|
|
|
|
crnlib::vector<uint> residual_syms;
|
|
residual_syms.reserve(m_hvq.get_alpha_endpoint_codebook_size()*2*3);
|
|
|
|
uint prev[2];
|
|
utils::zero_object(prev);
|
|
|
|
int total_residuals = 0;
|
|
|
|
for (uint endpoint_index = 0; endpoint_index < m_hvq.get_alpha_endpoint_codebook_size(); endpoint_index++)
|
|
{
|
|
const uint endpoint = remapped_endpoints[endpoint_index];
|
|
|
|
uint cur[2];
|
|
cur[0] = dxt5_block::unpack_endpoint(endpoint, 0);
|
|
cur[1] = dxt5_block::unpack_endpoint(endpoint, 1);
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
endpoint_image(0, endpoint_index) = cur[0];
|
|
endpoint_image(1, endpoint_index) = cur[1];
|
|
#endif
|
|
|
|
for (uint j = 0; j < 2; j++)
|
|
{
|
|
int delta = cur[j] - prev[j];
|
|
total_residuals += delta*delta;
|
|
|
|
int sym = delta & 255;
|
|
|
|
hist.inc_freq(sym);
|
|
|
|
residual_syms.push_back(sym);
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
endpoint_residual_image(j, endpoint_index) = static_cast<uint8>(sym);
|
|
#endif
|
|
}
|
|
|
|
prev[0] = cur[0];
|
|
prev[1] = cur[1];
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Total endpoint residuals: %i", total_residuals);
|
|
#endif
|
|
|
|
if (endpoint_indices.size() > 1)
|
|
{
|
|
uint prev_index = remapping[endpoint_indices[0]];
|
|
int64 total_delta = 0;
|
|
for (uint i = 1; i < endpoint_indices.size(); i++)
|
|
{
|
|
uint cur_index = remapping[endpoint_indices[i]];
|
|
int delta = cur_index - prev_index;
|
|
prev_index = cur_index;
|
|
total_delta += delta * delta;
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Total endpoint index delta: " CRNLIB_INT64_FORMAT_SPECIFIER, total_delta);
|
|
#endif
|
|
}
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
image_utils::write_to_file(dynamic_string(cVarArg, "alpha_endpoint_residuals_%u.tga", trial_index).get_ptr(), endpoint_residual_image);
|
|
image_utils::write_to_file(dynamic_string(cVarArg, "alpha_endpoints_%u.tga", trial_index).get_ptr(), endpoint_image);
|
|
#endif
|
|
|
|
static_huffman_data_model residual_dm;
|
|
|
|
symbol_codec codec;
|
|
codec.start_encoding(1024*1024);
|
|
|
|
// Transmit residuals
|
|
if (!residual_dm.init(true, hist, 15))
|
|
return false;
|
|
|
|
if (!codec.encode_transmit_static_huffman_data_model(residual_dm, false))
|
|
return false;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Wrote %u bits for alpha endpoint residual Huffman tables", codec.encode_get_total_bits_written());
|
|
#endif
|
|
|
|
uint start_bits = codec.encode_get_total_bits_written();
|
|
start_bits;
|
|
|
|
for (uint i = 0; i < residual_syms.size(); i++)
|
|
{
|
|
const uint sym = residual_syms[i];
|
|
codec.encode(sym, residual_dm);
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Wrote %u bits for alpha endpoint residuals", codec.encode_get_total_bits_written() - start_bits);
|
|
#endif
|
|
|
|
codec.stop_encoding(false);
|
|
|
|
data.swap(codec.get_encoding_buf());
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
{
|
|
console::debug("Wrote a total of %u bits for alpha endpoint codebook", codec.encode_get_total_bits_written());
|
|
|
|
console::debug("Wrote %f bits per each alpha endpoint", data.size() * 8.0f / m_hvq.get_alpha_endpoint_codebook_size());
|
|
}
|
|
#endif
|
|
|
|
return true;
|
|
}
|
|
|
|
float crn_comp::color_selector_similarity_func(uint index_a, uint index_b, void* pContext)
|
|
{
|
|
const crnlib::vector<dxt_hc::selectors>& selectors = *static_cast< const crnlib::vector<dxt_hc::selectors>* >(pContext);
|
|
|
|
const dxt_hc::selectors& selectors_a = selectors[index_a];
|
|
const dxt_hc::selectors& selectors_b = selectors[index_b];
|
|
|
|
int total = 0;
|
|
for (uint i = 0; i < 16; i++)
|
|
{
|
|
int a = g_dxt1_to_linear[selectors_a.get_by_index(i)];
|
|
int b = g_dxt1_to_linear[selectors_b.get_by_index(i)];
|
|
|
|
int delta = a - b;
|
|
total += delta*delta;
|
|
}
|
|
|
|
float weight = 1.0f - math::clamp(total * 1.0f/20.0f, 0.0f, 1.0f);
|
|
return weight;
|
|
}
|
|
|
|
float crn_comp::alpha_selector_similarity_func(uint index_a, uint index_b, void* pContext)
|
|
{
|
|
const crnlib::vector<dxt_hc::selectors>& selectors = *static_cast< const crnlib::vector<dxt_hc::selectors>* >(pContext);
|
|
|
|
const dxt_hc::selectors& selectors_a = selectors[index_a];
|
|
const dxt_hc::selectors& selectors_b = selectors[index_b];
|
|
|
|
int total = 0;
|
|
for (uint i = 0; i < 16; i++)
|
|
{
|
|
int a = g_dxt5_to_linear[selectors_a.get_by_index(i)];
|
|
int b = g_dxt5_to_linear[selectors_b.get_by_index(i)];
|
|
|
|
int delta = a - b;
|
|
total += delta*delta;
|
|
}
|
|
|
|
float weight = 1.0f - math::clamp(total * 1.0f/100.0f, 0.0f, 1.0f);
|
|
return weight;
|
|
}
|
|
|
|
void crn_comp::sort_selector_codebook(crnlib::vector<uint>& remapping, const crnlib::vector<dxt_hc::selectors>& selectors, const uint8* pTo_linear)
|
|
{
|
|
remapping.resize(selectors.size());
|
|
|
|
uint lowest_energy = UINT_MAX;
|
|
uint lowest_energy_index = 0;
|
|
|
|
for (uint i = 0; i < selectors.size(); i++)
|
|
{
|
|
uint total = 0;
|
|
for (uint j = 0; j < 16; j++)
|
|
{
|
|
int a = pTo_linear[selectors[i].get_by_index(j)];
|
|
|
|
total += a*a;
|
|
}
|
|
|
|
if (total < lowest_energy)
|
|
{
|
|
lowest_energy = total;
|
|
lowest_energy_index = i;
|
|
}
|
|
}
|
|
|
|
uint cur_index = lowest_energy_index;
|
|
|
|
crnlib::vector<bool> chosen_flags(selectors.size());
|
|
|
|
uint n = 0;
|
|
for ( ; ; )
|
|
{
|
|
chosen_flags[cur_index] = true;
|
|
|
|
remapping[cur_index] = n;
|
|
n++;
|
|
if (n == selectors.size())
|
|
break;
|
|
|
|
uint lowest_error = UINT_MAX;
|
|
uint lowest_error_index = 0;
|
|
|
|
for (uint i = 0; i < selectors.size(); i++)
|
|
{
|
|
if (chosen_flags[i])
|
|
continue;
|
|
|
|
uint total = 0;
|
|
for (uint j = 0; j < 16; j++)
|
|
{
|
|
int a = pTo_linear[selectors[cur_index].get_by_index(j)];
|
|
int b = pTo_linear[selectors[i].get_by_index(j)];
|
|
|
|
int delta = a - b;
|
|
total += delta*delta;
|
|
}
|
|
|
|
if (total < lowest_error)
|
|
{
|
|
lowest_error = total;
|
|
lowest_error_index = i;
|
|
}
|
|
}
|
|
|
|
cur_index = lowest_error_index;
|
|
}
|
|
}
|
|
|
|
// The indices are only used for statistical purposes.
|
|
bool crn_comp::pack_selectors(
|
|
crnlib::vector<uint8>& packed_data,
|
|
const crnlib::vector<uint>& selector_indices,
|
|
const crnlib::vector<dxt_hc::selectors>& selectors,
|
|
const crnlib::vector<uint>& remapping,
|
|
uint max_selector_value,
|
|
const uint8* pTo_linear,
|
|
uint trial_index)
|
|
{
|
|
trial_index;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("pack_selectors: %u", trial_index);
|
|
#endif
|
|
|
|
crnlib::vector<dxt_hc::selectors> remapped_selectors(selectors.size());
|
|
|
|
for (uint i = 0; i < selectors.size(); i++)
|
|
remapped_selectors[remapping[i]] = selectors[i];
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
image_u8 residual_image(16, selectors.size());;
|
|
image_u8 selector_image(16, selectors.size());;
|
|
#endif
|
|
|
|
crnlib::vector<uint> residual_syms;
|
|
residual_syms.reserve(selectors.size() * 8);
|
|
|
|
const uint num_baised_selector_values = (max_selector_value * 2 + 1);
|
|
symbol_histogram hist(num_baised_selector_values * num_baised_selector_values);
|
|
|
|
dxt_hc::selectors prev_selectors;
|
|
utils::zero_object(prev_selectors);
|
|
int total_residuals = 0;
|
|
for (uint selector_index = 0; selector_index < selectors.size(); selector_index++)
|
|
{
|
|
const dxt_hc::selectors& s = remapped_selectors[selector_index];
|
|
|
|
uint prev_sym = 0;
|
|
for (uint i = 0; i < 16; i++)
|
|
{
|
|
int p = pTo_linear[crnlib_assert_range_incl<uint>(prev_selectors.get_by_index(i), max_selector_value)];
|
|
|
|
int r = pTo_linear[crnlib_assert_range_incl<uint>(s.get_by_index(i), max_selector_value)] - p;
|
|
|
|
total_residuals += r*r;
|
|
|
|
uint sym = r + max_selector_value;
|
|
|
|
CRNLIB_ASSERT(sym < num_baised_selector_values);
|
|
if (i & 1)
|
|
{
|
|
uint paired_sym = (sym * num_baised_selector_values) + prev_sym;
|
|
residual_syms.push_back(paired_sym);
|
|
hist.inc_freq(paired_sym);
|
|
}
|
|
else
|
|
prev_sym = sym;
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
selector_image(i, selector_index) = (pTo_linear[crnlib_assert_range_incl<uint>(s.get_by_index(i), max_selector_value)] * 255) / max_selector_value;
|
|
residual_image(i, selector_index) = sym;
|
|
#endif
|
|
}
|
|
|
|
prev_selectors = s;
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Total selector endpoint residuals: %u", total_residuals);
|
|
#endif
|
|
|
|
if (selector_indices.size() > 1)
|
|
{
|
|
uint prev_index = remapping[selector_indices[1]];
|
|
int64 total_delta = 0;
|
|
for (uint i = 1; i < selector_indices.size(); i++)
|
|
{
|
|
uint cur_index = remapping[selector_indices[i]];
|
|
int delta = cur_index - prev_index;
|
|
prev_index = cur_index;
|
|
total_delta += delta * delta;
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Total selector index delta: " CRNLIB_INT64_FORMAT_SPECIFIER, total_delta);
|
|
#endif
|
|
}
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
image_utils::write_to_file(dynamic_string(cVarArg, "selectors_%u_%u.tga", trial_index, max_selector_value).get_ptr(), selector_image);
|
|
image_utils::write_to_file(dynamic_string(cVarArg, "selector_residuals_%u_%u.tga", trial_index, max_selector_value).get_ptr(), residual_image);
|
|
#endif
|
|
|
|
static_huffman_data_model residual_dm;
|
|
|
|
symbol_codec codec;
|
|
codec.start_encoding(1024*1024);
|
|
|
|
// Transmit residuals
|
|
if (!residual_dm.init(true, hist, 15))
|
|
return false;
|
|
|
|
if (!codec.encode_transmit_static_huffman_data_model(residual_dm, false))
|
|
return false;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Wrote %u bits for selector residual Huffman tables", codec.encode_get_total_bits_written());
|
|
#endif
|
|
|
|
uint start_bits = codec.encode_get_total_bits_written();
|
|
start_bits;
|
|
|
|
for (uint i = 0; i < residual_syms.size(); i++)
|
|
{
|
|
const uint sym = residual_syms[i];
|
|
codec.encode(sym, residual_dm);
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Wrote %u bits for selector residuals", codec.encode_get_total_bits_written() - start_bits);
|
|
#endif
|
|
|
|
codec.stop_encoding(false);
|
|
|
|
packed_data.swap(codec.get_encoding_buf());
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
{
|
|
console::debug("Wrote a total of %u bits for selector codebook", codec.encode_get_total_bits_written());
|
|
|
|
console::debug("Wrote %f bits per each selector codebook entry", packed_data.size() * 8.0f / selectors.size());
|
|
}
|
|
#endif
|
|
|
|
return true;
|
|
}
|
|
|
|
bool crn_comp::pack_chunks(
|
|
uint first_chunk, uint num_chunks,
|
|
bool clear_histograms,
|
|
symbol_codec* pCodec,
|
|
const crnlib::vector<uint>* pColor_endpoint_remap,
|
|
const crnlib::vector<uint>* pColor_selector_remap,
|
|
const crnlib::vector<uint>* pAlpha_endpoint_remap,
|
|
const crnlib::vector<uint>* pAlpha_selector_remap)
|
|
{
|
|
if (!pCodec)
|
|
{
|
|
m_chunk_encoding_hist.resize(1 << (3 * cEncodingMapNumChunksPerCode));
|
|
if (clear_histograms)
|
|
m_chunk_encoding_hist.set_all(0);
|
|
|
|
if (pColor_endpoint_remap)
|
|
{
|
|
CRNLIB_ASSERT(pColor_endpoint_remap->size() == m_hvq.get_color_endpoint_codebook_size());
|
|
m_endpoint_index_hist[0].resize(pColor_endpoint_remap->size());
|
|
if (clear_histograms)
|
|
m_endpoint_index_hist[0].set_all(0);
|
|
}
|
|
|
|
if (pColor_selector_remap)
|
|
{
|
|
CRNLIB_ASSERT(pColor_selector_remap->size() == m_hvq.get_color_selector_codebook_size());
|
|
m_selector_index_hist[0].resize(pColor_selector_remap->size());
|
|
if (clear_histograms)
|
|
m_selector_index_hist[0].set_all(0);
|
|
}
|
|
|
|
if (pAlpha_endpoint_remap)
|
|
{
|
|
CRNLIB_ASSERT(pAlpha_endpoint_remap->size() == m_hvq.get_alpha_endpoint_codebook_size());
|
|
m_endpoint_index_hist[1].resize(pAlpha_endpoint_remap->size());
|
|
if (clear_histograms)
|
|
m_endpoint_index_hist[1].set_all(0);
|
|
}
|
|
|
|
if (pAlpha_selector_remap)
|
|
{
|
|
CRNLIB_ASSERT(pAlpha_selector_remap->size() == m_hvq.get_alpha_selector_codebook_size());
|
|
m_selector_index_hist[1].resize(pAlpha_selector_remap->size());
|
|
if (clear_histograms)
|
|
m_selector_index_hist[1].set_all(0);
|
|
}
|
|
}
|
|
|
|
uint prev_endpoint_index[cNumComps];
|
|
utils::zero_object(prev_endpoint_index);
|
|
|
|
uint prev_selector_index[cNumComps];
|
|
utils::zero_object(prev_selector_index);
|
|
|
|
uint num_encodings_left = 0;
|
|
|
|
for (uint chunk_index = first_chunk; chunk_index < (first_chunk + num_chunks); chunk_index++)
|
|
{
|
|
if (!num_encodings_left)
|
|
{
|
|
uint index = 0;
|
|
for (uint i = 0; i < cEncodingMapNumChunksPerCode; i++)
|
|
if ((chunk_index + i) < (first_chunk + num_chunks))
|
|
index |= (m_hvq.get_chunk_encoding(chunk_index + i).m_encoding_index << (i * 3));
|
|
|
|
if (pCodec)
|
|
pCodec->encode(index, m_chunk_encoding_dm);
|
|
else
|
|
m_chunk_encoding_hist.inc_freq(index);
|
|
|
|
num_encodings_left = cEncodingMapNumChunksPerCode;
|
|
}
|
|
num_encodings_left--;
|
|
|
|
const dxt_hc::chunk_encoding& encoding = m_hvq.get_chunk_encoding(chunk_index);
|
|
const chunk_detail& details = m_chunk_details[chunk_index];
|
|
|
|
const uint comp_order[3] = { cAlpha0, cAlpha1, cColor };
|
|
for (uint c = 0; c < 3; c++)
|
|
{
|
|
const uint comp_index = comp_order[c];
|
|
if (!m_has_comp[comp_index])
|
|
continue;
|
|
|
|
// endpoints
|
|
if (comp_index == cColor)
|
|
{
|
|
if (pColor_endpoint_remap)
|
|
{
|
|
for (uint i = 0; i < encoding.m_num_tiles; i++)
|
|
{
|
|
uint cur_endpoint_index = (*pColor_endpoint_remap)[ m_endpoint_indices[cColor][details.m_first_endpoint_index + i] ];
|
|
int endpoint_delta = cur_endpoint_index - prev_endpoint_index[cColor];
|
|
|
|
int sym = endpoint_delta;
|
|
if (sym < 0)
|
|
sym += pColor_endpoint_remap->size();
|
|
|
|
CRNLIB_ASSERT(sym >= 0 && sym < (int)pColor_endpoint_remap->size());
|
|
|
|
if (!pCodec)
|
|
m_endpoint_index_hist[cColor].inc_freq(sym);
|
|
else
|
|
pCodec->encode(sym, m_endpoint_index_dm[0]);
|
|
|
|
prev_endpoint_index[cColor] = cur_endpoint_index;
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
if (pAlpha_endpoint_remap)
|
|
{
|
|
for (uint i = 0; i < encoding.m_num_tiles; i++)
|
|
{
|
|
uint cur_endpoint_index = (*pAlpha_endpoint_remap)[m_endpoint_indices[comp_index][details.m_first_endpoint_index + i]];
|
|
int endpoint_delta = cur_endpoint_index - prev_endpoint_index[comp_index];
|
|
|
|
int sym = endpoint_delta;
|
|
if (sym < 0)
|
|
sym += pAlpha_endpoint_remap->size();
|
|
|
|
CRNLIB_ASSERT(sym >= 0 && sym < (int)pAlpha_endpoint_remap->size());
|
|
|
|
if (!pCodec)
|
|
m_endpoint_index_hist[1].inc_freq(sym);
|
|
else
|
|
pCodec->encode(sym, m_endpoint_index_dm[1]);
|
|
|
|
prev_endpoint_index[comp_index] = cur_endpoint_index;
|
|
}
|
|
}
|
|
}
|
|
} // c
|
|
|
|
// selectors
|
|
for (uint y = 0; y < 2; y++)
|
|
{
|
|
for (uint x = 0; x < 2; x++)
|
|
{
|
|
for (uint c = 0; c < 3; c++)
|
|
{
|
|
const uint comp_index = comp_order[c];
|
|
if (!m_has_comp[comp_index])
|
|
continue;
|
|
|
|
if (comp_index == cColor)
|
|
{
|
|
if (pColor_selector_remap)
|
|
{
|
|
uint cur_selector_index = (*pColor_selector_remap)[ m_selector_indices[cColor][details.m_first_selector_index + x + y * 2] ];
|
|
int selector_delta = cur_selector_index - prev_selector_index[cColor];
|
|
|
|
int sym = selector_delta;
|
|
if (sym < 0)
|
|
sym += pColor_selector_remap->size();
|
|
|
|
CRNLIB_ASSERT(sym >= 0 && sym < (int)pColor_selector_remap->size());
|
|
|
|
if (!pCodec)
|
|
m_selector_index_hist[cColor].inc_freq(sym);
|
|
else
|
|
pCodec->encode(sym, m_selector_index_dm[cColor]);
|
|
|
|
prev_selector_index[cColor] = cur_selector_index;
|
|
}
|
|
}
|
|
else if (pAlpha_selector_remap)
|
|
{
|
|
uint cur_selector_index = (*pAlpha_selector_remap)[ m_selector_indices[comp_index][details.m_first_selector_index + x + y * 2] ];
|
|
int selector_delta = cur_selector_index - prev_selector_index[comp_index];
|
|
|
|
int sym = selector_delta;
|
|
if (sym < 0)
|
|
sym += pAlpha_selector_remap->size();
|
|
|
|
CRNLIB_ASSERT(sym >= 0 && sym < (int)pAlpha_selector_remap->size());
|
|
|
|
if (!pCodec)
|
|
m_selector_index_hist[1].inc_freq(sym);
|
|
else
|
|
pCodec->encode(sym, m_selector_index_dm[1]);
|
|
|
|
prev_selector_index[comp_index] = cur_selector_index;
|
|
}
|
|
|
|
} // c
|
|
|
|
} // x
|
|
} // y
|
|
|
|
} // chunk_index
|
|
|
|
return true;
|
|
}
|
|
|
|
bool crn_comp::pack_chunks_simulation(
|
|
uint first_chunk, uint num_chunks,
|
|
uint& total_bits,
|
|
const crnlib::vector<uint>* pColor_endpoint_remap,
|
|
const crnlib::vector<uint>* pColor_selector_remap,
|
|
const crnlib::vector<uint>* pAlpha_endpoint_remap,
|
|
const crnlib::vector<uint>* pAlpha_selector_remap)
|
|
{
|
|
if (!pack_chunks(first_chunk, num_chunks, true, NULL, pColor_endpoint_remap, pColor_selector_remap, pAlpha_endpoint_remap, pAlpha_selector_remap))
|
|
return false;
|
|
|
|
symbol_codec codec;
|
|
codec.start_encoding(2*1024*1024);
|
|
codec.encode_enable_simulation(true);
|
|
|
|
m_chunk_encoding_dm.init(true, m_chunk_encoding_hist, 16);
|
|
|
|
for (uint i = 0; i < 2; i++)
|
|
{
|
|
if (m_endpoint_index_hist[i].size())
|
|
{
|
|
m_endpoint_index_dm[i].init(true, m_endpoint_index_hist[i], 16);
|
|
|
|
codec.encode_transmit_static_huffman_data_model(m_endpoint_index_dm[i], false);
|
|
}
|
|
|
|
if (m_selector_index_hist[i].size())
|
|
{
|
|
m_selector_index_dm[i].init(true, m_selector_index_hist[i], 16);
|
|
|
|
codec.encode_transmit_static_huffman_data_model(m_selector_index_dm[i], false);
|
|
}
|
|
}
|
|
|
|
if (!pack_chunks(first_chunk, num_chunks, false, &codec, pColor_endpoint_remap, pColor_selector_remap, pAlpha_endpoint_remap, pAlpha_selector_remap))
|
|
return false;
|
|
|
|
codec.stop_encoding(false);
|
|
|
|
total_bits = codec.encode_get_total_bits_written();
|
|
|
|
return true;
|
|
}
|
|
|
|
void crn_comp::append_vec(crnlib::vector<uint8>& a, const void* p, uint size)
|
|
{
|
|
if (size)
|
|
{
|
|
uint ofs = a.size();
|
|
a.resize(ofs + size);
|
|
|
|
memcpy(&a[ofs], p, size);
|
|
}
|
|
}
|
|
|
|
void crn_comp::append_vec(crnlib::vector<uint8>& a, const crnlib::vector<uint8>& b)
|
|
{
|
|
if (!b.empty())
|
|
{
|
|
uint ofs = a.size();
|
|
a.resize(ofs + b.size());
|
|
|
|
memcpy(&a[ofs], &b[0], b.size());
|
|
}
|
|
}
|
|
|
|
#if 0
|
|
bool crn_comp::init_chunk_encoding_dm()
|
|
{
|
|
symbol_histogram hist(1 << (3 * cEncodingMapNumChunksPerCode));
|
|
|
|
for (uint chunk_index = 0; chunk_index < m_hvq.get_num_chunks(); chunk_index += cEncodingMapNumChunksPerCode)
|
|
{
|
|
uint index = 0;
|
|
for (uint i = 0; i < cEncodingMapNumChunksPerCode; i++)
|
|
{
|
|
if ((chunk_index + i) >= m_hvq.get_num_chunks())
|
|
break;
|
|
const dxt_hc::chunk_encoding& encoding = m_hvq.get_chunk_encoding(chunk_index + i);
|
|
|
|
index |= (encoding.m_encoding_index << (i * 3));
|
|
}
|
|
|
|
hist.inc_freq(index);
|
|
}
|
|
|
|
if (!m_chunk_encoding_dm.init(true, hist, 16))
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
#endif
|
|
|
|
bool crn_comp::alias_images()
|
|
{
|
|
for (uint face_index = 0; face_index < m_pParams->m_faces; face_index++)
|
|
{
|
|
for (uint level_index = 0; level_index < m_pParams->m_levels; level_index++)
|
|
{
|
|
const uint width = math::maximum(1U, m_pParams->m_width >> level_index);
|
|
const uint height = math::maximum(1U, m_pParams->m_height >> level_index);
|
|
|
|
if (!m_pParams->m_pImages[face_index][level_index])
|
|
return false;
|
|
|
|
m_images[face_index][level_index].alias((color_quad_u8*)m_pParams->m_pImages[face_index][level_index], width, height);
|
|
}
|
|
}
|
|
|
|
image_utils::conversion_type conv_type = image_utils::get_image_conversion_type_from_crn_format((crn_format)m_pParams->m_format);
|
|
if (conv_type != image_utils::cConversion_Invalid)
|
|
{
|
|
for (uint face_index = 0; face_index < m_pParams->m_faces; face_index++)
|
|
{
|
|
for (uint level_index = 0; level_index < m_pParams->m_levels; level_index++)
|
|
{
|
|
image_u8 cooked_image(m_images[face_index][level_index]);
|
|
|
|
image_utils::convert_image(cooked_image, conv_type);
|
|
|
|
m_images[face_index][level_index].swap(cooked_image);
|
|
}
|
|
}
|
|
}
|
|
|
|
m_mip_groups.clear();
|
|
m_mip_groups.resize(m_pParams->m_levels);
|
|
|
|
utils::zero_object(m_levels);
|
|
|
|
uint mip_group = 0;
|
|
uint chunk_index = 0;
|
|
uint mip_group_chunk_index = 0; (void)mip_group_chunk_index;
|
|
for (uint level_index = 0; level_index < m_pParams->m_levels; level_index++)
|
|
{
|
|
const uint width = math::maximum(1U, m_pParams->m_width >> level_index);
|
|
const uint height = math::maximum(1U, m_pParams->m_height >> level_index);
|
|
const uint chunk_width = math::align_up_value(width, cChunkPixelWidth) / cChunkPixelWidth;
|
|
const uint chunk_height = math::align_up_value(height, cChunkPixelHeight) / cChunkPixelHeight;
|
|
const uint num_chunks = m_pParams->m_faces * chunk_width * chunk_height;
|
|
|
|
m_mip_groups[mip_group].m_first_chunk = chunk_index;
|
|
mip_group_chunk_index = 0;
|
|
|
|
m_mip_groups[mip_group].m_num_chunks += num_chunks;
|
|
|
|
m_levels[level_index].m_width = width;
|
|
m_levels[level_index].m_height = height;
|
|
m_levels[level_index].m_chunk_width = chunk_width;
|
|
m_levels[level_index].m_chunk_height = chunk_height;
|
|
m_levels[level_index].m_first_chunk = chunk_index;
|
|
m_levels[level_index].m_num_chunks = num_chunks;
|
|
m_levels[level_index].m_group_index = mip_group;
|
|
m_levels[level_index].m_group_first_chunk = 0;
|
|
|
|
chunk_index += num_chunks;
|
|
|
|
mip_group++;
|
|
}
|
|
|
|
m_total_chunks = chunk_index;
|
|
|
|
return true;
|
|
}
|
|
|
|
void crn_comp::append_chunks(const image_u8& img, uint num_chunks_x, uint num_chunks_y, dxt_hc::pixel_chunk_vec& chunks, float weight)
|
|
{
|
|
for (uint y = 0; y < num_chunks_y; y++)
|
|
{
|
|
int x_start = 0;
|
|
int x_end = num_chunks_x;
|
|
int x_dir = 1;
|
|
if (y & 1)
|
|
{
|
|
x_start = num_chunks_x - 1;
|
|
x_end = -1;
|
|
x_dir = -1;
|
|
}
|
|
|
|
for (int x = x_start; x != x_end; x += x_dir)
|
|
{
|
|
chunks.resize(chunks.size() + 1);
|
|
|
|
dxt_hc::pixel_chunk& chunk = chunks.back();
|
|
chunk.m_weight = weight;
|
|
|
|
for (uint cy = 0; cy < cChunkPixelHeight; cy++)
|
|
{
|
|
uint py = y * cChunkPixelHeight + cy;
|
|
py = math::minimum(py, img.get_height() - 1);
|
|
|
|
for (uint cx = 0; cx < cChunkPixelWidth; cx++)
|
|
{
|
|
uint px = x * cChunkPixelWidth + cx;
|
|
px = math::minimum(px, img.get_width() - 1);
|
|
|
|
chunk(cx, cy) = img(px, py);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void crn_comp::create_chunks()
|
|
{
|
|
m_chunks.reserve(m_total_chunks);
|
|
m_chunks.resize(0);
|
|
|
|
for (uint level = 0; level < m_pParams->m_levels; level++)
|
|
{
|
|
for (uint face = 0; face < m_pParams->m_faces; face++)
|
|
{
|
|
if (!face)
|
|
{
|
|
CRNLIB_ASSERT(m_levels[level].m_first_chunk == m_chunks.size());
|
|
}
|
|
|
|
float mip_weight = math::minimum(12.0f, powf( 1.3f, static_cast<float>(level) ) );
|
|
//float mip_weight = 1.0f;
|
|
|
|
append_chunks(m_images[face][level], m_levels[level].m_chunk_width, m_levels[level].m_chunk_height, m_chunks, mip_weight);
|
|
}
|
|
}
|
|
|
|
CRNLIB_ASSERT(m_chunks.size() == m_total_chunks);
|
|
}
|
|
|
|
void crn_comp::clear()
|
|
{
|
|
m_pParams = NULL;
|
|
|
|
for (uint f = 0; f < cCRNMaxFaces; f++)
|
|
for (uint l = 0; l < cCRNMaxLevels; l++)
|
|
m_images[f][l].clear();
|
|
|
|
utils::zero_object(m_levels);
|
|
|
|
m_mip_groups.clear();
|
|
|
|
utils::zero_object(m_has_comp);
|
|
|
|
m_chunk_details.clear();
|
|
|
|
for (uint i = 0; i < cNumComps; i++)
|
|
{
|
|
m_endpoint_indices[i].clear();
|
|
m_selector_indices[i].clear();
|
|
}
|
|
|
|
m_total_chunks = 0;
|
|
|
|
m_chunks.clear();
|
|
|
|
utils::zero_object(m_crn_header);
|
|
|
|
m_comp_data.clear();
|
|
|
|
m_hvq.clear();
|
|
|
|
m_chunk_encoding_hist.clear();
|
|
m_chunk_encoding_dm.clear();
|
|
for (uint i = 0; i < 2; i++)
|
|
{
|
|
m_endpoint_index_hist[i].clear();
|
|
m_endpoint_index_dm[i].clear();
|
|
m_selector_index_hist[i].clear();
|
|
m_selector_index_dm[i].clear();
|
|
}
|
|
|
|
for (uint i = 0; i < cCRNMaxLevels; i++)
|
|
m_packed_chunks[i].clear();
|
|
|
|
m_packed_data_models.clear();
|
|
|
|
m_packed_color_endpoints.clear();
|
|
m_packed_color_selectors.clear();
|
|
m_packed_alpha_endpoints.clear();
|
|
m_packed_alpha_selectors.clear();
|
|
}
|
|
|
|
bool crn_comp::quantize_chunks()
|
|
{
|
|
dxt_hc::params params;
|
|
|
|
params.m_adaptive_tile_alpha_psnr_derating = m_pParams->m_crn_adaptive_tile_alpha_psnr_derating;
|
|
params.m_adaptive_tile_color_psnr_derating = m_pParams->m_crn_adaptive_tile_color_psnr_derating;
|
|
|
|
if (m_pParams->m_flags & cCRNCompFlagManualPaletteSizes)
|
|
{
|
|
params.m_color_endpoint_codebook_size = math::clamp<int>(m_pParams->m_crn_color_endpoint_palette_size, cCRNMinPaletteSize, cCRNMaxPaletteSize);
|
|
params.m_color_selector_codebook_size = math::clamp<int>(m_pParams->m_crn_color_selector_palette_size, cCRNMinPaletteSize, cCRNMaxPaletteSize);
|
|
params.m_alpha_endpoint_codebook_size = math::clamp<int>(m_pParams->m_crn_alpha_endpoint_palette_size, cCRNMinPaletteSize, cCRNMaxPaletteSize);
|
|
params.m_alpha_selector_codebook_size = math::clamp<int>(m_pParams->m_crn_alpha_selector_palette_size, cCRNMinPaletteSize, cCRNMaxPaletteSize);
|
|
}
|
|
else
|
|
{
|
|
uint max_codebook_entries = ((m_pParams->m_width + 3) / 4) * ((m_pParams->m_height + 3) / 4);
|
|
|
|
max_codebook_entries = math::clamp<uint>(max_codebook_entries, cCRNMinPaletteSize, cCRNMaxPaletteSize);
|
|
|
|
float quality = math::clamp<float>((float)m_pParams->m_quality_level / cCRNMaxQualityLevel, 0.0f, 1.0f);
|
|
float color_quality_power_mul = 1.0f;
|
|
float alpha_quality_power_mul = 1.0f;
|
|
if (m_pParams->m_format == cCRNFmtDXT5_CCxY)
|
|
{
|
|
color_quality_power_mul = 3.5f;
|
|
alpha_quality_power_mul = .35f;
|
|
params.m_adaptive_tile_color_psnr_derating = 5.0f;
|
|
}
|
|
else if (m_pParams->m_format == cCRNFmtDXT5)
|
|
color_quality_power_mul = .75f;
|
|
|
|
float color_endpoint_quality = powf(quality, 1.8f * color_quality_power_mul);
|
|
float color_selector_quality = powf(quality, 1.65f * color_quality_power_mul);
|
|
params.m_color_endpoint_codebook_size = math::clamp<uint>(math::float_to_uint(.5f + math::lerp<float>(math::maximum<float>(64, cCRNMinPaletteSize), (float)max_codebook_entries, color_endpoint_quality)), cCRNMinPaletteSize, cCRNMaxPaletteSize);
|
|
params.m_color_selector_codebook_size = math::clamp<uint>(math::float_to_uint(.5f + math::lerp<float>(math::maximum<float>(96, cCRNMinPaletteSize), (float)max_codebook_entries, color_selector_quality)), cCRNMinPaletteSize, cCRNMaxPaletteSize);
|
|
|
|
float alpha_endpoint_quality = powf(quality, 2.1f * alpha_quality_power_mul);
|
|
float alpha_selector_quality = powf(quality, 1.65f * alpha_quality_power_mul);
|
|
params.m_alpha_endpoint_codebook_size = math::clamp<uint>(math::float_to_uint(.5f + math::lerp<float>(math::maximum<float>(24, cCRNMinPaletteSize), (float)max_codebook_entries, alpha_endpoint_quality)), cCRNMinPaletteSize, cCRNMaxPaletteSize);;
|
|
params.m_alpha_selector_codebook_size = math::clamp<uint>(math::float_to_uint(.5f + math::lerp<float>(math::maximum<float>(48, cCRNMinPaletteSize), (float)max_codebook_entries, alpha_selector_quality)), cCRNMinPaletteSize, cCRNMaxPaletteSize);;
|
|
}
|
|
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
{
|
|
console::debug("Color endpoints: %u", params.m_color_endpoint_codebook_size);
|
|
console::debug("Color selectors: %u", params.m_color_selector_codebook_size);
|
|
console::debug("Alpha endpoints: %u", params.m_alpha_endpoint_codebook_size);
|
|
console::debug("Alpha selectors: %u", params.m_alpha_selector_codebook_size);
|
|
}
|
|
|
|
params.m_hierarchical = (m_pParams->m_flags & cCRNCompFlagHierarchical) != 0;
|
|
params.m_perceptual = (m_pParams->m_flags & cCRNCompFlagPerceptual) != 0;
|
|
|
|
params.m_pProgress_func = m_pParams->m_pProgress_func;
|
|
params.m_pProgress_func_data = m_pParams->m_pProgress_func_data;
|
|
|
|
switch (m_pParams->m_format)
|
|
{
|
|
case cCRNFmtDXT1:
|
|
{
|
|
params.m_format = cDXT1;
|
|
m_has_comp[cColor] = true;
|
|
break;
|
|
}
|
|
case cCRNFmtDXT3:
|
|
{
|
|
m_has_comp[cAlpha0] = true;
|
|
return false;
|
|
}
|
|
case cCRNFmtDXT5:
|
|
{
|
|
params.m_format = cDXT5;
|
|
params.m_alpha_component_indices[0] = m_pParams->m_alpha_component;
|
|
m_has_comp[cColor] = true;
|
|
m_has_comp[cAlpha0] = true;
|
|
break;
|
|
}
|
|
case cCRNFmtDXT5_CCxY:
|
|
{
|
|
params.m_format = cDXT5;
|
|
params.m_alpha_component_indices[0] = 3;
|
|
m_has_comp[cColor] = true;
|
|
m_has_comp[cAlpha0] = true;
|
|
params.m_perceptual = false;
|
|
|
|
//params.m_adaptive_tile_color_alpha_weighting_ratio = 1.0f;
|
|
params.m_adaptive_tile_color_alpha_weighting_ratio = 1.5f;
|
|
break;
|
|
}
|
|
case cCRNFmtDXT5_xGBR:
|
|
case cCRNFmtDXT5_AGBR:
|
|
case cCRNFmtDXT5_xGxR:
|
|
{
|
|
params.m_format = cDXT5;
|
|
params.m_alpha_component_indices[0] = 3;
|
|
m_has_comp[cColor] = true;
|
|
m_has_comp[cAlpha0] = true;
|
|
params.m_perceptual = false;
|
|
break;
|
|
}
|
|
case cCRNFmtDXN_XY:
|
|
{
|
|
params.m_format = cDXN_XY;
|
|
params.m_alpha_component_indices[0] = 0;
|
|
params.m_alpha_component_indices[1] = 1;
|
|
m_has_comp[cAlpha0] = true;
|
|
m_has_comp[cAlpha1] = true;
|
|
params.m_perceptual = false;
|
|
break;
|
|
}
|
|
case cCRNFmtDXN_YX:
|
|
{
|
|
params.m_format = cDXN_YX;
|
|
params.m_alpha_component_indices[0] = 1;
|
|
params.m_alpha_component_indices[1] = 0;
|
|
m_has_comp[cAlpha0] = true;
|
|
m_has_comp[cAlpha1] = true;
|
|
params.m_perceptual = false;
|
|
break;
|
|
}
|
|
case cCRNFmtDXT5A:
|
|
{
|
|
params.m_format = cDXT5A;
|
|
params.m_alpha_component_indices[0] = m_pParams->m_alpha_component;
|
|
m_has_comp[cAlpha0] = true;
|
|
params.m_perceptual = false;
|
|
break;
|
|
}
|
|
case cCRNFmtETC1:
|
|
{
|
|
console::warning("crn_comp::quantize_chunks: This class does not support ETC1");
|
|
return false;
|
|
}
|
|
default:
|
|
{
|
|
return false;
|
|
}
|
|
}
|
|
params.m_debugging = (m_pParams->m_flags & cCRNCompFlagDebugging) != 0;
|
|
|
|
params.m_num_levels = m_pParams->m_levels;
|
|
for (uint i = 0; i < m_pParams->m_levels; i++)
|
|
{
|
|
params.m_levels[i].m_first_chunk = m_levels[i].m_first_chunk;
|
|
params.m_levels[i].m_num_chunks = m_levels[i].m_num_chunks;
|
|
}
|
|
|
|
if (!m_hvq.compress(params, m_total_chunks, &m_chunks[0], m_task_pool))
|
|
return false;
|
|
|
|
#if CRNLIB_CREATE_DEBUG_IMAGES
|
|
if (params.m_debugging)
|
|
{
|
|
const dxt_hc::pixel_chunk_vec& pixel_chunks = m_hvq.get_compressed_chunk_pixels_final();
|
|
|
|
image_u8 img;
|
|
dxt_hc::create_debug_image_from_chunks((m_pParams->m_width+7)>>3, (m_pParams->m_height+7)>>3, pixel_chunks, &m_hvq.get_chunk_encoding_vec(), img, true, -1);
|
|
image_utils::write_to_file("quantized_chunks.tga", img);
|
|
}
|
|
#endif
|
|
|
|
return true;
|
|
}
|
|
|
|
void crn_comp::create_chunk_indices()
|
|
{
|
|
m_chunk_details.resize(m_total_chunks);
|
|
|
|
for (uint i = 0; i < cNumComps; i++)
|
|
{
|
|
m_endpoint_indices[i].clear();
|
|
m_selector_indices[i].clear();
|
|
}
|
|
|
|
for (uint chunk_index = 0; chunk_index < m_total_chunks; chunk_index++)
|
|
{
|
|
const dxt_hc::chunk_encoding& chunk_encoding = m_hvq.get_chunk_encoding(chunk_index);
|
|
|
|
for (uint i = 0; i < cNumComps; i++)
|
|
{
|
|
if (m_has_comp[i])
|
|
{
|
|
m_chunk_details[chunk_index].m_first_endpoint_index = m_endpoint_indices[i].size();
|
|
m_chunk_details[chunk_index].m_first_selector_index = m_selector_indices[i].size();
|
|
break;
|
|
}
|
|
}
|
|
|
|
for (uint i = 0; i < cNumComps; i++)
|
|
{
|
|
if (!m_has_comp[i])
|
|
continue;
|
|
|
|
for (uint tile_index = 0; tile_index < chunk_encoding.m_num_tiles; tile_index++)
|
|
m_endpoint_indices[i].push_back(chunk_encoding.m_endpoint_indices[i][tile_index]);
|
|
|
|
for (uint y = 0; y < cChunkBlockHeight; y++)
|
|
for (uint x = 0; x < cChunkBlockWidth; x++)
|
|
m_selector_indices[i].push_back(chunk_encoding.m_selector_indices[i][y][x]);
|
|
}
|
|
}
|
|
}
|
|
|
|
struct optimize_color_endpoint_codebook_params
|
|
{
|
|
crnlib::vector<uint>* m_pTrial_color_endpoint_remap;
|
|
uint m_iter_index;
|
|
uint m_max_iter_index;
|
|
};
|
|
|
|
void crn_comp::optimize_color_endpoint_codebook_task(uint64 data, void* pData_ptr)
|
|
{
|
|
data;
|
|
optimize_color_endpoint_codebook_params* pParams = reinterpret_cast<optimize_color_endpoint_codebook_params*>(pData_ptr);
|
|
|
|
if (pParams->m_iter_index == pParams->m_max_iter_index)
|
|
{
|
|
sort_color_endpoint_codebook(*pParams->m_pTrial_color_endpoint_remap, m_hvq.get_color_endpoint_vec());
|
|
}
|
|
else
|
|
{
|
|
float f = pParams->m_iter_index / static_cast<float>(pParams->m_max_iter_index - 1);
|
|
|
|
create_zeng_reorder_table(
|
|
m_hvq.get_color_endpoint_codebook_size(),
|
|
m_endpoint_indices[cColor].size(),
|
|
&m_endpoint_indices[cColor][0],
|
|
*pParams->m_pTrial_color_endpoint_remap,
|
|
pParams->m_iter_index ? color_endpoint_similarity_func : NULL,
|
|
&m_hvq,
|
|
f);
|
|
}
|
|
|
|
crnlib_delete(pParams);
|
|
}
|
|
|
|
bool crn_comp::optimize_color_endpoint_codebook(crnlib::vector<uint>& remapping)
|
|
{
|
|
if (m_pParams->m_flags & cCRNCompFlagQuick)
|
|
{
|
|
remapping.resize(m_hvq.get_color_endpoint_vec().size());
|
|
for (uint i = 0; i < m_hvq.get_color_endpoint_vec().size(); i++)
|
|
remapping[i] = i;
|
|
|
|
if (!pack_color_endpoints(m_packed_color_endpoints, remapping, m_endpoint_indices[cColor], 0))
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
|
|
const uint cMaxEndpointRemapIters = 3;
|
|
|
|
uint best_bits = UINT_MAX;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("----- Begin optimization of color endpoint codebook");
|
|
#endif
|
|
|
|
crnlib::vector<uint> trial_color_endpoint_remaps[cMaxEndpointRemapIters + 1];
|
|
|
|
for (uint i = 0; i <= cMaxEndpointRemapIters; i++)
|
|
{
|
|
optimize_color_endpoint_codebook_params* pParams = crnlib_new<optimize_color_endpoint_codebook_params>();
|
|
pParams->m_iter_index = i;
|
|
pParams->m_max_iter_index = cMaxEndpointRemapIters;
|
|
pParams->m_pTrial_color_endpoint_remap = &trial_color_endpoint_remaps[i];
|
|
|
|
m_task_pool.queue_object_task(this, &crn_comp::optimize_color_endpoint_codebook_task, 0, pParams);
|
|
}
|
|
|
|
m_task_pool.join();
|
|
|
|
for (uint i = 0; i <= cMaxEndpointRemapIters; i++)
|
|
{
|
|
if (!update_progress(20, i, cMaxEndpointRemapIters+1))
|
|
return false;
|
|
|
|
crnlib::vector<uint>& trial_color_endpoint_remap = trial_color_endpoint_remaps[i];
|
|
|
|
crnlib::vector<uint8> packed_data;
|
|
if (!pack_color_endpoints(packed_data, trial_color_endpoint_remap, m_endpoint_indices[cColor], i))
|
|
return false;
|
|
|
|
uint total_packed_chunk_bits;
|
|
if (!pack_chunks_simulation(0, m_total_chunks, total_packed_chunk_bits, &trial_color_endpoint_remap, NULL, NULL, NULL))
|
|
return false;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Pack chunks simulation: %u bits", total_packed_chunk_bits);
|
|
#endif
|
|
|
|
uint total_bits = packed_data.size() * 8 + total_packed_chunk_bits;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Total bits: %u", total_bits);
|
|
#endif
|
|
|
|
if (total_bits < best_bits)
|
|
{
|
|
m_packed_color_endpoints.swap(packed_data);
|
|
remapping.swap(trial_color_endpoint_remap);
|
|
best_bits = total_bits;
|
|
}
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("End optimization of color endpoint codebook");
|
|
#endif
|
|
|
|
return true;
|
|
}
|
|
|
|
struct optimize_color_selector_codebook_params
|
|
{
|
|
crnlib::vector<uint>* m_pTrial_color_selector_remap;
|
|
uint m_iter_index;
|
|
uint m_max_iter_index;
|
|
};
|
|
|
|
void crn_comp::optimize_color_selector_codebook_task(uint64 data, void* pData_ptr)
|
|
{
|
|
data;
|
|
optimize_color_selector_codebook_params* pParams = reinterpret_cast<optimize_color_selector_codebook_params*>(pData_ptr);
|
|
|
|
if (pParams->m_iter_index == pParams->m_max_iter_index)
|
|
{
|
|
sort_selector_codebook(*pParams->m_pTrial_color_selector_remap, m_hvq.get_color_selectors_vec(), g_dxt1_to_linear);
|
|
}
|
|
else
|
|
{
|
|
float f = pParams->m_iter_index / static_cast<float>(pParams->m_max_iter_index - 1);
|
|
create_zeng_reorder_table(
|
|
m_hvq.get_color_selector_codebook_size(),
|
|
m_selector_indices[cColor].size(),
|
|
&m_selector_indices[cColor][0],
|
|
*pParams->m_pTrial_color_selector_remap,
|
|
pParams->m_iter_index ? color_selector_similarity_func : NULL,
|
|
(void*)&m_hvq.get_color_selectors_vec(),
|
|
f);
|
|
}
|
|
|
|
crnlib_delete(pParams);
|
|
}
|
|
|
|
bool crn_comp::optimize_color_selector_codebook(crnlib::vector<uint>& remapping)
|
|
{
|
|
if (m_pParams->m_flags & cCRNCompFlagQuick)
|
|
{
|
|
remapping.resize(m_hvq.get_color_selectors_vec().size());
|
|
for (uint i = 0; i < m_hvq.get_color_selectors_vec().size(); i++)
|
|
remapping[i] = i;
|
|
|
|
if (!pack_selectors(
|
|
m_packed_color_selectors,
|
|
m_selector_indices[cColor],
|
|
m_hvq.get_color_selectors_vec(),
|
|
remapping,
|
|
3,
|
|
g_dxt1_to_linear, 0))
|
|
{
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
const uint cMaxSelectorRemapIters = 3;
|
|
|
|
uint best_bits = UINT_MAX;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("----- Begin optimization of color selector codebook");
|
|
#endif
|
|
|
|
crnlib::vector<uint> trial_color_selector_remaps[cMaxSelectorRemapIters + 1];
|
|
|
|
for (uint i = 0; i <= cMaxSelectorRemapIters; i++)
|
|
{
|
|
optimize_color_selector_codebook_params* pParams = crnlib_new<optimize_color_selector_codebook_params>();
|
|
pParams->m_iter_index = i;
|
|
pParams->m_max_iter_index = cMaxSelectorRemapIters;
|
|
pParams->m_pTrial_color_selector_remap = &trial_color_selector_remaps[i];
|
|
|
|
m_task_pool.queue_object_task(this, &crn_comp::optimize_color_selector_codebook_task, 0, pParams);
|
|
}
|
|
|
|
m_task_pool.join();
|
|
|
|
for (uint i = 0; i <= cMaxSelectorRemapIters; i++)
|
|
{
|
|
if (!update_progress(21, i, cMaxSelectorRemapIters+1))
|
|
return false;
|
|
|
|
crnlib::vector<uint>& trial_color_selector_remap = trial_color_selector_remaps[i];
|
|
|
|
crnlib::vector<uint8> packed_data;
|
|
if (!pack_selectors(
|
|
packed_data,
|
|
m_selector_indices[cColor],
|
|
m_hvq.get_color_selectors_vec(),
|
|
trial_color_selector_remap,
|
|
3,
|
|
g_dxt1_to_linear, i))
|
|
{
|
|
return false;
|
|
}
|
|
|
|
uint total_packed_chunk_bits;
|
|
if (!pack_chunks_simulation(0, m_total_chunks, total_packed_chunk_bits, NULL, &trial_color_selector_remap, NULL, NULL))
|
|
return false;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Pack chunks simulation: %u bits", total_packed_chunk_bits);
|
|
#endif
|
|
|
|
uint total_bits = packed_data.size() * 8 + total_packed_chunk_bits;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Total bits: %u", total_bits);
|
|
#endif
|
|
if (total_bits < best_bits)
|
|
{
|
|
m_packed_color_selectors.swap(packed_data);
|
|
remapping.swap(trial_color_selector_remap);
|
|
best_bits = total_bits;
|
|
}
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("End optimization of color selector codebook");
|
|
#endif
|
|
|
|
return true;
|
|
}
|
|
|
|
struct optimize_alpha_endpoint_codebook_params
|
|
{
|
|
crnlib::vector<uint>* m_pAlpha_indices;
|
|
crnlib::vector<uint>* m_pTrial_alpha_endpoint_remap;
|
|
uint m_iter_index;
|
|
uint m_max_iter_index;
|
|
};
|
|
|
|
void crn_comp::optimize_alpha_endpoint_codebook_task(uint64 data, void* pData_ptr)
|
|
{
|
|
data;
|
|
optimize_alpha_endpoint_codebook_params* pParams = reinterpret_cast<optimize_alpha_endpoint_codebook_params*>(pData_ptr);
|
|
|
|
if (pParams->m_iter_index == pParams->m_max_iter_index)
|
|
{
|
|
sort_alpha_endpoint_codebook(*pParams->m_pTrial_alpha_endpoint_remap, m_hvq.get_alpha_endpoint_vec());
|
|
}
|
|
else
|
|
{
|
|
float f = pParams->m_iter_index / static_cast<float>(pParams->m_max_iter_index - 1);
|
|
|
|
create_zeng_reorder_table(
|
|
m_hvq.get_alpha_endpoint_codebook_size(),
|
|
pParams->m_pAlpha_indices->size(),
|
|
&(*pParams->m_pAlpha_indices)[0],
|
|
*pParams->m_pTrial_alpha_endpoint_remap,
|
|
pParams->m_iter_index ? alpha_endpoint_similarity_func : NULL,
|
|
&m_hvq,
|
|
f);
|
|
}
|
|
|
|
crnlib_delete(pParams);
|
|
}
|
|
|
|
bool crn_comp::optimize_alpha_endpoint_codebook(crnlib::vector<uint>& remapping)
|
|
{
|
|
crnlib::vector<uint> alpha_indices;
|
|
alpha_indices.reserve(m_endpoint_indices[cAlpha0].size() + m_endpoint_indices[cAlpha1].size());
|
|
for (uint i = 0; i < m_endpoint_indices[cAlpha0].size(); i++)
|
|
alpha_indices.push_back(m_endpoint_indices[cAlpha0][i]);
|
|
for (uint i = 0; i < m_endpoint_indices[cAlpha1].size(); i++)
|
|
alpha_indices.push_back(m_endpoint_indices[cAlpha1][i]);
|
|
|
|
if (m_pParams->m_flags & cCRNCompFlagQuick)
|
|
{
|
|
remapping.resize(m_hvq.get_alpha_endpoint_vec().size());
|
|
for (uint i = 0; i < m_hvq.get_alpha_endpoint_vec().size(); i++)
|
|
remapping[i] = i;
|
|
|
|
if (!pack_alpha_endpoints(m_packed_alpha_endpoints, remapping, alpha_indices, 0))
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
|
|
const uint cMaxEndpointRemapIters = 3;
|
|
uint best_bits = UINT_MAX;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("----- Begin optimization of alpha endpoint codebook");
|
|
#endif
|
|
|
|
crnlib::vector<uint> trial_alpha_endpoint_remaps[cMaxEndpointRemapIters + 1];
|
|
|
|
for (uint i = 0; i <= cMaxEndpointRemapIters; i++)
|
|
{
|
|
optimize_alpha_endpoint_codebook_params* pParams = crnlib_new<optimize_alpha_endpoint_codebook_params>();
|
|
pParams->m_pAlpha_indices = &alpha_indices;
|
|
pParams->m_iter_index = i;
|
|
pParams->m_max_iter_index = cMaxEndpointRemapIters;
|
|
pParams->m_pTrial_alpha_endpoint_remap = &trial_alpha_endpoint_remaps[i];
|
|
|
|
m_task_pool.queue_object_task(this, &crn_comp::optimize_alpha_endpoint_codebook_task, 0, pParams);
|
|
}
|
|
|
|
m_task_pool.join();
|
|
|
|
for (uint i = 0; i <= cMaxEndpointRemapIters; i++)
|
|
{
|
|
if (!update_progress(22, i, cMaxEndpointRemapIters+1))
|
|
return false;
|
|
|
|
crnlib::vector<uint>& trial_alpha_endpoint_remap = trial_alpha_endpoint_remaps[i];
|
|
|
|
crnlib::vector<uint8> packed_data;
|
|
if (!pack_alpha_endpoints(packed_data, trial_alpha_endpoint_remap, alpha_indices, i))
|
|
return false;
|
|
|
|
uint total_packed_chunk_bits;
|
|
if (!pack_chunks_simulation(0, m_total_chunks, total_packed_chunk_bits, NULL, NULL, &trial_alpha_endpoint_remap, NULL))
|
|
return false;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Pack chunks simulation: %u bits", total_packed_chunk_bits);
|
|
#endif
|
|
|
|
uint total_bits = packed_data.size() * 8 + total_packed_chunk_bits;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Total bits: %u", total_bits);
|
|
#endif
|
|
|
|
if (total_bits < best_bits)
|
|
{
|
|
m_packed_alpha_endpoints.swap(packed_data);
|
|
remapping.swap(trial_alpha_endpoint_remap);
|
|
best_bits = total_bits;
|
|
}
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("End optimization of alpha endpoint codebook");
|
|
#endif
|
|
|
|
return true;
|
|
}
|
|
|
|
struct optimize_alpha_selector_codebook_params
|
|
{
|
|
crnlib::vector<uint>* m_pAlpha_indices;
|
|
crnlib::vector<uint>* m_pTrial_alpha_selector_remap;
|
|
uint m_iter_index;
|
|
uint m_max_iter_index;
|
|
};
|
|
|
|
void crn_comp::optimize_alpha_selector_codebook_task(uint64 data, void* pData_ptr)
|
|
{
|
|
data;
|
|
optimize_alpha_selector_codebook_params* pParams = reinterpret_cast<optimize_alpha_selector_codebook_params*>(pData_ptr);
|
|
|
|
if (pParams->m_iter_index == pParams->m_max_iter_index)
|
|
{
|
|
sort_selector_codebook(*pParams->m_pTrial_alpha_selector_remap, m_hvq.get_alpha_selectors_vec(), g_dxt5_to_linear);
|
|
}
|
|
else
|
|
{
|
|
float f = pParams->m_iter_index / static_cast<float>(pParams->m_max_iter_index - 1);
|
|
create_zeng_reorder_table(
|
|
m_hvq.get_alpha_selector_codebook_size(),
|
|
pParams->m_pAlpha_indices->size(),
|
|
&(*pParams->m_pAlpha_indices)[0],
|
|
*pParams->m_pTrial_alpha_selector_remap,
|
|
pParams->m_iter_index ? alpha_selector_similarity_func : NULL,
|
|
(void*)&m_hvq.get_alpha_selectors_vec(),
|
|
f);
|
|
}
|
|
}
|
|
|
|
bool crn_comp::optimize_alpha_selector_codebook(crnlib::vector<uint>& remapping)
|
|
{
|
|
crnlib::vector<uint> alpha_indices;
|
|
alpha_indices.reserve(m_selector_indices[cAlpha0].size() + m_selector_indices[cAlpha1].size());
|
|
for (uint i = 0; i < m_selector_indices[cAlpha0].size(); i++)
|
|
alpha_indices.push_back(m_selector_indices[cAlpha0][i]);
|
|
for (uint i = 0; i < m_selector_indices[cAlpha1].size(); i++)
|
|
alpha_indices.push_back(m_selector_indices[cAlpha1][i]);
|
|
|
|
if (m_pParams->m_flags & cCRNCompFlagQuick)
|
|
{
|
|
remapping.resize(m_hvq.get_alpha_selectors_vec().size());
|
|
for (uint i = 0; i < m_hvq.get_alpha_selectors_vec().size(); i++)
|
|
remapping[i] = i;
|
|
|
|
if (!pack_selectors(
|
|
m_packed_alpha_selectors,
|
|
alpha_indices,
|
|
m_hvq.get_alpha_selectors_vec(),
|
|
remapping,
|
|
7,
|
|
g_dxt5_to_linear, 0))
|
|
{
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
const uint cMaxSelectorRemapIters = 3;
|
|
|
|
uint best_bits = UINT_MAX;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("----- Begin optimization of alpha selector codebook");
|
|
#endif
|
|
|
|
crnlib::vector<uint> trial_alpha_selector_remaps[cMaxSelectorRemapIters + 1];
|
|
|
|
for (uint i = 0; i <= cMaxSelectorRemapIters; i++)
|
|
{
|
|
optimize_alpha_selector_codebook_params* pParams = crnlib_new<optimize_alpha_selector_codebook_params>();
|
|
pParams->m_pAlpha_indices = &alpha_indices;
|
|
pParams->m_iter_index = i;
|
|
pParams->m_max_iter_index = cMaxSelectorRemapIters;
|
|
pParams->m_pTrial_alpha_selector_remap = &trial_alpha_selector_remaps[i];
|
|
|
|
m_task_pool.queue_object_task(this, &crn_comp::optimize_alpha_selector_codebook_task, 0, pParams);
|
|
}
|
|
|
|
m_task_pool.join();
|
|
|
|
for (uint i = 0; i <= cMaxSelectorRemapIters; i++)
|
|
{
|
|
if (!update_progress(23, i, cMaxSelectorRemapIters+1))
|
|
return false;
|
|
|
|
crnlib::vector<uint>& trial_alpha_selector_remap = trial_alpha_selector_remaps[i];
|
|
|
|
crnlib::vector<uint8> packed_data;
|
|
if (!pack_selectors(
|
|
packed_data,
|
|
alpha_indices,
|
|
m_hvq.get_alpha_selectors_vec(),
|
|
trial_alpha_selector_remap,
|
|
7,
|
|
g_dxt5_to_linear, i))
|
|
{
|
|
return false;
|
|
}
|
|
|
|
uint total_packed_chunk_bits;
|
|
if (!pack_chunks_simulation(0, m_total_chunks, total_packed_chunk_bits, NULL, NULL, NULL, &trial_alpha_selector_remap))
|
|
return false;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Pack chunks simulation: %u bits", total_packed_chunk_bits);
|
|
#endif
|
|
|
|
uint total_bits = packed_data.size() * 8 + total_packed_chunk_bits;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("Total bits: %u", total_bits);
|
|
#endif
|
|
if (total_bits < best_bits)
|
|
{
|
|
m_packed_alpha_selectors.swap(packed_data);
|
|
|
|
remapping.swap(trial_alpha_selector_remap);
|
|
best_bits = total_bits;
|
|
}
|
|
}
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
console::debug("End optimization of alpha selector codebook");
|
|
#endif
|
|
|
|
return true;
|
|
}
|
|
|
|
bool crn_comp::pack_data_models()
|
|
{
|
|
symbol_codec codec;
|
|
codec.start_encoding(1024*1024);
|
|
|
|
if (!codec.encode_transmit_static_huffman_data_model(m_chunk_encoding_dm, false))
|
|
return false;
|
|
|
|
for (uint i = 0; i < 2; i++)
|
|
{
|
|
if (m_endpoint_index_dm[i].get_total_syms())
|
|
{
|
|
if (!codec.encode_transmit_static_huffman_data_model(m_endpoint_index_dm[i], false))
|
|
return false;
|
|
}
|
|
|
|
if (m_selector_index_dm[i].get_total_syms())
|
|
{
|
|
if (!codec.encode_transmit_static_huffman_data_model(m_selector_index_dm[i], false))
|
|
return false;
|
|
}
|
|
}
|
|
|
|
codec.stop_encoding(false);
|
|
|
|
m_packed_data_models.swap(codec.get_encoding_buf());
|
|
|
|
return true;
|
|
}
|
|
|
|
bool crn_comp::create_comp_data()
|
|
{
|
|
utils::zero_object(m_crn_header);
|
|
|
|
m_crn_header.m_width = static_cast<uint16>(m_pParams->m_width);
|
|
m_crn_header.m_height = static_cast<uint16>(m_pParams->m_height);
|
|
m_crn_header.m_levels = static_cast<uint8>(m_pParams->m_levels);
|
|
m_crn_header.m_faces = static_cast<uint8>(m_pParams->m_faces);
|
|
m_crn_header.m_format = static_cast<uint8>(m_pParams->m_format);
|
|
m_crn_header.m_userdata0 = m_pParams->m_userdata0;
|
|
m_crn_header.m_userdata1 = m_pParams->m_userdata1;
|
|
|
|
m_comp_data.clear();
|
|
m_comp_data.reserve(2*1024*1024);
|
|
append_vec(m_comp_data, &m_crn_header, sizeof(m_crn_header));
|
|
// tack on the rest of the variable size m_level_ofs array
|
|
m_comp_data.resize( m_comp_data.size() + sizeof(m_crn_header.m_level_ofs[0]) * (m_pParams->m_levels - 1) );
|
|
|
|
if (m_packed_color_endpoints.size())
|
|
{
|
|
m_crn_header.m_color_endpoints.m_num = static_cast<uint16>(m_hvq.get_color_endpoint_codebook_size());
|
|
m_crn_header.m_color_endpoints.m_size = m_packed_color_endpoints.size();
|
|
m_crn_header.m_color_endpoints.m_ofs = m_comp_data.size();
|
|
append_vec(m_comp_data, m_packed_color_endpoints);
|
|
}
|
|
|
|
if (m_packed_color_selectors.size())
|
|
{
|
|
m_crn_header.m_color_selectors.m_num = static_cast<uint16>(m_hvq.get_color_selector_codebook_size());
|
|
m_crn_header.m_color_selectors.m_size = m_packed_color_selectors.size();
|
|
m_crn_header.m_color_selectors.m_ofs = m_comp_data.size();
|
|
append_vec(m_comp_data, m_packed_color_selectors);
|
|
}
|
|
|
|
if (m_packed_alpha_endpoints.size())
|
|
{
|
|
m_crn_header.m_alpha_endpoints.m_num = static_cast<uint16>(m_hvq.get_alpha_endpoint_codebook_size());
|
|
m_crn_header.m_alpha_endpoints.m_size = m_packed_alpha_endpoints.size();
|
|
m_crn_header.m_alpha_endpoints.m_ofs = m_comp_data.size();
|
|
append_vec(m_comp_data, m_packed_alpha_endpoints);
|
|
}
|
|
|
|
if (m_packed_alpha_selectors.size())
|
|
{
|
|
m_crn_header.m_alpha_selectors.m_num = static_cast<uint16>(m_hvq.get_alpha_selector_codebook_size());
|
|
m_crn_header.m_alpha_selectors.m_size = m_packed_alpha_selectors.size();
|
|
m_crn_header.m_alpha_selectors.m_ofs = m_comp_data.size();
|
|
append_vec(m_comp_data, m_packed_alpha_selectors);
|
|
}
|
|
|
|
m_crn_header.m_tables_ofs = m_comp_data.size();
|
|
m_crn_header.m_tables_size = m_packed_data_models.size();
|
|
append_vec(m_comp_data, m_packed_data_models);
|
|
|
|
uint level_ofs[cCRNMaxLevels];
|
|
for (uint i = 0; i < m_mip_groups.size(); i++)
|
|
{
|
|
level_ofs[i] = m_comp_data.size();
|
|
append_vec(m_comp_data, m_packed_chunks[i]);
|
|
}
|
|
|
|
crnd::crn_header& dst_header = *(crnd::crn_header*)&m_comp_data[0];
|
|
// don't change the m_comp_data vector - or dst_header will be invalidated!
|
|
|
|
memcpy(&dst_header, &m_crn_header, sizeof(dst_header));
|
|
|
|
for (uint i = 0; i < m_mip_groups.size(); i++)
|
|
dst_header.m_level_ofs[i] = level_ofs[i];
|
|
|
|
const uint actual_header_size = sizeof(crnd::crn_header) + sizeof(dst_header.m_level_ofs[0]) * (m_mip_groups.size() - 1);
|
|
|
|
dst_header.m_sig = crnd::crn_header::cCRNSigValue;
|
|
|
|
dst_header.m_data_size = m_comp_data.size();
|
|
dst_header.m_data_crc16 = crc16(&m_comp_data[actual_header_size], m_comp_data.size() - actual_header_size);
|
|
|
|
dst_header.m_header_size = actual_header_size;
|
|
dst_header.m_header_crc16 = crc16(&dst_header.m_data_size, actual_header_size - (uint)((uint8*)&dst_header.m_data_size - (uint8*)&dst_header));
|
|
|
|
return true;
|
|
}
|
|
|
|
bool crn_comp::update_progress(uint phase_index, uint subphase_index, uint subphase_total)
|
|
{
|
|
if (!m_pParams->m_pProgress_func)
|
|
return true;
|
|
|
|
#if CRNLIB_ENABLE_DEBUG_MESSAGES
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
return true;
|
|
#endif
|
|
|
|
return (*m_pParams->m_pProgress_func)(phase_index, cTotalCompressionPhases, subphase_index, subphase_total, m_pParams->m_pProgress_func_data) != 0;
|
|
}
|
|
|
|
bool crn_comp::compress_internal()
|
|
{
|
|
if (!alias_images())
|
|
return false;
|
|
|
|
create_chunks();
|
|
|
|
if (!quantize_chunks())
|
|
return false;
|
|
|
|
create_chunk_indices();
|
|
|
|
crnlib::vector<uint> endpoint_remap[2];
|
|
crnlib::vector<uint> selector_remap[2];
|
|
|
|
if (m_has_comp[cColor])
|
|
{
|
|
if (!optimize_color_endpoint_codebook(endpoint_remap[0]))
|
|
return false;
|
|
if (!optimize_color_selector_codebook(selector_remap[0]))
|
|
return false;
|
|
}
|
|
|
|
if (m_has_comp[cAlpha0])
|
|
{
|
|
if (!optimize_alpha_endpoint_codebook(endpoint_remap[1]))
|
|
return false;
|
|
if (!optimize_alpha_selector_codebook(selector_remap[1]))
|
|
return false;
|
|
}
|
|
|
|
m_chunk_encoding_hist.clear();
|
|
for (uint i = 0; i < 2; i++)
|
|
{
|
|
m_endpoint_index_hist[i].clear();
|
|
m_endpoint_index_dm[i].clear();
|
|
m_selector_index_hist[i].clear();
|
|
m_selector_index_dm[i].clear();
|
|
}
|
|
|
|
for (uint pass = 0; pass < 2; pass++)
|
|
{
|
|
for (uint mip_group = 0; mip_group < m_mip_groups.size(); mip_group++)
|
|
{
|
|
symbol_codec codec;
|
|
codec.start_encoding(2*1024*1024);
|
|
|
|
if (!pack_chunks(
|
|
m_mip_groups[mip_group].m_first_chunk, m_mip_groups[mip_group].m_num_chunks,
|
|
!pass && !mip_group, pass ? &codec : NULL,
|
|
m_has_comp[cColor] ? &endpoint_remap[0] : NULL, m_has_comp[cColor] ? &selector_remap[0] : NULL,
|
|
m_has_comp[cAlpha0] ? &endpoint_remap[1] : NULL, m_has_comp[cAlpha0] ? &selector_remap[1] : NULL))
|
|
{
|
|
return false;
|
|
}
|
|
|
|
codec.stop_encoding(false);
|
|
|
|
if (pass)
|
|
m_packed_chunks[mip_group].swap(codec.get_encoding_buf());
|
|
}
|
|
|
|
if (!pass)
|
|
{
|
|
m_chunk_encoding_dm.init(true, m_chunk_encoding_hist, 16);
|
|
|
|
for (uint i = 0; i < 2; i++)
|
|
{
|
|
if (m_endpoint_index_hist[i].size())
|
|
m_endpoint_index_dm[i].init(true, m_endpoint_index_hist[i], 16);
|
|
|
|
if (m_selector_index_hist[i].size())
|
|
m_selector_index_dm[i].init(true, m_selector_index_hist[i], 16);
|
|
}
|
|
}
|
|
}
|
|
|
|
if (!pack_data_models())
|
|
return false;
|
|
|
|
if (!create_comp_data())
|
|
return false;
|
|
|
|
if (!update_progress(24, 1, 1))
|
|
return false;
|
|
|
|
if (m_pParams->m_flags & cCRNCompFlagDebugging)
|
|
{
|
|
crnlib_print_mem_stats();
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
bool crn_comp::compress_init(const crn_comp_params& params)
|
|
{
|
|
params;
|
|
return true;
|
|
}
|
|
|
|
bool crn_comp::compress_pass(const crn_comp_params& params, float *pEffective_bitrate)
|
|
{
|
|
clear();
|
|
|
|
if (pEffective_bitrate) *pEffective_bitrate = 0.0f;
|
|
|
|
m_pParams = ¶ms;
|
|
|
|
if ((math::minimum(m_pParams->m_width, m_pParams->m_height) < 1) || (math::maximum(m_pParams->m_width, m_pParams->m_height) > cCRNMaxLevelResolution))
|
|
return false;
|
|
|
|
if (!m_task_pool.init(params.m_num_helper_threads))
|
|
return false;
|
|
|
|
bool status = compress_internal();
|
|
|
|
m_task_pool.deinit();
|
|
|
|
if ((status) && (pEffective_bitrate))
|
|
{
|
|
uint total_pixels = 0;
|
|
|
|
for (uint f = 0; f < m_pParams->m_faces; f++)
|
|
for (uint l = 0; l < m_pParams->m_levels; l++)
|
|
total_pixels += m_images[f][l].get_total_pixels();
|
|
|
|
*pEffective_bitrate = (m_comp_data.size() * 8.0f) / total_pixels;
|
|
}
|
|
|
|
return status;
|
|
}
|
|
|
|
void crn_comp::compress_deinit()
|
|
{
|
|
}
|
|
|
|
} // namespace crnlib
|
|
|