mirror of
https://github.com/yuzu-emu/FasTC.git
synced 2024-11-30 21:24:17 +01:00
663caada50
1. Split compression parameter generation and compression parameter packing. This gives a good performance boost, since we don't pack every single time we compress. The error is computed each time, and only the best parameters are packed. 2. Allow the shape selection function to specify up to ten shapes to try for compression. We were already doing this kind of hackily where we allowed both a three and two partition shape. This makes it a little cleaner and exposes it to the user.
237 lines
10 KiB
C++
Executable File
237 lines
10 KiB
C++
Executable File
/* FasTC
|
|
* Copyright (c) 2014 University of North Carolina at Chapel Hill.
|
|
* All rights reserved.
|
|
*
|
|
* Permission to use, copy, modify, and distribute this software and its
|
|
* documentation for educational, research, and non-profit purposes, without
|
|
* fee, and without a written agreement is hereby granted, provided that the
|
|
* above copyright notice, this paragraph, and the following four paragraphs
|
|
* appear in all copies.
|
|
*
|
|
* Permission to incorporate this software into commercial products may be
|
|
* obtained by contacting the authors or the Office of Technology Development
|
|
* at the University of North Carolina at Chapel Hill <otd@unc.edu>.
|
|
*
|
|
* This software program and documentation are copyrighted by the University of
|
|
* North Carolina at Chapel Hill. The software program and documentation are
|
|
* supplied "as is," without any accompanying services from the University of
|
|
* North Carolina at Chapel Hill or the authors. The University of North
|
|
* Carolina at Chapel Hill and the authors do not warrant that the operation of
|
|
* the program will be uninterrupted or error-free. The end-user understands
|
|
* that the program was developed for research purposes and is advised not to
|
|
* rely exclusively on the program for any reason.
|
|
*
|
|
* IN NO EVENT SHALL THE UNIVERSITY OF NORTH CAROLINA AT CHAPEL HILL OR THE
|
|
* AUTHORS BE LIABLE TO ANY PARTY FOR DIRECT, INDIRECT, SPECIAL, INCIDENTAL,
|
|
* OR CONSEQUENTIAL DAMAGES, INCLUDING LOST PROFITS, ARISING OUT OF THE USE OF
|
|
* THIS SOFTWARE AND ITS DOCUMENTATION, EVEN IF THE UNIVERSITY OF NORTH CAROLINA
|
|
* AT CHAPEL HILL OR THE AUTHORS HAVE BEEN ADVISED OF THE POSSIBILITY OF SUCH
|
|
* DAMAGE.
|
|
*
|
|
* THE UNIVERSITY OF NORTH CAROLINA AT CHAPEL HILL AND THE AUTHORS SPECIFICALLY
|
|
* DISCLAIM ANY WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
|
|
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE AND ANY
|
|
* STATUTORY WARRANTY OF NON-INFRINGEMENT. THE SOFTWARE PROVIDED HEREUNDER IS ON
|
|
* AN "AS IS" BASIS, AND THE UNIVERSITY OF NORTH CAROLINA AT CHAPEL HILL AND
|
|
* THE AUTHORS HAVE NO OBLIGATIONS TO PROVIDE MAINTENANCE, SUPPORT, UPDATES,
|
|
* ENHANCEMENTS, OR MODIFICATIONS.
|
|
*
|
|
* Please send all BUG REPORTS to <pavel@cs.unc.edu>.
|
|
*
|
|
* The authors may be contacted via:
|
|
*
|
|
* Pavel Krajcevski
|
|
* Dept of Computer Science
|
|
* 201 S Columbia St
|
|
* Frederick P. Brooks, Jr. Computer Science Bldg
|
|
* Chapel Hill, NC 27599-3175
|
|
* USA
|
|
*
|
|
* <http://gamma.cs.unc.edu/FasTC/>
|
|
*/
|
|
|
|
// The original lisence from the code available at the following location:
|
|
// http://software.intel.com/en-us/vcsource/samples/fast-texture-compression
|
|
//
|
|
// This code has been modified significantly from the original.
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Copyright 2011 Intel Corporation
|
|
// All Rights Reserved
|
|
//
|
|
// Permission is granted to use, copy, distribute and prepare derivative works
|
|
// of this software for any purpose and without fee, provided, that the above
|
|
// copyright notice and this statement appear in all copies. Intel makes no
|
|
// representations about the suitability of this software for any purpose. THIS
|
|
// SOFTWARE IS PROVIDED "AS IS." INTEL SPECIFICALLY DISCLAIMS ALL WARRANTIES,
|
|
// EXPRESS OR IMPLIED, AND ALL LIABILITY, INCLUDING CONSEQUENTIAL AND OTHER
|
|
// INDIRECT DAMAGES, FOR THE USE OF THIS SOFTWARE, INCLUDING LIABILITY FOR
|
|
// INFRINGEMENT OF ANY PROPRIETARY RIGHTS, AND INCLUDING THE WARRANTIES OF
|
|
// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. Intel does not assume
|
|
// any responsibility for any errors which may appear in this software nor any
|
|
// responsibility to update it.
|
|
//
|
|
//------------------------------------------------------------------------------
|
|
|
|
#ifndef BPTCENCODER_INCLUDE_BPTCCOMPRESSOR_H_
|
|
#define BPTCENCODER_INCLUDE_BPTCCOMPRESSOR_H_
|
|
|
|
#include "BPTCConfig.h"
|
|
#include "CompressionJob.h"
|
|
|
|
#include <iosfwd>
|
|
|
|
namespace BPTCC {
|
|
// The various available block modes that a BPTC compressor can choose from.
|
|
// The enum is specialized to be power-of-two values so that an EBlockMode
|
|
// variable can be used as a bit mask.
|
|
enum EBlockMode {
|
|
eBlockMode_Zero = 1,
|
|
eBlockMode_One = 2,
|
|
eBlockMode_Two = 4,
|
|
eBlockMode_Three = 8,
|
|
eBlockMode_Four = 16,
|
|
eBlockMode_Five = 32,
|
|
eBlockMode_Six = 64,
|
|
eBlockMode_Seven = 128
|
|
};
|
|
|
|
// This is the error metric that is applied to our error measurement algorithm
|
|
// in order to bias calculation towards results that are more in-line with
|
|
// how the Human Visual System works. Uniform error means that each color
|
|
// channel is treated equally. For a while, the widely accepted non-uniform
|
|
// metric has been to give red 30%, green 59% and blue 11% weight when
|
|
// computing the error between two pixels.
|
|
enum ErrorMetric {
|
|
eErrorMetric_Uniform, // Treats r, g, and b channels equally
|
|
eErrorMetric_Nonuniform, // { 0.3, 0.59, 0.11 }
|
|
|
|
kNumErrorMetrics
|
|
};
|
|
|
|
// A shape consists of an index into the table of shapes and the number
|
|
// of partitions that the index corresponds to. Different BPTC modes
|
|
// interpret the shape differently and some are even illegal (such as
|
|
// having an index >= 16 on mode 0). Hence, each shape corresponds to
|
|
// these two variables.
|
|
struct Shape {
|
|
uint32 m_NumPartitions;
|
|
uint32 m_Index;
|
|
};
|
|
|
|
// A shape selection can influence the results of the compressor by choosing
|
|
// different modes to compress or not compress. The shape index is a value
|
|
// between zero and sixty-four that corresponds to one of the available
|
|
// partitioning schemes defined by the BPTC format.
|
|
struct ShapeSelection {
|
|
// This is the number of indices from which to select the appropriate
|
|
// shapes. I.e. the compressor will try the first m_NumIndices shapes
|
|
uint32 m_NumIndices;
|
|
|
|
// These are the shape indices to use when evaluating two-partition shapes.
|
|
Shape m_Shapes[10];
|
|
|
|
// This is the additional mask to prevent modes once shape selection
|
|
// is done. This value is &-ed with m_BlockModes from CompressionSettings
|
|
// to determine what the final considered blocks are.
|
|
uint32 m_SelectedModes;
|
|
|
|
// Defaults
|
|
ShapeSelection()
|
|
: m_NumIndices(0)
|
|
, m_SelectedModes(static_cast<EBlockMode>(0xFF))
|
|
{ }
|
|
};
|
|
|
|
// A shape selection function is one that selects a BPTC shape from a given
|
|
// block position and pixel array.
|
|
typedef ShapeSelection (*ShapeSelectionFn)
|
|
(uint32 x, uint32 y, const uint32 pixels[16], const void *userData);
|
|
|
|
// Compression parameters used to control the BPTC compressor. Each of the
|
|
// values has a default, so this is not strictly required to perform
|
|
// compression, but some aspects of the compressor can be user-defined or
|
|
// overridden.
|
|
struct CompressionSettings {
|
|
// The shape selection function to use during compression. The default (when
|
|
// this variable is set to NULL) is to use the diagonal of the axis-aligned
|
|
// bounding box of every partition to estimate the error using that
|
|
// partition would accrue. The shape with the least error is then chosen.
|
|
// This procedure is done for both two and three partition shapes, and then
|
|
// every block mode is still available.
|
|
ShapeSelectionFn m_ShapeSelectionFn;
|
|
|
|
// The user data passed to the shape selection function.
|
|
const void *m_ShapeSelectionUserData;
|
|
|
|
// The block modes that the compressor will consider during compression.
|
|
// This variable is a bit mask of EBlockMode values and by default contains
|
|
// every mode. This setting can be used to further restrict the search space
|
|
// and increase compression times.
|
|
uint32 m_BlockModes;
|
|
|
|
// See the description for ErrorMetric.
|
|
ErrorMetric m_ErrorMetric;
|
|
|
|
// The number of simulated annealing steps to perform per refinement
|
|
// iteration. In general, a larger number produces better results. The
|
|
// default is set to 50. This metric works on a logarithmic scale -- twice
|
|
// the value will double the compute time, but only decrease the error by
|
|
// two times a factor.
|
|
uint32 m_NumSimulatedAnnealingSteps;
|
|
|
|
CompressionSettings()
|
|
: m_ShapeSelectionFn(NULL)
|
|
, m_ShapeSelectionUserData(NULL)
|
|
, m_BlockModes(static_cast<EBlockMode>(0xFF))
|
|
, m_ErrorMetric(eErrorMetric_Uniform)
|
|
, m_NumSimulatedAnnealingSteps(50)
|
|
{ }
|
|
};
|
|
|
|
// Retreives a float4 pointer for the r, g, b, a weights for each color
|
|
// channel, in that order.
|
|
const float *GetErrorMetric(ErrorMetric e);
|
|
|
|
// Compress the image given as RGBA data to BPTC format. Width and Height are
|
|
// the dimensions of the image in pixels.
|
|
void Compress(const FasTC::CompressionJob &,
|
|
CompressionSettings settings = CompressionSettings());
|
|
|
|
// Perform a compression while recording all of the choices the compressor
|
|
// made into a list of statistics. We can use this to see whether or not
|
|
// certain heuristics are working, such as whether or not certain modes are
|
|
// being chosen more often than others, etc.
|
|
void CompressWithStats(const FasTC::CompressionJob &, std::ostream *logStream,
|
|
CompressionSettings settings = CompressionSettings());
|
|
|
|
#ifdef HAS_SSE_41
|
|
// Compress the image given as RGBA data to BPTC format using an algorithm
|
|
// optimized for SIMD enabled platforms. Width and Height are the dimensions
|
|
// of the image in pixels.
|
|
void CompressImageBPTCSIMD(const unsigned char* inBuf, unsigned char* outBuf,
|
|
unsigned int width, unsigned int height);
|
|
#endif
|
|
|
|
#ifdef HAS_ATOMICS
|
|
// This is a threadsafe version of the compression function that is designed
|
|
// to compress a list of textures. If this function is called with the same
|
|
// argument from multiple threads, they will work together to compress all of
|
|
// the images in the list.
|
|
void CompressAtomic(FasTC::CompressionJobList &);
|
|
#endif
|
|
|
|
#ifdef FOUND_NVTT_BPTC_EXPORT
|
|
// These functions take the same arguments as Compress and CompressWithStats,
|
|
// but they use the NVTT compressor if it was supplied to CMake.
|
|
void CompressNVTT(const FasTC::CompressionJob &);
|
|
void CompressNVTTWithStats(const FasTC::CompressionJob &,
|
|
std::ostream *logStream);
|
|
#endif
|
|
|
|
// Decompress the image given as BPTC data to R8G8B8A8 format.
|
|
void Decompress(const FasTC::DecompressionJob &);
|
|
} // namespace BPTCC
|
|
|
|
#endif // BPTCENCODER_INCLUDE_BPTCCOMPRESSOR_H_
|