11#include <cuda_runtime.h>
49 "QuantizerConfig must fit in FZM_STAGE_CONFIG_SIZE");
96template<
typename TInput =
float,
typename TCode = u
int16_t>
119 int radius = 32768,
float outlier_cap = 0.05f)
129 const std::vector<void*>& inputs,
130 const std::vector<void*>& outputs,
131 const std::vector<size_t>& sizes
136 std::string
getName()
const override {
return "Quantizer"; }
138 size_t getNumInputs()
const override {
139 if (!is_inverse_)
return 1;
140 return isInplaceMode() ? 1 : 4;
142 size_t getNumOutputs()
const override {
143 if (is_inverse_)
return 1;
144 return isInplaceMode() ? 1 : 4;
148 if (is_inverse_)
return {
"reconstructed"};
149 if (isInplaceMode())
return {
"codes"};
150 return {
"codes",
"outlier_vals",
"outlier_idxs",
"outlier_count"};
154 const std::vector<size_t>& input_sizes
159 std::unordered_map<std::string, size_t> result;
160 for (
size_t i = 0; i < names.size() && i < actual_output_sizes_.size(); i++)
161 result[names[i]] = actual_output_sizes_[i];
165 return (index >= 0 && index <
static_cast<int>(actual_output_sizes_.size()))
166 ? actual_output_sizes_[index] : 0;
169 void setInverse(
bool inverse)
override { is_inverse_ = inverse; }
170 bool isInverse()
const override {
return is_inverse_; }
173 return static_cast<uint16_t
>(StageType::QUANTIZER);
178 if (isInplaceMode())
return static_cast<uint8_t
>(getCodeDataType());
179 switch (output_index) {
180 case 0:
return static_cast<uint8_t
>(getCodeDataType());
182 case 2:
return static_cast<uint8_t
>(DataType::UINT32);
183 case 3:
return static_cast<uint8_t
>(DataType::UINT32);
184 default:
return static_cast<uint8_t
>(DataType::UINT8);
192 size_t serializeHeader(
size_t output_index, uint8_t* buf,
size_t max_size)
const override;
197 saved_config_ = config_;
198 saved_num_elements_ = num_elements_;
199 saved_actual_outlier_count_ = actual_outlier_count_;
200 saved_computed_abs_eb_ = computed_abs_eb_;
201 saved_computed_value_base_ = computed_value_base_;
202 saved_actual_output_sizes_ = actual_output_sizes_;
205 void restoreState()
override {
206 config_ = saved_config_;
207 num_elements_ = saved_num_elements_;
208 actual_outlier_count_ = saved_actual_outlier_count_;
209 computed_abs_eb_ = saved_computed_abs_eb_;
210 computed_value_base_ = saved_computed_value_base_;
211 actual_output_sizes_ = saved_actual_output_sizes_;
214 void setErrorBound(TInput eb) { config_.
error_bound =
static_cast<float>(eb); }
215 void setQuantRadius(
int r) { config_.
quant_radius = r; }
219 void setZigzagCodes(
bool enable) { config_.
zigzag_codes = enable; }
225 TInput getErrorBound()
const {
return static_cast<TInput
>(config_.
error_bound); }
226 int getQuantRadius()
const {
return config_.
quant_radius; }
227 ErrorBoundMode getErrorBoundMode()
const {
return config_.eb_mode; }
230 bool getZigzagCodes()
const {
return config_.
zigzag_codes; }
236 Config saved_config_;
237 std::vector<size_t> actual_output_sizes_;
238 std::vector<size_t> saved_actual_output_sizes_;
239 size_t num_elements_ = 0;
240 size_t saved_num_elements_ = 0;
241 uint32_t actual_outlier_count_= 0;
242 uint32_t saved_actual_outlier_count_ = 0;
243 bool is_inverse_ =
false;
244 TInput computed_abs_eb_ =
static_cast<TInput
>(1e-4);
245 TInput saved_computed_abs_eb_ =
static_cast<TInput
>(1e-4);
246 float computed_value_base_ = 0.0f;
247 float saved_computed_value_base_ = 0.0f;
248 const void* d_outlier_count_ptr_ =
nullptr;
250 bool isInplaceMode()
const {
251 return config_.inplace_outliers
256 if (std::is_same<TInput, float>::value)
return DataType::FLOAT32;
257 if (std::is_same<TInput, double>::value)
return DataType::FLOAT64;
258 return DataType::FLOAT32;
261 if (std::is_same<TCode, uint8_t>::value)
return DataType::UINT8;
262 if (std::is_same<TCode, uint16_t>::value)
return DataType::UINT16;
263 if (std::is_same<TCode, uint32_t>::value)
return DataType::UINT32;
264 return DataType::UINT16;
266 size_t getMaxOutlierCount(
size_t n)
const {
267 return static_cast<size_t>(std::ceil(n * config_.outlier_capacity));
271extern template class QuantizerStage<float, uint16_t>;
272extern template class QuantizerStage<float, uint32_t>;
273extern template class QuantizerStage<double, uint16_t>;
274extern template class QuantizerStage<double, uint32_t>;
Definition quantizer.h:97
void saveState() override
Definition quantizer.h:196
uint8_t getInputDataType(size_t) const override
Definition quantizer.h:188
uint8_t getOutputDataType(size_t output_index) const override
Definition quantizer.h:176
void setInplaceOutliers(bool enable)
ABS/NOA: encode outliers in-place (raw float bits in codes array; no scatter buffers).
Definition quantizer.h:223
std::vector< std::string > getOutputNames() const override
Definition quantizer.h:147
void setInverse(bool inverse) override
Definition quantizer.h:169
void postStreamSync(cudaStream_t stream) override
void deserializeHeader(const uint8_t *buf, size_t size) override
void setOutlierThreshold(float t)
ABS/NOA: |x| >= threshold → lossless outlier regardless of bin (LC reference parameter).
Definition quantizer.h:221
void execute(cudaStream_t stream, MemoryPool *pool, const std::vector< void * > &inputs, const std::vector< void * > &outputs, const std::vector< size_t > &sizes) override
std::string getName() const override
Definition quantizer.h:136
size_t serializeHeader(size_t output_index, uint8_t *buf, size_t max_size) const override
uint16_t getStageTypeId() const override
Definition quantizer.h:172
std::unordered_map< std::string, size_t > getActualOutputSizesByName() const override
Definition quantizer.h:157
std::vector< size_t > estimateOutputSizes(const std::vector< size_t > &input_sizes) const override
size_t getMaxHeaderSize(size_t) const override
Definition quantizer.h:193
size_t getActualOutputSize(int index) const override
Definition quantizer.h:164
Fused Lorenzo predictor and quantizer stage.
Definition fzm_format.h:25
ErrorBoundMode
Definition lorenzo_quant.h:30
@ ABS
Absolute error bound.
@ REL
Global-approximate point-wise relative bound.
constexpr size_t FZM_STAGE_CONFIG_SIZE
Per-stage serialized config slot (bytes)
Definition fzm_format.h:65
DataType
Element data type identifiers used in buffer and stage descriptors.
Definition fzm_format.h:104
Base class interface for all compression stages.
Definition quantizer.h:25
uint8_t inplace_outliers
1 if outliers are encoded in-place in the codes array.
Definition quantizer.h:37
uint8_t eb_mode
ErrorBoundMode cast to uint8_t.
Definition quantizer.h:34
uint32_t outlier_count
Actual number of outliers.
Definition quantizer.h:31
DataType code_type
Quantization code type (1B).
Definition quantizer.h:33
uint8_t zigzag_codes
1 if ABS/NOA codes are zigzag-encoded.
Definition quantizer.h:35
uint32_t num_elements
Total element count.
Definition quantizer.h:30
uint32_t quant_radius
Quantization radius.
Definition quantizer.h:29
float user_error_bound
Original user-specified EB.
Definition quantizer.h:27
DataType input_type
Original input type (1B).
Definition quantizer.h:32
float abs_error_bound
Absolute EB after mode conversion (0 for REL).
Definition quantizer.h:26
uint8_t _pad[3]
Alignment padding — must be zero.
Definition quantizer.h:38
float outlier_threshold
ABS/NOA: |x| >= threshold → forced outlier (inf = disabled).
Definition quantizer.h:36
float value_base
value_range (NOA); 0 for ABS/REL.
Definition quantizer.h:28
Definition quantizer.h:100
float outlier_threshold
ABS/NOA: |x| >= threshold → lossless outlier (LC reference threshold). Default: ∞.
Definition quantizer.h:111
float outlier_capacity
Fraction of input size reserved for outliers.
Definition quantizer.h:103
bool zigzag_codes
Definition quantizer.h:109
float precomputed_value_base
Pre-computed value_base > 0 to skip the NOA data scan; 0 = auto.
Definition quantizer.h:106
bool inplace_outliers
Definition quantizer.h:115
int quant_radius
Quantization radius.
Definition quantizer.h:102
float error_bound
Error bound (interpretation set by eb_mode).
Definition quantizer.h:101