FZGPUModules 2.0
GPU-accelerated modular compression pipelines
Loading...
Searching...
No Matches
fzm_format.h
Go to the documentation of this file.
1#pragma once
2
20#include <cstdint>
21#include <cstring>
22#include <stdexcept>
23#include <string>
24
25namespace fz {
26
28constexpr uint32_t FZM_MAGIC = 0x464D5A32;
29
40constexpr uint8_t FZM_VERSION_MAJOR = 3;
41constexpr uint8_t FZM_VERSION_MINOR = 1;
42constexpr uint16_t FZM_VERSION = (static_cast<uint16_t>(FZM_VERSION_MAJOR) << 8)
43 | static_cast<uint16_t>(FZM_VERSION_MINOR);
44
46constexpr size_t FZM_LEGACY_HEADER_CORE_SIZE = 72;
47
48constexpr uint16_t FZM_FLAG_HAS_DATA_CHECKSUM = 0x0001u;
49constexpr uint16_t FZM_FLAG_HAS_HEADER_CHECKSUM = 0x0002u;
50
55constexpr uint8_t fzmVersionMajor(uint16_t v) {
56 return (v <= 0xFF) ? static_cast<uint8_t>(v) : static_cast<uint8_t>(v >> 8);
57}
59constexpr uint8_t fzmVersionMinor(uint16_t v) {
60 return (v <= 0xFF) ? 0u : static_cast<uint8_t>(v & 0xFF);
61}
62
63constexpr size_t FZM_MAX_BUFFERS = 32;
64constexpr size_t FZM_MAX_NAME_LEN = 64;
65constexpr size_t FZM_STAGE_CONFIG_SIZE = 128;
66constexpr size_t FZM_MAX_SOURCES = 4;
67
68// ─────────────────────────────────────────────────────────────────────────────
69
76enum class StageType : uint16_t {
77 UNKNOWN = 0,
78 LORENZO_QUANT = 1,
79 DIFFERENCE = 2,
80 SCALE = 3,
81 PASSTHROUGH= 4,
82 RLE = 5,
83 HUFFMAN = 6,
84 BITPACK = 7,
85 SPLIT = 10,
86 MERGE = 11,
87 LORENZO = 12,
88 QUANTIZER = 14,
89 ZIGZAG = 15,
90 NEGABINARY = 16,
91 BITSHUFFLE = 17,
92 RZE = 18,
93 ANS = 20,
94 ADM = 19,
95 G_INTERP = 22,
96 BITPLANE_RZE = 23,
97 ADAPTIVE_BITPACK = 24,
98 TILED_LORENZO = 25,
99 RRE = 26,
100};
101
109enum class DataType : uint8_t {
110 UINT8 = 0,
111 UINT16 = 1,
112 UINT32 = 2,
113 UINT64 = 3,
114 INT8 = 4,
115 INT16 = 5,
116 INT32 = 6,
117 INT64 = 7,
118 FLOAT32 = 8,
119 FLOAT64 = 9,
120 UNKNOWN = 0xFF,
121};
122
123// ─────────────────────────────────────────────────────────────────────────────
124
125constexpr size_t FZM_MAX_STAGE_INPUTS = 8;
126constexpr size_t FZM_MAX_STAGE_OUTPUTS = 8;
127
139 uint16_t stage_version;
140 uint8_t num_inputs;
141 uint8_t num_outputs;
142 uint16_t reserved1;
143
144 uint16_t input_buffer_ids[FZM_MAX_STAGE_INPUTS];
145 uint16_t output_buffer_ids[FZM_MAX_STAGE_OUTPUTS];
146
148 uint32_t config_size;
149
150 uint8_t reserved2[84];
151 // Total: 2+2+1+1+2+16+16+128+4+84 = 256 bytes
152
153 FZMStageInfo() {
154 stage_type = StageType::UNKNOWN;
155 stage_version = 0;
156 num_inputs = 0;
157 num_outputs = 0;
158 reserved1 = 0;
159 memset(input_buffer_ids, 0xFF, sizeof(input_buffer_ids));
160 memset(output_buffer_ids, 0xFF, sizeof(output_buffer_ids));
162 config_size = 0;
163 memset(reserved2, 0, 84);
164 }
165};
166static_assert(sizeof(FZMStageInfo) == 256, "FZMStageInfo must be 256 bytes");
167
178 uint16_t stage_version;
181 uint16_t dag_buffer_id;
183
184 uint64_t data_size;
185 uint64_t allocated_size;
187 uint64_t byte_offset;
188
190 uint32_t config_size;
191
192 uint8_t reserved2[14];
193
195 stage_type = StageType::UNKNOWN;
196 stage_version = 0;
197 data_type = DataType::UINT8;
199 dag_buffer_id = 0xFFFF;
200 memset(name, 0, FZM_MAX_NAME_LEN);
201 data_size = 0;
202 allocated_size = 0;
204 byte_offset = 0;
206 config_size = 0;
207 memset(reserved2, 0, 14);
208 }
209};
210static_assert(sizeof(FZMBufferEntry) == 256, "FZMBufferEntry must be 256 bytes");
211
225 uint32_t magic;
226 uint16_t version;
227 uint16_t num_buffers;
228
231 uint64_t header_size;
232
233 uint32_t num_stages;
234 uint16_t num_sources;
235 uint16_t flags;
236
243
244 uint32_t data_checksum;
246
247 FZMHeaderCore() {
249 version = FZM_VERSION;
250 num_buffers = 0;
252 compressed_size = 0;
253 header_size = sizeof(FZMHeaderCore);
254 num_stages = 0;
255 num_sources = 0;
256 flags = 0;
258 data_checksum = 0;
259 header_checksum = 0;
260 }
261
263 uint64_t computeHeaderSize() const {
264 return sizeof(FZMHeaderCore)
265 + num_stages * sizeof(FZMStageInfo)
266 + num_buffers * sizeof(FZMBufferEntry);
267 }
268};
269static_assert(sizeof(FZMHeaderCore) == 80, "FZMHeaderCore must be 80 bytes");
270
271// ─────────────────────────────────────────────────────────────────────────────
272// Helper functions
273// ─────────────────────────────────────────────────────────────────────────────
274
276inline size_t getDataTypeSize(DataType type) {
277 switch (type) {
278 case DataType::UINT8: case DataType::INT8: return 1;
279 case DataType::UINT16: case DataType::INT16: return 2;
280 case DataType::UINT32: case DataType::INT32: case DataType::FLOAT32: return 4;
281 case DataType::UINT64: case DataType::INT64: case DataType::FLOAT64: return 8;
282 default: throw std::runtime_error("Unknown data type");
283 }
284}
285
287inline std::string dataTypeToString(DataType type) {
288 switch (type) {
289 case DataType::UINT8: return "uint8";
290 case DataType::UINT16: return "uint16";
291 case DataType::UINT32: return "uint32";
292 case DataType::UINT64: return "uint64";
293 case DataType::INT8: return "int8";
294 case DataType::INT16: return "int16";
295 case DataType::INT32: return "int32";
296 case DataType::INT64: return "int64";
297 case DataType::FLOAT32: return "float32";
298 case DataType::FLOAT64: return "float64";
299 default: return "unknown";
300 }
301}
302
304inline std::string stageTypeToString(StageType type) {
305 switch (type) {
306 case StageType::LORENZO_QUANT: return "LorenzoQuant";
307 case StageType::DIFFERENCE: return "Difference";
308 case StageType::SCALE: return "Scale";
309 case StageType::PASSTHROUGH: return "PassThrough";
310 case StageType::RLE: return "RLE";
311 case StageType::HUFFMAN: return "Huffman";
312 case StageType::BITPACK: return "BitPack";
313 case StageType::SPLIT: return "Split";
314 case StageType::MERGE: return "Merge";
315 case StageType::QUANTIZER: return "Quantizer";
316 case StageType::ZIGZAG: return "Zigzag";
317 case StageType::NEGABINARY: return "Negabinary";
318 case StageType::BITSHUFFLE: return "Bitshuffle";
319 case StageType::RZE: return "RZE";
320 case StageType::RRE: return "RRE";
321 case StageType::LORENZO: return "Lorenzo";
322 case StageType::ANS: return "ANS";
323 case StageType::ADM: return "ADM";
324 case StageType::G_INTERP: return "GInterp";
325 case StageType::BITPLANE_RZE: return "BitplaneRZE";
326 case StageType::ADAPTIVE_BITPACK: return "AdaptiveBitpack";
327 case StageType::TILED_LORENZO: return "TiledLorenzo";
328 default: return "Unknown";
329 }
330}
331
332} // namespace fz
Definition fzm_format.h:25
size_t getDataTypeSize(DataType type)
Definition fzm_format.h:276
constexpr uint8_t FZM_VERSION_MAJOR
Definition fzm_format.h:40
std::string dataTypeToString(DataType type)
Definition fzm_format.h:287
std::string stageTypeToString(StageType type)
Definition fzm_format.h:304
constexpr uint8_t fzmVersionMinor(uint16_t v)
Definition fzm_format.h:59
constexpr size_t FZM_MAX_SOURCES
Maximum source stages per pipeline.
Definition fzm_format.h:66
constexpr size_t FZM_STAGE_CONFIG_SIZE
Per-stage serialized config slot (bytes)
Definition fzm_format.h:65
constexpr uint8_t fzmVersionMajor(uint16_t v)
Definition fzm_format.h:55
constexpr uint16_t FZM_FLAG_HAS_DATA_CHECKSUM
data_checksum field is valid
Definition fzm_format.h:48
constexpr uint32_t FZM_MAGIC
Definition fzm_format.h:28
StageType
Stage type identifiers written into the FZM header.
Definition fzm_format.h:76
@ ADAPTIVE_BITPACK
Per-block adaptive fixed-rate bit-plane coder (cuSZp plain mode)
@ ANS
rANS entropy coder (GPU, via dietGPU)
@ RRE
Repetition-Reduction Encoding (LC framework lossless component)
@ ADM
Adaptive Data Mapping transform (MANS)
@ TILED_LORENZO
Dimension-aware (tiled separable) Lorenzo predictor (cuSZp3 delta)
@ BITPLANE_RZE
Fused bitplane transpose + zero-group RZE (FZ-GPU lossless encoder)
@ G_INTERP
Spline interpolation predictor + quantizer (cuSZ-Hi G-Interp)
constexpr uint16_t FZM_FLAG_HAS_HEADER_CHECKSUM
header_checksum field is valid
Definition fzm_format.h:49
DataType
Element data type identifiers used in buffer and stage descriptors.
Definition fzm_format.h:109
constexpr size_t FZM_LEGACY_HEADER_CORE_SIZE
Definition fzm_format.h:46
constexpr size_t FZM_MAX_NAME_LEN
Maximum output port name length (bytes, null-terminated)
Definition fzm_format.h:64
constexpr size_t FZM_MAX_BUFFERS
Maximum pipeline output buffers per file.
Definition fzm_format.h:63
Per-buffer metadata record written into the FZM header (256 bytes).
Definition fzm_format.h:176
StageType stage_type
Producer stage type (2B)
Definition fzm_format.h:177
uint64_t data_size
Actual compressed bytes in this segment (8B)
Definition fzm_format.h:184
uint8_t producer_output_idx
Which output port of the producer (1B)
Definition fzm_format.h:180
uint64_t uncompressed_size
Bytes after fully decompressing this stage's output (8B)
Definition fzm_format.h:186
uint8_t stage_config[FZM_STAGE_CONFIG_SIZE]
Producer stage config, see Stage::serializeHeader() (128B)
Definition fzm_format.h:189
char name[FZM_MAX_NAME_LEN]
Output port name, null-terminated (64B)
Definition fzm_format.h:182
DataType data_type
Element data type in this buffer (1B)
Definition fzm_format.h:179
uint64_t allocated_size
Buffer capacity required for decompression (8B)
Definition fzm_format.h:185
uint8_t reserved2[14]
Reserved for future use (14B)
Definition fzm_format.h:192
uint32_t config_size
Valid bytes in stage_config (4B)
Definition fzm_format.h:190
uint16_t dag_buffer_id
DAG buffer ID used for inverse routing; 0xFFFF = unassigned (2B)
Definition fzm_format.h:181
uint16_t stage_version
Producer stage config version (2B)
Definition fzm_format.h:178
uint64_t byte_offset
Byte offset of this segment within the compressed payload (8B)
Definition fzm_format.h:187
Fixed-size FZM file header core (80 bytes).
Definition fzm_format.h:224
uint64_t computeHeaderSize() const
Definition fzm_format.h:263
uint16_t num_buffers
Number of FZMBufferEntry records (2B)
Definition fzm_format.h:227
uint32_t header_checksum
CRC32 of header bytes (v3.1+; 0 if flag not set) (4B)
Definition fzm_format.h:245
uint16_t flags
Feature flags: FZM_FLAG_* constants (2B)
Definition fzm_format.h:235
uint32_t data_checksum
CRC32 of compressed payload (v3.1+; 0 if flag not set) (4B)
Definition fzm_format.h:244
uint32_t num_stages
Number of FZMStageInfo records (4B)
Definition fzm_format.h:233
uint64_t compressed_size
Total compressed payload size in bytes (8B)
Definition fzm_format.h:230
uint64_t source_uncompressed_sizes[FZM_MAX_SOURCES]
(32B)
Definition fzm_format.h:242
uint16_t version
FZM_VERSION (2B)
Definition fzm_format.h:226
uint64_t uncompressed_size
Sum of all source uncompressed sizes in bytes (8B)
Definition fzm_format.h:229
uint16_t num_sources
Number of source (input) stages in the pipeline (2B)
Definition fzm_format.h:234
uint32_t magic
Must equal FZM_MAGIC (4B)
Definition fzm_format.h:225
uint64_t header_size
Total header size; compressed payload starts at this offset (8B)
Definition fzm_format.h:231
Per-stage metadata record written into the FZM header (256 bytes).
Definition fzm_format.h:137
uint8_t stage_config[FZM_STAGE_CONFIG_SIZE]
Serialized stage config, see Stage::serializeHeader() (128B)
Definition fzm_format.h:147
uint8_t num_inputs
Number of input ports (1B)
Definition fzm_format.h:140
uint8_t num_outputs
Number of output ports (1B)
Definition fzm_format.h:141
StageType stage_type
Stage type (2B)
Definition fzm_format.h:138
uint8_t reserved2[84]
Reserved for future use (84B)
Definition fzm_format.h:150
uint16_t input_buffer_ids[FZM_MAX_STAGE_INPUTS]
Input buffer indices (16B); 0xFFFF = unused.
Definition fzm_format.h:144
uint16_t stage_version
Config format version (2B)
Definition fzm_format.h:139
uint32_t config_size
Valid bytes in stage_config (4B)
Definition fzm_format.h:148
uint16_t reserved1
Padding (2B)
Definition fzm_format.h:142
uint16_t output_buffer_ids[FZM_MAX_STAGE_OUTPUTS]
Output buffer indices (16B); 0xFFFF = unused.
Definition fzm_format.h:145