FZGPUModules 2.0
GPU-accelerated modular compression pipelines
Loading...
Searching...
No Matches
fzm_format.h
Go to the documentation of this file.
1#pragma once
2
20#include <cstdint>
21#include <cstring>
22#include <stdexcept>
23#include <string>
24
25namespace fz {
26
28constexpr uint32_t FZM_MAGIC = 0x464D5A32;
29
40constexpr uint8_t FZM_VERSION_MAJOR = 3;
41constexpr uint8_t FZM_VERSION_MINOR = 1;
42constexpr uint16_t FZM_VERSION = (static_cast<uint16_t>(FZM_VERSION_MAJOR) << 8)
43 | static_cast<uint16_t>(FZM_VERSION_MINOR);
44
46constexpr size_t FZM_LEGACY_HEADER_CORE_SIZE = 72;
47
48constexpr uint16_t FZM_FLAG_HAS_DATA_CHECKSUM = 0x0001u;
49constexpr uint16_t FZM_FLAG_HAS_HEADER_CHECKSUM = 0x0002u;
50
55constexpr uint8_t fzmVersionMajor(uint16_t v) {
56 return (v <= 0xFF) ? static_cast<uint8_t>(v) : static_cast<uint8_t>(v >> 8);
57}
59constexpr uint8_t fzmVersionMinor(uint16_t v) {
60 return (v <= 0xFF) ? 0u : static_cast<uint8_t>(v & 0xFF);
61}
62
63constexpr size_t FZM_MAX_BUFFERS = 32;
64constexpr size_t FZM_MAX_NAME_LEN = 64;
65constexpr size_t FZM_STAGE_CONFIG_SIZE = 128;
66constexpr size_t FZM_MAX_SOURCES = 4;
67
68// ─────────────────────────────────────────────────────────────────────────────
69
76enum class StageType : uint16_t {
77 UNKNOWN = 0,
78 LORENZO_QUANT = 1,
79 DIFFERENCE = 2,
80 SCALE = 3,
81 PASSTHROUGH= 4,
82 RLE = 5,
83 HUFFMAN = 6,
84 BITPACK = 7,
85 SPLIT = 10,
86 MERGE = 11,
87 LORENZO = 12,
88 QUANTIZER = 14,
89 ZIGZAG = 15,
90 NEGABINARY = 16,
91 BITSHUFFLE = 17,
92 RZE = 18,
93 ANS = 20,
94 ADM = 19,
95};
96
104enum class DataType : uint8_t {
105 UINT8 = 0,
106 UINT16 = 1,
107 UINT32 = 2,
108 UINT64 = 3,
109 INT8 = 4,
110 INT16 = 5,
111 INT32 = 6,
112 INT64 = 7,
113 FLOAT32 = 8,
114 FLOAT64 = 9,
115 UNKNOWN = 0xFF,
116};
117
118// ─────────────────────────────────────────────────────────────────────────────
119
120constexpr size_t FZM_MAX_STAGE_INPUTS = 8;
121constexpr size_t FZM_MAX_STAGE_OUTPUTS = 8;
122
134 uint16_t stage_version;
135 uint8_t num_inputs;
136 uint8_t num_outputs;
137 uint16_t reserved1;
138
139 uint16_t input_buffer_ids[FZM_MAX_STAGE_INPUTS];
140 uint16_t output_buffer_ids[FZM_MAX_STAGE_OUTPUTS];
141
143 uint32_t config_size;
144
145 uint8_t reserved2[84];
146 // Total: 2+2+1+1+2+16+16+128+4+84 = 256 bytes
147
148 FZMStageInfo() {
149 stage_type = StageType::UNKNOWN;
150 stage_version = 0;
151 num_inputs = 0;
152 num_outputs = 0;
153 reserved1 = 0;
154 memset(input_buffer_ids, 0xFF, sizeof(input_buffer_ids));
155 memset(output_buffer_ids, 0xFF, sizeof(output_buffer_ids));
157 config_size = 0;
158 memset(reserved2, 0, 84);
159 }
160};
161static_assert(sizeof(FZMStageInfo) == 256, "FZMStageInfo must be 256 bytes");
162
173 uint16_t stage_version;
176 uint16_t dag_buffer_id;
178
179 uint64_t data_size;
180 uint64_t allocated_size;
182 uint64_t byte_offset;
183
185 uint32_t config_size;
186
187 uint8_t reserved2[14];
188
190 stage_type = StageType::UNKNOWN;
191 stage_version = 0;
192 data_type = DataType::UINT8;
194 dag_buffer_id = 0xFFFF;
195 memset(name, 0, FZM_MAX_NAME_LEN);
196 data_size = 0;
197 allocated_size = 0;
199 byte_offset = 0;
201 config_size = 0;
202 memset(reserved2, 0, 14);
203 }
204};
205static_assert(sizeof(FZMBufferEntry) == 256, "FZMBufferEntry must be 256 bytes");
206
220 uint32_t magic;
221 uint16_t version;
222 uint16_t num_buffers;
223
226 uint64_t header_size;
227
228 uint32_t num_stages;
229 uint16_t num_sources;
230 uint16_t flags;
231
238
239 uint32_t data_checksum;
241
242 FZMHeaderCore() {
244 version = FZM_VERSION;
245 num_buffers = 0;
247 compressed_size = 0;
248 header_size = sizeof(FZMHeaderCore);
249 num_stages = 0;
250 num_sources = 0;
251 flags = 0;
253 data_checksum = 0;
254 header_checksum = 0;
255 }
256
258 uint64_t computeHeaderSize() const {
259 return sizeof(FZMHeaderCore)
260 + num_stages * sizeof(FZMStageInfo)
261 + num_buffers * sizeof(FZMBufferEntry);
262 }
263};
264static_assert(sizeof(FZMHeaderCore) == 80, "FZMHeaderCore must be 80 bytes");
265
266// ─────────────────────────────────────────────────────────────────────────────
267// Helper functions
268// ─────────────────────────────────────────────────────────────────────────────
269
271inline size_t getDataTypeSize(DataType type) {
272 switch (type) {
273 case DataType::UINT8: case DataType::INT8: return 1;
274 case DataType::UINT16: case DataType::INT16: return 2;
275 case DataType::UINT32: case DataType::INT32: case DataType::FLOAT32: return 4;
276 case DataType::UINT64: case DataType::INT64: case DataType::FLOAT64: return 8;
277 default: throw std::runtime_error("Unknown data type");
278 }
279}
280
282inline std::string dataTypeToString(DataType type) {
283 switch (type) {
284 case DataType::UINT8: return "uint8";
285 case DataType::UINT16: return "uint16";
286 case DataType::UINT32: return "uint32";
287 case DataType::UINT64: return "uint64";
288 case DataType::INT8: return "int8";
289 case DataType::INT16: return "int16";
290 case DataType::INT32: return "int32";
291 case DataType::INT64: return "int64";
292 case DataType::FLOAT32: return "float32";
293 case DataType::FLOAT64: return "float64";
294 default: return "unknown";
295 }
296}
297
299inline std::string stageTypeToString(StageType type) {
300 switch (type) {
301 case StageType::LORENZO_QUANT: return "LorenzoQuant";
302 case StageType::DIFFERENCE: return "Difference";
303 case StageType::SCALE: return "Scale";
304 case StageType::PASSTHROUGH: return "PassThrough";
305 case StageType::RLE: return "RLE";
306 case StageType::HUFFMAN: return "Huffman";
307 case StageType::BITPACK: return "BitPack";
308 case StageType::SPLIT: return "Split";
309 case StageType::MERGE: return "Merge";
310 case StageType::QUANTIZER: return "Quantizer";
311 case StageType::ZIGZAG: return "Zigzag";
312 case StageType::NEGABINARY: return "Negabinary";
313 case StageType::BITSHUFFLE: return "Bitshuffle";
314 case StageType::RZE: return "RZE";
315 case StageType::LORENZO: return "Lorenzo";
316 case StageType::ANS: return "ANS";
317 case StageType::ADM: return "ADM";
318 default: return "Unknown";
319 }
320}
321
322} // namespace fz
Definition fzm_format.h:25
size_t getDataTypeSize(DataType type)
Definition fzm_format.h:271
constexpr uint8_t FZM_VERSION_MAJOR
Definition fzm_format.h:40
std::string dataTypeToString(DataType type)
Definition fzm_format.h:282
std::string stageTypeToString(StageType type)
Definition fzm_format.h:299
constexpr uint8_t fzmVersionMinor(uint16_t v)
Definition fzm_format.h:59
constexpr size_t FZM_MAX_SOURCES
Maximum source stages per pipeline.
Definition fzm_format.h:66
constexpr size_t FZM_STAGE_CONFIG_SIZE
Per-stage serialized config slot (bytes)
Definition fzm_format.h:65
constexpr uint8_t fzmVersionMajor(uint16_t v)
Definition fzm_format.h:55
constexpr uint16_t FZM_FLAG_HAS_DATA_CHECKSUM
data_checksum field is valid
Definition fzm_format.h:48
constexpr uint32_t FZM_MAGIC
Definition fzm_format.h:28
StageType
Stage type identifiers written into the FZM header.
Definition fzm_format.h:76
@ ANS
rANS entropy coder (GPU, via dietGPU)
@ ADM
Adaptive Data Mapping transform (MANS)
constexpr uint16_t FZM_FLAG_HAS_HEADER_CHECKSUM
header_checksum field is valid
Definition fzm_format.h:49
DataType
Element data type identifiers used in buffer and stage descriptors.
Definition fzm_format.h:104
constexpr size_t FZM_LEGACY_HEADER_CORE_SIZE
Definition fzm_format.h:46
constexpr size_t FZM_MAX_NAME_LEN
Maximum output port name length (bytes, null-terminated)
Definition fzm_format.h:64
constexpr size_t FZM_MAX_BUFFERS
Maximum pipeline output buffers per file.
Definition fzm_format.h:63
Per-buffer metadata record written into the FZM header (256 bytes).
Definition fzm_format.h:171
StageType stage_type
Producer stage type (2B)
Definition fzm_format.h:172
uint64_t data_size
Actual compressed bytes in this segment (8B)
Definition fzm_format.h:179
uint8_t producer_output_idx
Which output port of the producer (1B)
Definition fzm_format.h:175
uint64_t uncompressed_size
Bytes after fully decompressing this stage's output (8B)
Definition fzm_format.h:181
uint8_t stage_config[FZM_STAGE_CONFIG_SIZE]
Producer stage config, see Stage::serializeHeader() (128B)
Definition fzm_format.h:184
char name[FZM_MAX_NAME_LEN]
Output port name, null-terminated (64B)
Definition fzm_format.h:177
DataType data_type
Element data type in this buffer (1B)
Definition fzm_format.h:174
uint64_t allocated_size
Buffer capacity required for decompression (8B)
Definition fzm_format.h:180
uint8_t reserved2[14]
Reserved for future use (14B)
Definition fzm_format.h:187
uint32_t config_size
Valid bytes in stage_config (4B)
Definition fzm_format.h:185
uint16_t dag_buffer_id
DAG buffer ID used for inverse routing; 0xFFFF = unassigned (2B)
Definition fzm_format.h:176
uint16_t stage_version
Producer stage config version (2B)
Definition fzm_format.h:173
uint64_t byte_offset
Byte offset of this segment within the compressed payload (8B)
Definition fzm_format.h:182
Fixed-size FZM file header core (80 bytes).
Definition fzm_format.h:219
uint64_t computeHeaderSize() const
Definition fzm_format.h:258
uint16_t num_buffers
Number of FZMBufferEntry records (2B)
Definition fzm_format.h:222
uint32_t header_checksum
CRC32 of header bytes (v3.1+; 0 if flag not set) (4B)
Definition fzm_format.h:240
uint16_t flags
Feature flags: FZM_FLAG_* constants (2B)
Definition fzm_format.h:230
uint32_t data_checksum
CRC32 of compressed payload (v3.1+; 0 if flag not set) (4B)
Definition fzm_format.h:239
uint32_t num_stages
Number of FZMStageInfo records (4B)
Definition fzm_format.h:228
uint64_t compressed_size
Total compressed payload size in bytes (8B)
Definition fzm_format.h:225
uint64_t source_uncompressed_sizes[FZM_MAX_SOURCES]
(32B)
Definition fzm_format.h:237
uint16_t version
FZM_VERSION (2B)
Definition fzm_format.h:221
uint64_t uncompressed_size
Sum of all source uncompressed sizes in bytes (8B)
Definition fzm_format.h:224
uint16_t num_sources
Number of source (input) stages in the pipeline (2B)
Definition fzm_format.h:229
uint32_t magic
Must equal FZM_MAGIC (4B)
Definition fzm_format.h:220
uint64_t header_size
Total header size; compressed payload starts at this offset (8B)
Definition fzm_format.h:226
Per-stage metadata record written into the FZM header (256 bytes).
Definition fzm_format.h:132
uint8_t stage_config[FZM_STAGE_CONFIG_SIZE]
Serialized stage config, see Stage::serializeHeader() (128B)
Definition fzm_format.h:142
uint8_t num_inputs
Number of input ports (1B)
Definition fzm_format.h:135
uint8_t num_outputs
Number of output ports (1B)
Definition fzm_format.h:136
StageType stage_type
Stage type (2B)
Definition fzm_format.h:133
uint8_t reserved2[84]
Reserved for future use (84B)
Definition fzm_format.h:145
uint16_t input_buffer_ids[FZM_MAX_STAGE_INPUTS]
Input buffer indices (16B); 0xFFFF = unused.
Definition fzm_format.h:139
uint16_t stage_version
Config format version (2B)
Definition fzm_format.h:134
uint32_t config_size
Valid bytes in stage_config (4B)
Definition fzm_format.h:143
uint16_t reserved1
Padding (2B)
Definition fzm_format.h:137
uint16_t output_buffer_ids[FZM_MAX_STAGE_OUTPUTS]
Output buffer indices (16B); 0xFFFF = unused.
Definition fzm_format.h:140