FZGPUModules 2.0
GPU-accelerated modular compression pipelines
Loading...
Searching...
No Matches
fzm_format.h
Go to the documentation of this file.
1#pragma once
2
20#include <cstdint>
21#include <cstring>
22#include <stdexcept>
23#include <string>
24
25namespace fz {
26
28constexpr uint32_t FZM_MAGIC = 0x464D5A32;
29
40constexpr uint8_t FZM_VERSION_MAJOR = 3;
41constexpr uint8_t FZM_VERSION_MINOR = 1;
42constexpr uint16_t FZM_VERSION = (static_cast<uint16_t>(FZM_VERSION_MAJOR) << 8)
43 | static_cast<uint16_t>(FZM_VERSION_MINOR);
44
46constexpr size_t FZM_LEGACY_HEADER_CORE_SIZE = 72;
47
48constexpr uint16_t FZM_FLAG_HAS_DATA_CHECKSUM = 0x0001u;
49constexpr uint16_t FZM_FLAG_HAS_HEADER_CHECKSUM = 0x0002u;
50
55constexpr uint8_t fzmVersionMajor(uint16_t v) {
56 return (v <= 0xFF) ? static_cast<uint8_t>(v) : static_cast<uint8_t>(v >> 8);
57}
59constexpr uint8_t fzmVersionMinor(uint16_t v) {
60 return (v <= 0xFF) ? 0u : static_cast<uint8_t>(v & 0xFF);
61}
62
63constexpr size_t FZM_MAX_BUFFERS = 32;
64constexpr size_t FZM_MAX_NAME_LEN = 64;
65constexpr size_t FZM_STAGE_CONFIG_SIZE = 128;
66constexpr size_t FZM_MAX_SOURCES = 4;
67
68// ─────────────────────────────────────────────────────────────────────────────
69
76enum class StageType : uint16_t {
77 UNKNOWN = 0,
78 LORENZO_QUANT = 1,
79 DIFFERENCE = 2,
80 SCALE = 3,
81 PASSTHROUGH= 4,
82 RLE = 5,
83 HUFFMAN = 6,
84 BITPACK = 7,
85 SPLIT = 10,
86 MERGE = 11,
87 LORENZO = 12,
88 QUANTIZER = 14,
89 ZIGZAG = 15,
90 NEGABINARY = 16,
91 BITSHUFFLE = 17,
92 RZE = 18,
93};
94
102enum class DataType : uint8_t {
103 UINT8 = 0,
104 UINT16 = 1,
105 UINT32 = 2,
106 UINT64 = 3,
107 INT8 = 4,
108 INT16 = 5,
109 INT32 = 6,
110 INT64 = 7,
111 FLOAT32 = 8,
112 FLOAT64 = 9,
113 UNKNOWN = 0xFF,
114};
115
116// ─────────────────────────────────────────────────────────────────────────────
117
118constexpr size_t FZM_MAX_STAGE_INPUTS = 8;
119constexpr size_t FZM_MAX_STAGE_OUTPUTS = 8;
120
132 uint16_t stage_version;
133 uint8_t num_inputs;
134 uint8_t num_outputs;
135 uint16_t reserved1;
136
137 uint16_t input_buffer_ids[FZM_MAX_STAGE_INPUTS];
138 uint16_t output_buffer_ids[FZM_MAX_STAGE_OUTPUTS];
139
141 uint32_t config_size;
142
143 uint8_t reserved2[84];
144 // Total: 2+2+1+1+2+16+16+128+4+84 = 256 bytes
145
146 FZMStageInfo() {
147 stage_type = StageType::UNKNOWN;
148 stage_version = 0;
149 num_inputs = 0;
150 num_outputs = 0;
151 reserved1 = 0;
152 memset(input_buffer_ids, 0xFF, sizeof(input_buffer_ids));
153 memset(output_buffer_ids, 0xFF, sizeof(output_buffer_ids));
155 config_size = 0;
156 memset(reserved2, 0, 84);
157 }
158};
159static_assert(sizeof(FZMStageInfo) == 256, "FZMStageInfo must be 256 bytes");
160
171 uint16_t stage_version;
174 uint16_t dag_buffer_id;
176
177 uint64_t data_size;
178 uint64_t allocated_size;
180 uint64_t byte_offset;
181
183 uint32_t config_size;
184
185 uint8_t reserved2[14];
186
188 stage_type = StageType::UNKNOWN;
189 stage_version = 0;
190 data_type = DataType::UINT8;
192 dag_buffer_id = 0xFFFF;
193 memset(name, 0, FZM_MAX_NAME_LEN);
194 data_size = 0;
195 allocated_size = 0;
197 byte_offset = 0;
199 config_size = 0;
200 memset(reserved2, 0, 14);
201 }
202};
203static_assert(sizeof(FZMBufferEntry) == 256, "FZMBufferEntry must be 256 bytes");
204
218 uint32_t magic;
219 uint16_t version;
220 uint16_t num_buffers;
221
224 uint64_t header_size;
225
226 uint32_t num_stages;
227 uint16_t num_sources;
228 uint16_t flags;
229
236
237 uint32_t data_checksum;
239
240 FZMHeaderCore() {
242 version = FZM_VERSION;
243 num_buffers = 0;
245 compressed_size = 0;
246 header_size = sizeof(FZMHeaderCore);
247 num_stages = 0;
248 num_sources = 0;
249 flags = 0;
251 data_checksum = 0;
252 header_checksum = 0;
253 }
254
256 uint64_t computeHeaderSize() const {
257 return sizeof(FZMHeaderCore)
258 + num_stages * sizeof(FZMStageInfo)
259 + num_buffers * sizeof(FZMBufferEntry);
260 }
261};
262static_assert(sizeof(FZMHeaderCore) == 80, "FZMHeaderCore must be 80 bytes");
263
264// ─────────────────────────────────────────────────────────────────────────────
265// Helper functions
266// ─────────────────────────────────────────────────────────────────────────────
267
269inline size_t getDataTypeSize(DataType type) {
270 switch (type) {
271 case DataType::UINT8: case DataType::INT8: return 1;
272 case DataType::UINT16: case DataType::INT16: return 2;
273 case DataType::UINT32: case DataType::INT32: case DataType::FLOAT32: return 4;
274 case DataType::UINT64: case DataType::INT64: case DataType::FLOAT64: return 8;
275 default: throw std::runtime_error("Unknown data type");
276 }
277}
278
280inline std::string dataTypeToString(DataType type) {
281 switch (type) {
282 case DataType::UINT8: return "uint8";
283 case DataType::UINT16: return "uint16";
284 case DataType::UINT32: return "uint32";
285 case DataType::UINT64: return "uint64";
286 case DataType::INT8: return "int8";
287 case DataType::INT16: return "int16";
288 case DataType::INT32: return "int32";
289 case DataType::INT64: return "int64";
290 case DataType::FLOAT32: return "float32";
291 case DataType::FLOAT64: return "float64";
292 default: return "unknown";
293 }
294}
295
297inline std::string stageTypeToString(StageType type) {
298 switch (type) {
299 case StageType::LORENZO_QUANT: return "LorenzoQuant";
300 case StageType::DIFFERENCE: return "Difference";
301 case StageType::SCALE: return "Scale";
302 case StageType::PASSTHROUGH: return "PassThrough";
303 case StageType::RLE: return "RLE";
304 case StageType::HUFFMAN: return "Huffman";
305 case StageType::BITPACK: return "BitPack";
306 case StageType::SPLIT: return "Split";
307 case StageType::MERGE: return "Merge";
308 case StageType::QUANTIZER: return "Quantizer";
309 case StageType::ZIGZAG: return "Zigzag";
310 case StageType::NEGABINARY: return "Negabinary";
311 case StageType::BITSHUFFLE: return "Bitshuffle";
312 case StageType::RZE: return "RZE";
313 case StageType::LORENZO: return "Lorenzo";
314 default: return "Unknown";
315 }
316}
317
318} // namespace fz
size_t getDataTypeSize(DataType type)
Definition fzm_format.h:269
constexpr uint8_t FZM_VERSION_MAJOR
Definition fzm_format.h:40
std::string dataTypeToString(DataType type)
Definition fzm_format.h:280
std::string stageTypeToString(StageType type)
Definition fzm_format.h:297
constexpr uint8_t fzmVersionMinor(uint16_t v)
Definition fzm_format.h:59
constexpr size_t FZM_MAX_SOURCES
Maximum source stages per pipeline.
Definition fzm_format.h:66
constexpr size_t FZM_STAGE_CONFIG_SIZE
Per-stage serialized config slot (bytes)
Definition fzm_format.h:65
constexpr uint8_t fzmVersionMajor(uint16_t v)
Definition fzm_format.h:55
constexpr uint16_t FZM_FLAG_HAS_DATA_CHECKSUM
data_checksum field is valid
Definition fzm_format.h:48
constexpr uint32_t FZM_MAGIC
Definition fzm_format.h:28
StageType
Stage type identifiers written into the FZM header.
Definition fzm_format.h:76
constexpr uint16_t FZM_FLAG_HAS_HEADER_CHECKSUM
header_checksum field is valid
Definition fzm_format.h:49
DataType
Element data type identifiers used in buffer and stage descriptors.
Definition fzm_format.h:102
constexpr size_t FZM_LEGACY_HEADER_CORE_SIZE
Definition fzm_format.h:46
constexpr size_t FZM_MAX_NAME_LEN
Maximum output port name length (bytes, null-terminated)
Definition fzm_format.h:64
constexpr size_t FZM_MAX_BUFFERS
Maximum pipeline output buffers per file.
Definition fzm_format.h:63
Per-buffer metadata record written into the FZM header (256 bytes).
Definition fzm_format.h:169
StageType stage_type
Producer stage type (2B)
Definition fzm_format.h:170
uint64_t data_size
Actual compressed bytes in this segment (8B)
Definition fzm_format.h:177
uint8_t producer_output_idx
Which output port of the producer (1B)
Definition fzm_format.h:173
uint64_t uncompressed_size
Bytes after fully decompressing this stage's output (8B)
Definition fzm_format.h:179
uint8_t stage_config[FZM_STAGE_CONFIG_SIZE]
Producer stage config, see Stage::serializeHeader() (128B)
Definition fzm_format.h:182
char name[FZM_MAX_NAME_LEN]
Output port name, null-terminated (64B)
Definition fzm_format.h:175
DataType data_type
Element data type in this buffer (1B)
Definition fzm_format.h:172
uint64_t allocated_size
Buffer capacity required for decompression (8B)
Definition fzm_format.h:178
uint8_t reserved2[14]
Reserved for future use (14B)
Definition fzm_format.h:185
uint32_t config_size
Valid bytes in stage_config (4B)
Definition fzm_format.h:183
uint16_t dag_buffer_id
DAG buffer ID used for inverse routing; 0xFFFF = unassigned (2B)
Definition fzm_format.h:174
uint16_t stage_version
Producer stage config version (2B)
Definition fzm_format.h:171
uint64_t byte_offset
Byte offset of this segment within the compressed payload (8B)
Definition fzm_format.h:180
Fixed-size FZM file header core (80 bytes).
Definition fzm_format.h:217
uint64_t computeHeaderSize() const
Definition fzm_format.h:256
uint16_t num_buffers
Number of FZMBufferEntry records (2B)
Definition fzm_format.h:220
uint32_t header_checksum
CRC32 of header bytes (v3.1+; 0 if flag not set) (4B)
Definition fzm_format.h:238
uint16_t flags
Feature flags: FZM_FLAG_* constants (2B)
Definition fzm_format.h:228
uint32_t data_checksum
CRC32 of compressed payload (v3.1+; 0 if flag not set) (4B)
Definition fzm_format.h:237
uint32_t num_stages
Number of FZMStageInfo records (4B)
Definition fzm_format.h:226
uint64_t compressed_size
Total compressed payload size in bytes (8B)
Definition fzm_format.h:223
uint64_t source_uncompressed_sizes[FZM_MAX_SOURCES]
(32B)
Definition fzm_format.h:235
uint16_t version
FZM_VERSION (2B)
Definition fzm_format.h:219
uint64_t uncompressed_size
Sum of all source uncompressed sizes in bytes (8B)
Definition fzm_format.h:222
uint16_t num_sources
Number of source (input) stages in the pipeline (2B)
Definition fzm_format.h:227
uint32_t magic
Must equal FZM_MAGIC (4B)
Definition fzm_format.h:218
uint64_t header_size
Total header size; compressed payload starts at this offset (8B)
Definition fzm_format.h:224
Per-stage metadata record written into the FZM header (256 bytes).
Definition fzm_format.h:130
uint8_t stage_config[FZM_STAGE_CONFIG_SIZE]
Serialized stage config, see Stage::serializeHeader() (128B)
Definition fzm_format.h:140
uint8_t num_inputs
Number of input ports (1B)
Definition fzm_format.h:133
uint8_t num_outputs
Number of output ports (1B)
Definition fzm_format.h:134
StageType stage_type
Stage type (2B)
Definition fzm_format.h:131
uint8_t reserved2[84]
Reserved for future use (84B)
Definition fzm_format.h:143
uint16_t input_buffer_ids[FZM_MAX_STAGE_INPUTS]
Input buffer indices (16B); 0xFFFF = unused.
Definition fzm_format.h:137
uint16_t stage_version
Config format version (2B)
Definition fzm_format.h:132
uint32_t config_size
Valid bytes in stage_config (4B)
Definition fzm_format.h:141
uint16_t reserved1
Padding (2B)
Definition fzm_format.h:135
uint16_t output_buffer_ids[FZM_MAX_STAGE_OUTPUTS]
Output buffer indices (16B); 0xFFFF = unused.
Definition fzm_format.h:138