FZGPUModules 2.0
GPU-accelerated modular compression pipelines
Loading...
Searching...
No Matches
stage.h
Go to the documentation of this file.
1
5#pragma once
6
7#include "fzm_format.h"
8#include <array>
9#include <cuda_runtime.h>
10#include <cstdint>
11#include <stdexcept>
12#include <string>
13#include <unordered_map>
14#include <vector>
15
16namespace fz {
17
18// Forward declaration — avoids requiring mempool.h in every stage header
19class MemoryPool;
20
30class Stage {
31public:
32 virtual ~Stage() = default;
33
35 virtual void execute(
36 cudaStream_t stream,
37 MemoryPool* pool,
38 const std::vector<void*>& inputs,
39 const std::vector<void*>& outputs,
40 const std::vector<size_t>& sizes
41 ) = 0;
42
44 virtual std::string getName() const = 0;
45
46 virtual size_t getNumInputs() const = 0;
47 virtual size_t getNumOutputs() const = 0;
48
55 virtual size_t getRequiredInputAlignment() const { return 1; }
56
61 virtual std::vector<std::string> getOutputNames() const {
62 return {"output"};
63 }
64
66 int getOutputIndex(const std::string& name) const {
67 auto names = getOutputNames();
68 for (size_t i = 0; i < names.size(); i++) {
69 if (names[i] == name) return static_cast<int>(i);
70 }
71 return -1;
72 }
73
79 virtual std::vector<size_t> estimateOutputSizes(
80 const std::vector<size_t>& input_sizes
81 ) const = 0;
82
84 virtual std::unordered_map<std::string, size_t> getActualOutputSizesByName() const = 0;
85
92 virtual size_t getActualOutputSize(int index) const {
93 auto names = getOutputNames();
94 if (index < 0 || index >= static_cast<int>(names.size())) return 0;
96 auto it = m.find(names[index]);
97 return (it != m.end()) ? it->second : 0;
98 }
99
104 virtual void setInverse(bool inverse) { (void)inverse; }
105 virtual bool isInverse() const { return false; }
106
108 virtual uint16_t getStageTypeId() const = 0;
109
111 virtual uint8_t getOutputDataType(size_t output_index) const = 0;
112
122 virtual uint8_t getInputDataType(size_t /*input_index*/) const {
123 return static_cast<uint8_t>(DataType::UNKNOWN);
124 }
125
130 virtual size_t serializeHeader(size_t output_index, uint8_t* header_buffer, size_t max_size) const {
131 (void)output_index; (void)header_buffer; (void)max_size;
132 return 0;
133 }
134
136 virtual void deserializeHeader(const uint8_t* header_buffer, size_t size) {
137 (void)header_buffer; (void)size;
138 }
139
146 virtual void saveState() {}
147 virtual void restoreState() {}
148
154 virtual void setDims(const std::array<size_t, 3>& dims) { (void)dims; }
155
162 virtual void postStreamSync(cudaStream_t stream) { (void)stream; }
163
165 virtual size_t getMaxHeaderSize(size_t output_index) const {
166 (void)output_index;
167 return 0;
168 }
169
182 virtual bool isGraphCompatible() const { return true; }
183
192 virtual size_t estimateScratchBytes(const std::vector<size_t>& input_sizes) const {
193 (void)input_sizes;
194 return 0;
195 }
196};
197
198} // namespace fz
Definition mempool.h:66
Definition stage.h:30
virtual uint8_t getInputDataType(size_t) const
Definition stage.h:122
virtual std::string getName() const =0
virtual std::vector< std::string > getOutputNames() const
Definition stage.h:61
virtual void saveState()
Definition stage.h:146
virtual bool isGraphCompatible() const
Definition stage.h:182
virtual void postStreamSync(cudaStream_t stream)
Definition stage.h:162
virtual size_t getActualOutputSize(int index) const
Definition stage.h:92
virtual std::vector< size_t > estimateOutputSizes(const std::vector< size_t > &input_sizes) const =0
virtual void setInverse(bool inverse)
Definition stage.h:104
virtual uint16_t getStageTypeId() const =0
virtual size_t serializeHeader(size_t output_index, uint8_t *header_buffer, size_t max_size) const
Definition stage.h:130
virtual uint8_t getOutputDataType(size_t output_index) const =0
virtual void deserializeHeader(const uint8_t *header_buffer, size_t size)
Definition stage.h:136
virtual size_t getRequiredInputAlignment() const
Definition stage.h:55
virtual std::unordered_map< std::string, size_t > getActualOutputSizesByName() const =0
virtual void execute(cudaStream_t stream, MemoryPool *pool, const std::vector< void * > &inputs, const std::vector< void * > &outputs, const std::vector< size_t > &sizes)=0
int getOutputIndex(const std::string &name) const
Definition stage.h:66
virtual size_t estimateScratchBytes(const std::vector< size_t > &input_sizes) const
Definition stage.h:192
virtual size_t getMaxHeaderSize(size_t output_index) const
Definition stage.h:165
virtual void setDims(const std::array< size_t, 3 > &dims)
Definition stage.h:154
FZM binary file format definitions — structs, enums, and helpers.