5#include <cuda_runtime.h>
9#include <unordered_map>
30 virtual ~Stage() =
default;
36 const std::vector<void*>& inputs,
37 const std::vector<void*>& outputs,
38 const std::vector<size_t>& sizes
44 virtual size_t getNumInputs()
const = 0;
45 virtual size_t getNumOutputs()
const = 0;
66 for (
size_t i = 0; i < names.size(); i++) {
67 if (names[i] == name)
return static_cast<int>(i);
78 const std::vector<size_t>& input_sizes
92 if (index < 0 || index >=
static_cast<int>(names.size()))
return 0;
94 auto it = m.find(names[index]);
95 return (it != m.end()) ? it->second : 0;
103 virtual bool isInverse()
const {
return false; }
128 virtual size_t serializeHeader(
size_t output_index, uint8_t* header_buffer,
size_t max_size)
const {
129 (void)output_index; (void)header_buffer; (void)max_size;
135 (void)header_buffer; (void)size;
145 virtual void restoreState() {}
152 virtual void setDims(
const std::array<size_t, 3>& dims) { (void)dims; }
virtual uint8_t getInputDataType(size_t) const
Definition stage.h:120
virtual std::string getName() const =0
virtual std::vector< std::string > getOutputNames() const
Definition stage.h:59
virtual void saveState()
Definition stage.h:144
virtual bool isGraphCompatible() const
Definition stage.h:180
virtual void postStreamSync(cudaStream_t stream)
Definition stage.h:160
virtual size_t getActualOutputSize(int index) const
Definition stage.h:90
virtual std::vector< size_t > estimateOutputSizes(const std::vector< size_t > &input_sizes) const =0
virtual void setInverse(bool inverse)
Definition stage.h:102
virtual uint16_t getStageTypeId() const =0
virtual size_t serializeHeader(size_t output_index, uint8_t *header_buffer, size_t max_size) const
Definition stage.h:128
virtual uint8_t getOutputDataType(size_t output_index) const =0
virtual void deserializeHeader(const uint8_t *header_buffer, size_t size)
Definition stage.h:134
virtual size_t getRequiredInputAlignment() const
Definition stage.h:53
virtual std::unordered_map< std::string, size_t > getActualOutputSizesByName() const =0
virtual void execute(cudaStream_t stream, MemoryPool *pool, const std::vector< void * > &inputs, const std::vector< void * > &outputs, const std::vector< size_t > &sizes)=0
int getOutputIndex(const std::string &name) const
Definition stage.h:64
virtual size_t estimateScratchBytes(const std::vector< size_t > &input_sizes) const
Definition stage.h:190
virtual size_t getMaxHeaderSize(size_t output_index) const
Definition stage.h:163
virtual void setDims(const std::array< size_t, 3 > &dims)
Definition stage.h:152
Definition fzm_format.h:25
@ UNKNOWN
Byte-transparent stages: skip type checking at finalize()