FullyConnected_fb_io_block() : FullyConnectedKernelBase("fully_connected_gpu_fb_io_block_fp16") {}
KernelsData GetKernelsData(const Params& params, const optional_params& options) const override;
- ParamsKey GetSupportedKey() const override;
protected:
- struct DispatchData : public FullyConnectedKernelBase::DispatchData
- {
- DispatchData(const FullyConnectedKernelBase::DispatchData& base_dispatch_data)
- : FullyConnectedKernelBase::DispatchData(base_dispatch_data),
- unit_byte_size(0), chunk_type(nullptr), chunk_byte_size(0), units_per_chunk(0),
- bytes_per_sg_read(0), units_per_sg_read(0), last_rg_size(0), rg_count(0)
- {}
-
- uint32_t unit_byte_size;
- const char *chunk_type;
- uint32_t chunk_byte_size;
- uint32_t units_per_chunk;
- uint32_t bytes_per_sg_read;
- uint32_t units_per_sg_read;
- uint32_t last_rg_size;
- uint32_t rg_count;
- };
-
+ ParamsKey GetSupportedKey() const override;
bool Validate(const Params& p, const optional_params& o) const override;
JitConstants GetJitConstants(const fully_connected_params& params, const FullyConnectedKernelBase::DispatchData& kd) const override;
- std::unique_ptr<FullyConnectedKernelBase::DispatchData> SetDefault(const fully_connected_params& arg) const override;
+ DispatchData SetDefault(const fully_connected_params& arg, int autoTuneIndex = -1) const override;
};
-}
\ No newline at end of file
+}