diff --git a/csrc/runtime/fusion_executor_cache.h b/csrc/runtime/fusion_executor_cache.h index 6ec0435bbd0..57cf6ce9c15 100644 --- a/csrc/runtime/fusion_executor_cache.h +++ b/csrc/runtime/fusion_executor_cache.h @@ -140,12 +140,6 @@ class FusionExecutorCache { std::optional forced_index_type = std::nullopt, std::optional selected_device = std::nullopt); - //! Converts inputs from IValue to KernelArgumentHolder, also handles cache - //! lookup - KernelArgumentHolder prepareInputs( - const at::ArrayRef& inputs, - std::optional selected_device = std::nullopt); - //! query if there's a kernel ready to go for given inputs NVF_API bool isCompiled( const at::ArrayRef& inputs, @@ -241,6 +235,12 @@ class FusionExecutorCache { void deserialize(const serde::FusionExecutorCache* buffer, int64_t fusion_id); private: + //! Converts inputs from IValue to KernelArgumentHolder, also handles cache + //! lookup + KernelArgumentHolder prepareInputs( + const at::ArrayRef& inputs, + std::optional selected_device = std::nullopt); + //! evict cached short cut entry in `code_to_fe_lookup_` as well as cached //! entry in `FusionExecutor` void evictCache(size_t cache_id);