Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Move fusion executor files to their own directory #2756

Merged
merged 21 commits into from
Sep 9, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
21 commits
Select commit Hold shift + click to select a range
d74a8bf
Minor cleanup in executor.cpp
csarofeen Aug 2, 2024
11df23a
Apply suggestions from code review
csarofeen Aug 3, 2024
78ca610
Merge branch 'main' of https://github.com/NVIDIA/Fuser into executor_…
csarofeen Aug 4, 2024
75543ce
Merge branch 'executor_cleanup' of https://github.com/NVIDIA/Fuser in…
csarofeen Aug 4, 2024
549d150
Merge branch 'main' of https://github.com/NVIDIA/Fuser into executor_…
csarofeen Aug 5, 2024
3f1036b
Merge branch 'main' of https://github.com/NVIDIA/Fuser into executor_…
csarofeen Aug 6, 2024
f23b40b
Merge branch 'main' of https://github.com/NVIDIA/Fuser into executor_…
csarofeen Aug 28, 2024
453e44f
Merge branch 'main' of https://github.com/NVIDIA/Fuser into executor_…
csarofeen Aug 28, 2024
9943152
Improve error message in expression evaluator when propagating consta…
csarofeen Aug 28, 2024
97ef121
Apply suggestions from code review
csarofeen Aug 31, 2024
5826645
Merge branch 'main' of https://github.com/NVIDIA/Fuser into executor_…
csarofeen Sep 2, 2024
9bc2af8
PR Feedback.
csarofeen Sep 2, 2024
8029b1b
Merge branch 'executor_cleanup' of https://github.com/NVIDIA/Fuser in…
csarofeen Sep 2, 2024
8ecc5e7
Merge branch 'main' of https://github.com/NVIDIA/Fuser into executor_…
csarofeen Sep 6, 2024
1db8e06
resolve bad conflict resolution.
csarofeen Sep 6, 2024
8f3ff98
Minor fix.
csarofeen Sep 6, 2024
64d22bd
Move fusion executor files to their own directory.
csarofeen Aug 4, 2024
ae5ec7c
Empty-Commit
csarofeen Aug 4, 2024
6080d46
Empty-Commit
csarofeen Aug 4, 2024
d9ae359
Merge branch 'main' of https://github.com/NVIDIA/Fuser into move_exec…
csarofeen Sep 8, 2024
90ce5b1
one more header
csarofeen Sep 8, 2024
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 4 additions & 4 deletions CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -123,13 +123,13 @@ list(APPEND NVFUSER_SRCS
${NVFUSER_SRCS_DIR}/dynamic_transform.cpp
${NVFUSER_SRCS_DIR}/evaluator_common.cpp
${NVFUSER_SRCS_DIR}/exceptions.cpp
${NVFUSER_SRCS_DIR}/executor.cpp
${NVFUSER_SRCS_DIR}/executor_kernel_arg.cpp
${NVFUSER_SRCS_DIR}/executor_params.cpp
${NVFUSER_SRCS_DIR}/executor_utils.cpp
${NVFUSER_SRCS_DIR}/expr_evaluator.cpp
${NVFUSER_SRCS_DIR}/expr_simplifier.cpp
${NVFUSER_SRCS_DIR}/fusion.cpp
${NVFUSER_SRCS_DIR}/fusion_executor/executor.cpp
${NVFUSER_SRCS_DIR}/fusion_executor/executor_kernel_arg.cpp
${NVFUSER_SRCS_DIR}/fusion_executor/executor_params.cpp
${NVFUSER_SRCS_DIR}/fusion_executor/executor_utils.cpp
${NVFUSER_SRCS_DIR}/fusion_segmenter.cpp
${NVFUSER_SRCS_DIR}/global_allocator.cpp
${NVFUSER_SRCS_DIR}/grouped_reduction.cpp
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/batch_norm_channels_first.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/batch_norm_channels_first_backward.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/batch_norm_channels_last.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/batch_norm_channels_last_backward.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/bert.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -6,8 +6,8 @@
*/
// clang-format on
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/broadcast.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -6,8 +6,8 @@
*/
// clang-format on
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/utils.h>
#include <ops/arith.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/gelu_backward.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -9,8 +9,8 @@
// Based on NVFuserTest.FusionBiasGeluBwd_CUDA

#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/builder.h>
#include <ops/arith.h>
#include <scheduler/all_schedulers.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/gelu_backward_reduction.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -6,8 +6,8 @@
*/
// clang-format on
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/utils.h>
#include <ops/arith.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/heuristic_cache.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/heuristic_lookup.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/indexselect.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -9,8 +9,8 @@
// Based on NVFuserTest.FusionBiasGeluBwd_CUDA

#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/builder.h>
#include <ops/arith.h>
#include <scheduler/all_schedulers.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/instance_norm.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/builder.h>
#include <ops/all_ops.h>
#include <scheduler/all_schedulers.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/layer_norm.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/layer_norm_backward.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/layer_norm_fused.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/lstm_cell.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -6,8 +6,8 @@
*/
// clang-format on
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ops/all_ops.h>
#include <scheduler/all_schedulers.h>

Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/matmul.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/analysis/bank_conflict.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/utils.h>
#include <ops/all_ops.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/reduction.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -6,8 +6,8 @@
*/
// clang-format on
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/utils.h>
#include <ops/arith.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/rms_norm.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/rms_norm_backward.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/scale_bias_relu.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ops/arith.h>
#include <scheduler/all_schedulers.h>

Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/shape_inference.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/softmax.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/utils.h>
#include <ops/all_ops.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/softmax_backward.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/utils.h>
#include <ops/all_ops.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/softmax_dropout.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,8 @@
// clang-format on
#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>
#include <ir/utils.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/timm.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -5,8 +5,8 @@
* SPDX-License-Identifier: BSD-3-Clause
*/
// clang-format on
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/builder.h>

Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/transpose.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -6,8 +6,8 @@
*/
// clang-format on
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/utils.h>
#include <ops/all_ops.h>
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/cpp/utils.h
Original file line number Diff line number Diff line change
Expand Up @@ -9,8 +9,8 @@

#include <csrc/exceptions.h>
#include <device_lower/lower2device.h>
#include <executor.h>
#include <fusion.h>
#include <fusion_executor/executor.h>
#include <ir/all_nodes.h>
#include <ir/utils.h>
#include <kernel_cache.h>
Expand Down
2 changes: 1 addition & 1 deletion csrc/device_lower/analysis/bank_conflict.h
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@
#pragma once

#include <exceptions.h>
#include <executor_params.h>
#include <fusion_executor/executor_params.h>
#include <ir/base_nodes.h>
#include <kernel.h>
#include <polymorphic_value.h>
Expand Down
2 changes: 1 addition & 1 deletion csrc/device_lower/lower2device.h
Original file line number Diff line number Diff line change
Expand Up @@ -23,8 +23,8 @@
#include <device_lower/pass/scalar_hoist.h>
#include <device_lower/pass/warp_reduce.h>
#include <exceptions.h>
#include <executor_params.h>
#include <expr_simplifier.h>
#include <fusion_executor/executor_params.h>
#include <id_model/id_model.h>
#include <id_model/indexing.h>
#include <ir/all_nodes.h>
Expand Down
2 changes: 1 addition & 1 deletion csrc/device_lower/pass/loop_rotation.h
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@
#pragma once

#include <exceptions.h>
#include <executor_params.h>
#include <fusion_executor/executor_params.h>
#include <ir/all_nodes.h>

namespace nvfuser {
Expand Down
4 changes: 2 additions & 2 deletions csrc/dynamic_transform.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7,10 +7,10 @@
// clang-format on
#include <device_lower/utils.h>
#include <dynamic_transform.h>
#include <executor_kernel_arg.h>
#include <executor_utils.h>
#include <expr_evaluator.h>
#include <fusion.h>
#include <fusion_executor/executor_kernel_arg.h>
#include <fusion_executor/executor_utils.h>
#include <ir/cloner.h>
#include <ir/utils.h>
#include <logical_domain_map.h>
Expand Down
2 changes: 1 addition & 1 deletion csrc/evaluator_common.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -9,8 +9,8 @@

#include <debug.h>
#include <device_lower/lower2device.h>
#include <executor_kernel_arg.h>
#include <expr_evaluator.h>
#include <fusion_executor/executor_kernel_arg.h>
#include <instrumentation.h>
#include <ir/utils.h>
#include <tensor_metadata.h>
Expand Down
2 changes: 1 addition & 1 deletion csrc/evaluator_common.h
Original file line number Diff line number Diff line change
Expand Up @@ -8,8 +8,8 @@
#pragma once
#include <device_lower/lower2device.h>
#include <exceptions.h>
#include <executor_params.h>
#include <fusion.h>
#include <fusion_executor/executor_params.h>
#include <ir/all_nodes.h>
#include <polymorphic_value.h>
#include <utils.h>
Expand Down
2 changes: 1 addition & 1 deletion csrc/fusion.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -10,8 +10,8 @@
#include <device_lower/analysis/bank_conflict.h>
#include <device_lower/lower2device.h>
#include <disjoint_set.h>
#include <executor_params.h>
#include <fusion.h>
#include <fusion_executor/executor_params.h>
#include <fusion_segmenter.h>
#include <host_ir/container.h>
#include <instrumentation.h>
Expand Down
2 changes: 1 addition & 1 deletion csrc/fusion.h
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@
#include <exceptions.h>

#include <debug.h>
#include <executor_params.h>
#include <fusion_executor/executor_params.h>
#include <ir/base_nodes.h>
#include <ir/container.h>
#include <iter_visitor.h>
Expand Down
6 changes: 3 additions & 3 deletions csrc/executor.cpp → csrc/fusion_executor/executor.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -6,14 +6,14 @@
*/
// clang-format on

#include <executor.h>
#include <fusion_executor/executor.h>

#include <codegen.h>
#include <debug.h>
#include <device_lower/analysis/bank_conflict.h>
#include <driver_api.h>
#include <executor_kernel_arg.h>
#include <executor_utils.h>
#include <fusion_executor/executor_kernel_arg.h>
#include <fusion_executor/executor_utils.h>
#include <fusion_profiler.h>
#include <global_allocator.h>
#include <instrumentation.h>
Expand Down
Loading
Loading