Skip to content

Commit

Permalink
TL/MLX5: minor clean and profiler
Browse files Browse the repository at this point in the history
  • Loading branch information
samnordmann committed Jan 2, 2025
1 parent 73651ea commit f99208f
Show file tree
Hide file tree
Showing 2 changed files with 12 additions and 4 deletions.
12 changes: 10 additions & 2 deletions src/components/tl/mlx5/alltoall/alltoall_coll.c
Original file line number Diff line number Diff line change
Expand Up @@ -243,6 +243,10 @@ static ucc_status_t ucc_tl_mlx5_fanout_start(ucc_coll_task_t *coll_task)
tl_debug(UCC_TASK_LIB(task), "fanout start");
/* start task if completion event received */
UCC_TL_MLX5_PROFILE_REQUEST_EVENT(task, "mlx5_alltoall_fanout_start", 0);
if (team->a2a->node.sbgp->group_rank == team->a2a->node.asr_rank) {
UCC_TL_MLX5_PROFILE_REQUEST_EVENT(
task, "mlx5_alltoall_wait-on-data_start", 0);
}
/* Start fanout */
ucc_progress_enqueue(UCC_TL_CORE_CTX(team)->pq, coll_task);
return UCC_OK;
Expand All @@ -265,6 +269,8 @@ static void ucc_tl_mlx5_fanout_progress(ucc_coll_task_t *coll_task)
coll_task->status = UCC_INPROGRESS;
return;
}
UCC_TL_MLX5_PROFILE_REQUEST_EVENT(
task, "mlx5_alltoall_wait-on-data_complete, fanout_start", 0);
}

if (UCC_OK == ucc_tl_mlx5_node_fanout(team, task)) {
Expand Down Expand Up @@ -342,12 +348,14 @@ static ucc_status_t ucc_tl_mlx5_asr_barrier_start(ucc_coll_task_t *coll_task)
status = send_done(team, i);
}
if (status != UCC_OK) {
tl_error(UCC_TASK_LIB(task), "failed sending barrier notice");
tl_error(UCC_TASK_LIB(task), "failed sending barrier notice");
return status;
}
UCC_TL_MLX5_PROFILE_REQUEST_EVENT(
task, "mlx5_alltoall_barrier_send_posted", 0);
}
coll_task->status = UCC_OK;
UCC_TL_MLX5_PROFILE_REQUEST_EVENT(task, "mlx5_alltoall_barreir_done",
UCC_TL_MLX5_PROFILE_REQUEST_EVENT(task, "mlx5_alltoall_barrier_done",
0);
return ucc_task_complete(coll_task);
}
Expand Down
4 changes: 2 additions & 2 deletions src/components/tl/mlx5/tl_mlx5_team.c
Original file line number Diff line number Diff line change
Expand Up @@ -117,7 +117,7 @@ ucc_status_t ucc_tl_mlx5_team_destroy(ucc_base_team_t *tl_team)
return UCC_OK;
}

static inline ucc_status_t ucc_tl_mlx5_a2a_team_test(ucc_base_team_t *team)
static inline ucc_status_t ucc_tl_mlx5_alltoall_team_test(ucc_base_team_t *team)
{
ucc_tl_mlx5_team_t *tl_team = ucc_derived_of(team, ucc_tl_mlx5_team_t);

Expand Down Expand Up @@ -253,7 +253,7 @@ ucc_status_t ucc_tl_mlx5_team_create_test(ucc_base_team_t *team)
goto initial_sync_post;
}

a2a_status = ucc_tl_mlx5_a2a_team_test(team);
a2a_status = ucc_tl_mlx5_alltoall_team_test(team);
if (a2a_status < 0) {
tl_warn(team->context->lib, "ALLTOALL tl team: %p creation failed %d",
team, a2a_status);
Expand Down

0 comments on commit f99208f

Please sign in to comment.