Skip to content

Commit

Permalink
fix mem fence (#2030)
Browse files Browse the repository at this point in the history
Co-authored-by: yuzhai <[email protected]>
  • Loading branch information
yzhaiustc and yuzhai authored Jan 8, 2025
1 parent 7494a18 commit c506e16
Showing 1 changed file with 4 additions and 0 deletions.
4 changes: 4 additions & 0 deletions include/cutlass/pipeline/sm90_pipeline.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -316,6 +316,7 @@ class PipelineTmaAsync {
cutlass::arch::detail::initialize_barrier_array_pair_aligned<decltype(storage.full_barrier_), decltype(storage.empty_barrier_), Stages>(
storage.full_barrier_, storage.empty_barrier_, producer_arv_cnt, multicast_consumer_arrival_count);
}
cutlass::arch::fence_barrier_init();
}

template<class ClusterShape, class InitBarriers, class InitMasks>
Expand Down Expand Up @@ -757,6 +758,7 @@ class PipelineTransactionAsync {
cutlass::arch::detail::initialize_barrier_array_pair_aligned<decltype(full_barrier_ptr), decltype(empty_barrier_ptr), Stages>(
full_barrier_ptr, empty_barrier_ptr, params.producer_arv_count, params.consumer_arv_count);
}
cutlass::arch::fence_barrier_init();
}

// Constructor
Expand Down Expand Up @@ -993,6 +995,7 @@ class PipelineAsync {
cutlass::arch::detail::initialize_barrier_array_pair_aligned<decltype(storage.full_barrier_), decltype(storage.empty_barrier_), Stages>(
storage.full_barrier_, storage.empty_barrier_, params.producer_arv_count, params.consumer_arv_count);
}
cutlass::arch::fence_barrier_init();
}

template<class InitBarriers>
Expand Down Expand Up @@ -1249,6 +1252,7 @@ class OrderedSequenceBarrier {
}
}
}
cutlass::arch::fence_barrier_init();
}

// Wait on a stage to be unlocked
Expand Down

0 comments on commit c506e16

Please sign in to comment.