@@ -1740,6 +1740,26 @@ c10::intrusive_ptr<Work> ProcessGroupXCCL::reduce_scatter_tensor_coalesced(
1740
1740
std::vector<at::Tensor>& outputs,
1741
1741
std::vector<at::Tensor>& inputs,
1742
1742
const ReduceScatterOptions& opts) {
1743
+
1744
+ RECORD_PARAM_COMMS_DATA_WITH_LOG (
1745
+ std::make_tuple (
1746
+ static_cast <int64_t >(seqCollective_) + 1 ,
1747
+ false ), // seq + 1 to match collective and assume only one collective
1748
+ // in coalesced range
1749
+ std::make_tuple (pg_uid_, pg_desc_), // PG name tuple
1750
+ inputs, // inputTensors
1751
+ outputs, // outputTensors
1752
+ rank_, // rank
1753
+ " reduce_scatter_tensor_coalesced" , // collective name
1754
+ getTensorsNumel (inputs), // inNelems
1755
+ getTensorsNumel (outputs), // outNelems
1756
+ inputs[0 ].scalar_type (), // dType
1757
+ std::vector<int64_t >(), // inSplitSizes
1758
+ std::vector<int64_t >(), // outSplitSizes
1759
+ -1 , // globalRankStart
1760
+ -1 , // globalRankStride
1761
+ this ->getSize ()); // worldSize
1762
+
1743
1763
return collectiveCoalesced (
1744
1764
inputs,
1745
1765
outputs,
0 commit comments