@@ -268,7 +268,7 @@ void DataChannelTCP::allGather(
268
268
memcpy (
269
269
output[group_rank].data_ptr (),
270
270
input.data_ptr (),
271
- input.type (). elementSizeInBytes () * input.numel ());
271
+ input.element_size () * input.numel ());
272
272
273
273
auto j = group_rank, jnext = left;
274
274
for (rank_type i = 0 ; i < group.size (); ++i) {
@@ -315,7 +315,7 @@ void DataChannelTCP::gather(
315
315
memcpy (
316
316
output.at (i).data_ptr (),
317
317
input.data_ptr (),
318
- input.numel () * input.type (). elementSizeInBytes ());
318
+ input.numel () * input.element_size ());
319
319
}
320
320
}
321
321
}
@@ -355,7 +355,7 @@ void DataChannelTCP::scatter(
355
355
memcpy (
356
356
output.data_ptr (),
357
357
input.at (i).data_ptr (),
358
- output.numel () * output.type (). elementSizeInBytes ());
358
+ output.numel () * output.element_size ());
359
359
}
360
360
}
361
361
}
@@ -389,7 +389,7 @@ void DataChannelTCP::allReduce(
389
389
if (!exists)
390
390
return ;
391
391
392
- uint64_t tensor_bytes = data.type (). elementSizeInBytes () * data.numel ();
392
+ uint64_t tensor_bytes = data.element_size () * data.numel ();
393
393
auto tmp_tensor = data.clone ();
394
394
395
395
auto pof2 = pow2 (group.size ());
@@ -489,7 +489,7 @@ void DataChannelTCP::reduce(
489
489
std::memcpy (
490
490
data.data_ptr (),
491
491
result_tensor.data_ptr (),
492
- data.type (). elementSizeInBytes () * data.numel ());
492
+ data.element_size () * data.numel ());
493
493
}
494
494
495
495
void DataChannelTCP::broadcast (
@@ -703,7 +703,7 @@ void DataChannelTCP::_send(const at::Tensor& data, rank_type dst_rank) {
703
703
throw std::logic_error (" tensor to send is not contiguous" );
704
704
705
705
// send size of tensor data in bytes
706
- uint64_t tensor_bytes = data.type (). elementSizeInBytes () * data.numel ();
706
+ uint64_t tensor_bytes = data.element_size () * data.numel ();
707
707
send_bytes<uint64_t >(process_dst.socket , &tensor_bytes, 1 , true );
708
708
709
709
// send data (bytes)
@@ -759,7 +759,7 @@ void DataChannelTCP::_receive(const at::Tensor& data, rank_type src_rank) {
759
759
recv_bytes<uint64_t >(process_src.socket , &tensor_bytes, 1 );
760
760
761
761
uint64_t actual_tensor_bytes =
762
- data.type (). elementSizeInBytes () * data.numel ();
762
+ data.element_size () * data.numel ();
763
763
if (actual_tensor_bytes == tensor_bytes) {
764
764
recv_bytes<std::uint8_t >(
765
765
process_src.socket ,
0 commit comments