Skip to content

Commit d0c67bd

Browse files
[pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
1 parent 81ededa commit d0c67bd

4 files changed

Lines changed: 192 additions & 204 deletions

File tree

tests/cpp/operator/test_cast_mxfp8_grouped.cu

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -266,7 +266,7 @@ void performTest_x1(const ProcessingMethod processing_method,
266266
std::vector<OutputType> out_data_colwise_h(colwise ? elts_num : 0);
267267
std::vector<fp8e8m0> out_scales_rowwise_h(rowwise ? sfs_num : 0);
268268
std::vector<fp8e8m0> out_scales_colwise_h(colwise ? sfs_num : 0);
269-
269+
270270
std::vector<OutputType> out_data_rowwise_ref(rowwise ? elts_num : 0);
271271
std::vector<OutputType> out_data_colwise_ref(colwise ? elts_num : 0);
272272
std::vector<fp8e8m0> out_scales_rowwise_ref(rowwise ? sfs_num : 0);
@@ -328,7 +328,7 @@ void performTest_x1(const ProcessingMethod processing_method,
328328
cudaMalloc((void**)&first_dims_d, first_dims_size);
329329
cudaMalloc((void**)&last_dims_d, last_dims_size);
330330
cudaMalloc((void**)&offsets_d, offsets_size);
331-
331+
332332
cudaMemcpy(in_data_d, in_data.data(), in_data_size, cudaMemcpyHostToDevice);
333333
cudaMemcpy(first_dims_d, first_dims_h.data(), first_dims_size, cudaMemcpyHostToDevice);
334334
cudaMemcpy(last_dims_d, last_dims_h.data(), last_dims_size, cudaMemcpyHostToDevice);
@@ -411,7 +411,7 @@ void performTest_x1(const ProcessingMethod processing_method,
411411
OutputType* const out_data_colwise_ptr = out_data_colwise_ref.data() + data_offset;
412412
fp8e8m0* const out_scales_rowwise_ptr = out_scales_rowwise_ref.data() + sfs_offset;
413413
fp8e8m0* const out_scales_colwise_ptr = out_scales_colwise_ref.data() + sfs_offset;
414-
414+
415415
compute_ref<InputType, OutputType>(
416416
processing_method, OP, rowwise, colwise, in_ptr, /*grad=*/ nullptr,
417417
out_data_rowwise_ptr, out_data_colwise_ptr,
@@ -539,7 +539,7 @@ TEST_P(GroupedFusedCastMXFP8TestSuite, Test) {
539539

540540
using namespace transformer_engine;
541541
using namespace test;
542-
542+
543543
const ProcessingMethod processing_method = std::get<0>(GetParam());
544544
const ActivationKind activation = std::get<1>(GetParam());
545545
const ScalingDirection scaling_direction = std::get<2>(GetParam());

transformer_engine/common/cast/cast.cu

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,8 @@ void nvte_quantize(const NVTETensor input, NVTETensor output, cudaStream_t strea
2727
// dispatch::quantize_fwd_helper<IS_ACT, Empty, nullptr>(input, output, nullptr, stream);
2828
}
2929

30-
void nvte_quantize_grouped(const NVTEGroupedTensor input, NVTEGroupedTensor output, cudaStream_t stream) {
30+
void nvte_quantize_grouped(const NVTEGroupedTensor input, NVTEGroupedTensor output,
31+
cudaStream_t stream) {
3132
NVTE_API_CALL(nvte_quantize_grouped);
3233
using namespace transformer_engine;
3334

transformer_engine/common/cast/dispatch/quantize_grouped.cuh

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -59,7 +59,8 @@ void quantize_grouped_fwd_helper(const NVTEGroupedTensor input, NVTEGroupedTenso
5959
GroupedTensor *workspace_tensor = convertNVTEGroupedTensor(workspace);
6060

6161
mxfp8::quantize_grouped</*IS_DBIAS=*/false, /*IS_DACT=*/false, IS_ACT, ParamOP, OP>(
62-
input_tensor, activations_tensor, noop_tensor, output_tensor, dbias_tensor, workspace_tensor, stream);
62+
input_tensor, activations_tensor, noop_tensor, output_tensor, dbias_tensor,
63+
workspace_tensor, stream);
6364
break;
6465
}
6566
default:

0 commit comments

Comments
 (0)