From f83f1dd30ca64a41518180f66040d6626a30c3d1 Mon Sep 17 00:00:00 2001 From: co63oc <4617245+co63oc@users.noreply.github.com> Date: Tue, 21 Apr 2026 10:08:28 +0800 Subject: [PATCH 1/2] update iluvatar_gpu kernels --- .../cuda_kernels/abs_grad_kernel_register.cc | 8 +- .../cuda_kernels/abs_kernel_register.cc | 4 +- .../kernels/cuda_kernels/accuracy_kernel.cu | 4 +- .../activation_grad_kernel_register.cc | 216 +++++++++--------- .../activation_kernel_register.cc | 184 +++++++-------- .../cuda_kernels/adadelta_kernel_register.cu | 2 +- .../cuda_kernels/adagrad_kernel_register.cu | 2 +- .../cuda_kernels/adam_kernel_register.cu | 8 +- .../cuda_kernels/adamax_kernel_register.cu | 2 +- .../cuda_kernels/adamw_kernel_register.cc | 4 +- .../cuda_kernels/adamw_kernel_row_register.cc | 2 +- .../cuda_kernels/add_n_kernel_register.cu | 8 +- .../addmm_grad_kernel_register.cc | 4 +- .../cuda_kernels/addmm_kernel_register.cc | 4 +- .../all_gather_kernel_register.cu | 2 +- .../all_reduce_kernel_register.cu | 6 +- .../all_to_all_kernel_register.cu | 6 +- .../cuda_kernels/allclose_kernel_register.cu | 2 +- .../cuda_kernels/amp_kernel_register.cc | 8 +- .../angle_grad_kernel_register.cu | 4 +- .../cuda_kernels/angle_kernel_register.cu | 4 +- .../cuda_kernels/ap_facade_kernel_register.cu | 4 +- ...ap_trivial_fusion_begin_kernel_register.cu | 4 +- .../ap_trivial_fusion_end_kernel_register.cu | 4 +- .../ap_variadic_kernel_register.cu | 6 +- ...apply_per_channel_scale_kernel_register.cu | 4 +- .../cuda_kernels/arange_kernel_register.cc | 8 +- .../arg_min_max_kernel_register.cc | 8 +- .../argsort_grad_kernel_register.cc | 4 +- .../cuda_kernels/argsort_kernel_register.cc | 4 +- .../array_grad_kernel_register.cc | 2 +- .../cuda_kernels/array_kernel_register.cu | 24 +- .../cuda_kernels/asgd_kernel_register.cu | 4 +- .../cuda_kernels/assign_kernel_register.cc | 4 +- .../atan2_grad_kernel_register.cu | 4 +- .../cuda_kernels/atan2_kernel_register.cu | 4 +- .../baddbmm_grad_kernel_register.cu | 4 +- .../cuda_kernels/baddbmm_kernel_register.cu | 4 +- .../batch_norm_grad_kernel_register.cc | 6 +- .../batch_norm_kernel_register.cc | 8 +- .../bce_loss_grad_kernel_register.cu | 2 +- .../cuda_kernels/bce_loss_kernel_register.cu | 2 +- .../beam_search_decode_kernel_register.cu | 2 +- .../cuda_kernels/bernoulli_kernel_register.cu | 4 +- .../cuda_kernels/binomial_kernel_register.cu | 4 +- .../cuda_kernels/bmm_grad_kernel_register.cc | 4 +- .../cuda_kernels/bmm_kernel_register.cc | 4 +- .../cuda_kernels/broadcast_kernel_register.cu | 6 +- .../broadcast_tensors_grad_kernel_register.cu | 4 +- .../broadcast_tensors_kernel_register.cu | 4 +- .../cuda_kernels/c_concat_kernel_register.cu | 2 +- .../c_embedding_grad_kernel_register.cc | 4 +- .../c_embedding_kernel_register.cc | 4 +- .../c_identity_kernel_register.cc | 4 +- .../cuda_kernels/c_scatter_kernel_register.cu | 2 +- ...with_cross_entropy_grad_kernel_register.cc | 2 +- .../cuda_kernels/c_split_kernel_register.cu | 6 +- .../cuda_kernels/cast_kernel_register.cc | 4 +- .../channel_shuffle_grad_kernel_register.cu | 4 +- .../channel_shuffle_kernel_register.cu | 4 +- .../check_memory_continue_kernel_register.cc | 2 +- .../check_numerics_kernel_register.cu | 4 +- .../clip_by_norm_kernel_register.cu | 4 +- .../cuda_kernels/clip_grad_kernel_register.cc | 4 +- .../cuda_kernels/clip_kernel_register.cc | 4 +- .../cuda_kernels/coalesce_kernel_register.cu | 2 +- .../coalesce_tensor_kernel_register.cc | 4 +- .../compare_kernel_legacy_register.cu | 8 +- .../cuda_kernels/compare_kernel_register.cc | 8 +- .../cuda_kernels/complex_kernel_register.cu | 4 +- .../concat_grad_kernel_register.cc | 4 +- .../cuda_kernels/concat_kernel_register.cc | 4 +- .../contiguous_kernel_register.cc | 4 +- .../conv_dnn_grad_kernel_register.cu | 20 +- .../cuda_kernels/conv_dnn_kernel_register.cu | 8 +- .../conv_transpose_grad_kernel_register.cu | 6 +- .../conv_transpose_kernel_register.cu | 4 +- .../cross_entropy2_grad_kernel_register.cu | 4 +- .../cross_entropy2_kernel_register.cu | 4 +- .../cross_entropy_grad_kernel_register.cu | 4 +- .../cross_entropy_kernel_register.cu | 4 +- .../cross_grad_kernel_register.cu | 4 +- .../cuda_kernels/cross_kernel_register.cu | 4 +- .../cuda_kernels/cum_grad_kernel_register.cc | 4 +- .../cuda_kernels/cum_kernel_register.cc | 8 +- .../cumprod_grad_kernel_register.cu | 4 +- .../cuda_kernels/cumprod_kernel_register.cu | 4 +- .../debug_tools_kernel_register.cu | 4 +- .../cuda_kernels/depend_kernel_register.cu | 2 +- .../depthwise_conv_grad_kernel_register.cu | 4 +- .../depthwise_conv_kernel_register.cu | 4 +- .../cuda_kernels/diag_grad_kernel_register.cu | 4 +- .../cuda_kernels/diag_kernel_register.cu | 4 +- .../diagonal_grad_kernel_register.cu | 4 +- .../cuda_kernels/diagonal_kernel_register.cu | 4 +- .../digamma_grad_kernel_register.cu | 4 +- .../cuda_kernels/digamma_kernel_register.cu | 4 +- .../cuda_kernels/dist_grad_kernel_register.cc | 4 +- .../cuda_kernels/dist_kernel_register.cu | 4 +- .../cuda_kernels/dot_grad_kernel_register.cu | 4 +- .../cuda_kernels/dot_kernel_register.cu | 4 +- .../dropout_grad_kernel_register.cc | 8 +- .../cuda_kernels/dropout_kernel_register.cc | 8 +- .../einsum_grad_kernel_register.cu | 4 +- .../cuda_kernels/einsum_kernel_register.cc | 8 +- .../elementwise_grad_kernel_register.cc | 72 +++--- .../elementwise_kernel_register.cc | 4 +- .../cuda_kernels/elementwise_legacy_kernel.cu | 4 +- .../elementwise_multiply_kernel_register.cc | 4 +- .../embedding_grad_kernel_register.cc | 8 +- .../cuda_kernels/embedding_kernel_register.cc | 4 +- ...th_scaled_gradient_grad_kernel_register.cu | 4 +- .../cuda_kernels/empty_kernel_register.cc | 8 +- .../cuda_kernels/erf_grad_kernel_register.cu | 4 +- .../cuda_kernels/erf_kernel_register.cu | 4 +- .../erfinv_grad_kernel_register.cu | 4 +- .../cuda_kernels/erfinv_kernel_register.cu | 4 +- .../expand_as_grad_kernel_register.cu | 2 +- .../cuda_kernels/expand_as_kernel_register.cu | 2 +- .../expand_grad_kernel_register.cu | 4 +- .../cuda_kernels/expand_kernel_register.cc | 4 +- .../exponential_kernel_register.cu | 4 +- .../cuda_kernels/eye_kernel_register.cu | 4 +- .../fake_dequantize_kernel_register.cu | 4 +- .../fake_quantize_kernel_register.cu | 12 +- .../cuda_kernels/fc_kernel_register.cc | 8 +- .../fetch_barrier_kernel_register.cu | 2 +- .../fill_diagonal_grad_kernel_register.cc | 2 +- .../fill_diagonal_kernel_register.cc | 2 +- ...ll_diagonal_tensor_grad_kernel_register.cc | 4 +- .../fill_diagonal_tensor_kernel_register.cc | 4 +- .../cuda_kernels/fill_grad_kernel_register.cu | 4 +- .../cuda_kernels/fill_kernel_register.cc | 4 +- .../cuda_kernels/flash_attn_grad_kernel.cu | 20 +- .../kernels/cuda_kernels/flash_attn_kernel.cu | 20 +- .../flatten_grad_kernel_register.cc | 4 +- .../cuda_kernels/flatten_kernel_register.cc | 8 +- .../cuda_kernels/flip_kernel_register.cc | 4 +- .../frame_grad_kernel_register.cu | 4 +- .../cuda_kernels/frame_kernel_register.cu | 4 +- .../cuda_kernels/full_kernel_register.cc | 12 +- .../fused_adam_kernel_register.cu | 4 +- ...bias_residual_layernorm_kernel_register.cu | 4 +- .../fused_conv2d_add_act_kernel_register.cu | 2 +- .../fused_rope_grad_kernel_register.cu | 4 +- .../fused_rope_kernel_register.cu | 4 +- ...fused_softmax_mask_grad_kernel_register.cu | 2 +- .../fused_softmax_mask_kernel_register.cu | 2 +- ...max_mask_upper_triangle_kernel_register.cu | 4 +- ...d_stack_transpose_quant_kernel_register.cu | 2 +- ...d_transpose_split_quant_kernel_register.cu | 2 +- ...nspose_wlch_split_quant_kernel_register.cu | 2 +- .../fusion_group_kernel_register.cu | 2 +- .../cuda_kernels/gammaln_kernel_register.cu | 4 +- .../gather_grad_kernel_register.cc | 4 +- .../cuda_kernels/gather_kernel_register.cc | 4 +- .../gather_nd_grad_kernel_register.cc | 4 +- .../cuda_kernels/gather_nd_kernel_register.cc | 4 +- .../gaussian_inplace_grad_kernel_register.cu | 4 +- .../cuda_kernels/gaussian_kernel_register.cc | 8 +- .../cuda_kernels/gelu_grad_kernel_register.cc | 4 +- .../cuda_kernels/gelu_kernel_register.cc | 4 +- .../global_gather_kernel_register.cu | 2 +- .../global_scatter_kernel_register.cu | 2 +- .../group_norm_grad_kernel_register.cu | 4 +- .../group_norm_kernel_register.cu | 8 +- .../gumbel_softmax_grad_kernel_register.cu | 2 +- .../gumbel_softmax_kernel_register.cu | 2 +- .../huber_loss_grad_kernel_register.cu | 4 +- .../huber_loss_kernel_register.cu | 4 +- .../index_add_grad_kernel_register.cu | 4 +- .../cuda_kernels/index_add_kernel_register.cu | 4 +- ...ex_elementwise_get_grad_kernel_register.cu | 4 +- .../index_elementwise_get_kernel_register.cu | 4 +- .../index_put_grad_kernel_register.cu | 4 +- .../cuda_kernels/index_put_kernel_register.cc | 4 +- .../index_sample_grad_kernel_register.cu | 4 +- .../index_sample_kernel_register.cu | 4 +- .../index_select_grad_kernel_register.cu | 4 +- .../index_select_kernel_register.cu | 4 +- .../interpolate_grad_kernel_register.cu | 28 +-- .../interpolate_kernel_register.cc | 28 +-- .../cuda_kernels/isclose_kernel_register.cu | 2 +- .../cuda_kernels/isfinite_kernel_register.cc | 2 +- .../cuda_kernels/isfinite_kernel_register.cu | 12 +- .../cuda_kernels/kron_grad_kernel_register.cu | 4 +- .../cuda_kernels/kron_kernel_register.cu | 4 +- .../kthvalue_grad_kernel_register.cu | 4 +- .../cuda_kernels/kthvalue_kernel_register.cu | 4 +- .../label_smooth_grad_kernel_register.cu | 4 +- .../label_smooth_kernel_register.cu | 4 +- .../cuda_kernels/lamb_kernel_register.cu | 4 +- .../cuda_kernels/layer_norm_grad_kernel.cu | 4 +- .../kernels/cuda_kernels/layer_norm_kernel.cu | 4 +- .../legacy_expand_grad_kernel_register.cu | 2 +- .../kernels/cuda_kernels/lerp_grad_kernel.cu | 4 +- .../kernels/cuda_kernels/lerp_kernel.cu | 4 +- .../lgamma_grad_kernel_register.cu | 4 +- .../cuda_kernels/lgamma_kernel_register.cu | 4 +- .../cuda_kernels/linspace_kernel_register.cu | 4 +- .../log_softmax_grad_kernel_register.cu | 4 +- .../log_softmax_kernel_register.cu | 4 +- .../logcumsumexp_grad_kernel_register.cu | 4 +- .../cuda_kernels/logical_kernel_register.cc | 4 +- .../cuda_kernels/logspace_kernel_register.cu | 4 +- .../logsumexp_grad_kernel_register.cu | 4 +- .../cuda_kernels/logsumexp_kernel_register.cc | 4 +- .../lookup_table_grad_kernel_register.cu | 4 +- .../lookup_table_kernel_register.cu | 2 +- ...rgin_cross_entropy_grad_kernel_register.cu | 4 +- .../margin_cross_entropy_kernel_register.cu | 4 +- .../cuda_kernels/mask_grad_kernel_register.cu | 4 +- .../cuda_kernels/mask_kernel_register.cu | 6 +- .../masked_fill_grad_kernel_register.cu | 4 +- .../masked_fill_kernel_register.cu | 4 +- ...ked_multihead_attention_kernel_register.cu | 2 +- .../masked_select_grad_kernel_register.cu | 4 +- .../cuda_kernels/masked_select_kernel.cu | 4 +- .../matmul_grad_kernel_register.cc | 18 +- .../cuda_kernels/matmul_kernel_register.cc | 10 +- .../maxout_grad_kernel_register.cu | 2 +- .../cuda_kernels/maxout_kernel_register.cu | 2 +- .../mean_all_grad_kernel_register.cc | 2 +- .../cuda_kernels/mean_all_kernel_register.cc | 2 +- .../merged_momentum_kernel_register.cu | 2 +- .../meshgrid_grad_kernel_register.cc | 4 +- .../cuda_kernels/meshgrid_kernel_register.cc | 4 +- .../cuda_kernels/mode_grad_kernel_register.cu | 4 +- .../cuda_kernels/mode_kernel_register.cu | 4 +- .../moe_combine_no_weight_kernel_register.cu | 4 +- .../moe_permute_kernel_register.cu | 2 +- .../moe_unpermute_kernel_register.cu | 2 +- .../cuda_kernels/momentum_kernel_register.cu | 4 +- ...g_average_abs_max_scale_kernel_register.cu | 2 +- .../mp_allreduce_sum_kernel_register.cu | 2 +- .../multinomial_kernel_register.cc | 4 +- .../cuda_kernels/nadam_kernel_register.cu | 2 +- .../nanmedian_grad_kernel_register.cu | 4 +- .../cuda_kernels/nanmedian_kernel_register.cu | 4 +- .../cuda_kernels/nonzero_kernel_register.cc | 4 +- .../cuda_kernels/nop_kernel_register.cu | 4 +- .../cuda_kernels/norm_grad_kernel_register.cu | 4 +- .../cuda_kernels/norm_kernel_register.cu | 4 +- .../npu_identity_kernel_register.cc | 2 +- .../cuda_kernels/numel_kernel_register.cc | 4 +- .../overlap_add_grad_kernel_register.cu | 4 +- .../overlap_add_kernel_register.cu | 4 +- .../p_norm_grad_kernel_register.cc | 4 +- .../cuda_kernels/p_norm_kernel_register.cc | 4 +- .../cuda_kernels/p_recv_kernel_register.cu | 2 +- .../cuda_kernels/p_send_kernel_register.cu | 2 +- .../pad3d_grad_kernel_register.cu | 4 +- .../cuda_kernels/pad3d_kernel_register.cu | 4 +- .../cuda_kernels/pad_grad_kernel_register.cc | 4 +- .../cuda_kernels/pad_kernel_register.cc | 4 +- .../partial_allgather_kernel_register.cu | 6 +- .../partial_concat_grad_kernel_register.cu | 2 +- .../partial_concat_kernel_register.cu | 2 +- .../partial_recv_kernel_register.cu | 6 +- .../partial_send_kernel_register.cu | 6 +- .../pixel_shuffle_grad_kernel_register.cu | 4 +- .../pixel_shuffle_kernel_register.cu | 4 +- .../pixel_unshuffle_kernel_register.cu | 4 +- .../poisson_grad_kernel_register.cu | 4 +- .../cuda_kernels/poisson_kernel_register.cu | 4 +- .../cuda_kernels/pool_grad_kernel_register.cc | 28 +-- .../cuda_kernels/pool_kernel_register.cc | 28 +-- .../prelu_grad_kernel_register.cu | 4 +- .../cuda_kernels/prelu_kernel_register.cu | 4 +- .../cuda_kernels/prod_grad_kernel_register.cu | 4 +- .../cuda_kernels/prod_kernel_register.cc | 4 +- .../put_along_axis_grad_kernel_register.cu | 4 +- .../put_along_axis_kernel_register.cc | 4 +- .../qkv_unpack_mha_kernel_register.cu | 2 +- .../quant_linear_kernel_register.cu | 2 +- .../quantize_linear_kernel_register.cu | 10 +- .../cuda_kernels/radam_kernel_register.cu | 2 +- .../random_routing_kernel_register.cu | 2 +- .../cuda_kernels/randperm_kernel_register.cu | 4 +- .../reduce_as_grad_kernel_register.cu | 4 +- .../cuda_kernels/reduce_as_kernel_register.cu | 4 +- .../reduce_kernel_kps_register.cc | 18 +- .../cuda_kernels/reduce_kernel_register.cc | 20 +- .../reduce_max_kernel_register.cc | 4 +- .../reduce_mean_kernel_register.cc | 4 +- .../kernels/cuda_kernels/reduce_min_kernel.cc | 4 +- .../reduce_scatter_kernel_register.cu | 6 +- .../reduce_sum_kernel_register.cc | 4 +- .../repeat_interleave_grad_kernel_register.cu | 4 +- .../repeat_interleave_kernel_register.cu | 4 +- .../rms_norm_grad_kernel_register.cc | 4 +- .../cuda_kernels/rms_norm_kernel_register.cc | 4 +- .../cuda_kernels/rmsprop_kernel_register.cu | 4 +- .../cuda_kernels/roll_grad_kernel_register.cu | 4 +- .../cuda_kernels/roll_kernel_register.cu | 4 +- .../cuda_kernels/rprop_kernel_register.cu | 6 +- .../rrelu_grad_kernel_register.cu | 4 +- .../cuda_kernels/rrelu_kernel_register.cu | 4 +- .../cuda_kernels/scale_kernel_register.cc | 4 +- .../scatter_grad_kernel_register.cc | 4 +- .../cuda_kernels/scatter_kernel_register.cc | 4 +- .../scatter_nd_add_grad_kernel_register.cc | 4 +- .../scatter_nd_add_kernel_register.cc | 4 +- .../searchsorted_kernel_register.cu | 4 +- .../segment_pool_grad_kernel_register.cu | 4 +- .../segment_pool_kernel_register.cu | 4 +- .../cuda_kernels/selu_grad_kernel_register.cu | 4 +- .../send_u_recv_grad_kernel_register.cu | 2 +- .../send_u_recv_kernel_register.cu | 2 +- .../send_ue_recv_grad_kernel_register.cu | 2 +- .../send_ue_recv_kernel_register.cu | 2 +- .../send_uv_grad_kernel_register.cu | 2 +- .../cuda_kernels/send_uv_kernel_register.cu | 2 +- .../cuda_kernels/set_kernel_register.cc | 4 +- .../set_value_grad_kernel_register.cc | 8 +- .../cuda_kernels/set_value_kernel_register.cc | 8 +- .../cuda_kernels/sgd_kernel_register.cu | 10 +- .../cuda_kernels/shape_kernel_register.cc | 8 +- .../share_data_kernel_register.cu | 4 +- ...ntropy_with_logits_grad_kernel_register.cu | 2 +- ...oss_entropy_with_logits_kernel_register.cu | 2 +- .../cuda_kernels/sign_kernel_register.cc | 4 +- .../slice_grad_kernel_register.cc | 12 +- .../cuda_kernels/slice_kernel_register.cc | 12 +- .../soft_relu_grad_kernel_register.cu | 4 +- .../cuda_kernels/soft_relu_kernel_register.cu | 8 +- .../softmax_grad_kernel_register.cu | 4 +- .../cuda_kernels/softmax_kernel_register.cu | 4 +- .../sparse_momentum_kernel_register.cu | 2 +- .../sparse_utils_kernel_register.cu | 2 +- .../cuda_kernels/split_kernel_register.cc | 8 +- .../squared_l2_norm_grad_kernel_register.cu | 4 +- .../squared_l2_norm_kernel_register.cc | 4 +- .../squeeze_grad_kernel_register.cc | 4 +- .../cuda_kernels/squeeze_kernel_register.cc | 8 +- .../stack_grad_kernel_register.cu | 4 +- .../cuda_kernels/stack_kernel_register.cc | 4 +- ..._through_estimator_grad_kernel_register.cu | 2 +- .../strided_copy_kernel_register.cc | 4 +- .../strided_slice_grad_kernel_register.cc | 4 +- .../strided_slice_kernel_register.cc | 4 +- .../swiglu_grad_kernel_register.cc | 4 +- .../cuda_kernels/swiglu_kernel_register.cc | 4 +- .../sync_batch_norm_grad_kernel_register.cu | 2 +- .../sync_batch_norm_kernel_register.cu | 8 +- .../sync_calc_stream_kernel_register.cu | 4 +- .../take_along_axis_grad_kernel_register.cu | 4 +- .../take_along_axis_kernel_register.cc | 4 +- .../temporal_shift_grad_kernel_register.cu | 4 +- .../temporal_shift_kernel_register.cu | 4 +- .../cuda_kernels/tile_grad_kernel_register.cc | 4 +- .../cuda_kernels/tile_kernel_register.cc | 4 +- .../kernels/cuda_kernels/top_k_grad_kernel.cu | 8 +- .../kernels/cuda_kernels/top_k_kernel.cu | 8 +- .../trace_grad_kernel_register.cu | 4 +- .../cuda_kernels/trace_kernel_register.cu | 4 +- .../transpose_grad_kernel_register.cc | 8 +- .../cuda_kernels/transpose_kernel_register.cc | 4 +- .../tril_triu_grad_kernel_register.cu | 12 +- .../cuda_kernels/tril_triu_kernel_register.cc | 12 +- .../trunc_grad_kernel_register.cu | 4 +- .../cuda_kernels/trunc_kernel_register.cu | 4 +- .../unary_grad_kernel_register.cu | 12 +- .../cuda_kernels/unary_kernel_register.cu | 16 +- .../cuda_kernels/unbind_kernel_register.cc | 4 +- .../unfold_grad_kernel_register.cu | 4 +- .../cuda_kernels/unfold_kernel_register.cu | 4 +- .../uniform_inplace_grad_kernel_register.cu | 4 +- .../uniform_inplace_kernel_register.cu | 4 +- .../cuda_kernels/uniform_kernel_register.cc | 4 +- .../unsqueeze_grad_kernel_register.cc | 4 +- .../cuda_kernels/unsqueeze_kernel_register.cc | 8 +- .../unstack_grad_kernel_register.cu | 4 +- .../cuda_kernels/unstack_kernel_register.cu | 4 +- .../cuda_kernels/weight_only_linear_kernel.cu | 8 +- .../cuda_kernels/weight_quantize_kernel.cu | 4 +- .../where_grad_kernel_register.cu | 4 +- .../cuda_kernels/where_kernel_register.cc | 4 +- 378 files changed, 1144 insertions(+), 1148 deletions(-) diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/abs_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/abs_grad_kernel_register.cc index c8c72b6b039..409be40469f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/abs_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/abs_grad_kernel_register.cc @@ -25,8 +25,8 @@ PD_CUSTOM_KERNEL_REGISTER(abs_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, complex) { kernel->InputAt(1).SetDataType(phi::dtype::ToReal(kernel_key.dtype())); } @@ -38,8 +38,8 @@ PD_CUSTOM_KERNEL_REGISTER(abs_double_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, complex) { kernel->InputAt(1).SetDataType(phi::dtype::ToReal(kernel_key.dtype())); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/abs_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/abs_kernel_register.cc index 2427f983abe..09d391b1d16 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/abs_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/abs_kernel_register.cc @@ -23,8 +23,8 @@ PD_CUSTOM_KERNEL_REGISTER(abs, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) { kernel->OutputAt(0).SetDataType(phi::dtype::ToReal(kernel_key.dtype())); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/accuracy_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/accuracy_kernel.cu index 15dc2ee1505..1928a27568f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/accuracy_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/accuracy_kernel.cu @@ -135,8 +135,8 @@ PD_CUSTOM_KERNEL_REGISTER(accuracy, iluvatar_gpu, ALL_LAYOUT, phi::AccuracyKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float) { kernel->InputAt(1).SetDataType(phi::DataType::INT32); kernel->InputAt(2).SetDataType(phi::DataType::INT32); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/activation_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/activation_grad_kernel_register.cc index f9339a78bda..4161d869b2c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/activation_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/activation_grad_kernel_register.cc @@ -20,224 +20,224 @@ PD_CUSTOM_KERNEL_REGISTER(relu_grad, ALL_LAYOUT, phi::ReluGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sin_grad, iluvatar_gpu, ALL_LAYOUT, phi::SinGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sin_double_grad, iluvatar_gpu, ALL_LAYOUT, phi::SinDoubleGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sin_triple_grad, iluvatar_gpu, ALL_LAYOUT, phi::SinTripleGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(cos_grad, iluvatar_gpu, ALL_LAYOUT, phi::CosGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(cos_double_grad, iluvatar_gpu, ALL_LAYOUT, phi::CosDoubleGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(cos_triple_grad, iluvatar_gpu, ALL_LAYOUT, phi::CosTripleGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(tan_grad, iluvatar_gpu, ALL_LAYOUT, phi::TanGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(acos_grad, iluvatar_gpu, ALL_LAYOUT, phi::AcosGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(asin_grad, iluvatar_gpu, ALL_LAYOUT, phi::AsinGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(atan_grad, iluvatar_gpu, ALL_LAYOUT, phi::AtanGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sinh_grad, iluvatar_gpu, ALL_LAYOUT, phi::SinhGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(cosh_grad, iluvatar_gpu, ALL_LAYOUT, phi::CoshGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(asinh_grad, iluvatar_gpu, ALL_LAYOUT, phi::AsinhGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(acosh_grad, iluvatar_gpu, ALL_LAYOUT, phi::AcoshGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(atanh_grad, iluvatar_gpu, ALL_LAYOUT, phi::AtanhGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(tanh_grad, iluvatar_gpu, ALL_LAYOUT, phi::TanhGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(tanh_double_grad, iluvatar_gpu, ALL_LAYOUT, phi::TanhDoubleGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(hardtanh_grad, iluvatar_gpu, ALL_LAYOUT, phi::HardTanhGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(thresholded_relu_grad, iluvatar_gpu, ALL_LAYOUT, phi::ThresholdedReluGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(relu6_grad, iluvatar_gpu, ALL_LAYOUT, phi::Relu6GradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(leaky_relu_grad, iluvatar_gpu, ALL_LAYOUT, phi::LeakyReluGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(mish_grad, iluvatar_gpu, ALL_LAYOUT, phi::MishGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(stanh_grad, iluvatar_gpu, ALL_LAYOUT, phi::STanhGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(reciprocal_grad, iluvatar_gpu, ALL_LAYOUT, phi::ReciprocalGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sqrt_grad, iluvatar_gpu, ALL_LAYOUT, phi::SqrtGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(rsqrt_grad, iluvatar_gpu, ALL_LAYOUT, phi::RsqrtGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(softplus_grad, iluvatar_gpu, ALL_LAYOUT, phi::SoftplusGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(exp_grad, iluvatar_gpu, @@ -246,8 +246,8 @@ PD_CUSTOM_KERNEL_REGISTER(exp_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(expm1_grad, iluvatar_gpu, @@ -256,8 +256,8 @@ PD_CUSTOM_KERNEL_REGISTER(expm1_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(square_grad, iluvatar_gpu, @@ -266,144 +266,144 @@ PD_CUSTOM_KERNEL_REGISTER(square_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(hard_shrink_grad, iluvatar_gpu, ALL_LAYOUT, phi::HardShrinkGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(softshrink_grad, iluvatar_gpu, ALL_LAYOUT, phi::SoftShrinkGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(tanh_shrink_grad, iluvatar_gpu, ALL_LAYOUT, phi::TanhShrinkGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(elu_grad, iluvatar_gpu, ALL_LAYOUT, phi::EluGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(silu_grad, iluvatar_gpu, ALL_LAYOUT, phi::SiluGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(softsign_grad, iluvatar_gpu, ALL_LAYOUT, phi::SoftsignGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sigmoid_grad, iluvatar_gpu, ALL_LAYOUT, phi::SigmoidGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sigmoid_double_grad, iluvatar_gpu, ALL_LAYOUT, phi::SigmoidDoubleGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sigmoid_triple_grad, iluvatar_gpu, ALL_LAYOUT, phi::SigmoidTripleGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(logsigmoid_grad, iluvatar_gpu, ALL_LAYOUT, phi::LogSigmoidGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(hardsigmoid_grad, iluvatar_gpu, ALL_LAYOUT, phi::HardSigmoidGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(hardswish_grad, iluvatar_gpu, ALL_LAYOUT, phi::HardSwishGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(swish_grad, iluvatar_gpu, ALL_LAYOUT, phi::SwishGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(round_grad, iluvatar_gpu, ALL_LAYOUT, phi::RoundGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(floor_grad, iluvatar_gpu, ALL_LAYOUT, phi::FloorGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(ceil_grad, iluvatar_gpu, ALL_LAYOUT, phi::CeilGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(celu_grad, iluvatar_gpu, ALL_LAYOUT, phi::CeluGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(log_grad, iluvatar_gpu, @@ -412,8 +412,8 @@ PD_CUSTOM_KERNEL_REGISTER(log_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(log2_grad, iluvatar_gpu, @@ -422,8 +422,8 @@ PD_CUSTOM_KERNEL_REGISTER(log2_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(log10_grad, iluvatar_gpu, @@ -432,8 +432,8 @@ PD_CUSTOM_KERNEL_REGISTER(log10_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(log1p_grad, iluvatar_gpu, @@ -442,8 +442,8 @@ PD_CUSTOM_KERNEL_REGISTER(log1p_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(pow_grad, iluvatar_gpu, @@ -452,8 +452,8 @@ PD_CUSTOM_KERNEL_REGISTER(pow_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(pow_double_grad, iluvatar_gpu, @@ -462,5 +462,5 @@ PD_CUSTOM_KERNEL_REGISTER(pow_double_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/activation_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/activation_kernel_register.cc index 497036bb89e..4837fe97270 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/activation_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/activation_kernel_register.cc @@ -20,24 +20,24 @@ PD_CUSTOM_KERNEL_REGISTER(relu, ALL_LAYOUT, phi::ReluKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sin, iluvatar_gpu, ALL_LAYOUT, phi::SinKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(cos, iluvatar_gpu, ALL_LAYOUT, phi::CosKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(tan, @@ -45,160 +45,160 @@ PD_CUSTOM_KERNEL_REGISTER(tan, ALL_LAYOUT, phi::TanKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(acos, iluvatar_gpu, ALL_LAYOUT, phi::AcosKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(asin, iluvatar_gpu, ALL_LAYOUT, phi::AsinKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(atan, iluvatar_gpu, ALL_LAYOUT, phi::AtanKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sinh, iluvatar_gpu, ALL_LAYOUT, phi::SinhKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(cosh, iluvatar_gpu, ALL_LAYOUT, phi::CoshKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(asinh, iluvatar_gpu, ALL_LAYOUT, phi::AsinhKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(acosh, iluvatar_gpu, ALL_LAYOUT, phi::AcoshKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(atanh, iluvatar_gpu, ALL_LAYOUT, phi::AtanhKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(tanh, iluvatar_gpu, ALL_LAYOUT, phi::TanhKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(hardtanh, iluvatar_gpu, ALL_LAYOUT, phi::HardTanhKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(thresholded_relu, iluvatar_gpu, ALL_LAYOUT, phi::ThresholdedReluKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(relu6, iluvatar_gpu, ALL_LAYOUT, phi::Relu6Kernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(leaky_relu, iluvatar_gpu, ALL_LAYOUT, phi::LeakyReluKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(mish, iluvatar_gpu, ALL_LAYOUT, phi::MishKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(stanh, iluvatar_gpu, ALL_LAYOUT, phi::StanhKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(reciprocal, iluvatar_gpu, ALL_LAYOUT, phi::ReciprocalKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sqrt, iluvatar_gpu, ALL_LAYOUT, phi::SqrtKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(rsqrt, iluvatar_gpu, ALL_LAYOUT, phi::RsqrtKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(softplus, iluvatar_gpu, ALL_LAYOUT, phi::SoftplusKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(exp, iluvatar_gpu, @@ -207,8 +207,8 @@ PD_CUSTOM_KERNEL_REGISTER(exp, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(expm1, iluvatar_gpu, @@ -217,8 +217,8 @@ PD_CUSTOM_KERNEL_REGISTER(expm1, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(square, iluvatar_gpu, @@ -227,128 +227,128 @@ PD_CUSTOM_KERNEL_REGISTER(square, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(hard_shrink, iluvatar_gpu, ALL_LAYOUT, phi::HardShrinkKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(softshrink, iluvatar_gpu, ALL_LAYOUT, phi::SoftShrinkKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(tanh_shrink, iluvatar_gpu, ALL_LAYOUT, phi::TanhShrinkKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(elu, iluvatar_gpu, ALL_LAYOUT, phi::EluKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(silu, iluvatar_gpu, ALL_LAYOUT, phi::SiluKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(softsign, iluvatar_gpu, ALL_LAYOUT, phi::SoftsignKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sigmoid, iluvatar_gpu, ALL_LAYOUT, phi::SigmoidKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(logsigmoid, iluvatar_gpu, ALL_LAYOUT, phi::LogSigmoidKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(hardsigmoid, iluvatar_gpu, ALL_LAYOUT, phi::HardSigmoidKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(hardswish, iluvatar_gpu, ALL_LAYOUT, phi::HardSwishKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(swish, iluvatar_gpu, ALL_LAYOUT, phi::SwishKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(round, iluvatar_gpu, ALL_LAYOUT, phi::RoundKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(floor, iluvatar_gpu, ALL_LAYOUT, phi::FloorKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(ceil, iluvatar_gpu, ALL_LAYOUT, phi::CeilKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(celu, iluvatar_gpu, ALL_LAYOUT, phi::CeluKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(log, iluvatar_gpu, @@ -357,8 +357,8 @@ PD_CUSTOM_KERNEL_REGISTER(log, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(log2, iluvatar_gpu, @@ -367,8 +367,8 @@ PD_CUSTOM_KERNEL_REGISTER(log2, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(log10, iluvatar_gpu, @@ -377,8 +377,8 @@ PD_CUSTOM_KERNEL_REGISTER(log10, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(log1p, iluvatar_gpu, @@ -387,8 +387,8 @@ PD_CUSTOM_KERNEL_REGISTER(log1p, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(pow, iluvatar_gpu, @@ -397,5 +397,5 @@ PD_CUSTOM_KERNEL_REGISTER(pow, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/adadelta_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/adadelta_kernel_register.cu index dabbc081842..1422cede8f8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/adadelta_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/adadelta_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(adadelta, phi::AdadeltaKernel, float, double, - phi::dtype::float16) { + phi::float16) { if (kernel_key.dtype() == phi::DataType::FLOAT16) { kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(2).SetDataType(phi::DataType::FLOAT32); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/adagrad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/adagrad_kernel_register.cu index c56274a8654..d3936fd6f44 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/adagrad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/adagrad_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(adagrad, phi::AdagradDenseKernel, float, double, - phi::dtype::float16) { + phi::float16) { if (kernel_key.dtype() == phi::DataType::FLOAT16) { kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(2).SetDataType(phi::DataType::FLOAT32); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/adam_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/adam_kernel_register.cu index e85e558abe4..d7e54b68da8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/adam_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/adam_kernel_register.cu @@ -21,8 +21,8 @@ PD_CUSTOM_KERNEL_REGISTER(adam, ALL_LAYOUT, phi::AdamDenseKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { // Skip beta1_pow, beta2_pow, skip_update data transform kernel->InputAt(6).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(7).SetBackend(phi::Backend::ALL_BACKEND); @@ -46,8 +46,8 @@ PD_CUSTOM_KERNEL_REGISTER(merged_adam, ALL_LAYOUT, phi::MergedAdamKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { // Skip beta1_pow, beta2_pow data transform kernel->InputAt(6).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(7).SetBackend(phi::Backend::ALL_BACKEND); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/adamax_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/adamax_kernel_register.cu index 526d7bee53a..27ac3146292 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/adamax_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/adamax_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(adamax, phi::AdamaxKernel, float, double, - phi::dtype::float16) { + phi::float16) { if (kernel_key.dtype() == phi::DataType::FLOAT16) { kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(2).SetDataType(phi::DataType::FLOAT32); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/adamw_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/adamw_kernel_register.cc index 5779c633d08..4a8441a4cc8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/adamw_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/adamw_kernel_register.cc @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(adamw, ALL_LAYOUT, phi::AdamwDenseKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { // Skip beta1_pow, beta2_pow, skip_update data transform kernel->InputAt(6).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(7).SetBackend(phi::Backend::ALL_BACKEND); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/adamw_kernel_row_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/adamw_kernel_row_register.cc index 54eea57dc23..63bdae52b5a 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/adamw_kernel_row_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/adamw_kernel_row_register.cc @@ -19,7 +19,7 @@ PD_CUSTOM_KERNEL_REGISTER(adamw_dense_param_sparse_grad, ALL_LAYOUT, phi::sr::AdamwDenseParamSparseGradKernel, float, - phi::dtype::float16) { + phi::float16) { // Skip beta1_pow, beta2_pow, skip_update data transform kernel->InputAt(6).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(7).SetBackend(phi::Backend::ALL_BACKEND); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/add_n_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/add_n_kernel_register.cu index 5623175eebe..dfcbb5cf1e7 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/add_n_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/add_n_kernel_register.cu @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(add_n, phi::AddNKernel, float, int, - phi::dtype::bfloat16, - phi::dtype::float16, + phi::bfloat16, + phi::float16, int64_t, phi::dtype::complex) {} @@ -31,7 +31,7 @@ PD_CUSTOM_KERNEL_REGISTER(add_n_array, phi::AddNArrayKernel, float, int, - phi::dtype::bfloat16, - phi::dtype::float16, + phi::bfloat16, + phi::float16, int64_t, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/addmm_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/addmm_grad_kernel_register.cc index 863d71ba501..4dc8b3a14b3 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/addmm_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/addmm_grad_kernel_register.cc @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(addmm_grad, ALL_LAYOUT, phi::AddmmGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/addmm_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/addmm_kernel_register.cc index 2f27a6f094c..b4cbe2f12b9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/addmm_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/addmm_kernel_register.cc @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(addmm, ALL_LAYOUT, phi::AddmmKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/all_gather_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/all_gather_kernel_register.cu index 47669596921..2b62a0b27ba 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/all_gather_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/all_gather_kernel_register.cu @@ -30,6 +30,6 @@ PD_CUSTOM_KERNEL_REGISTER(all_gather, int16_t, int64_t, bool, - phi::dtype::float16, + phi::float16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/all_reduce_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/all_reduce_kernel_register.cu index 05707873293..478fe205ed4 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/all_reduce_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/all_reduce_kernel_register.cu @@ -31,8 +31,8 @@ PD_CUSTOM_KERNEL_REGISTER(all_reduce, uint8_t, int16_t, int64_t, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} #else PD_CUSTOM_KERNEL_REGISTER(all_reduce, iluvatar_gpu, @@ -46,5 +46,5 @@ PD_CUSTOM_KERNEL_REGISTER(all_reduce, uint8_t, int16_t, int64_t, - phi::dtype::float16) {} + phi::float16) {} #endif diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/all_to_all_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/all_to_all_kernel_register.cu index ab1e0390a5b..1d78ee5f7f6 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/all_to_all_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/all_to_all_kernel_register.cu @@ -32,8 +32,8 @@ PD_CUSTOM_KERNEL_REGISTER(all_to_all, int16_t, int64_t, bool, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} #else PD_CUSTOM_KERNEL_REGISTER(all_to_all, iluvatar_gpu, @@ -47,5 +47,5 @@ PD_CUSTOM_KERNEL_REGISTER(all_to_all, int16_t, int64_t, bool, - phi::dtype::float16) {} + phi::float16) {} #endif diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/allclose_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/allclose_kernel_register.cu index 92c631702d6..9bdbb51c99c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/allclose_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/allclose_kernel_register.cu @@ -25,6 +25,6 @@ PD_CUSTOM_KERNEL_REGISTER(allclose, bool, int, int64_t, - phi::dtype::float16) { + phi::float16) { kernel->OutputAt(0).SetDataType(phi::DataType::BOOL); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/amp_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/amp_kernel_register.cc index 612317c883e..cf7f7c78a8e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/amp_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/amp_kernel_register.cc @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(check_finite_and_unscale, ALL_LAYOUT, phi::CheckFiniteAndUnscaleKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(1).SetDataType(phi::DataType::BOOL); } @@ -30,8 +30,8 @@ PD_CUSTOM_KERNEL_REGISTER(update_loss_scaling, ALL_LAYOUT, phi::UpdateLossScalingKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); if (kernel_key.dtype() == phi::DataType::FLOAT16 || kernel_key.dtype() == phi::DataType::BFLOAT16) { diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/angle_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/angle_grad_kernel_register.cu index c9cded31ab9..fd0fb51aaaa 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/angle_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/angle_grad_kernel_register.cu @@ -22,8 +22,8 @@ PD_CUSTOM_KERNEL_REGISTER(angle_grad, phi::AngleGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) { kernel->InputAt(1).SetDataType(phi::dtype::ToReal(kernel_key.dtype())); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/angle_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/angle_kernel_register.cu index c0da2fdf288..48ac5877269 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/angle_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/angle_kernel_register.cu @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(angle, phi::AngleKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) { kernel->OutputAt(0).SetDataType(phi::DataType::UNDEFINED); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/ap_facade_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/ap_facade_kernel_register.cu index c472d594036..148de38ce59 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/ap_facade_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/ap_facade_kernel_register.cu @@ -22,8 +22,8 @@ PD_CUSTOM_KERNEL_REGISTER(ap_facade, float, double, int, - phi::dtype::bfloat16, - phi::dtype::float16, + phi::bfloat16, + phi::float16, int64_t, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/ap_trivial_fusion_begin_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/ap_trivial_fusion_begin_kernel_register.cu index 6f21217e939..d40c350fa28 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/ap_trivial_fusion_begin_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/ap_trivial_fusion_begin_kernel_register.cu @@ -22,8 +22,8 @@ PD_CUSTOM_KERNEL_REGISTER(ap_trivial_fusion_begin, float, double, int, - phi::dtype::bfloat16, - phi::dtype::float16, + phi::bfloat16, + phi::float16, int64_t, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/ap_trivial_fusion_end_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/ap_trivial_fusion_end_kernel_register.cu index 6452f845d64..b04b66c04c2 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/ap_trivial_fusion_end_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/ap_trivial_fusion_end_kernel_register.cu @@ -22,8 +22,8 @@ PD_CUSTOM_KERNEL_REGISTER(ap_trivial_fusion_end, float, double, int, - phi::dtype::bfloat16, - phi::dtype::float16, + phi::bfloat16, + phi::float16, int64_t, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/ap_variadic_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/ap_variadic_kernel_register.cu index e625f7afa7f..b2b159ca8b1 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/ap_variadic_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/ap_variadic_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(ap_variadic, phi::ApVariadicKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} #else PD_CUSTOM_KERNEL_REGISTER(ap_variadic, iluvatar_gpu, @@ -31,6 +31,6 @@ PD_CUSTOM_KERNEL_REGISTER(ap_variadic, phi::ApVariadicKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} #endif diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/apply_per_channel_scale_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/apply_per_channel_scale_kernel_register.cu index 078671d181f..a4590bc0288 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/apply_per_channel_scale_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/apply_per_channel_scale_kernel_register.cu @@ -19,5 +19,5 @@ PD_CUSTOM_KERNEL_REGISTER(apply_per_channel_scale, iluvatar_gpu, ALL_LAYOUT, phi::ApplyPerChannelScaleKernel, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/arange_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/arange_kernel_register.cc index ec7e34e8469..7cfabe98908 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/arange_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/arange_kernel_register.cc @@ -22,8 +22,8 @@ PD_CUSTOM_KERNEL_REGISTER(arange_tensor, float, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(0).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); @@ -36,5 +36,5 @@ PD_CUSTOM_KERNEL_REGISTER(arange, float, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/arg_min_max_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/arg_min_max_kernel_register.cc index cb8d5e978e1..19cb977428b 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/arg_min_max_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/arg_min_max_kernel_register.cc @@ -18,8 +18,8 @@ PD_CUSTOM_KERNEL_REGISTER(argmin, iluvatar_gpu, ALL_LAYOUT, phi::ArgMinKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, int32_t, int64_t, @@ -32,8 +32,8 @@ PD_CUSTOM_KERNEL_REGISTER(argmax, iluvatar_gpu, ALL_LAYOUT, phi::ArgMaxKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, int32_t, int64_t, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/argsort_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/argsort_grad_kernel_register.cc index fd4e8736671..7a3d5d999b1 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/argsort_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/argsort_grad_kernel_register.cc @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(argsort_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/argsort_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/argsort_kernel_register.cc index 38f33ca290b..15ef55a1864 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/argsort_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/argsort_kernel_register.cc @@ -22,7 +22,7 @@ PD_CUSTOM_KERNEL_REGISTER(argsort, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(1).SetDataType(phi::DataType::INT64); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/array_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/array_grad_kernel_register.cc index 5a9801a5c8f..a3db7773717 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/array_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/array_grad_kernel_register.cc @@ -24,6 +24,6 @@ PD_CUSTOM_KERNEL_REGISTER(tensor_to_array, int64_t, float, double, - phi::dtype::float16, + phi::float16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/array_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/array_kernel_register.cu index 1f435a5fd2a..27a6b333170 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/array_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/array_kernel_register.cu @@ -26,8 +26,8 @@ PD_CUSTOM_KERNEL_REGISTER(create_array, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} @@ -40,8 +40,8 @@ PD_CUSTOM_KERNEL_REGISTER(create_array_like, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} @@ -54,8 +54,8 @@ PD_CUSTOM_KERNEL_REGISTER(array_read, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} @@ -68,8 +68,8 @@ PD_CUSTOM_KERNEL_REGISTER(array_write, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} @@ -82,8 +82,8 @@ PD_CUSTOM_KERNEL_REGISTER(array_to_tensor, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} @@ -96,7 +96,7 @@ PD_CUSTOM_KERNEL_REGISTER(array_pop, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/asgd_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/asgd_kernel_register.cu index 0426c1a31a4..4b672edd7ca 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/asgd_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/asgd_kernel_register.cu @@ -18,7 +18,7 @@ PD_CUSTOM_KERNEL_REGISTER(asgd, iluvatar_gpu, ALL_LAYOUT, phi::ASGDKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/assign_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/assign_kernel_register.cc index 1c1b38e15fe..47996ae6b96 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/assign_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/assign_kernel_register.cc @@ -38,6 +38,6 @@ PD_CUSTOM_KERNEL_REGISTER(assign_value, float, int8_t, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/atan2_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/atan2_grad_kernel_register.cu index 8bd284a5b5f..ceaaa3135c6 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/atan2_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/atan2_grad_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(atan2_grad, phi::Atan2GradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/atan2_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/atan2_kernel_register.cu index 1b920e0ac78..6c77f92b067 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/atan2_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/atan2_kernel_register.cu @@ -21,8 +21,8 @@ PD_CUSTOM_KERNEL_REGISTER(atan2, phi::Atan2Kernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t) { kernel->OutputAt(0).SetDataType(phi::DataType::UNDEFINED); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/baddbmm_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/baddbmm_grad_kernel_register.cu index a61d29d9319..03486eeb8b2 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/baddbmm_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/baddbmm_grad_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(baddbmm_grad, phi::BaddbmmGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/baddbmm_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/baddbmm_kernel_register.cu index 2be49c429eb..5ed55f8a4d7 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/baddbmm_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/baddbmm_kernel_register.cu @@ -23,5 +23,5 @@ PD_CUSTOM_KERNEL_REGISTER(baddbmm, phi::BaddbmmKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/batch_norm_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/batch_norm_grad_kernel_register.cc index 5185743eeb8..80bcb28b41a 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/batch_norm_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/batch_norm_grad_kernel_register.cc @@ -22,7 +22,7 @@ PD_CUSTOM_KERNEL_REGISTER(batch_norm_coo_grad, phi::sparse::BatchNormCooGradKernel, float, double, - phi::dtype::float16) { + phi::float16) { kernel->InputAt(0).SetDataLayout(phi::DataLayout::SPARSE_COO); if (kernel_key.dtype() == phi::DataType::FLOAT16) { kernel->OutputAt(0).SetDataType(phi::DataType::FLOAT32); // x_grad @@ -36,8 +36,8 @@ PD_CUSTOM_KERNEL_REGISTER(batch_norm_grad, ALL_LAYOUT, phi::BatchNormGradKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16) { + phi::bfloat16, + phi::float16) { if (kernel_key.dtype() == phi::DataType::FLOAT16 || kernel_key.dtype() == phi::DataType::BFLOAT16) { kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); // scale_grad diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/batch_norm_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/batch_norm_kernel_register.cc index eacc440ad68..c19e597d2d3 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/batch_norm_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/batch_norm_kernel_register.cc @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(batch_norm_infer, ALL_LAYOUT, phi::BatchNormInferKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16) { + phi::bfloat16, + phi::float16) { if (kernel_key.dtype() == phi::DataType::FLOAT16 || kernel_key.dtype() == phi::DataType::BFLOAT16) { kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); @@ -34,8 +34,8 @@ PD_CUSTOM_KERNEL_REGISTER(batch_norm, ALL_LAYOUT, phi::BatchNormKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16) { + phi::bfloat16, + phi::float16) { if (kernel_key.dtype() == phi::DataType::FLOAT16 || kernel_key.dtype() == phi::DataType::BFLOAT16) { kernel->InputAt(1).SetDataType(phi::DataType::FLOAT32); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/bce_loss_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/bce_loss_grad_kernel_register.cu index 511bd9ed702..2b141704fb5 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/bce_loss_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/bce_loss_grad_kernel_register.cu @@ -20,4 +20,4 @@ PD_CUSTOM_KERNEL_REGISTER(bce_loss_grad, phi::BCELossGradKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/bce_loss_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/bce_loss_kernel_register.cu index 5e071e194e2..f5048b561c2 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/bce_loss_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/bce_loss_kernel_register.cu @@ -20,4 +20,4 @@ PD_CUSTOM_KERNEL_REGISTER(bce_loss, phi::BCELossKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/beam_search_decode_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/beam_search_decode_kernel_register.cu index f3d84ff3d0a..6edc6f6afa8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/beam_search_decode_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/beam_search_decode_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(beam_search_decode, phi::BeamSearchDecodeOpKernel, float, double, - phi::dtype::float16, + phi::float16, int, int64_t) { kernel->OutputAt(0).SetDataType(phi::DataType::INT64); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/bernoulli_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/bernoulli_kernel_register.cu index 261dc6997c6..c26ed39b716 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/bernoulli_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/bernoulli_kernel_register.cu @@ -19,7 +19,7 @@ PD_CUSTOM_KERNEL_REGISTER(bernoulli, iluvatar_gpu, ALL_LAYOUT, phi::BernoulliKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/binomial_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/binomial_kernel_register.cu index d0384d112f8..c78bd81ec71 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/binomial_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/binomial_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(binomial, phi::BinomialKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(0).SetDataType(phi::DataType::INT64); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/bmm_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/bmm_grad_kernel_register.cc index f963c30b789..050ef2d0fc1 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/bmm_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/bmm_grad_kernel_register.cc @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(bmm_grad, ALL_LAYOUT, phi::BmmGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/bmm_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/bmm_kernel_register.cc index bc1c9dff029..4609471f3fc 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/bmm_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/bmm_kernel_register.cc @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(bmm, ALL_LAYOUT, phi::BmmKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_kernel_register.cu index c45719d09c9..00b652c37b9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_kernel_register.cu @@ -22,14 +22,14 @@ PD_CUSTOM_KERNEL_REGISTER(broadcast, phi::BroadcastKernel, float, double, - phi::dtype::bfloat16, + phi::bfloat16, int, bool, int8_t, uint8_t, int16_t, int64_t, - phi::dtype::float16, + phi::float16, phi::dtype::complex, phi::dtype::complex) {} #else @@ -45,7 +45,7 @@ PD_CUSTOM_KERNEL_REGISTER(broadcast, uint8_t, int16_t, int64_t, - phi::dtype::float16, + phi::float16, phi::dtype::complex, phi::dtype::complex) {} #endif diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_tensors_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_tensors_grad_kernel_register.cu index 305d8a4a5a4..bcbba855b4f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_tensors_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_tensors_grad_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(broadcast_tensors_grad, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_tensors_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_tensors_kernel_register.cu index 34fa9030695..d9082427144 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_tensors_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/broadcast_tensors_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(broadcast_tensors, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/c_concat_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/c_concat_kernel_register.cu index 8e2961321a9..6c8b33af852 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/c_concat_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/c_concat_kernel_register.cu @@ -23,4 +23,4 @@ PD_CUSTOM_KERNEL_REGISTER(c_concat, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/c_embedding_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/c_embedding_grad_kernel_register.cc index 3040e711f63..c57c2db5906 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/c_embedding_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/c_embedding_grad_kernel_register.cc @@ -20,6 +20,6 @@ PD_CUSTOM_KERNEL_REGISTER(c_embedding_grad, ALL_LAYOUT, phi::CEmbeddingGradKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16, + phi::bfloat16, + phi::float16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/c_embedding_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/c_embedding_kernel_register.cc index bf57d2e3b39..ffb99b75583 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/c_embedding_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/c_embedding_kernel_register.cc @@ -20,6 +20,6 @@ PD_CUSTOM_KERNEL_REGISTER(c_embedding, ALL_LAYOUT, phi::CEmbeddingKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16, + phi::bfloat16, + phi::float16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/c_identity_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/c_identity_kernel_register.cc index 38d1e402bde..e9eedd92889 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/c_identity_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/c_identity_kernel_register.cc @@ -24,5 +24,5 @@ PD_CUSTOM_KERNEL_REGISTER(c_identity, float, int, int64_t, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/c_scatter_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/c_scatter_kernel_register.cu index fe6c5eba253..3fe91a83023 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/c_scatter_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/c_scatter_kernel_register.cu @@ -23,4 +23,4 @@ PD_CUSTOM_KERNEL_REGISTER(c_scatter, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/c_softmax_with_cross_entropy_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/c_softmax_with_cross_entropy_grad_kernel_register.cc index 05dc0d7acbd..f54d63be38d 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/c_softmax_with_cross_entropy_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/c_softmax_with_cross_entropy_grad_kernel_register.cc @@ -20,4 +20,4 @@ PD_CUSTOM_KERNEL_REGISTER(c_softmax_with_cross_entropy_grad, ALL_LAYOUT, phi::CSoftmaxWithCrossEntropyGradKernel, float, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/c_split_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/c_split_kernel_register.cu index db327af7380..80592897183 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/c_split_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/c_split_kernel_register.cu @@ -25,8 +25,8 @@ PD_CUSTOM_KERNEL_REGISTER(c_split, double, int, int64_t, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} #else PD_CUSTOM_KERNEL_REGISTER(c_split, iluvatar_gpu, @@ -36,5 +36,5 @@ PD_CUSTOM_KERNEL_REGISTER(c_split, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} #endif diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/cast_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/cast_kernel_register.cc index 294775dca37..e28dffe28d4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/cast_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/cast_kernel_register.cc @@ -26,8 +26,8 @@ PD_CUSTOM_KERNEL_REGISTER(cast, bool, int8_t, uint8_t, - phi::dtype::float16, + phi::float16, phi::dtype::complex, - phi::dtype::bfloat16) { + phi::bfloat16) { kernel->OutputAt(0).SetDataType(phi::DataType::UNDEFINED); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/channel_shuffle_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/channel_shuffle_grad_kernel_register.cu index a90a67052fc..0a4cfeed297 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/channel_shuffle_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/channel_shuffle_grad_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(channel_shuffle_grad, phi::ChannelShuffleGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/channel_shuffle_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/channel_shuffle_kernel_register.cu index c4e18964676..42ad4354f6e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/channel_shuffle_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/channel_shuffle_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(channel_shuffle, phi::ChannelShuffleKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/check_memory_continue_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/check_memory_continue_kernel_register.cc index c3558dfee5c..01d3e70263b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/check_memory_continue_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/check_memory_continue_kernel_register.cc @@ -19,7 +19,7 @@ PD_CUSTOM_KERNEL_REGISTER(check_memory_continue, iluvatar_gpu, ALL_LAYOUT, phi::CheckMemoryContinueKernel, - phi::dtype::float16, + phi::float16, int, float, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/check_numerics_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/check_numerics_kernel_register.cu index 4717e65c6ea..88b80dc94cc 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/check_numerics_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/check_numerics_kernel_register.cu @@ -21,8 +21,8 @@ PD_CUSTOM_KERNEL_REGISTER(check_numerics, phi::CheckNumericsKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex, phi::dtype::float8_e4m3fn, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/clip_by_norm_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/clip_by_norm_kernel_register.cu index 9af5f441c34..4d6b0aa62b2 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/clip_by_norm_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/clip_by_norm_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(clip_by_norm, ALL_LAYOUT, phi::ClipByNormKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/clip_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/clip_grad_kernel_register.cc index e7c870b0340..a8fb8d75037 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/clip_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/clip_grad_kernel_register.cc @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(clip_grad, float, int, int64_t, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/clip_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/clip_kernel_register.cc index 99ad6a49fc7..fff31fb8041 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/clip_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/clip_kernel_register.cc @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(clip, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/coalesce_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/coalesce_kernel_register.cu index bce4ab1c7c4..88f62ad5023 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/coalesce_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/coalesce_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(coalesce_coo, phi::sparse::CoalesceCooKernel, float, double, - phi::dtype::float16, + phi::float16, uint8_t, int16_t, int, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/coalesce_tensor_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/coalesce_tensor_kernel_register.cc index 5980180cfdd..855a3859412 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/coalesce_tensor_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/coalesce_tensor_kernel_register.cc @@ -19,8 +19,8 @@ PD_CUSTOM_KERNEL_REGISTER(coalesce_tensor, iluvatar_gpu, ALL_LAYOUT, phi::CoalesceTensorKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, float, double) { diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/compare_kernel_legacy_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/compare_kernel_legacy_register.cu index 0dcfdd6b980..1cc743f409e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/compare_kernel_legacy_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/compare_kernel_legacy_register.cu @@ -32,8 +32,8 @@ PD_CUSTOM_KERNEL_REGISTER(less_than_raw, phi::dtype::complex, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(0).SetDataType(phi::DataType::BOOL); } @@ -52,8 +52,8 @@ PD_CUSTOM_KERNEL_REGISTER(less_than_raw, phi::dtype::complex, \ float, \ double, \ - phi::dtype::float16, \ - phi::dtype::bfloat16) { \ + phi::float16, \ + phi::bfloat16) { \ kernel->OutputAt(0).SetDataType(phi::DataType::BOOL); \ } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/compare_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/compare_kernel_register.cc index 760542dc0b2..20c82a2973a 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/compare_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/compare_kernel_register.cc @@ -38,8 +38,8 @@ PD_CUSTOM_KERNEL_REGISTER(equal_all, int16_t, \ int64_t, \ float, \ - phi::dtype::float16, \ - phi::dtype::bfloat16) { \ + phi::float16, \ + phi::bfloat16) { \ kernel->OutputAt(0).SetDataType(phi::DataType::BOOL); \ } @@ -56,8 +56,8 @@ PD_CUSTOM_KERNEL_REGISTER(equal_all, int64_t, \ phi::dtype::complex, \ float, \ - phi::dtype::float16, \ - phi::dtype::bfloat16) { \ + phi::float16, \ + phi::bfloat16) { \ kernel->OutputAt(0).SetDataType(phi::DataType::BOOL); \ } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/complex_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/complex_kernel_register.cu index b9dafdf489c..d329ab83504 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/complex_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/complex_kernel_register.cu @@ -19,8 +19,8 @@ PD_CUSTOM_KERNEL_REGISTER(conj, iluvatar_gpu, ALL_LAYOUT, phi::ConjKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex, float, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/concat_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/concat_grad_kernel_register.cc index 61ffaf3e540..47b891d73c5 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/concat_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/concat_grad_kernel_register.cc @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(concat_grad, uint8_t, int8_t, int16_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/concat_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/concat_kernel_register.cc index 9fd78f85fa8..3ddc102b854 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/concat_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/concat_kernel_register.cc @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(concat, uint8_t, int8_t, int16_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/contiguous_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/contiguous_kernel_register.cc index 0d6c3bb8a73..60fe09a404e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/contiguous_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/contiguous_kernel_register.cc @@ -23,6 +23,6 @@ PD_CUSTOM_KERNEL_REGISTER(contiguous, int32_t, int64_t, float, - ::phi::dtype::float16, - ::phi::dtype::bfloat16, + ::phi::float16, + ::phi::bfloat16, ::phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/conv_dnn_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/conv_dnn_grad_kernel_register.cu index 2f65f91ece5..afd9ea4c0bc 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/conv_dnn_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/conv_dnn_grad_kernel_register.cu @@ -20,37 +20,37 @@ PD_CUSTOM_KERNEL_REGISTER(conv2d_grad, ALL_LAYOUT, phi::ConvCudnnGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(conv3d_grad, GPUDNN, ALL_LAYOUT, phi::Conv3DCudnnGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(conv2d_double_grad, GPUDNN, ALL_LAYOUT, phi::ConvCudnnGradGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(conv3d_double_grad, GPUDNN, ALL_LAYOUT, phi::Conv3DCudnnDoubleGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(depthwise_conv2d_double_grad, GPUDNN, ALL_LAYOUT, phi::DepthwiseConvDoubleGradGPUDNNKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/conv_dnn_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/conv_dnn_kernel_register.cu index b51d661ed08..859a3b7ac54 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/conv_dnn_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/conv_dnn_kernel_register.cu @@ -20,13 +20,13 @@ PD_CUSTOM_KERNEL_REGISTER(conv2d, ALL_LAYOUT, phi::ConvCudnnKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(conv3d, GPUDNN, ALL_LAYOUT, phi::Conv3DCudnnKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/conv_transpose_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/conv_transpose_grad_kernel_register.cu index bf939e1ab45..bbbb4a68556 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/conv_transpose_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/conv_transpose_grad_kernel_register.cu @@ -21,18 +21,18 @@ PD_CUSTOM_KERNEL_REGISTER(conv2d_transpose_grad, phi::Conv2dTransposeGradGPUDNNKernel, float, float16, - phi::dtype::bfloat16) {} + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(conv2d_transpose_double_grad, iluvatar_gpu, ALL_LAYOUT, phi::Conv2dTransposeDoubleGradGPUDNNKernel, float, float16, - phi::dtype::bfloat16) {} + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(conv3d_transpose_grad, iluvatar_gpu, ALL_LAYOUT, phi::Conv3dTransposeGradGPUDNNKernel, float, float16, - phi::dtype::bfloat16) {} + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/conv_transpose_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/conv_transpose_kernel_register.cu index f2850e1fd24..05bea6e9eb1 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/conv_transpose_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/conv_transpose_kernel_register.cu @@ -21,11 +21,11 @@ PD_CUSTOM_KERNEL_REGISTER(conv2d_transpose, phi::Conv2dTransposeGPUDNNKernel, float, float16, - phi::dtype::bfloat16) {} + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(conv3d_transpose, iluvatar_gpu, ALL_LAYOUT, phi::Conv3dTransposeGPUDNNKernel, float, float16, - phi::dtype::bfloat16) {} + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy2_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy2_grad_kernel_register.cu index a3f7884c19c..62d22f13116 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy2_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy2_grad_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(cross_entropy_grad, phi::CrossEntropyGradientOpKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(cross_entropy_grad2, iluvatar_gpu, @@ -29,6 +29,6 @@ PD_CUSTOM_KERNEL_REGISTER(cross_entropy_grad2, phi::CrossEntropyGradientOpKernel2, float, double, - phi::dtype::float16) { + phi::float16) { kernel->InputAt(1).SetDataType(phi::DataType::INT64); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy2_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy2_kernel_register.cu index dd384ffffec..1abe2496f6f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy2_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy2_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(cross_entropy, phi::CrossEntropyOpKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(cross_entropy2, iluvatar_gpu, @@ -29,4 +29,4 @@ PD_CUSTOM_KERNEL_REGISTER(cross_entropy2, phi::CrossEntropyOpKernel2, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy_grad_kernel_register.cu index 233022e2fe1..7b6e5494195 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy_grad_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(cross_entropy_with_softmax_grad, ALL_LAYOUT, phi::CrossEntropyWithSoftmaxGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy_kernel_register.cu index ed9992fa8d8..61981e9d6f0 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_entropy_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(cross_entropy_with_softmax, ALL_LAYOUT, phi::CrossEntropyWithSoftmaxKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_grad_kernel_register.cu index 23a3a729162..4ec40a64311 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_grad_kernel_register.cu @@ -19,8 +19,8 @@ PD_CUSTOM_KERNEL_REGISTER(cross_grad, iluvatar_gpu, ALL_LAYOUT, phi::CrossGradKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double, int, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_kernel_register.cu index eb838e9c7ce..3df53576d02 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/cross_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/cross_kernel_register.cu @@ -19,8 +19,8 @@ PD_CUSTOM_KERNEL_REGISTER(cross, iluvatar_gpu, ALL_LAYOUT, phi::CrossKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double, int, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/cum_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/cum_grad_kernel_register.cc index cec9a1c7efa..bff301f7f4b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/cum_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/cum_grad_kernel_register.cc @@ -23,6 +23,6 @@ PD_CUSTOM_KERNEL_REGISTER(cumsum_grad, int16_t, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/cum_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/cum_kernel_register.cc index c13773c2701..54dfe102f51 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/cum_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/cum_kernel_register.cc @@ -23,13 +23,13 @@ PD_CUSTOM_KERNEL_REGISTER(cumsum, int16_t, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(logcumsumexp, iluvatar_gpu, ALL_LAYOUT, phi::LogcumsumexpKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/cumprod_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/cumprod_grad_kernel_register.cu index 6ff77374bae..181b7af85f1 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/cumprod_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/cumprod_grad_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(cumprod_grad, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/cumprod_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/cumprod_kernel_register.cu index cd209d7b5b6..e69355d7898 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/cumprod_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/cumprod_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(cumprod, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/debug_tools_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/debug_tools_kernel_register.cu index 7873d99f81d..a7fd884dfdd 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/debug_tools_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/debug_tools_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(check_model_nan_inf, double, int32_t, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/depend_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/depend_kernel_register.cu index 784f9255d26..8042d85d84a 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/depend_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/depend_kernel_register.cu @@ -24,6 +24,6 @@ PD_CUSTOM_KERNEL_REGISTER(depend, double, int, int64_t, - phi::dtype::float16, + phi::float16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/depthwise_conv_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/depthwise_conv_grad_kernel_register.cu index 29f32924036..95155929705 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/depthwise_conv_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/depthwise_conv_grad_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(depthwise_conv2d_grad, ALL_LAYOUT, phi::DepthwiseConvGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/depthwise_conv_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/depthwise_conv_kernel_register.cu index 219b475bf11..fef05331190 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/depthwise_conv_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/depthwise_conv_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(depthwise_conv2d, ALL_LAYOUT, phi::DepthwiseConvKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/diag_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/diag_grad_kernel_register.cu index 7f019983058..cc7a4282c96 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/diag_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/diag_grad_kernel_register.cu @@ -19,8 +19,8 @@ PD_CUSTOM_KERNEL_REGISTER(diag_grad, iluvatar_gpu, ALL_LAYOUT, phi::DiagGradKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t, float, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/diag_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/diag_kernel_register.cu index f8d538a73bb..1359ea8a387 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/diag_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/diag_kernel_register.cu @@ -19,8 +19,8 @@ PD_CUSTOM_KERNEL_REGISTER(diag, iluvatar_gpu, ALL_LAYOUT, phi::DiagKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t, float, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/diagonal_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/diagonal_grad_kernel_register.cu index df9e4dad95d..c099cbf089d 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/diagonal_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/diagonal_grad_kernel_register.cu @@ -26,7 +26,7 @@ PD_CUSTOM_KERNEL_REGISTER(diagonal_grad, int, int64_t, bool, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/diagonal_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/diagonal_kernel_register.cu index dc58ceb7074..90652d0447e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/diagonal_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/diagonal_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(diagonal, int, int64_t, bool, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/digamma_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/digamma_grad_kernel_register.cu index fc439b26cbb..fc3db113b73 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/digamma_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/digamma_grad_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(digamma_grad, phi::DigammaGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/digamma_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/digamma_kernel_register.cu index 1ff0588ca10..62549182b87 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/digamma_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/digamma_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(digamma, phi::DigammaKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/dist_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/dist_grad_kernel_register.cc index d6100c700b1..a7810256d46 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/dist_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/dist_grad_kernel_register.cc @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(dist_grad, phi::DistGradKernel, float, double, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/dist_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/dist_kernel_register.cu index 428319116db..a6c451f7b0c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/dist_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/dist_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(dist, phi::DistKernel, float, double, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/dot_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/dot_grad_kernel_register.cu index 13d3c81dbb4..96adb3fbd64 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/dot_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/dot_grad_kernel_register.cu @@ -25,5 +25,5 @@ PD_CUSTOM_KERNEL_REGISTER(dot_grad, int64_t, phi::dtype::complex, phi::dtype::complex, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/dot_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/dot_kernel_register.cu index 7ab9bd39666..123accc32e4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/dot_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/dot_kernel_register.cu @@ -29,5 +29,5 @@ PD_CUSTOM_KERNEL_REGISTER(dot, int64_t, complex64, complex128, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/dropout_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/dropout_grad_kernel_register.cc index e64e389ae56..73a794a7363 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/dropout_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/dropout_grad_kernel_register.cc @@ -20,13 +20,13 @@ PD_CUSTOM_KERNEL_REGISTER(dropout_grad, ALL_LAYOUT, phi::DropoutGradRawKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(dropout_nd_grad, iluvatar_gpu, ALL_LAYOUT, phi::DropoutNdGradKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/dropout_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/dropout_kernel_register.cc index ace70aff999..986e97a1b6e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/dropout_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/dropout_kernel_register.cc @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(dropout, ALL_LAYOUT, phi::DropoutRawKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16) { + phi::bfloat16, + phi::float16) { kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); kernel->OutputAt(1).SetDataType(phi::DataType::UINT8); } @@ -31,8 +31,8 @@ PD_CUSTOM_KERNEL_REGISTER(dropout_nd, ALL_LAYOUT, phi::DropoutNdKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16) { + phi::bfloat16, + phi::float16) { kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); kernel->OutputAt(1).SetDataType(phi::DataType::UINT8); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/einsum_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/einsum_grad_kernel_register.cu index 16ef62b5ff9..c5027ec309d 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/einsum_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/einsum_grad_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(einsum_grad, phi::EinsumGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/einsum_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/einsum_kernel_register.cc index 10ad2ea912f..6f7a220b1d3 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/einsum_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/einsum_kernel_register.cc @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(einsum, ALL_LAYOUT, phi::EinsumKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(einsum_infer, @@ -29,6 +29,6 @@ PD_CUSTOM_KERNEL_REGISTER(einsum_infer, ALL_LAYOUT, phi::EinsumInferKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_grad_kernel_register.cc index 18dbda76b64..4a22eb00028 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_grad_kernel_register.cc @@ -25,8 +25,8 @@ PD_CUSTOM_KERNEL_REGISTER(fmax_grad, phi::ElementwiseFMaxGradKernel, float, int, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int64_t) {} PD_CUSTOM_KERNEL_REGISTER(fmin_grad, @@ -35,8 +35,8 @@ PD_CUSTOM_KERNEL_REGISTER(fmin_grad, phi::ElementwiseFMinGradKernel, float, int, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int64_t) {} PD_CUSTOM_KERNEL_REGISTER(maximum_grad, @@ -46,8 +46,8 @@ PD_CUSTOM_KERNEL_REGISTER(maximum_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(minimum_grad, iluvatar_gpu, @@ -56,8 +56,8 @@ PD_CUSTOM_KERNEL_REGISTER(minimum_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(remainder_grad, iluvatar_gpu, @@ -66,8 +66,8 @@ PD_CUSTOM_KERNEL_REGISTER(remainder_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(heaviside_grad, iluvatar_gpu, @@ -75,8 +75,8 @@ PD_CUSTOM_KERNEL_REGISTER(heaviside_grad, phi::HeavisideGradKernel, float, int, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int64_t) {} PD_CUSTOM_KERNEL_REGISTER(elementwise_pow_grad, @@ -85,8 +85,8 @@ PD_CUSTOM_KERNEL_REGISTER(elementwise_pow_grad, phi::ElementwisePowGradKernel, float, int, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int64_t) {} PD_CUSTOM_KERNEL_REGISTER(add_grad, @@ -96,8 +96,8 @@ PD_CUSTOM_KERNEL_REGISTER(add_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(add_double_grad, @@ -107,8 +107,8 @@ PD_CUSTOM_KERNEL_REGISTER(add_double_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(add_triple_grad, @@ -118,8 +118,8 @@ PD_CUSTOM_KERNEL_REGISTER(add_triple_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(divide_grad, @@ -127,8 +127,8 @@ PD_CUSTOM_KERNEL_REGISTER(divide_grad, ALL_LAYOUT, phi::DivideGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int8_t, uint8_t, int16_t, @@ -142,8 +142,8 @@ PD_CUSTOM_KERNEL_REGISTER(divide_double_grad, ALL_LAYOUT, phi::DivideDoubleGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t, bool, @@ -154,11 +154,11 @@ PD_CUSTOM_KERNEL_REGISTER(multiply_grad, ALL_LAYOUT, phi::MultiplyGradKernel, float, - phi::dtype::float16, + phi::float16, int, int64_t, bool, - phi::dtype::bfloat16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(multiply_double_grad, @@ -166,12 +166,12 @@ PD_CUSTOM_KERNEL_REGISTER(multiply_double_grad, ALL_LAYOUT, phi::MultiplyDoubleGradKernel, float, - phi::dtype::float16, + phi::float16, double, int, int64_t, bool, - phi::dtype::bfloat16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(multiply_triple_grad, @@ -179,11 +179,11 @@ PD_CUSTOM_KERNEL_REGISTER(multiply_triple_grad, ALL_LAYOUT, phi::MultiplyTripleGradKernel, float, - phi::dtype::float16, + phi::float16, int, int64_t, bool, - phi::dtype::bfloat16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(subtract_grad, @@ -193,8 +193,8 @@ PD_CUSTOM_KERNEL_REGISTER(subtract_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(subtract_double_grad, @@ -204,8 +204,8 @@ PD_CUSTOM_KERNEL_REGISTER(subtract_double_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(copysign_grad, @@ -219,5 +219,5 @@ PD_CUSTOM_KERNEL_REGISTER(copysign_grad, int, int64_t, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_kernel_register.cc index ef794ef1936..f0b57a43d95 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_kernel_register.cc @@ -15,8 +15,8 @@ #include "paddle/phi/core/kernel_registry.h" #include "paddle/phi/kernels/kps/elementwise_kernel.cu" // NOLINT -using float16 = phi::dtype::float16; -using bfloat16 = phi::dtype::bfloat16; +using float16 = phi::float16; +using bfloat16 = phi::bfloat16; using complex64 = ::phi::dtype::complex; PD_CUSTOM_KERNEL_REGISTER(maximum, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_legacy_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_legacy_kernel.cu index 0ee2a272f7b..4a29ddc9b79 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_legacy_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_legacy_kernel.cu @@ -46,8 +46,8 @@ PD_REGISTER_KERNEL( } #else -using float16 = phi::dtype::float16; -using bfloat16 = phi::dtype::bfloat16; +using float16 = phi::float16; +using bfloat16 = phi::bfloat16; using complex64 = ::phi::dtype::complex; using complex128 = ::phi::dtype::complex; diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_multiply_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_multiply_kernel_register.cc index a4abbbce360..f98a7356103 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_multiply_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/elementwise_multiply_kernel_register.cc @@ -28,7 +28,7 @@ PD_CUSTOM_KERNEL_REGISTER(multiply_raw_sr, int, int64_t, bool, - phi::dtype::bfloat16, - phi::dtype::float16, + phi::bfloat16, + phi::float16, complex64, complex128) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_grad_kernel_register.cc index 09d980e00ad..30dd5a8b9f1 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_grad_kernel_register.cc @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(embedding_grad, ALL_LAYOUT, phi::EmbeddingGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(embedding_sparse_grad, @@ -29,6 +29,6 @@ PD_CUSTOM_KERNEL_REGISTER(embedding_sparse_grad, ALL_LAYOUT, phi::EmbeddingSparseGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_kernel_register.cc index 4b93f8c37be..dd884849129 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_kernel_register.cc @@ -21,6 +21,6 @@ PD_CUSTOM_KERNEL_REGISTER(embedding, phi::EmbeddingKernel, float, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_with_scaled_gradient_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_with_scaled_gradient_grad_kernel_register.cu index d1bf841adaa..ab841c79506 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_with_scaled_gradient_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/embedding_with_scaled_gradient_grad_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(embedding_with_scaled_gradient_grad, phi::EmbeddingWithScaledGradientGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/empty_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/empty_kernel_register.cc index b8ea03f8785..1890487f49b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/empty_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/empty_kernel_register.cc @@ -26,8 +26,8 @@ PD_CUSTOM_KERNEL_REGISTER(empty, int, int64_t, bool, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(empty_like, @@ -41,8 +41,8 @@ PD_CUSTOM_KERNEL_REGISTER(empty_like, int, int64_t, bool, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) { kernel->InputAt(0).SetBackend(phi::Backend::ALL_BACKEND); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/erf_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/erf_grad_kernel_register.cu index 150f5b92561..0e1ffc512b8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/erf_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/erf_grad_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(erf_grad, phi::ErfGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/erf_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/erf_kernel_register.cu index 8ea9c0e33fa..ae4c1277a65 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/erf_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/erf_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(erf, phi::ErfKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/erfinv_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/erfinv_grad_kernel_register.cu index 03e630b4966..0559de68172 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/erfinv_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/erfinv_grad_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(erfinv_grad, phi::ErfinvGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/erfinv_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/erfinv_kernel_register.cu index b109c333307..ca34bc787f4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/erfinv_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/erfinv_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(erfinv, phi::ErfinvKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/expand_as_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/expand_as_grad_kernel_register.cu index b32916fd8f4..408920393e8 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/expand_as_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/expand_as_grad_kernel_register.cu @@ -22,4 +22,4 @@ PD_CUSTOM_KERNEL_REGISTER(expand_as_grad, double, int, int64_t, - phi::dtype::bfloat16) {} + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/expand_as_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/expand_as_kernel_register.cu index f1226d76d58..801fd304575 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/expand_as_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/expand_as_kernel_register.cu @@ -23,4 +23,4 @@ PD_CUSTOM_KERNEL_REGISTER(expand_as, int, int64_t, bool, - phi::dtype::bfloat16) {} + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/expand_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/expand_grad_kernel_register.cu index af75f0ba828..7d73084d4a5 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/expand_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/expand_grad_kernel_register.cu @@ -27,7 +27,7 @@ PD_CUSTOM_KERNEL_REGISTER(expand_grad, int16_t, uint8_t, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/expand_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/expand_kernel_register.cc index 8a94abcf0f1..3fba8380203 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/expand_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/expand_kernel_register.cc @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(expand, int16_t, uint8_t, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/exponential_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/exponential_kernel_register.cu index f24eedc6d13..75cbc19fb00 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/exponential_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/exponential_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(exponential, phi::ExponentialKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/eye_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/eye_kernel_register.cu index bdf8b9df19d..40851055b27 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/eye_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/eye_kernel_register.cu @@ -25,7 +25,7 @@ PD_CUSTOM_KERNEL_REGISTER(eye, double, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fake_dequantize_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fake_dequantize_kernel_register.cu index 14e377bf248..555015d160c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fake_dequantize_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fake_dequantize_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(fake_dequantize_max_abs, phi::FakeDequantizeMaxAbsKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(fake_channel_wise_dequantize_max_abs, iluvatar_gpu, @@ -29,4 +29,4 @@ PD_CUSTOM_KERNEL_REGISTER(fake_channel_wise_dequantize_max_abs, phi::FakeChannelWiseDequantizeMaxAbsKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fake_quantize_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fake_quantize_kernel_register.cu index 518221c2a48..d34446a9260 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fake_quantize_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fake_quantize_kernel_register.cu @@ -20,28 +20,28 @@ PD_CUSTOM_KERNEL_REGISTER(fake_quantize_range_abs_max, ALL_LAYOUT, phi::FakeQuantizeRangeAbsMaxKernel, float, - phi::dtype::float16) {} + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(fake_quantize_abs_max, iluvatar_gpu, ALL_LAYOUT, phi::FakeQuantizeAbsMaxKernel, float, - phi::dtype::float16) {} + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(fake_quantize_moving_average_abs_max, iluvatar_gpu, ALL_LAYOUT, phi::FakeQuantOrWithDequantMovingAverageAbsMaxKernel, float, - phi::dtype::float16) {} + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(fake_channel_wise_quantize_abs_max, iluvatar_gpu, ALL_LAYOUT, phi::FakeChannelWiseQuantizeAbsMaxKernel, float, - phi::dtype::float16) {} + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(fake_channel_wise_quantize_dequantize_abs_max, iluvatar_gpu, @@ -54,11 +54,11 @@ PD_CUSTOM_KERNEL_REGISTER(fake_quantize_dequantize_moving_average_abs_max, ALL_LAYOUT, phi::FakeQuantizeDequantizeMovingAverageAbsMaxKernel, float, - phi::dtype::float16) {} + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(fake_quantize_dequantize_abs_max, iluvatar_gpu, ALL_LAYOUT, phi::FakeQuantizeDequantizeAbsMaxKernel, float, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fc_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/fc_kernel_register.cc index c66f4ed3cad..0685e4327a9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fc_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fc_kernel_register.cc @@ -16,9 +16,5 @@ #include "paddle/phi/core/kernel_registry.h" #include "paddle/phi/kernels/impl/fc_kernel_impl.h" -PD_CUSTOM_KERNEL_REGISTER(fc, - iluvatar_gpu, - ALL_LAYOUT, - phi::fusion::FCKernel, - float, - phi::dtype::float16) {} +PD_CUSTOM_KERNEL_REGISTER( + fc, iluvatar_gpu, ALL_LAYOUT, phi::fusion::FCKernel, float, phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fetch_barrier_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fetch_barrier_kernel_register.cu index ebe95879c79..eb381932706 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fetch_barrier_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fetch_barrier_kernel_register.cu @@ -23,6 +23,6 @@ PD_CUSTOM_KERNEL_REGISTER(fetch_barrier, double, int, int64_t, - phi::dtype::float16, + phi::float16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_grad_kernel_register.cc index dc6236eca8d..865655a89ae 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_grad_kernel_register.cc @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(fill_diagonal_grad, float, int64_t, int, - phi::dtype::float16, + phi::float16, bool) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_kernel_register.cc index 64c9ae7a6d6..e0445e730ef 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_kernel_register.cc @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(fill_diagonal, float, int64_t, int, - phi::dtype::float16, + phi::float16, bool) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_tensor_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_tensor_grad_kernel_register.cc index 93e527f1bee..4a08b0f01d5 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_tensor_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_tensor_grad_kernel_register.cc @@ -25,6 +25,6 @@ PD_CUSTOM_KERNEL_REGISTER(fill_diagonal_tensor_grad, int16_t, int8_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, bool) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_tensor_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_tensor_kernel_register.cc index 492ec8d8ab9..01b4874de8a 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_tensor_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_diagonal_tensor_kernel_register.cc @@ -25,6 +25,6 @@ PD_CUSTOM_KERNEL_REGISTER(fill_diagonal_tensor, int16_t, int8_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, bool) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_grad_kernel_register.cu index 5722468828c..6e2a02f1a8e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_grad_kernel_register.cu @@ -23,6 +23,6 @@ PD_CUSTOM_KERNEL_REGISTER(fill_grad, double, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, bool) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_kernel_register.cc index 2ef70f2b971..2f4e7ed730e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fill_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fill_kernel_register.cc @@ -28,6 +28,6 @@ PD_CUSTOM_KERNEL_REGISTER(fill, int32_t, int64_t, float, - ::phi::dtype::float16, - ::phi::dtype::bfloat16, + ::phi::float16, + ::phi::bfloat16, ::phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/flash_attn_grad_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/flash_attn_grad_kernel.cu index 4a9b07e0fc3..7fbbec058ca 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/flash_attn_grad_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/flash_attn_grad_kernel.cu @@ -1415,8 +1415,8 @@ PD_REGISTER_PLUGIN_KERNEL(flash_attn_unpadded_grad, #ifdef PADDLE_WITH_COREX float, #endif - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(7).SetBackend(phi::Backend::CPU); // seed_offset } @@ -1427,8 +1427,8 @@ PD_REGISTER_PLUGIN_KERNEL(flash_attn_varlen_qkvpacked_grad, #ifdef PADDLE_WITH_COREX float, #endif - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(5).SetBackend(phi::Backend::CPU); // seed_offset } @@ -1439,8 +1439,8 @@ PD_REGISTER_PLUGIN_KERNEL(flash_attn_grad, #ifdef PADDLE_WITH_COREX float, #endif - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(5).SetBackend(phi::Backend::CPU); // seed_offset } @@ -1451,8 +1451,8 @@ PD_REGISTER_PLUGIN_KERNEL(flash_attn_qkvpacked_grad, #ifdef PADDLE_WITH_COREX float, #endif - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(3).SetBackend(phi::Backend::CPU); // seed_offset } @@ -1460,7 +1460,7 @@ PD_REGISTER_PLUGIN_KERNEL(flashmask_attention_grad, iluvatar_gpu, ALL_LAYOUT, phi::FlashMaskGradKernel, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(6).SetBackend(phi::Backend::CPU); // seed_offset } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/flash_attn_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/flash_attn_kernel.cu index fcc9929b77e..4134e635d4e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/flash_attn_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/flash_attn_kernel.cu @@ -1106,8 +1106,8 @@ PD_REGISTER_PLUGIN_KERNEL(flash_attn_unpadded, #ifdef PADDLE_WITH_COREX float, #endif - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(5).SetBackend( phi::Backend::ALL_BACKEND); // fixed_seed_offset } @@ -1119,8 +1119,8 @@ PD_REGISTER_PLUGIN_KERNEL(flash_attn_varlen_qkvpacked, #ifdef PADDLE_WITH_COREX float, #endif - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(3).SetBackend( phi::Backend::ALL_BACKEND); // fixed_seed_offset } @@ -1132,8 +1132,8 @@ PD_REGISTER_PLUGIN_KERNEL(flash_attn, #ifdef PADDLE_WITH_COREX float, #endif - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(3).SetBackend( phi::Backend::ALL_BACKEND); // fixed_seed_offset } @@ -1145,8 +1145,8 @@ PD_REGISTER_PLUGIN_KERNEL(flash_attn_qkvpacked, #ifdef PADDLE_WITH_COREX float, #endif - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetBackend( phi::Backend::ALL_BACKEND); // fixed_seed_offset } @@ -1155,8 +1155,8 @@ PD_REGISTER_PLUGIN_KERNEL(flashmask_attention, iluvatar_gpu, ALL_LAYOUT, phi::FlashMaskKernel, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(4).SetBackend( phi::Backend::ALL_BACKEND); // fixed_seed_offset } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/flatten_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/flatten_grad_kernel_register.cc index bdae02c2a4f..d938b8ac615 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/flatten_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/flatten_grad_kernel_register.cc @@ -19,8 +19,8 @@ PD_CUSTOM_KERNEL_REGISTER(flatten_grad, ALL_LAYOUT, phi::FlattenGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, uint8_t, int8_t, int, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/flatten_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/flatten_kernel_register.cc index 2787c8da489..3631c81fa5e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/flatten_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/flatten_kernel_register.cc @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(flatten, ALL_LAYOUT, phi::FlattenKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, uint8_t, int8_t, int16_t, @@ -33,8 +33,8 @@ PD_CUSTOM_KERNEL_REGISTER(flatten_with_xshape, ALL_LAYOUT, phi::FlattenWithXShapeKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, uint8_t, int8_t, int16_t, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/flip_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/flip_kernel_register.cc index 4701e73ba75..f33ee9b66b9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/flip_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/flip_kernel_register.cc @@ -24,8 +24,8 @@ PD_CUSTOM_KERNEL_REGISTER(flip, ALL_LAYOUT, phi::FlipKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t, bool, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/frame_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/frame_grad_kernel_register.cu index b436cbaaa8e..366b437d34c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/frame_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/frame_grad_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(frame_grad, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/frame_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/frame_kernel_register.cu index d02afae5edb..c0840373f8c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/frame_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/frame_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(frame, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/full_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/full_kernel_register.cc index f4469164431..50dd738af2a 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/full_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/full_kernel_register.cc @@ -26,8 +26,8 @@ PD_CUSTOM_KERNEL_REGISTER(full, int, int64_t, bool, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(full_like, @@ -40,8 +40,8 @@ PD_CUSTOM_KERNEL_REGISTER(full_like, int, int64_t, bool, - phi::dtype::bfloat16, - phi::dtype::float16, + phi::bfloat16, + phi::float16, phi::dtype::complex) { kernel->InputAt(0).SetBackend(phi::Backend::ALL_BACKEND); } @@ -57,8 +57,8 @@ PD_CUSTOM_KERNEL_REGISTER(full_with_tensor, int, int64_t, bool, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) { kernel->InputAt(0).SetBackend(phi::Backend::CPU); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_adam_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_adam_kernel_register.cu index 478730f383c..8a8c08c6ec2 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_adam_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_adam_kernel_register.cu @@ -19,8 +19,8 @@ PD_CUSTOM_KERNEL_REGISTER(fused_adam, iluvatar_gpu, ALL_LAYOUT, phi::FusedAdamKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double) { // Skip beta1_pow, beta2_pow, skip_update data transform diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_bias_residual_layernorm_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_bias_residual_layernorm_kernel_register.cu index f6018d573d9..ed764856168 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_bias_residual_layernorm_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_bias_residual_layernorm_kernel_register.cu @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(fused_bias_residual_layernorm, ALL_LAYOUT, phi::fusion::FusedLayerNormKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(3).SetDataType(phi::DataType::FLOAT32); kernel->InputAt(4).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(0).SetDataType(phi::DataType::UNDEFINED); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_conv2d_add_act_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_conv2d_add_act_kernel_register.cu index 93052423202..e2dd2289903 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_conv2d_add_act_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_conv2d_add_act_kernel_register.cu @@ -21,4 +21,4 @@ PD_CUSTOM_KERNEL_REGISTER(fused_conv2d_add_act, // cuda_only phi::fusion::FusedConv2dAddActKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_rope_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_rope_grad_kernel_register.cu index 64d4083f0be..ef082f6e6e7 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_rope_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_rope_grad_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(fused_rotary_position_embedding_grad, ALL_LAYOUT, phi::fusion::FusedRopeGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16){}; + phi::float16, + phi::bfloat16){}; diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_rope_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_rope_kernel_register.cu index 23ba04fff9c..9bb3c204963 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_rope_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_rope_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(fused_rotary_position_embedding, ALL_LAYOUT, phi::fusion::FusedRopeKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16){}; + phi::float16, + phi::bfloat16){}; diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_grad_kernel_register.cu index 800a8c3f23d..ee6a2d1b7de 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_grad_kernel_register.cu @@ -22,4 +22,4 @@ PD_CUSTOM_KERNEL_REGISTER(fused_softmax_mask_grad, ALL_LAYOUT, phi::fusion::FusedSoftmaxMaskGradKernel, float, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_kernel_register.cu index d41e948eae2..f0640a365af 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_kernel_register.cu @@ -21,4 +21,4 @@ PD_CUSTOM_KERNEL_REGISTER(fused_softmax_mask, ALL_LAYOUT, phi::fusion::FusedSoftmaxMaskKernel, float, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_upper_triangle_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_upper_triangle_kernel_register.cu index 1562bb77f92..b671a0e6ef9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_upper_triangle_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_upper_triangle_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(fused_softmax_mask_upper_triangle, ALL_LAYOUT, phi::fusion::FusedSoftmaxMaskFuseUpperTriangleKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_stack_transpose_quant_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_stack_transpose_quant_kernel_register.cu index 749eb2d482e..8579c482fd4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_stack_transpose_quant_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_stack_transpose_quant_kernel_register.cu @@ -20,7 +20,7 @@ PD_CUSTOM_KERNEL_REGISTER(fused_stack_transpose_quant, iluvatar_gpu, ALL_LAYOUT, phi::fusion::FusedStackTransposeQuantKernel, - phi::dtype::bfloat16) { + phi::bfloat16) { kernel->OutputAt(0).SetDataType(phi::DataType::FLOAT8_E4M3FN); kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_transpose_split_quant_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_transpose_split_quant_kernel_register.cu index 3e829e02d0b..d0126cedd9f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_transpose_split_quant_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_transpose_split_quant_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(fused_transpose_split_quant, double, int, int64_t, - phi::dtype::bfloat16) { + phi::bfloat16) { kernel->OutputAt(0).SetDataType(phi::DataType::FLOAT8_E4M3FN); kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_transpose_wlch_split_quant_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_transpose_wlch_split_quant_kernel_register.cu index 32144f2327e..3b3d99e0918 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_transpose_wlch_split_quant_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_transpose_wlch_split_quant_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(fused_transpose_wlch_split_quant, iluvatar_gpu, ALL_LAYOUT, phi::fusion::FusedTransposeWLCHSplitQuantKernel, - phi::dtype::bfloat16) { + phi::bfloat16) { kernel->OutputAt(0).SetDataType(phi::DataType::FLOAT8_E4M3FN); kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fusion_group_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fusion_group_kernel_register.cu index 309f8e0ce54..ebed5a88385 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fusion_group_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fusion_group_kernel_register.cu @@ -22,6 +22,6 @@ PD_CUSTOM_KERNEL_REGISTER(fusion_group, phi::fusion::FusionGroupKernel, float, double, - phi::dtype::float16) { + phi::float16) { kernel->OutputAt(0).SetDataType(phi::DataType::UNDEFINED); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/gammaln_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/gammaln_kernel_register.cu index ee5bcdfa7ae..2fa02e334ee 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/gammaln_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/gammaln_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(gammaln, phi::GammalnKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/gather_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/gather_grad_kernel_register.cc index 33eae45ff60..8b47dd602fd 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/gather_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/gather_grad_kernel_register.cc @@ -22,6 +22,6 @@ PD_CUSTOM_KERNEL_REGISTER(gather_grad, float, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/gather_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/gather_kernel_register.cc index a62c03028c5..3074887b754 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/gather_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/gather_kernel_register.cc @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(gather, bool, uint8_t, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/gather_nd_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/gather_nd_grad_kernel_register.cc index a424a53fa28..2d5e61628ff 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/gather_nd_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/gather_nd_grad_kernel_register.cc @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(gather_nd_grad, int8_t, int16_t, bool, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/gather_nd_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/gather_nd_kernel_register.cc index c9361062577..b04c1009c73 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/gather_nd_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/gather_nd_kernel_register.cc @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(gather_nd, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/gaussian_inplace_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/gaussian_inplace_grad_kernel_register.cu index 4a5373cb6e9..f764864dc3d 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/gaussian_inplace_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/gaussian_inplace_grad_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(gaussian_inplace_grad, phi::GaussianInplaceGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/gaussian_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/gaussian_kernel_register.cc index e37ffc33227..8b187472040 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/gaussian_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/gaussian_kernel_register.cc @@ -19,8 +19,8 @@ PD_CUSTOM_KERNEL_REGISTER(gaussian, iluvatar_gpu, ALL_LAYOUT, phi::GaussianKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, phi::dtype::complex) {} @@ -28,7 +28,7 @@ PD_CUSTOM_KERNEL_REGISTER(gaussian_inplace, iluvatar_gpu, ALL_LAYOUT, phi::GaussianInplaceKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/gelu_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/gelu_grad_kernel_register.cc index 2a26847e518..12b00ec1e37 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/gelu_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/gelu_grad_kernel_register.cc @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(gelu_grad, ALL_LAYOUT, phi::GeluGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/gelu_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/gelu_kernel_register.cc index eabbf81a3ec..bb6088f547b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/gelu_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/gelu_kernel_register.cc @@ -24,5 +24,5 @@ PD_CUSTOM_KERNEL_REGISTER(gelu, ALL_LAYOUT, phi::GeluKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/global_gather_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/global_gather_kernel_register.cu index bbeaa102739..321a9d817db 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/global_gather_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/global_gather_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(global_gather, double, int, int64_t, - phi::dtype::float16) { + phi::float16) { kernel->InputAt(1).SetDataType(phi::DataType::INT64); kernel->InputAt(2).SetDataType(phi::DataType::INT64); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/global_scatter_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/global_scatter_kernel_register.cu index e2fe3370d21..aba9ddbd176 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/global_scatter_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/global_scatter_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(global_scatter, double, int, int64_t, - phi::dtype::float16) { + phi::float16) { kernel->InputAt(1).SetDataType(phi::DataType::INT64); kernel->InputAt(2).SetDataType(phi::DataType::INT64); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/group_norm_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/group_norm_grad_kernel_register.cu index 8f1fd80a5f9..38dffe3d7df 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/group_norm_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/group_norm_grad_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(group_norm_grad, phi::GroupNormGradKernel, float, double, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/group_norm_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/group_norm_kernel_register.cu index eea404e6a63..10dbacbd079 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/group_norm_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/group_norm_kernel_register.cu @@ -21,8 +21,8 @@ PD_CUSTOM_KERNEL_REGISTER(group_norm, phi::GroupNormKernel, float, double, - phi::dtype::bfloat16, - phi::dtype::float16) { + phi::bfloat16, + phi::float16) { if (kernel_key.dtype() == phi::DataType::BFLOAT16 || kernel_key.dtype() == phi::DataType::FLOAT16) { kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); @@ -34,8 +34,8 @@ PD_CUSTOM_KERNEL_REGISTER(add_group_norm_silu, iluvatar_gpu, ALL_LAYOUT, phi::GroupNormNDHWCKernel, - phi::dtype::bfloat16, - phi::dtype::float16) { + phi::bfloat16, + phi::float16) { kernel->OutputAt(2).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(3).SetDataType(phi::DataType::FLOAT32); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/gumbel_softmax_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/gumbel_softmax_grad_kernel_register.cu index 6f11551b27f..ccbcb764c79 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/gumbel_softmax_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/gumbel_softmax_grad_kernel_register.cu @@ -20,6 +20,6 @@ PD_CUSTOM_KERNEL_REGISTER(gumbel_softmax_grad, iluvatar_gpu, ALL_LAYOUT, phi::GumbelSoftmaxGradKernel, - phi::dtype::float16, + phi::float16, float, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/gumbel_softmax_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/gumbel_softmax_kernel_register.cu index 74e7995007b..979b13ad0f8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/gumbel_softmax_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/gumbel_softmax_kernel_register.cu @@ -19,6 +19,6 @@ PD_CUSTOM_KERNEL_REGISTER(gumbel_softmax, iluvatar_gpu, ALL_LAYOUT, phi::GumbelSoftmaxKernel, - phi::dtype::float16, + phi::float16, float, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/huber_loss_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/huber_loss_grad_kernel_register.cu index fa5808b6625..2314d53a935 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/huber_loss_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/huber_loss_grad_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(huber_loss_grad, phi::HuberLossGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/huber_loss_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/huber_loss_kernel_register.cu index 6e1647bb21c..6c3b262a194 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/huber_loss_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/huber_loss_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(huber_loss, phi::HuberLossKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/index_add_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/index_add_grad_kernel_register.cu index 34fa0d3a34f..0709702478e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/index_add_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/index_add_grad_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(index_add_grad, phi::IndexAddGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/index_add_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/index_add_kernel_register.cu index 440d72a9532..90ab6eeded6 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/index_add_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/index_add_kernel_register.cu @@ -20,7 +20,7 @@ PD_CUSTOM_KERNEL_REGISTER(index_add, phi::IndexAddKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/index_elementwise_get_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/index_elementwise_get_grad_kernel_register.cu index c3f49df03b0..a27dd3921d3 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/index_elementwise_get_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/index_elementwise_get_grad_kernel_register.cu @@ -27,7 +27,7 @@ PD_CUSTOM_KERNEL_REGISTER(index_elementwise_get_grad, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/index_elementwise_get_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/index_elementwise_get_kernel_register.cu index 63b38a26e78..b35585e305d 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/index_elementwise_get_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/index_elementwise_get_kernel_register.cu @@ -27,7 +27,7 @@ PD_CUSTOM_KERNEL_REGISTER(index_elementwise_get, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/index_put_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/index_put_grad_kernel_register.cu index d366eeabe97..65ec91c5840 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/index_put_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/index_put_grad_kernel_register.cu @@ -29,7 +29,7 @@ PD_CUSTOM_KERNEL_REGISTER(index_put_grad, int16_t, uint8_t, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/index_put_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/index_put_kernel_register.cc index 49d10cd52d7..5087ce08c46 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/index_put_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/index_put_kernel_register.cc @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(index_put, int16_t, uint8_t, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/index_sample_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/index_sample_grad_kernel_register.cu index 0764a71e6f5..ea93ba512fa 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/index_sample_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/index_sample_grad_kernel_register.cu @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(index_sample_grad, iluvatar_gpu, ALL_LAYOUT, phi::IndexSampleGradKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double, int, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/index_sample_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/index_sample_kernel_register.cu index b1368e8b23e..c0c862f03e2 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/index_sample_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/index_sample_kernel_register.cu @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(index_sample, iluvatar_gpu, ALL_LAYOUT, phi::IndexSampleKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double, int, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/index_select_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/index_select_grad_kernel_register.cu index 98ba688305e..cb767cda788 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/index_select_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/index_select_grad_kernel_register.cu @@ -21,8 +21,8 @@ PD_CUSTOM_KERNEL_REGISTER(index_select_grad, phi::IndexSelectGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex, int, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/index_select_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/index_select_kernel_register.cu index b48f63bd6e6..1da6f86d11e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/index_select_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/index_select_kernel_register.cu @@ -22,8 +22,8 @@ PD_CUSTOM_KERNEL_REGISTER(index_select, float, double, phi::dtype::float8_e4m3fn, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex, int, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/interpolate_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/interpolate_grad_kernel_register.cu index 6309441310e..45877ea72c9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/interpolate_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/interpolate_grad_kernel_register.cu @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(bilinear_interp_grad, ALL_LAYOUT, phi::BilinearInterpGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetBackend(phi::Backend::CPU); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(3).SetBackend(phi::Backend::ALL_BACKEND); @@ -31,8 +31,8 @@ PD_CUSTOM_KERNEL_REGISTER(legacy_bilinear_interp_grad, ALL_LAYOUT, phi::LegacyBilinearInterpGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetBackend(phi::Backend::CPU); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(3).SetBackend(phi::Backend::ALL_BACKEND); @@ -42,8 +42,8 @@ PD_CUSTOM_KERNEL_REGISTER(nearest_interp_grad, ALL_LAYOUT, phi::NearestInterpGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetBackend(phi::Backend::CPU); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(3).SetBackend(phi::Backend::ALL_BACKEND); @@ -53,8 +53,8 @@ PD_CUSTOM_KERNEL_REGISTER(legacy_nearest_interp_grad, ALL_LAYOUT, phi::LegacyNearestInterpGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetBackend(phi::Backend::CPU); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(3).SetBackend(phi::Backend::ALL_BACKEND); @@ -64,8 +64,8 @@ PD_CUSTOM_KERNEL_REGISTER(trilinear_interp_grad, ALL_LAYOUT, phi::TrilinearInterpGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetBackend(phi::Backend::CPU); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(3).SetBackend(phi::Backend::ALL_BACKEND); @@ -75,8 +75,8 @@ PD_CUSTOM_KERNEL_REGISTER(linear_interp_grad, ALL_LAYOUT, phi::LinearInterpGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetBackend(phi::Backend::CPU); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(3).SetBackend(phi::Backend::ALL_BACKEND); @@ -86,8 +86,8 @@ PD_CUSTOM_KERNEL_REGISTER(bicubic_interp_grad, ALL_LAYOUT, phi::BicubicInterpGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetBackend(phi::Backend::CPU); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(3).SetBackend(phi::Backend::ALL_BACKEND); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/interpolate_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/interpolate_kernel_register.cc index cf8f2213b7a..7c3fa80b4ef 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/interpolate_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/interpolate_kernel_register.cc @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(bilinear_interp, ALL_LAYOUT, phi::BilinearInterpKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int) { kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); @@ -32,8 +32,8 @@ PD_CUSTOM_KERNEL_REGISTER(legacy_bilinear_interp, ALL_LAYOUT, phi::LegacyBilinearInterpKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int) { kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); @@ -44,8 +44,8 @@ PD_CUSTOM_KERNEL_REGISTER(nearest_interp, ALL_LAYOUT, phi::NearestInterpKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t) { kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); @@ -57,8 +57,8 @@ PD_CUSTOM_KERNEL_REGISTER(legacy_nearest_interp, ALL_LAYOUT, phi::LegacyNearestInterpKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t) { kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); @@ -70,8 +70,8 @@ PD_CUSTOM_KERNEL_REGISTER(trilinear_interp, ALL_LAYOUT, phi::TrilinearInterpKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int) { kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); @@ -82,8 +82,8 @@ PD_CUSTOM_KERNEL_REGISTER(linear_interp, ALL_LAYOUT, phi::LinearInterpKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int) { kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); @@ -94,8 +94,8 @@ PD_CUSTOM_KERNEL_REGISTER(bicubic_interp, ALL_LAYOUT, phi::BicubicInterpKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int) { kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/isclose_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/isclose_kernel_register.cu index 9897819bb07..f02382b97b1 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/isclose_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/isclose_kernel_register.cu @@ -21,6 +21,6 @@ PD_CUSTOM_KERNEL_REGISTER(isclose, phi::IscloseKernel, float, double, - phi::dtype::float16, + phi::float16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/isfinite_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/isfinite_kernel_register.cc index e4769d52092..b0511002425 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/isfinite_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/isfinite_kernel_register.cc @@ -22,6 +22,6 @@ PD_CUSTOM_KERNEL_REGISTER(isfinite_sr, phi::IsfiniteSR, float, double, - phi::dtype::float16, + phi::float16, int, int64_t) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/isfinite_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/isfinite_kernel_register.cu index 7239b7e30dd..4655cd43725 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/isfinite_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/isfinite_kernel_register.cu @@ -21,8 +21,8 @@ PD_CUSTOM_KERNEL_REGISTER(isinf, phi::IsinfKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t, int16_t, @@ -39,8 +39,8 @@ PD_CUSTOM_KERNEL_REGISTER(isnan, phi::IsnanKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t, phi::dtype::complex, @@ -54,8 +54,8 @@ PD_CUSTOM_KERNEL_REGISTER(isfinite, phi::IsfiniteKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t, phi::dtype::complex, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/kron_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/kron_grad_kernel_register.cu index 8f0463f8ef0..6b2a9bd1582 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/kron_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/kron_grad_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(kron_grad, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/kron_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/kron_kernel_register.cu index 0657c9b9267..f4ab4d3ad0b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/kron_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/kron_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(kron, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/kthvalue_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/kthvalue_grad_kernel_register.cu index d75a7feddac..ac37ec59829 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/kthvalue_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/kthvalue_grad_kernel_register.cu @@ -26,5 +26,5 @@ PD_CUSTOM_KERNEL_REGISTER(kthvalue_grad, double, int, int64_t, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/kthvalue_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/kthvalue_kernel_register.cu index 0de40a327f1..ac427c434db 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/kthvalue_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/kthvalue_kernel_register.cu @@ -28,7 +28,7 @@ PD_CUSTOM_KERNEL_REGISTER(kthvalue, double, int, int64_t, - phi::dtype::bfloat16, - phi::dtype::float16) { + phi::bfloat16, + phi::float16) { kernel->OutputAt(1).SetDataType(phi::DataType::INT64); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/label_smooth_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/label_smooth_grad_kernel_register.cu index c348464a929..112b44341af 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/label_smooth_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/label_smooth_grad_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(label_smooth_grad, phi::LabelSmoothGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/label_smooth_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/label_smooth_kernel_register.cu index 42dbe02d28e..c327f59456e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/label_smooth_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/label_smooth_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(label_smooth, phi::LabelSmoothKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/lamb_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/lamb_kernel_register.cu index 46a690a2348..198f3fa2069 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/lamb_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/lamb_kernel_register.cu @@ -19,8 +19,8 @@ PD_CUSTOM_KERNEL_REGISTER(lamb, iluvatar_gpu, ALL_LAYOUT, phi::LambKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double) { kernel->InputAt(5).SetBackend(phi::Backend::ALL_BACKEND); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/layer_norm_grad_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/layer_norm_grad_kernel.cu index 61b5c8e337f..719553c7bc2 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/layer_norm_grad_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/layer_norm_grad_kernel.cu @@ -114,8 +114,8 @@ PD_REGISTER_PLUGIN_KERNEL(layer_norm_grad, ALL_LAYOUT, phi::LayerNormGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { if (kernel_key.dtype() == phi::DataType::FLOAT16) { kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(2).SetDataType(phi::DataType::FLOAT32); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/layer_norm_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/layer_norm_kernel.cu index c74deade4d6..d719dbd965e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/layer_norm_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/layer_norm_kernel.cu @@ -674,8 +674,8 @@ PD_REGISTER_PLUGIN_KERNEL(layer_norm, ALL_LAYOUT, phi::LayerNormKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(1).SetDataType(phi::DataType::UNDEFINED); kernel->OutputAt(2).SetDataType(phi::DataType::UNDEFINED); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/legacy_expand_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/legacy_expand_grad_kernel_register.cu index 289bd33f19f..e1cf5c9852b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/legacy_expand_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/legacy_expand_grad_kernel_register.cu @@ -23,4 +23,4 @@ PD_CUSTOM_KERNEL_REGISTER(legacy_expand_grad, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/lerp_grad_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/lerp_grad_kernel.cu index 0f50174c70b..391cac0082f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/lerp_grad_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/lerp_grad_kernel.cu @@ -19,7 +19,7 @@ PD_CUSTOM_KERNEL_REGISTER(lerp_grad, iluvatar_gpu, ALL_LAYOUT, phi::LerpGradKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/lerp_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/lerp_kernel.cu index 6fffa2517c5..edf14a60e5b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/lerp_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/lerp_kernel.cu @@ -19,7 +19,7 @@ PD_CUSTOM_KERNEL_REGISTER(lerp, iluvatar_gpu, ALL_LAYOUT, phi::LerpKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/lgamma_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/lgamma_grad_kernel_register.cu index 07c9e6fd875..1bde0510bef 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/lgamma_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/lgamma_grad_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(lgamma_grad, phi::LgammaGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/lgamma_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/lgamma_kernel_register.cu index ea9acdcb416..06478dfd78c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/lgamma_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/lgamma_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(lgamma, phi::LgammaKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/linspace_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/linspace_kernel_register.cu index be062827548..e2dedb90121 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/linspace_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/linspace_kernel_register.cu @@ -23,8 +23,8 @@ PD_CUSTOM_KERNEL_REGISTER(linspace, int32_t, int64_t, double, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(0).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(1).SetBackend(phi::Backend::ALL_BACKEND); kernel->InputAt(2).SetBackend(phi::Backend::ALL_BACKEND); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/log_softmax_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/log_softmax_grad_kernel_register.cu index 440185fd334..84e7f24fa16 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/log_softmax_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/log_softmax_grad_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(log_softmax_grad, ALL_LAYOUT, phi::LogSoftmaxGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/log_softmax_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/log_softmax_kernel_register.cu index bd0dd372fc3..35a64feb66d 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/log_softmax_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/log_softmax_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(log_softmax, ALL_LAYOUT, phi::LogSoftmaxKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/logcumsumexp_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/logcumsumexp_grad_kernel_register.cu index b1fdc06775a..c018ca7e6fe 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/logcumsumexp_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/logcumsumexp_grad_kernel_register.cu @@ -28,8 +28,8 @@ PD_CUSTOM_KERNEL_REGISTER(logcumsumexp_grad, iluvatar_gpu, ALL_LAYOUT, phi::LogcumsumexpGradKernel, - phi::dtype::float16, + phi::float16, float, double, - phi::dtype::bfloat16) {} + phi::bfloat16) {} #endif diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/logical_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/logical_kernel_register.cc index 335855e24d3..c17334451e4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/logical_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/logical_kernel_register.cc @@ -21,8 +21,8 @@ ALL_LAYOUT, \ phi::Logical##func_type##Kernel, \ float, \ - phi::dtype::float16, \ - phi::dtype::bfloat16, \ + phi::float16, \ + phi::bfloat16, \ bool, \ int64_t, \ int, \ diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/logspace_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/logspace_kernel_register.cu index 2f42490d7ff..e98d8cfd3a6 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/logspace_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/logspace_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(logspace, int32_t, int64_t, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/logsumexp_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/logsumexp_grad_kernel_register.cu index aa9d1c98683..b19ae0b1269 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/logsumexp_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/logsumexp_grad_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(logsumexp_grad, phi::LogsumexpGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/logsumexp_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/logsumexp_kernel_register.cc index f1a64a84df4..380aae32e61 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/logsumexp_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/logsumexp_kernel_register.cc @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(logsumexp, ALL_LAYOUT, phi::LogsumexpKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/lookup_table_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/lookup_table_grad_kernel_register.cu index 5535637b352..243b0985fe7 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/lookup_table_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/lookup_table_grad_kernel_register.cu @@ -20,7 +20,7 @@ PD_CUSTOM_KERNEL_REGISTER(lookup_table_grad, phi::LookupTableGradCUDAKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(lookup_table_sparse_grad, iluvatar_gpu, @@ -28,4 +28,4 @@ PD_CUSTOM_KERNEL_REGISTER(lookup_table_sparse_grad, phi::LookupTableSparseGradCUDAKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/lookup_table_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/lookup_table_kernel_register.cu index 30b58c16f63..916f0175063 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/lookup_table_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/lookup_table_kernel_register.cu @@ -21,6 +21,6 @@ PD_CUSTOM_KERNEL_REGISTER(lookup_table, phi::LookupTableCUDAKernel, float, double, - phi::dtype::float16, + phi::float16, int8_t, int16_t) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/margin_cross_entropy_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/margin_cross_entropy_grad_kernel_register.cu index b28610259b7..821400e7984 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/margin_cross_entropy_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/margin_cross_entropy_grad_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(margin_cross_entropy_grad, phi::MarginCrossEntropyGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/margin_cross_entropy_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/margin_cross_entropy_kernel_register.cu index 1736784c15b..df1be727628 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/margin_cross_entropy_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/margin_cross_entropy_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(margin_cross_entropy, phi::MarginCrossEntropyKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/mask_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/mask_grad_kernel_register.cu index 419c0555ffb..2df46b749c8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/mask_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/mask_grad_kernel_register.cu @@ -22,7 +22,7 @@ PD_CUSTOM_KERNEL_REGISTER(mask_as_coo_grad, phi::sparse::MaskAsCooGradKernel, float, double, - phi::dtype::float16, + phi::float16, uint8_t, int8_t, int16_t, @@ -40,7 +40,7 @@ PD_CUSTOM_KERNEL_REGISTER(mask_as_csr_grad, phi::sparse::MaskAsCsrGradKernel, float, double, - phi::dtype::float16, + phi::float16, uint8_t, int8_t, int16_t, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/mask_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/mask_kernel_register.cu index 7f8687b52c0..ec8076bd9d8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/mask_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/mask_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(mask_helper_coo, phi::sparse::MaskHelperCooKernel, float, double, - phi::dtype::float16, + phi::float16, uint8_t, int16_t, int, @@ -37,7 +37,7 @@ PD_CUSTOM_KERNEL_REGISTER(mask_as_coo, phi::sparse::MaskAsCooKernel, float, double, - phi::dtype::float16, + phi::float16, uint8_t, int8_t, int16_t, @@ -55,7 +55,7 @@ PD_CUSTOM_KERNEL_REGISTER(mask_as_csr, phi::sparse::MaskAsCsrKernel, float, double, - phi::dtype::float16, + phi::float16, uint8_t, int8_t, int16_t, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/masked_fill_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/masked_fill_grad_kernel_register.cu index b8470dfd4b0..41891bb2e49 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/masked_fill_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/masked_fill_grad_kernel_register.cu @@ -28,8 +28,8 @@ PD_CUSTOM_KERNEL_REGISTER(masked_fill_grad, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) { kernel->InputAt(1).SetDataType(phi::DataType::BOOL); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/masked_fill_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/masked_fill_kernel_register.cu index a70ee851d35..ffc7f2f4b40 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/masked_fill_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/masked_fill_kernel_register.cu @@ -28,8 +28,8 @@ PD_CUSTOM_KERNEL_REGISTER(masked_fill, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) { kernel->InputAt(1).SetDataType(phi::DataType::BOOL); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/masked_multihead_attention_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/masked_multihead_attention_kernel_register.cu index e35b5416046..d32e3a54cc4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/masked_multihead_attention_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/masked_multihead_attention_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(masked_multihead_attention, ALL_LAYOUT, phi::fusion::MMHAKernel, float, - phi::dtype::float16, + phi::float16, int32_t) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/masked_select_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/masked_select_grad_kernel_register.cu index 1d5c520e3a1..ce7cd83f260 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/masked_select_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/masked_select_grad_kernel_register.cu @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(masked_select_grad, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/masked_select_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/masked_select_kernel.cu index 39716a19665..44872fa64c0 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/masked_select_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/masked_select_kernel.cu @@ -108,8 +108,8 @@ PD_REGISTER_PLUGIN_KERNEL(masked_select, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) { kernel->InputAt(1).SetDataType(phi::DataType::BOOL); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/matmul_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/matmul_grad_kernel_register.cc index cab6cb18206..0f6dca45d8e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/matmul_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/matmul_grad_kernel_register.cc @@ -21,8 +21,8 @@ PD_CUSTOM_KERNEL_REGISTER(matmul_grad, ALL_LAYOUT, phi::MatmulGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(matmul_double_grad, @@ -30,7 +30,7 @@ PD_CUSTOM_KERNEL_REGISTER(matmul_double_grad, ALL_LAYOUT, phi::MatmulDoubleGradKernel, float, - phi::dtype::float16, + phi::float16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(matmul_triple_grad, @@ -38,7 +38,7 @@ PD_CUSTOM_KERNEL_REGISTER(matmul_triple_grad, ALL_LAYOUT, phi::MatmulTripleGradKernel, float, - phi::dtype::float16, + phi::float16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(matmul_with_flatten_grad, @@ -46,20 +46,20 @@ PD_CUSTOM_KERNEL_REGISTER(matmul_with_flatten_grad, ALL_LAYOUT, phi::MatmulWithFlattenGradKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(matmul_with_flatten_double_grad, iluvatar_gpu, ALL_LAYOUT, phi::MatmulWithFlattenDoubleGradKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(legacy_matmul_grad, iluvatar_gpu, ALL_LAYOUT, phi::LegacyMatmulGradKernel, float, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/matmul_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/matmul_kernel_register.cc index a80ca48b7c4..776c73f0780 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/matmul_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/matmul_kernel_register.cc @@ -23,8 +23,8 @@ PD_CUSTOM_KERNEL_REGISTER(matmul, float, int32_t, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, int8_t) { if (kernel_key.dtype() == phi::DataType::INT8) { @@ -41,8 +41,8 @@ PD_CUSTOM_KERNEL_REGISTER(matmul_with_flatten, phi::MatmulWithFlattenKernel, int8_t, float, - phi::dtype::bfloat16, - phi::dtype::float16) { + phi::bfloat16, + phi::float16) { if (kernel_key.dtype() == phi::DataType::INT8) { kernel->OutputAt(0).SetDataType(phi::DataType::INT32); } @@ -53,7 +53,7 @@ PD_REGISTER_PLUGIN_KERNEL(legacy_matmul, ALL_LAYOUT, phi::LegacyMatmulKernel, float, - phi::dtype::float16, + phi::float16, int8_t) { if (kernel_key.dtype() == phi::DataType::INT8) { kernel->OutputAt(0).SetDataType(phi::DataType::INT32); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/maxout_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/maxout_grad_kernel_register.cu index 579d75c2eb3..731ba5ec5bf 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/maxout_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/maxout_grad_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(maxout_grad, ALL_LAYOUT, phi::MaxOutGradKernel, float, - phi::dtype::float16, + phi::float16, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/maxout_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/maxout_kernel_register.cu index c0351719327..afbc9a8176f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/maxout_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/maxout_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(maxout, ALL_LAYOUT, phi::MaxOutKernel, float, - phi::dtype::float16, + phi::float16, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/mean_all_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/mean_all_grad_kernel_register.cc index df7332cd4b4..caf0df4031e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/mean_all_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/mean_all_grad_kernel_register.cc @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(mean_all_grad, ALL_LAYOUT, phi::MeanAllGradKernel, float, - phi::dtype::float16, + phi::float16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/mean_all_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/mean_all_kernel_register.cc index 7fd931d6354..0906ffeaa53 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/mean_all_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/mean_all_kernel_register.cc @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(mean_all, ALL_LAYOUT, phi::MeanAllKernel, float, - phi::dtype::float16, + phi::float16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/merged_momentum_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/merged_momentum_kernel_register.cu index 67337b3429a..73ca326ccfc 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/merged_momentum_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/merged_momentum_kernel_register.cu @@ -20,7 +20,7 @@ PD_CUSTOM_KERNEL_REGISTER(merged_momentum, iluvatar_gpu, ALL_LAYOUT, phi::MergedMomentumKernel, - phi::dtype::float16, + phi::float16, float, double) { if (kernel_key.dtype() == phi::DataType::FLOAT16) { diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/meshgrid_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/meshgrid_grad_kernel_register.cc index a7a98e5b268..d2d34b80e69 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/meshgrid_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/meshgrid_grad_kernel_register.cc @@ -21,11 +21,11 @@ PD_CUSTOM_KERNEL_REGISTER(meshgrid_grad, iluvatar_gpu, ALL_LAYOUT, phi::MeshgridGradKernel, - phi::dtype::float16, + phi::float16, float, double, int, int64_t, - phi::dtype::bfloat16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/meshgrid_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/meshgrid_kernel_register.cc index 5c33dba422d..3ead5188983 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/meshgrid_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/meshgrid_kernel_register.cc @@ -21,11 +21,11 @@ PD_CUSTOM_KERNEL_REGISTER(meshgrid, iluvatar_gpu, ALL_LAYOUT, phi::MeshgridKernel, - phi::dtype::float16, + phi::float16, float, double, int, int64_t, - phi::dtype::bfloat16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/mode_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/mode_grad_kernel_register.cu index 7ff4069e1b5..d178cb1e0eb 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/mode_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/mode_grad_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(mode_grad, double, int32_t, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/mode_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/mode_kernel_register.cu index a0281d3cf9f..d3a7d532223 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/mode_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/mode_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(mode, double, int32_t, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(1).SetDataType(phi::DataType::INT64); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/moe_combine_no_weight_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/moe_combine_no_weight_kernel_register.cu index 9f8e8c73bed..8ceaf6586a7 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/moe_combine_no_weight_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/moe_combine_no_weight_kernel_register.cu @@ -23,5 +23,5 @@ PD_CUSTOM_KERNEL_REGISTER(moe_combine_no_weight, phi::MoeCombineNoWeightKernel, float, double, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/moe_permute_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/moe_permute_kernel_register.cu index 91075eb75b2..80a8927bd3b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/moe_permute_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/moe_permute_kernel_register.cu @@ -18,4 +18,4 @@ PD_CUSTOM_KERNEL_REGISTER(moe_permute, iluvatar_gpu, ALL_LAYOUT, phi::MoePermuteKernel, - phi::dtype::bfloat16) {} + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/moe_unpermute_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/moe_unpermute_kernel_register.cu index 2b2ead4fde1..826eb0ae2f9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/moe_unpermute_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/moe_unpermute_kernel_register.cu @@ -21,4 +21,4 @@ PD_CUSTOM_KERNEL_REGISTER(moe_unpermute, iluvatar_gpu, ALL_LAYOUT, phi::MoeUnpermuteKernel, - phi::dtype::bfloat16) {} + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/momentum_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/momentum_kernel_register.cu index f6dc8225080..46d4066d309 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/momentum_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/momentum_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(momentum, phi::MomentumDenseKernel, float, double, - phi::dtype::float16) { + phi::float16) { if (kernel_key.dtype() == phi::DataType::FLOAT16) { kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(2).SetDataType(phi::DataType::FLOAT32); @@ -34,7 +34,7 @@ PD_CUSTOM_KERNEL_REGISTER(momentum_dense_param_sparse_grad, phi::MomentumSparseKernel, float, double, - phi::dtype::float16) { + phi::float16) { if (kernel_key.dtype() == phi::DataType::FLOAT16) { kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(2).SetDataType(phi::DataType::FLOAT32); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/moving_average_abs_max_scale_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/moving_average_abs_max_scale_kernel_register.cu index 36dd1ad3a3a..05c3cd0e7db 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/moving_average_abs_max_scale_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/moving_average_abs_max_scale_kernel_register.cu @@ -20,4 +20,4 @@ PD_CUSTOM_KERNEL_REGISTER(moving_average_abs_max_scale, ALL_LAYOUT, phi::MovingAverageAbsMaxScaleKernel, float, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/mp_allreduce_sum_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/mp_allreduce_sum_kernel_register.cu index 1e83e6c7609..fc081757c16 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/mp_allreduce_sum_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/mp_allreduce_sum_kernel_register.cu @@ -23,4 +23,4 @@ PD_CUSTOM_KERNEL_REGISTER(mp_allreduce_sum, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/multinomial_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/multinomial_kernel_register.cc index 2a1e2c7982a..42a61a161ba 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/multinomial_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/multinomial_kernel_register.cc @@ -19,8 +19,8 @@ PD_CUSTOM_KERNEL_REGISTER(multinomial, iluvatar_gpu, ALL_LAYOUT, phi::MultinomialKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float) { kernel->OutputAt(0).SetDataType(phi::DataType::INT64); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/nadam_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/nadam_kernel_register.cu index 502b4b269db..3e5561b2451 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/nadam_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/nadam_kernel_register.cu @@ -20,4 +20,4 @@ PD_CUSTOM_KERNEL_REGISTER(nadam, phi::NAdamKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/nanmedian_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/nanmedian_grad_kernel_register.cu index efd19e901f9..f0fdc15f272 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/nanmedian_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/nanmedian_grad_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(nanmedian_grad, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/nanmedian_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/nanmedian_kernel_register.cu index bf02ea7337f..8bfc279a32d 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/nanmedian_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/nanmedian_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(nanmedian, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(1).SetDataType(phi::DataType::INT64); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/nonzero_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/nonzero_kernel_register.cc index f0b5bf2bc83..56827bd9093 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/nonzero_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/nonzero_kernel_register.cc @@ -22,8 +22,8 @@ PD_CUSTOM_KERNEL_REGISTER(nonzero, int64_t, int, int16_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, bool, float) { kernel->OutputAt(0).SetDataType(phi::DataType::INT64); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/nop_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/nop_kernel_register.cu index b0eb68ecf09..2d76dd7bcef 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/nop_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/nop_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(nop, ALL_LAYOUT, phi::NopKernel, float, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/norm_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/norm_grad_kernel_register.cu index dce2be811d0..0139e4de3b4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/norm_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/norm_grad_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(norm_grad, phi::NormGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/norm_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/norm_kernel_register.cu index 0cef6adc427..8f8cae6406f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/norm_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/norm_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(norm, phi::NormKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/npu_identity_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/npu_identity_kernel_register.cc index 4ba3d1896be..0e6aaa11c5b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/npu_identity_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/npu_identity_kernel_register.cc @@ -44,4 +44,4 @@ PD_CUSTOM_KERNEL_REGISTER(npu_identity, int, int64_t, bool, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/numel_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/numel_kernel_register.cc index cb3755ed1f1..d0d1885b2bf 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/numel_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/numel_kernel_register.cc @@ -24,8 +24,8 @@ PD_CUSTOM_KERNEL_REGISTER(numel, int16_t, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, bool, phi::dtype::complex) { diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/overlap_add_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/overlap_add_grad_kernel_register.cu index 36efbd20932..fafd7debee8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/overlap_add_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/overlap_add_grad_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(overlap_add_grad, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/overlap_add_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/overlap_add_kernel_register.cu index 4460273d827..9bbfe1a128c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/overlap_add_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/overlap_add_kernel_register.cu @@ -22,7 +22,7 @@ PD_CUSTOM_KERNEL_REGISTER(overlap_add, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/p_norm_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/p_norm_grad_kernel_register.cc index c1fa9ba4d0f..1929fe4932e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/p_norm_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/p_norm_grad_kernel_register.cc @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(p_norm_grad, ALL_LAYOUT, phi::PNormGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/p_norm_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/p_norm_kernel_register.cc index a561fc04da0..9f56a6f69b8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/p_norm_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/p_norm_kernel_register.cc @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(p_norm, ALL_LAYOUT, phi::PNormKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/p_recv_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/p_recv_kernel_register.cu index caa405372b8..1ccd90603cc 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/p_recv_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/p_recv_kernel_register.cu @@ -26,4 +26,4 @@ PD_CUSTOM_KERNEL_REGISTER(p_recv_array, int8_t, uint8_t, int64_t, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/p_send_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/p_send_kernel_register.cu index d226b33e669..b60ff3dd811 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/p_send_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/p_send_kernel_register.cu @@ -27,4 +27,4 @@ PD_CUSTOM_KERNEL_REGISTER(p_send, uint8_t, int16_t, int64_t, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/pad3d_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/pad3d_grad_kernel_register.cu index a5bc3e3ac6d..56b3b35a5d0 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/pad3d_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/pad3d_grad_kernel_register.cu @@ -26,7 +26,7 @@ PD_CUSTOM_KERNEL_REGISTER(pad3d_grad, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/pad3d_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/pad3d_kernel_register.cu index 7d78841acc0..03bba0e1a22 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/pad3d_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/pad3d_kernel_register.cu @@ -21,8 +21,8 @@ PD_CUSTOM_KERNEL_REGISTER(pad3d, iluvatar_gpu, ALL_LAYOUT, phi::Pad3dKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double, int, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/pad_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/pad_grad_kernel_register.cc index e6a9b842e62..0031a21c0f8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/pad_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/pad_grad_kernel_register.cc @@ -20,6 +20,6 @@ PD_CUSTOM_KERNEL_REGISTER(pad_grad, ALL_LAYOUT, phi::PadGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/pad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/pad_kernel_register.cc index 26650099617..5c55ed021b9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/pad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/pad_kernel_register.cc @@ -22,6 +22,6 @@ PD_CUSTOM_KERNEL_REGISTER(pad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/partial_allgather_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/partial_allgather_kernel_register.cu index c461d959df4..6b823955c12 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/partial_allgather_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/partial_allgather_kernel_register.cu @@ -23,10 +23,10 @@ PD_CUSTOM_KERNEL_REGISTER(partial_allgather, phi::PartialAllGatherOpCUDAKernel, float, double, - phi::dtype::bfloat16, + phi::bfloat16, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} #else PD_CUSTOM_KERNEL_REGISTER(partial_allgather, iluvatar_gpu, @@ -36,5 +36,5 @@ PD_CUSTOM_KERNEL_REGISTER(partial_allgather, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} #endif diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/partial_concat_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/partial_concat_grad_kernel_register.cu index 6652d8c58df..37717361cdf 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/partial_concat_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/partial_concat_grad_kernel_register.cu @@ -22,6 +22,6 @@ PD_CUSTOM_KERNEL_REGISTER(partial_concat_grad, double, int, int64_t, - phi::dtype::float16, + phi::float16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/partial_concat_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/partial_concat_kernel_register.cu index f7198f79329..4f86738add2 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/partial_concat_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/partial_concat_kernel_register.cu @@ -33,6 +33,6 @@ PD_CUSTOM_KERNEL_REGISTER(partial_concat, double, int, int64_t, - phi::dtype::float16, + phi::float16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/partial_recv_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/partial_recv_kernel_register.cu index f7af373bce7..3d6b6d1e9c5 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/partial_recv_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/partial_recv_kernel_register.cu @@ -22,10 +22,10 @@ PD_CUSTOM_KERNEL_REGISTER(partial_recv, phi::PartialRecvKernel, float, double, - phi::dtype::bfloat16, + phi::bfloat16, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} #else PD_CUSTOM_KERNEL_REGISTER(partial_recv, iluvatar_gpu, @@ -35,5 +35,5 @@ PD_CUSTOM_KERNEL_REGISTER(partial_recv, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} #endif diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/partial_send_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/partial_send_kernel_register.cu index 2c6bb9f6805..41596fa0bd4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/partial_send_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/partial_send_kernel_register.cu @@ -22,10 +22,10 @@ PD_CUSTOM_KERNEL_REGISTER(partial_send, phi::PartialSendKernel, float, double, - phi::dtype::bfloat16, + phi::bfloat16, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} #else PD_CUSTOM_KERNEL_REGISTER(partial_send, iluvatar_gpu, @@ -35,5 +35,5 @@ PD_CUSTOM_KERNEL_REGISTER(partial_send, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} #endif diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_shuffle_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_shuffle_grad_kernel_register.cu index 937bd0a374c..62316cf2477 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_shuffle_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_shuffle_grad_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(pixel_shuffle_grad, phi::PixelShuffleGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_shuffle_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_shuffle_kernel_register.cu index a478e4c418d..798280eb9de 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_shuffle_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_shuffle_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(pixel_shuffle, phi::PixelShuffleKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_unshuffle_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_unshuffle_kernel_register.cu index 3c659a25ff5..3a7b37c4ce9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_unshuffle_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/pixel_unshuffle_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(pixel_unshuffle, phi::PixelUnshuffleKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/poisson_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/poisson_grad_kernel_register.cu index c3db7fc5ae1..fb33e83a194 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/poisson_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/poisson_grad_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(poisson_grad, phi::PoissonGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/poisson_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/poisson_kernel_register.cu index cf25bdcb02a..31e42b79c9a 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/poisson_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/poisson_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(poisson, phi::PoissonKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/pool_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/pool_grad_kernel_register.cc index 9a5bae77439..6383213b97c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/pool_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/pool_grad_kernel_register.cc @@ -23,15 +23,15 @@ PD_CUSTOM_KERNEL_REGISTER(pool2d_grad, ALL_LAYOUT, phi::Pool2dGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(lp_pool2d_grad, iluvatar_gpu, ALL_LAYOUT, phi::LPPool2dGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(pool2d_double_grad, iluvatar_gpu, ALL_LAYOUT, @@ -42,8 +42,8 @@ PD_CUSTOM_KERNEL_REGISTER(max_pool2d_with_index_grad, ALL_LAYOUT, phi::MaxPool2dWithIndexGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetDataType(phi::CppTypeToDataType::Type()); } @@ -52,15 +52,15 @@ PD_CUSTOM_KERNEL_REGISTER(pool3d_grad, ALL_LAYOUT, phi::Pool3dGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(max_pool3d_with_index_grad, iluvatar_gpu, ALL_LAYOUT, phi::MaxPool3dWithIndexGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetDataType(phi::CppTypeToDataType::Type()); } @@ -69,8 +69,8 @@ PD_CUSTOM_KERNEL_REGISTER(fractional_max_pool2d_grad, ALL_LAYOUT, phi::FractionalMaxPool2dGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetDataType(phi::CppTypeToDataType::Type()); } @@ -79,7 +79,7 @@ PD_CUSTOM_KERNEL_REGISTER(fractional_max_pool3d_grad, ALL_LAYOUT, phi::FractionalMaxPool3dGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(1).SetDataType(phi::CppTypeToDataType::Type()); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/pool_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/pool_kernel_register.cc index bc509c24760..021ee853093 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/pool_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/pool_kernel_register.cc @@ -23,22 +23,22 @@ PD_CUSTOM_KERNEL_REGISTER(pool2d, ALL_LAYOUT, phi::Pool2dKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(lp_pool2d, iluvatar_gpu, ALL_LAYOUT, phi::LPPool2dKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(max_pool2d_with_index, iluvatar_gpu, ALL_LAYOUT, phi::MaxPool2dWithIndexKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(1).SetDataType(phi::CppTypeToDataType::Type()); } @@ -47,15 +47,15 @@ PD_CUSTOM_KERNEL_REGISTER(pool3d, ALL_LAYOUT, phi::Pool3dKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(max_pool3d_with_index, iluvatar_gpu, ALL_LAYOUT, phi::MaxPool3dWithIndexKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(1).SetDataType(phi::CppTypeToDataType::Type()); } @@ -64,8 +64,8 @@ PD_CUSTOM_KERNEL_REGISTER(fractional_max_pool2d, ALL_LAYOUT, phi::FractionalMaxPool2dKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(1).SetDataType(phi::CppTypeToDataType::Type()); } @@ -74,7 +74,7 @@ PD_CUSTOM_KERNEL_REGISTER(fractional_max_pool3d, ALL_LAYOUT, phi::FractionalMaxPool3dKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(1).SetDataType(phi::CppTypeToDataType::Type()); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/prelu_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/prelu_grad_kernel_register.cu index 629c5aa5883..4708666d7ed 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/prelu_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/prelu_grad_kernel_register.cu @@ -20,6 +20,6 @@ PD_CUSTOM_KERNEL_REGISTER(prelu_grad, ALL_LAYOUT, phi::PReluGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/prelu_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/prelu_kernel_register.cu index 7398525bdf6..69edb02f4d0 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/prelu_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/prelu_kernel_register.cu @@ -21,6 +21,6 @@ PD_CUSTOM_KERNEL_REGISTER(prelu, ALL_LAYOUT, phi::PReluKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/prod_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/prod_grad_kernel_register.cu index c35270f782c..d03ebcd3da4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/prod_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/prod_grad_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(prod_grad, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/prod_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/prod_kernel_register.cc index 84c8e0a326a..21101d8a331 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/prod_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/prod_kernel_register.cc @@ -24,5 +24,5 @@ PD_CUSTOM_KERNEL_REGISTER(prod_infer, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/put_along_axis_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/put_along_axis_grad_kernel_register.cu index 003740ed21a..1056f344579 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/put_along_axis_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/put_along_axis_grad_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(put_along_axis_grad, double, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/put_along_axis_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/put_along_axis_kernel_register.cc index 921f642b998..d15456ae020 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/put_along_axis_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/put_along_axis_kernel_register.cc @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(put_along_axis, float, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/qkv_unpack_mha_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/qkv_unpack_mha_kernel_register.cu index 6c0775a1aa6..a41338b1b3a 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/qkv_unpack_mha_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/qkv_unpack_mha_kernel_register.cu @@ -21,4 +21,4 @@ PD_CUSTOM_KERNEL_REGISTER(qkv_unpack_mha, ALL_LAYOUT, phi::fusion::QKVMMHAKernel, float, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/quant_linear_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/quant_linear_kernel_register.cu index 2ba5a631199..45a8147ee70 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/quant_linear_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/quant_linear_kernel_register.cu @@ -23,4 +23,4 @@ PD_CUSTOM_KERNEL_REGISTER(quant_linear, phi::QuantLinearKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/quantize_linear_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/quantize_linear_kernel_register.cu index 040c0fe45a2..a956ff02bf6 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/quantize_linear_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/quantize_linear_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(dequantize_linear, float, int8_t, double, - phi::dtype::float16) { + phi::float16) { kernel->OutputAt(0).SetDataType(phi::DataType::UNDEFINED); } @@ -33,7 +33,7 @@ PD_CUSTOM_KERNEL_REGISTER(quantize_linear, ALL_LAYOUT, phi::QuantizeLinearKernel, float, - phi::dtype::float16) { + phi::float16) { kernel->OutputAt(0).SetDataType(phi::DataType::UNDEFINED); } @@ -44,7 +44,7 @@ PD_CUSTOM_KERNEL_REGISTER(dequantize_linear_deprecated, float, int8_t, double, - phi::dtype::float16) { + phi::float16) { kernel->OutputAt(0).SetDataType(phi::DataType::UNDEFINED); } @@ -53,7 +53,7 @@ PD_CUSTOM_KERNEL_REGISTER(quantize_linear_deprecated_train, ALL_LAYOUT, phi::QuantizeLinearDeprecatedTrainKernel, float, - phi::dtype::float16) { + phi::float16) { kernel->OutputAt(0).SetDataType(phi::DataType::UNDEFINED); } @@ -62,6 +62,6 @@ PD_CUSTOM_KERNEL_REGISTER(quantize_linear_deprecated_infer, ALL_LAYOUT, phi::QuantizeLinearDeprecatedInferKernel, float, - phi::dtype::float16) { + phi::float16) { kernel->OutputAt(0).SetDataType(phi::DataType::UNDEFINED); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/radam_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/radam_kernel_register.cu index 4cc8a59d781..b78e1cc5bbb 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/radam_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/radam_kernel_register.cu @@ -20,4 +20,4 @@ PD_CUSTOM_KERNEL_REGISTER(radam, phi::RAdamKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/random_routing_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/random_routing_kernel_register.cu index c70c6c71379..d7cb852f4d0 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/random_routing_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/random_routing_kernel_register.cu @@ -21,4 +21,4 @@ PD_CUSTOM_KERNEL_REGISTER(random_routing, phi::RandomRoutingKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/randperm_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/randperm_kernel_register.cu index 76a05f4d6fc..d46e2f0437f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/randperm_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/randperm_kernel_register.cu @@ -23,5 +23,5 @@ PD_CUSTOM_KERNEL_REGISTER(randperm, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_as_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_as_grad_kernel_register.cu index c8b6662e9f8..132dc08d1e8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_as_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_as_grad_kernel_register.cu @@ -22,8 +22,8 @@ PD_CUSTOM_KERNEL_REGISTER(reduce_as_grad, bool, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int16_t, int, int64_t, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_as_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_as_kernel_register.cu index bfd6e9ac473..3b7da5bff4c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_as_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_as_kernel_register.cu @@ -21,8 +21,8 @@ PD_CUSTOM_KERNEL_REGISTER(reduce_as, bool, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int16_t, int, int64_t, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_kernel_kps_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_kernel_kps_register.cc index d2ef7f4b846..d5b863f6921 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_kernel_kps_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_kernel_kps_register.cc @@ -27,8 +27,8 @@ #include "paddle/phi/kernels/reduce_min_kernel.h" #include "paddle/phi/kernels/reduce_sum_kernel.h" -using float16 = phi::dtype::float16; -using bfloat16 = phi::dtype::bfloat16; +using float16 = phi::float16; +using bfloat16 = phi::bfloat16; using complex64 = ::phi::dtype::complex; using complex128 = ::phi::dtype::complex; @@ -79,8 +79,8 @@ PD_CUSTOM_KERNEL_REGISTER(max, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(mean_raw, iluvatar_gpu, @@ -88,7 +88,7 @@ PD_CUSTOM_KERNEL_REGISTER(mean_raw, phi::MeanRawKernel, float, bool, - phi::dtype::bfloat16, + phi::bfloat16, float16, int, int64_t, @@ -101,8 +101,8 @@ PD_CUSTOM_KERNEL_REGISTER(min_raw, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sum_raw, iluvatar_gpu, @@ -128,6 +128,6 @@ PD_CUSTOM_KERNEL_REGISTER(prod, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_kernel_register.cc index ef288438bca..2650157d5b9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_kernel_register.cc @@ -25,8 +25,8 @@ PD_CUSTOM_KERNEL_REGISTER(reduce, int8_t, uint8_t, int64_t, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(amax_grad, iluvatar_gpu, @@ -52,8 +52,8 @@ PD_CUSTOM_KERNEL_REGISTER(max_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(mean_grad, iluvatar_gpu, @@ -61,8 +61,8 @@ PD_CUSTOM_KERNEL_REGISTER(mean_grad, phi::ReduceMeanGradKernel, bool, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, int, int64_t) {} @@ -74,8 +74,8 @@ PD_CUSTOM_KERNEL_REGISTER(min_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(sum_grad, iluvatar_gpu, @@ -83,8 +83,8 @@ PD_CUSTOM_KERNEL_REGISTER(sum_grad, phi::ReduceSumGradKernel, bool, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int8_t, uint8_t, int16_t, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_max_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_max_kernel_register.cc index 5c75076a051..e41f406a0c1 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_max_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_max_kernel_register.cc @@ -23,5 +23,5 @@ PD_CUSTOM_KERNEL_REGISTER(max_raw, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_mean_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_mean_kernel_register.cc index 85fe7979697..68f2bc1b0ac 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_mean_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_mean_kernel_register.cc @@ -23,6 +23,6 @@ PD_CUSTOM_KERNEL_REGISTER(mean, bool, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_min_kernel.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_min_kernel.cc index adbb0d6dee7..fd3d96a4feb 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_min_kernel.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_min_kernel.cc @@ -26,5 +26,5 @@ PD_CUSTOM_KERNEL_REGISTER(min, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_scatter_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_scatter_kernel_register.cu index d723fce724b..1260bbf59ee 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_scatter_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_scatter_kernel_register.cu @@ -28,8 +28,8 @@ PD_CUSTOM_KERNEL_REGISTER(reduce_scatter, uint8_t, int16_t, int64_t, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} #else PD_CUSTOM_KERNEL_REGISTER(reduce_scatter, iluvatar_gpu, @@ -43,5 +43,5 @@ PD_CUSTOM_KERNEL_REGISTER(reduce_scatter, uint8_t, int16_t, int64_t, - phi::dtype::float16) {} + phi::float16) {} #endif diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_sum_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_sum_kernel_register.cc index bb5f638f51e..893cc62e869 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_sum_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/reduce_sum_kernel_register.cc @@ -23,8 +23,8 @@ PD_CUSTOM_KERNEL_REGISTER(sum, phi::SumKernel, bool, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int16_t, int, int64_t, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/repeat_interleave_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/repeat_interleave_grad_kernel_register.cu index 1fd6ae7d52f..82b75795049 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/repeat_interleave_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/repeat_interleave_grad_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(repeat_interleave_with_tensor_index_grad, double, int, int64_t, - phi::dtype::bfloat16) {} + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(repeat_interleave_grad, iluvatar_gpu, ALL_LAYOUT, @@ -32,4 +32,4 @@ PD_CUSTOM_KERNEL_REGISTER(repeat_interleave_grad, double, int, int64_t, - phi::dtype::bfloat16) {} + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/repeat_interleave_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/repeat_interleave_kernel_register.cu index e0d24211894..cecc74dd5af 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/repeat_interleave_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/repeat_interleave_kernel_register.cu @@ -23,7 +23,7 @@ PD_CUSTOM_KERNEL_REGISTER(repeat_interleave, double, int, int64_t, - phi::dtype::bfloat16) {} + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(repeat_interleave_with_tensor_index, iluvatar_gpu, @@ -33,4 +33,4 @@ PD_CUSTOM_KERNEL_REGISTER(repeat_interleave_with_tensor_index, double, int, int64_t, - phi::dtype::bfloat16) {} + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/rms_norm_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/rms_norm_grad_kernel_register.cc index e669cc26e85..2889859ae44 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/rms_norm_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/rms_norm_grad_kernel_register.cc @@ -25,5 +25,5 @@ PD_CUSTOM_KERNEL_REGISTER(fused_rms_norm_quant_grad, ALL_LAYOUT, phi::RmsNormQuantGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/rms_norm_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/rms_norm_kernel_register.cc index 4dcc3449fb3..cc6049ad76b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/rms_norm_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/rms_norm_kernel_register.cc @@ -42,5 +42,5 @@ PD_CUSTOM_KERNEL_REGISTER(fused_rms_norm_quant, ALL_LAYOUT, phi::RmsNormQuantKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/rmsprop_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/rmsprop_kernel_register.cu index 80ecfecf748..d5ed3797238 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/rmsprop_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/rmsprop_kernel_register.cu @@ -21,7 +21,7 @@ PD_CUSTOM_KERNEL_REGISTER(rmsprop, phi::RmspropDenseKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(rmsprop_dense_param_sparse_grad, iluvatar_gpu, @@ -29,4 +29,4 @@ PD_CUSTOM_KERNEL_REGISTER(rmsprop_dense_param_sparse_grad, phi::RmspropSparseKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/roll_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/roll_grad_kernel_register.cu index 521e755efda..30ebac15b5c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/roll_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/roll_grad_kernel_register.cu @@ -23,8 +23,8 @@ PD_CUSTOM_KERNEL_REGISTER(roll_grad, iluvatar_gpu, ALL_LAYOUT, phi::RollGradKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double, int, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/roll_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/roll_kernel_register.cu index 1cd668cc737..56776c6cec4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/roll_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/roll_kernel_register.cu @@ -24,8 +24,8 @@ PD_CUSTOM_KERNEL_REGISTER(roll, iluvatar_gpu, ALL_LAYOUT, phi::RollKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, bool, float, double, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/rprop_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/rprop_kernel_register.cu index 4fb7024ce9c..6a5957c2047 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/rprop_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/rprop_kernel_register.cu @@ -25,8 +25,8 @@ PD_CUSTOM_KERNEL_REGISTER(rprop, iluvatar_gpu, ALL_LAYOUT, phi::RpropKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double) { if (kernel_key.dtype() == phi::DataType::FLOAT16 || @@ -41,7 +41,7 @@ PD_CUSTOM_KERNEL_REGISTER(rprop, iluvatar_gpu, ALL_LAYOUT, phi::RpropKernel, - phi::dtype::float16, + phi::float16, float, double) { if (kernel_key.dtype() == phi::DataType::FLOAT16) { diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/rrelu_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/rrelu_grad_kernel_register.cu index 9fb8ed076e7..1eb8d0cb1c5 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/rrelu_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/rrelu_grad_kernel_register.cu @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(rrelu_grad, ALL_LAYOUT, phi::RReluGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/rrelu_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/rrelu_kernel_register.cu index fa7d3ca7f33..66e7e286895 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/rrelu_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/rrelu_kernel_register.cu @@ -23,6 +23,6 @@ PD_CUSTOM_KERNEL_REGISTER(rrelu, ALL_LAYOUT, phi::RReluKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/scale_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/scale_kernel_register.cc index 5bf12a96d61..d9c5d281c66 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/scale_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/scale_kernel_register.cc @@ -21,8 +21,8 @@ PD_CUSTOM_KERNEL_REGISTER(scale, phi::ScaleKernel, bool, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, uint8_t, int8_t, int16_t, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_grad_kernel_register.cc index 7879f263634..47a2b417e1c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_grad_kernel_register.cc @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(scatter_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_kernel_register.cc index d32f24c8e02..2baf225a9e6 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_kernel_register.cc @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(scatter, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_nd_add_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_nd_add_grad_kernel_register.cc index ef9ecd7a9bb..6dad1e79bb1 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_nd_add_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_nd_add_grad_kernel_register.cc @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(scatter_nd_add_grad, float, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_nd_add_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_nd_add_kernel_register.cc index c3a914db2a1..fec70a7caf0 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_nd_add_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/scatter_nd_add_kernel_register.cc @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(scatter_nd_add, float, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/searchsorted_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/searchsorted_kernel_register.cu index 00380bf85d1..4eaa3e25b4f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/searchsorted_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/searchsorted_kernel_register.cu @@ -25,7 +25,7 @@ PD_CUSTOM_KERNEL_REGISTER(searchsorted, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(0).SetDataType(phi::DataType::UNDEFINED); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/segment_pool_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/segment_pool_grad_kernel_register.cu index fdf02fe9e73..23c25789541 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/segment_pool_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/segment_pool_grad_kernel_register.cu @@ -26,5 +26,5 @@ PD_CUSTOM_KERNEL_REGISTER(segment_pool_grad, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/segment_pool_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/segment_pool_kernel_register.cu index 816992e389a..51ac3a3e090 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/segment_pool_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/segment_pool_kernel_register.cu @@ -26,5 +26,5 @@ PD_CUSTOM_KERNEL_REGISTER(segment_pool, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/selu_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/selu_grad_kernel_register.cu index ac06f9bd536..5af7ed2b939 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/selu_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/selu_grad_kernel_register.cu @@ -23,5 +23,5 @@ PD_CUSTOM_KERNEL_REGISTER(selu_grad, phi::SeluGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/send_u_recv_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/send_u_recv_grad_kernel_register.cu index 17747e09db0..7fc8396a522 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/send_u_recv_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/send_u_recv_grad_kernel_register.cu @@ -24,4 +24,4 @@ PD_CUSTOM_KERNEL_REGISTER(send_u_recv_grad, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/send_u_recv_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/send_u_recv_kernel_register.cu index baeb33145ce..5892aa74c1d 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/send_u_recv_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/send_u_recv_kernel_register.cu @@ -34,6 +34,6 @@ PD_CUSTOM_KERNEL_REGISTER(send_u_recv, double, int, int64_t, - phi::dtype::float16) { + phi::float16) { kernel->OutputAt(1).SetDataType(phi::DataType::INT32); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/send_ue_recv_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/send_ue_recv_grad_kernel_register.cu index 9587f5ecdb0..cc0a596604c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/send_ue_recv_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/send_ue_recv_grad_kernel_register.cu @@ -32,4 +32,4 @@ PD_CUSTOM_KERNEL_REGISTER(send_ue_recv_grad, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/send_ue_recv_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/send_ue_recv_kernel_register.cu index 6800cf976d3..7cb9d3066a3 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/send_ue_recv_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/send_ue_recv_kernel_register.cu @@ -37,6 +37,6 @@ PD_CUSTOM_KERNEL_REGISTER(send_ue_recv, double, int, int64_t, - phi::dtype::float16) { + phi::float16) { kernel->OutputAt(1).SetDataType(phi::DataType::INT32); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/send_uv_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/send_uv_grad_kernel_register.cu index 5a1d5f2d149..5c0a02c95c6 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/send_uv_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/send_uv_grad_kernel_register.cu @@ -32,4 +32,4 @@ PD_CUSTOM_KERNEL_REGISTER(send_uv_grad, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/send_uv_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/send_uv_kernel_register.cu index a93782e7840..5ba7735c6a5 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/send_uv_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/send_uv_kernel_register.cu @@ -26,4 +26,4 @@ PD_CUSTOM_KERNEL_REGISTER(send_uv, double, int, int64_t, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/set_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/set_kernel_register.cc index 338c1a9e092..b6a821298be 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/set_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/set_kernel_register.cc @@ -28,7 +28,7 @@ PD_CUSTOM_KERNEL_REGISTER(set, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/set_value_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/set_value_grad_kernel_register.cc index 828e9cc7dad..02e80a90d5b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/set_value_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/set_value_grad_kernel_register.cc @@ -26,8 +26,8 @@ PD_CUSTOM_KERNEL_REGISTER(set_value_grad, int16_t, uint8_t, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(set_value_with_scalar_grad, @@ -41,6 +41,6 @@ PD_CUSTOM_KERNEL_REGISTER(set_value_with_scalar_grad, int16_t, uint8_t, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/set_value_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/set_value_kernel_register.cc index 79b72334c74..a5cc3e42601 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/set_value_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/set_value_kernel_register.cc @@ -26,8 +26,8 @@ PD_CUSTOM_KERNEL_REGISTER(set_value, int16_t, uint8_t, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(set_value_with_tensor, iluvatar_gpu, @@ -40,6 +40,6 @@ PD_CUSTOM_KERNEL_REGISTER(set_value_with_tensor, int16_t, uint8_t, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/sgd_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/sgd_kernel_register.cu index 791b0db0404..41b583e6b79 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/sgd_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/sgd_kernel_register.cu @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(sgd, iluvatar_gpu, ALL_LAYOUT, phi::SGDDenseKernel, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, float, double) { if (kernel_key.dtype() == phi::DataType::FLOAT16 || @@ -36,7 +36,7 @@ PD_CUSTOM_KERNEL_REGISTER(sgd, iluvatar_gpu, ALL_LAYOUT, phi::SGDDenseKernel, - phi::dtype::float16, + phi::float16, float, double) { if (kernel_key.dtype() == phi::DataType::FLOAT16) { @@ -49,7 +49,7 @@ PD_CUSTOM_KERNEL_REGISTER(sgd_dense_param_sparse_grad, iluvatar_gpu, ALL_LAYOUT, phi::SGDDenseParamSparseGradKernel, - phi::dtype::float16, + phi::float16, float, double) {} @@ -57,6 +57,6 @@ PD_CUSTOM_KERNEL_REGISTER(sgd_sparse_param_sparse_grad, iluvatar_gpu, ALL_LAYOUT, phi::SGDSparseParamSparseGradKernel, - phi::dtype::float16, + phi::float16, float, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/shape_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/shape_kernel_register.cc index 4059678f1b1..33facd31e08 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/shape_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/shape_kernel_register.cc @@ -26,8 +26,8 @@ PD_CUSTOM_KERNEL_REGISTER(shape, int64_t, float, phi::dtype::complex, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(0).SetBackend(phi::Backend::ALL_BACKEND); kernel->OutputAt(0).SetBackend(phi::Backend::CPU); kernel->OutputAt(0).SetDataType(phi::DataType::INT32); @@ -44,8 +44,8 @@ PD_CUSTOM_KERNEL_REGISTER(shape64, int64_t, float, phi::dtype::complex, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->InputAt(0).SetBackend(phi::Backend::ALL_BACKEND); kernel->OutputAt(0).SetBackend(phi::Backend::CPU); kernel->OutputAt(0).SetDataType(phi::DataType::INT64); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/share_data_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/share_data_kernel_register.cu index db4b23b21ec..dc1e31271f2 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/share_data_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/share_data_kernel_register.cu @@ -26,5 +26,5 @@ PD_CUSTOM_KERNEL_REGISTER(share_data, int64_t, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/sigmoid_cross_entropy_with_logits_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/sigmoid_cross_entropy_with_logits_grad_kernel_register.cu index fe00f8cfb81..aba1b95db9d 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/sigmoid_cross_entropy_with_logits_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/sigmoid_cross_entropy_with_logits_grad_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(sigmoid_cross_entropy_with_logits_grad, ALL_LAYOUT, phi::SigmoidCrossEntropyWithLogitsGradKernel, float, - phi::dtype::float16, + phi::float16, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/sigmoid_cross_entropy_with_logits_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/sigmoid_cross_entropy_with_logits_kernel_register.cu index 5da295a7442..cadc85074d4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/sigmoid_cross_entropy_with_logits_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/sigmoid_cross_entropy_with_logits_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(sigmoid_cross_entropy_with_logits, ALL_LAYOUT, phi::SigmoidCrossEntropyWithLogitsKernel, float, - phi::dtype::float16, + phi::float16, double) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/sign_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/sign_kernel_register.cc index 9b55390894e..7c12e829ddc 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/sign_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/sign_kernel_register.cc @@ -25,6 +25,6 @@ PD_CUSTOM_KERNEL_REGISTER(sign, int32_t, int64_t, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/slice_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/slice_grad_kernel_register.cc index f225890a957..03b3bcb2fb8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/slice_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/slice_grad_kernel_register.cc @@ -27,8 +27,8 @@ PD_CUSTOM_KERNEL_REGISTER(slice_grad, int16_t, int8_t, phi::dtype::complex, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(slice_array_grad, iluvatar_gpu, @@ -42,8 +42,8 @@ PD_CUSTOM_KERNEL_REGISTER(slice_array_grad, int16_t, int8_t, phi::dtype::complex, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(slice_array_dense_grad, iluvatar_gpu, @@ -57,5 +57,5 @@ PD_CUSTOM_KERNEL_REGISTER(slice_array_dense_grad, int16_t, int8_t, phi::dtype::complex, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/slice_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/slice_kernel_register.cc index 26013cb6514..fa4358f6f07 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/slice_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/slice_kernel_register.cc @@ -27,8 +27,8 @@ PD_CUSTOM_KERNEL_REGISTER(slice, int16_t, int8_t, phi::dtype::complex, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(slice_array, iluvatar_gpu, @@ -42,8 +42,8 @@ PD_CUSTOM_KERNEL_REGISTER(slice_array, int16_t, int8_t, phi::dtype::complex, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} PD_CUSTOM_KERNEL_REGISTER(slice_array_dense, iluvatar_gpu, @@ -57,5 +57,5 @@ PD_CUSTOM_KERNEL_REGISTER(slice_array_dense, int16_t, int8_t, phi::dtype::complex, - phi::dtype::bfloat16, - phi::dtype::float16) {} + phi::bfloat16, + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/soft_relu_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/soft_relu_grad_kernel_register.cu index 068990ce3f1..4d65e839006 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/soft_relu_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/soft_relu_grad_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(soft_relu_grad, phi::SoftReluGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/soft_relu_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/soft_relu_kernel_register.cu index 7cd7355885c..3ba78ad6de5 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/soft_relu_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/soft_relu_kernel_register.cu @@ -58,8 +58,8 @@ PD_REGISTER_KERNEL(soft_relu, phi::SoftReluCudaKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_CUSTOM_KERNEL_REGISTER(soft_relu, iluvatar_gpu, @@ -67,5 +67,5 @@ PD_CUSTOM_KERNEL_REGISTER(soft_relu, phi::SoftReluCudaKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/softmax_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/softmax_grad_kernel_register.cu index 8c6991a1ad1..0dd80a9670c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/softmax_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/softmax_grad_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(softmax_grad, ALL_LAYOUT, phi::SoftmaxGradGPUDNNKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/softmax_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/softmax_kernel_register.cu index 29fd6c65561..7e69642ffd8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/softmax_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/softmax_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(softmax, ALL_LAYOUT, phi::SoftmaxGPUDNNKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/sparse_momentum_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/sparse_momentum_kernel_register.cu index 9128de2a5b2..8b9b5a6473a 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/sparse_momentum_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/sparse_momentum_kernel_register.cu @@ -21,4 +21,4 @@ PD_CUSTOM_KERNEL_REGISTER(sparse_momentum, phi::SparseMomentumOpKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/sparse_utils_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/sparse_utils_kernel_register.cu index 2fcb815c8c6..c165009da24 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/sparse_utils_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/sparse_utils_kernel_register.cu @@ -20,7 +20,7 @@ PD_CUSTOM_KERNEL_REGISTER(sparse_coo_tensor, ALL_LAYOUT, phi::sparse::SparseCooTensorKernel, float, - phi::dtype::float16, + phi::float16, uint8_t, int16_t, int, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/split_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/split_kernel_register.cc index 2340164cbce..2340ca38d30 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/split_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/split_kernel_register.cc @@ -26,8 +26,8 @@ PD_CUSTOM_KERNEL_REGISTER(split, uint8_t, int8_t, int16_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::complex64) {} PD_CUSTOM_KERNEL_REGISTER(split_with_num, @@ -40,5 +40,5 @@ PD_CUSTOM_KERNEL_REGISTER(split_with_num, bool, uint8_t, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/squared_l2_norm_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/squared_l2_norm_grad_kernel_register.cu index f4a4c72985e..38e2c45b1e6 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/squared_l2_norm_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/squared_l2_norm_grad_kernel_register.cu @@ -23,5 +23,5 @@ PD_CUSTOM_KERNEL_REGISTER(squared_l2_norm_grad, phi::SquaredL2NormGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/squared_l2_norm_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/squared_l2_norm_kernel_register.cc index 09391d69dfe..1618a3867fb 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/squared_l2_norm_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/squared_l2_norm_kernel_register.cc @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(squared_l2_norm, ALL_LAYOUT, phi::SquaredL2NormKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/squeeze_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/squeeze_grad_kernel_register.cc index 5fb5a2fdd8c..3f897d9c93c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/squeeze_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/squeeze_grad_kernel_register.cc @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(squeeze_grad, ALL_LAYOUT, phi::SqueezeGradKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, bool, int, uint8_t, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/squeeze_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/squeeze_kernel_register.cc index a61a9c0f979..f8ae7a73170 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/squeeze_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/squeeze_kernel_register.cc @@ -26,8 +26,8 @@ PD_CUSTOM_KERNEL_REGISTER(squeeze, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(squeeze_with_xshape, @@ -41,6 +41,6 @@ PD_CUSTOM_KERNEL_REGISTER(squeeze_with_xshape, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/stack_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/stack_grad_kernel_register.cu index 6a39776e11a..a4f6612f330 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/stack_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/stack_grad_kernel_register.cu @@ -26,8 +26,8 @@ PD_CUSTOM_KERNEL_REGISTER(stack_grad, int64_t, uint8_t, int16_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::float8_e4m3fn, phi::dtype::float8_e5m2, phi::dtype::complex, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/stack_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/stack_kernel_register.cc index d348e921237..0cb5902c0e1 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/stack_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/stack_kernel_register.cc @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(stack, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/straight_through_estimator_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/straight_through_estimator_grad_kernel_register.cu index 13f224158f0..750bc11b552 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/straight_through_estimator_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/straight_through_estimator_grad_kernel_register.cu @@ -19,4 +19,4 @@ PD_CUSTOM_KERNEL_REGISTER(straight_through_estimator_grad, ALL_LAYOUT, phi::StraightThroughEstimatorGradKernel, float, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/strided_copy_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/strided_copy_kernel_register.cc index 37dcc2348d8..77b82d5b706 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/strided_copy_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/strided_copy_kernel_register.cc @@ -23,6 +23,6 @@ PD_CUSTOM_KERNEL_REGISTER(strided_copy, int32_t, int64_t, float, - ::phi::dtype::float16, - ::phi::dtype::bfloat16, + ::phi::float16, + ::phi::bfloat16, ::phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/strided_slice_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/strided_slice_grad_kernel_register.cc index 6314e4f1ec6..d931e85eb11 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/strided_slice_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/strided_slice_grad_kernel_register.cc @@ -23,6 +23,6 @@ PD_CUSTOM_KERNEL_REGISTER(strided_slice_grad, int, int64_t, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/strided_slice_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/strided_slice_kernel_register.cc index 6e7da3bc677..25c2725d557 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/strided_slice_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/strided_slice_kernel_register.cc @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(strided_slice, int, uint8_t, int8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/swiglu_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/swiglu_grad_kernel_register.cc index 9b748a859f9..4eecbca3b08 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/swiglu_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/swiglu_grad_kernel_register.cc @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(swiglu_grad, phi::SwiGLUGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/swiglu_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/swiglu_kernel_register.cc index 115a1c9cd50..5761584ea9b 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/swiglu_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/swiglu_kernel_register.cc @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(swiglu, ALL_LAYOUT, phi::SwiGLUKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/sync_batch_norm_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/sync_batch_norm_grad_kernel_register.cu index 319cdbe33a5..f67ceef3a87 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/sync_batch_norm_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/sync_batch_norm_grad_kernel_register.cu @@ -23,4 +23,4 @@ PD_CUSTOM_KERNEL_REGISTER(sync_batch_norm_grad, phi::SyncBatchNormGradKernel, float, double, - phi::dtype::float16) {} + phi::float16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/sync_batch_norm_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/sync_batch_norm_kernel_register.cu index c1ac1db3754..ac3c78188f2 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/sync_batch_norm_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/sync_batch_norm_kernel_register.cu @@ -22,7 +22,7 @@ PD_CUSTOM_KERNEL_REGISTER(sync_batch_norm, ALL_LAYOUT, phi::SyncBatchNormKernel, float, - phi::dtype::float16) { + phi::float16) { if (kernel_key.dtype() == phi::DataType::FLOAT16) { kernel->InputAt(1).SetDataType(phi::DataType::FLOAT32); kernel->InputAt(2).SetDataType(phi::DataType::FLOAT32); @@ -42,8 +42,8 @@ PD_CUSTOM_KERNEL_REGISTER(sync_batch_norm, phi::SyncBatchNormKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { if (kernel_key.dtype() == phi::DataType::FLOAT16 || kernel_key.dtype() == phi::DataType::BFLOAT16) { kernel->InputAt(1).SetDataType(phi::DataType::FLOAT32); @@ -63,7 +63,7 @@ PD_CUSTOM_KERNEL_REGISTER(sync_batch_norm, phi::SyncBatchNormKernel, float, double, - phi::dtype::float16) { + phi::float16) { if (kernel_key.dtype() == phi::DataType::FLOAT16) { kernel->InputAt(1).SetDataType(phi::DataType::FLOAT32); kernel->InputAt(2).SetDataType(phi::DataType::FLOAT32); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/sync_calc_stream_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/sync_calc_stream_kernel_register.cu index 39865cf70b9..81b7365968d 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/sync_calc_stream_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/sync_calc_stream_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(sync_calc_stream, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/take_along_axis_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/take_along_axis_grad_kernel_register.cu index c7fe46680ce..fc7e34524ca 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/take_along_axis_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/take_along_axis_grad_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(take_along_axis_grad, double, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/take_along_axis_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/take_along_axis_kernel_register.cc index 507d4024f5f..e70d3df9379 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/take_along_axis_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/take_along_axis_kernel_register.cc @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(take_along_axis, float, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/temporal_shift_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/temporal_shift_grad_kernel_register.cu index b5ebb018d62..fc38b9048cb 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/temporal_shift_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/temporal_shift_grad_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(temporal_shift_grad, phi::TemporalShiftGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/temporal_shift_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/temporal_shift_kernel_register.cu index 67cb222d043..ad84d58273c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/temporal_shift_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/temporal_shift_kernel_register.cu @@ -21,5 +21,5 @@ PD_CUSTOM_KERNEL_REGISTER(temporal_shift, phi::TemporalShiftKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/tile_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/tile_grad_kernel_register.cc index ec5911ab23e..93cf0f52c0f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/tile_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/tile_grad_kernel_register.cc @@ -23,6 +23,6 @@ PD_CUSTOM_KERNEL_REGISTER(tile_grad, float, int, int64_t, - phi::dtype::float16, + phi::float16, phi::dtype::complex, - phi::dtype::bfloat16) {} + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/tile_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/tile_kernel_register.cc index 620123b71fd..3785319ec4d 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/tile_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/tile_kernel_register.cc @@ -23,6 +23,6 @@ PD_CUSTOM_KERNEL_REGISTER(tile, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/top_k_grad_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/top_k_grad_kernel.cu index 3f8d4b4eb34..b974c2de836 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/top_k_grad_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/top_k_grad_kernel.cu @@ -98,8 +98,8 @@ PD_REGISTER_PLUGIN_KERNEL(topk_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} PD_REGISTER_PLUGIN_KERNEL(topk_v1_grad, iluvatar_gpu, @@ -108,5 +108,5 @@ PD_REGISTER_PLUGIN_KERNEL(topk_v1_grad, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/top_k_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/top_k_kernel.cu index be4648b233f..9b26a5dedb7 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/top_k_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/top_k_kernel.cu @@ -377,8 +377,8 @@ PD_REGISTER_PLUGIN_KERNEL(topk, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(1).SetDataType(phi::DataType::INT64); } @@ -389,7 +389,7 @@ PD_REGISTER_PLUGIN_KERNEL(topk_v1, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) { + phi::float16, + phi::bfloat16) { kernel->OutputAt(1).SetDataType(phi::DataType::INT64); } diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/trace_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/trace_grad_kernel_register.cu index 496dfaeb220..4fa1dbf5021 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/trace_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/trace_grad_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(trace_grad, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/trace_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/trace_kernel_register.cu index eac030974ad..b2509e7048c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/trace_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/trace_kernel_register.cu @@ -26,7 +26,7 @@ PD_CUSTOM_KERNEL_REGISTER(trace, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/transpose_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/transpose_grad_kernel_register.cc index 8a29b96a5cb..d3b306ca662 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/transpose_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/transpose_grad_kernel_register.cc @@ -26,8 +26,8 @@ PD_CUSTOM_KERNEL_REGISTER(transpose_grad, int16_t, int32_t, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(trans_layout_grad, @@ -38,6 +38,6 @@ PD_CUSTOM_KERNEL_REGISTER(trans_layout_grad, float, int32_t, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/transpose_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/transpose_kernel_register.cc index c24582e11a3..d99b7201c06 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/transpose_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/transpose_kernel_register.cc @@ -26,6 +26,6 @@ PD_CUSTOM_KERNEL_REGISTER(transpose, int32_t, int64_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/tril_triu_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/tril_triu_grad_kernel_register.cu index 45858e5146b..239ea37eb47 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/tril_triu_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/tril_triu_grad_kernel_register.cu @@ -23,8 +23,8 @@ PD_CUSTOM_KERNEL_REGISTER(tril_grad, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} @@ -37,8 +37,8 @@ PD_CUSTOM_KERNEL_REGISTER(triu_grad, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} @@ -51,7 +51,7 @@ PD_CUSTOM_KERNEL_REGISTER(tril_triu_grad, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/tril_triu_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/tril_triu_kernel_register.cc index 7425712316b..d37095288c7 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/tril_triu_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/tril_triu_kernel_register.cc @@ -23,8 +23,8 @@ PD_CUSTOM_KERNEL_REGISTER(tril_triu, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(triu, @@ -35,8 +35,8 @@ PD_CUSTOM_KERNEL_REGISTER(triu, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} PD_CUSTOM_KERNEL_REGISTER(tril, @@ -47,6 +47,6 @@ PD_CUSTOM_KERNEL_REGISTER(tril, float, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/trunc_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/trunc_grad_kernel_register.cu index 57ab7c2f8ce..89e4466f743 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/trunc_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/trunc_grad_kernel_register.cu @@ -23,5 +23,5 @@ PD_CUSTOM_KERNEL_REGISTER(trunc_grad, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/trunc_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/trunc_kernel_register.cu index 53c6d3ea5e4..c84ae587191 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/trunc_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/trunc_kernel_register.cu @@ -23,5 +23,5 @@ PD_CUSTOM_KERNEL_REGISTER(trunc, double, int, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/unary_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/unary_grad_kernel_register.cu index 7c9956724a2..baeebd2c8f9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/unary_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/unary_grad_kernel_register.cu @@ -22,7 +22,7 @@ iluvatar_gpu, \ ALL_LAYOUT, \ phi::sparse::prefix##CooGradKernel, \ - phi::dtype::float16, \ + phi::float16, \ float, \ double) { \ kernel->InputAt(0).SetDataLayout(phi::DataLayout::SPARSE_COO); \ @@ -32,7 +32,7 @@ iluvatar_gpu, \ ALL_LAYOUT, \ phi::sparse::prefix##CsrGradKernel, \ - phi::dtype::float16, \ + phi::float16, \ float, \ double) { \ kernel->InputAt(0).SetDataLayout(phi::DataLayout::SPARSE_CSR); \ @@ -43,7 +43,7 @@ iluvatar_gpu, \ ALL_LAYOUT, \ phi::sparse::prefix##CooGradKernel, \ - phi::dtype::float16, \ + phi::float16, \ float, \ double, \ phi::dtype::complex, \ @@ -55,7 +55,7 @@ iluvatar_gpu, \ ALL_LAYOUT, \ phi::sparse::prefix##CsrGradKernel, \ - phi::dtype::float16, \ + phi::float16, \ float, \ double, \ phi::dtype::complex, \ @@ -67,7 +67,7 @@ PD_CUSTOM_KERNEL_REGISTER(cast_coo_grad, iluvatar_gpu, ALL_LAYOUT, phi::sparse::CastCooGradKernel, - phi::dtype::float16, + phi::float16, float, double, int8_t, @@ -81,7 +81,7 @@ PD_CUSTOM_KERNEL_REGISTER(cast_csr_grad, iluvatar_gpu, ALL_LAYOUT, phi::sparse::CastCsrGradKernel, - phi::dtype::float16, + phi::float16, float, double, int8_t, diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/unary_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/unary_kernel_register.cu index 2a47dfab696..9161fd38292 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/unary_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/unary_kernel_register.cu @@ -21,7 +21,7 @@ iluvatar_gpu, \ ALL_LAYOUT, \ phi::sparse::prefix##CooKernel, \ - phi::dtype::float16, \ + phi::float16, \ float, \ double) { \ kernel->InputAt(0).SetDataLayout(phi::DataLayout::SPARSE_COO); \ @@ -31,7 +31,7 @@ iluvatar_gpu, \ ALL_LAYOUT, \ phi::sparse::prefix##CsrKernel, \ - phi::dtype::float16, \ + phi::float16, \ float, \ double) { \ kernel->InputAt(0).SetDataLayout(phi::DataLayout::SPARSE_CSR); \ @@ -42,7 +42,7 @@ iluvatar_gpu, \ ALL_LAYOUT, \ phi::sparse::prefix##CooKernel, \ - phi::dtype::float16, \ + phi::float16, \ float, \ double, \ phi::dtype::complex, \ @@ -54,7 +54,7 @@ iluvatar_gpu, \ ALL_LAYOUT, \ phi::sparse::prefix##CsrKernel, \ - phi::dtype::float16, \ + phi::float16, \ float, \ double, \ phi::dtype::complex, \ @@ -84,7 +84,7 @@ PD_CUSTOM_KERNEL_REGISTER(cast_coo, iluvatar_gpu, ALL_LAYOUT, phi::sparse::CastCooKernel, - phi::dtype::float16, + phi::float16, float, double, int8_t, @@ -98,7 +98,7 @@ PD_CUSTOM_KERNEL_REGISTER(cast_csr, iluvatar_gpu, ALL_LAYOUT, phi::sparse::CastCsrKernel, - phi::dtype::float16, + phi::float16, float, double, int8_t, @@ -114,7 +114,7 @@ PD_CUSTOM_KERNEL_REGISTER(isnan_coo, phi::sparse::IsnanCooKernel, float, double, - phi::dtype::float16, + phi::float16, int, int64_t) { kernel->InputAt(0).SetDataLayout(phi::DataLayout::SPARSE_COO); @@ -126,7 +126,7 @@ PD_CUSTOM_KERNEL_REGISTER(isnan_csr, phi::sparse::IsnanCsrKernel, float, double, - phi::dtype::float16, + phi::float16, int, int64_t) { kernel->InputAt(0).SetDataLayout(phi::DataLayout::SPARSE_CSR); diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/unbind_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/unbind_kernel_register.cc index 772eee99c0c..50494b3cfa4 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/unbind_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/unbind_kernel_register.cc @@ -21,8 +21,8 @@ PD_CUSTOM_KERNEL_REGISTER(unbind, phi::UnbindKernel, bool, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, int, int64_t, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/unfold_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/unfold_grad_kernel_register.cu index 5089214399b..952fd5d56aa 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/unfold_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/unfold_grad_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(unfold_grad, phi::UnfoldGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/unfold_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/unfold_kernel_register.cu index 4ca265b641d..3988f3b407e 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/unfold_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/unfold_kernel_register.cu @@ -22,5 +22,5 @@ PD_CUSTOM_KERNEL_REGISTER(unfold, phi::UnfoldKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_inplace_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_inplace_grad_kernel_register.cu index cf4d54e03ec..d2daffa3cfa 100755 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_inplace_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_inplace_grad_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(uniform_inplace_grad, phi::UniformInplaceGradKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_inplace_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_inplace_kernel_register.cu index f2b327de849..daaa75822f3 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_inplace_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_inplace_kernel_register.cu @@ -20,5 +20,5 @@ PD_CUSTOM_KERNEL_REGISTER(uniform_inplace, phi::UniformInplaceKernel, float, double, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_kernel_register.cc index 760f11e21e2..3d38ab2cf0a 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/uniform_kernel_register.cc @@ -20,6 +20,6 @@ PD_CUSTOM_KERNEL_REGISTER(uniform, ALL_LAYOUT, phi::UniformKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/unsqueeze_grad_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/unsqueeze_grad_kernel_register.cc index 36fc01aa8ee..124c7a3fb50 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/unsqueeze_grad_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/unsqueeze_grad_kernel_register.cc @@ -27,6 +27,6 @@ PD_CUSTOM_KERNEL_REGISTER(unsqueeze_grad, uint8_t, int8_t, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/unsqueeze_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/unsqueeze_kernel_register.cc index 180a9745718..f69ab594ed8 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/unsqueeze_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/unsqueeze_kernel_register.cc @@ -20,8 +20,8 @@ PD_CUSTOM_KERNEL_REGISTER(unsqueeze, ALL_LAYOUT, phi::UnsqueezeKernel, float, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, bool, int, int16_t, @@ -41,6 +41,6 @@ PD_CUSTOM_KERNEL_REGISTER(unsqueeze_with_xshape, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/unstack_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/unstack_grad_kernel_register.cu index 19edfa002d4..ed0178b598f 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/unstack_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/unstack_grad_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(unstack_grad, double, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/unstack_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/unstack_kernel_register.cu index 017ea8ddbe1..6e877bfe08c 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/unstack_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/unstack_kernel_register.cu @@ -24,7 +24,7 @@ PD_CUSTOM_KERNEL_REGISTER(unstack, double, int64_t, int, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/weight_only_linear_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/weight_only_linear_kernel.cu index 8f624c27559..39cdb70aea0 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/weight_only_linear_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/weight_only_linear_kernel.cu @@ -67,9 +67,9 @@ void WeightOnlyLinearKernel(const Context& dev_ctx, PADDLE_THROW(common::errors::Unimplemented("Unsupported weight dtype %s.", weight_dtype)); } - if (std::is_same::value) { + if (std::is_same::value) { bc_type = CUDA_R_16F; - } else if (std::is_same::value) { + } else if (std::is_same::value) { bc_type = CUDA_R_16BF; } else { PADDLE_THROW(common::errors::Unimplemented("Unsupported input dtype.")); @@ -178,5 +178,5 @@ PD_REGISTER_PLUGIN_KERNEL(weight_only_linear, iluvatar_gpu, ALL_LAYOUT, phi::WeightOnlyLinearKernel, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/weight_quantize_kernel.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/weight_quantize_kernel.cu index e121bf49da8..8955dd41a12 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/weight_quantize_kernel.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/weight_quantize_kernel.cu @@ -58,5 +58,5 @@ PD_REGISTER_PLUGIN_KERNEL(weight_quantize, iluvatar_gpu, ALL_LAYOUT, phi::WeightQuantizeKernel, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/where_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/where_grad_kernel_register.cu index 3896b8694b7..24b8fdefa36 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/where_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/where_grad_kernel_register.cu @@ -26,7 +26,7 @@ PD_CUSTOM_KERNEL_REGISTER(where_grad, int64_t, int16_t, uint8_t, - phi::dtype::float16, - phi::dtype::bfloat16, + phi::float16, + phi::bfloat16, phi::dtype::complex, phi::dtype::complex) {} diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/where_kernel_register.cc b/backends/iluvatar_gpu/kernels/cuda_kernels/where_kernel_register.cc index 1db5f746724..a75aa526180 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/where_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/where_kernel_register.cc @@ -23,5 +23,5 @@ PD_CUSTOM_KERNEL_REGISTER(where, int, bool, int64_t, - phi::dtype::float16, - phi::dtype::bfloat16) {} + phi::float16, + phi::bfloat16) {} From 9da922669c54e513c0d49a57073b98f9650903da Mon Sep 17 00:00:00 2001 From: co63oc <4617245+co63oc@users.noreply.github.com> Date: Wed, 22 Apr 2026 15:36:03 +0800 Subject: [PATCH 2/2] ci