Searched defs:sum_dy (Results 1 – 2 of 2) sorted by relevance
/aosp_15_r20/external/pytorch/aten/src/ATen/native/cuda/ |
H A D | Normalization.cuh | 478 GenericPackedTensorAccessor<stat_accscalar_t, 1, DefaultPtrTraits, index_t> sum_dy, in batch_norm_backward_reduce_kernel() 514 const GenericPackedTensorAccessor<stat_accscalar_t, 1, DefaultPtrTraits, index_t> sum_dy, in batch_norm_backward_elemt_kernel_impl() 552 const GenericPackedTensorAccessor<stat_accscalar_t, 1, DefaultPtrTraits, index_t> sum_dy, in batch_norm_backward_elemt_kernel() 574 const GenericPackedTensorAccessor<stat_accscalar_t, 1, DefaultPtrTraits, index_t> sum_dy, in batch_norm_backward_elemt_kernel() 814 auto sum_dy = packed_accessor_or_dummy< in batch_norm_backward_reduce_cuda_template() local 860 auto sum_dy = packed_accessor_or_dummy< in batch_norm_backward_elemt_cuda_template() local 911 auto sum_dy = packed_accessor_or_dummy< in batch_norm_backward_elemt_cuda_template() local 1137 __device__ __forceinline__ void merge_block_vertical_backward(T& sum_dy, in merge_block_vertical_backward() 1182 accscalar_t sum_dy[PARALLEL_LOADS]; in batch_norm_backward_reduce_channels_last_kernel() local 1330 const accscalar_t* __restrict__ sum_dy, in batch_norm_backward_elemt_channels_last_kernel_impl() [all …]
|
H A D | Normalization.cu | 182 const Tensor& weight, const Tensor& sum_dy, const Tensor& sum_dy_xmu) { in batch_norm_elementwise_backward_train() 626 Tensor sum_dy, sum_dy_xmu, grad_weight, grad_bias; in batch_norm_backward_cuda() local 762 …n, const Tensor& invstd, const std::optional<Tensor>& weight_opt, const Tensor& sum_dy, const Tens… in batch_norm_backward_elemt_cuda()
|