xref: /aosp_15_r20/external/pytorch/c10/util/Unroll.h (revision da0073e96a02ea20f0ac840b70461e3646d07c45)
1*da0073e9SAndroid Build Coastguard Worker #pragma once
2*da0073e9SAndroid Build Coastguard Worker #include <c10/macros/Macros.h>
3*da0073e9SAndroid Build Coastguard Worker #include <type_traits>
4*da0073e9SAndroid Build Coastguard Worker 
5*da0073e9SAndroid Build Coastguard Worker // Utility to guarantee complete unrolling of a loop where the bounds are known
6*da0073e9SAndroid Build Coastguard Worker // at compile time. Various pragmas achieve similar effects, but are not as
7*da0073e9SAndroid Build Coastguard Worker // portable across compilers.
8*da0073e9SAndroid Build Coastguard Worker 
9*da0073e9SAndroid Build Coastguard Worker // Example: c10::ForcedUnroll<4>{}(f); is equivalent to f(0); f(1); f(2); f(3);
10*da0073e9SAndroid Build Coastguard Worker 
11*da0073e9SAndroid Build Coastguard Worker namespace c10 {
12*da0073e9SAndroid Build Coastguard Worker 
13*da0073e9SAndroid Build Coastguard Worker template <int n>
14*da0073e9SAndroid Build Coastguard Worker struct ForcedUnroll {
15*da0073e9SAndroid Build Coastguard Worker   template <typename Func, typename... Args>
operatorForcedUnroll16*da0073e9SAndroid Build Coastguard Worker   C10_ALWAYS_INLINE void operator()(const Func& f, Args... args) const {
17*da0073e9SAndroid Build Coastguard Worker     ForcedUnroll<n - 1>{}(f, args...);
18*da0073e9SAndroid Build Coastguard Worker     f(std::integral_constant<int, n - 1>{}, args...);
19*da0073e9SAndroid Build Coastguard Worker   }
20*da0073e9SAndroid Build Coastguard Worker };
21*da0073e9SAndroid Build Coastguard Worker 
22*da0073e9SAndroid Build Coastguard Worker template <>
23*da0073e9SAndroid Build Coastguard Worker struct ForcedUnroll<1> {
24*da0073e9SAndroid Build Coastguard Worker   template <typename Func, typename... Args>
25*da0073e9SAndroid Build Coastguard Worker   C10_ALWAYS_INLINE void operator()(const Func& f, Args... args) const {
26*da0073e9SAndroid Build Coastguard Worker     f(std::integral_constant<int, 0>{}, args...);
27*da0073e9SAndroid Build Coastguard Worker   }
28*da0073e9SAndroid Build Coastguard Worker };
29*da0073e9SAndroid Build Coastguard Worker 
30*da0073e9SAndroid Build Coastguard Worker } // namespace c10
31