/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/common/selectors/ |
H A D | simple_selectors.cc | 58 const GpuInfo& gpu_info) { in SelectLSTM() 68 const GpuInfo& gpu_info, in SelectPReLU() 74 const GpuInfo& gpu_info, in SelectPooling() 80 const MaxUnpooling2DAttributes& attr, const GpuInfo& gpu_info, in SelectMaxUnpooling() 105 const GpuInfo& gpu_info) { in SelectResampler() 120 const OperationDef& op_def, const GpuInfo& gpu_info, in SelectConcat() 142 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolutionDynamicWeights() 174 void SelectSplit(const SplitAttributes& attr, const GpuInfo& gpu_info, in SelectSplit() 197 const GpuInfo& gpu_info) { in SelectReduce() 226 const GpuInfo& gpu_info, const Padding2D& padding, in SelectWinograd4x4To36() [all …]
|
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/common/task/ |
H A D | tensor_desc.cc | 84 std::string GetConversionForImage(const GpuInfo& gpu_info, DataType src_type, in GetConversionForImage() 98 std::string GetConversion(const GpuInfo& gpu_info, in GetConversion() 384 absl::Status TensorDescriptor::PerformConstExpr(const GpuInfo& gpu_info, in PerformConstExpr() 402 const GpuInfo& gpu_info, const std::string& selector, in PerformSelector() 463 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformReadSelector() 511 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformReadNearestSelector() 544 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformReadBilinearSelector() 617 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformReadPerChannelSelector() 695 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformWriteSelector() 714 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformWriteLinearSelector() [all …]
|
H A D | util.cc | 28 std::string GetGlslConversion(const GpuInfo& gpu_info, DataType src_type, in GetGlslConversion() 136 int GetRecommendedBlockSizeForConv(const GpuInfo& gpu_info, in GetRecommendedBlockSizeForConv() 218 std::string GetTypeDeclaration(const GpuInfo& gpu_info, DataType data_type, in GetTypeDeclaration() 232 std::string GetZeroValue(const GpuInfo& gpu_info, DataType data_type, in GetZeroValue() 247 std::string GetOneValue(const GpuInfo& gpu_info, DataType data_type, in GetOneValue() 262 std::string GetTypeConversion(const GpuInfo& gpu_info, DataType src_type, in GetTypeConversion()
|
H A D | gpu_operation.cc | 196 const GpuInfo& gpu_info, GPUOperation* operation) { in FuseSimpleElemWithSimpleElem() 228 const GpuInfo& gpu_info, GPUOperation* operation) { in Fuse2InputElemWithSimpleElemAsFirstInput() 263 const GpuInfo& gpu_info, GPUOperation* operation43) { in Fuse2InputElemWithSimpleElemAsSecondInput() 287 absl::Status GPUOperation::AddOperation(const GpuInfo& gpu_info, in AddOperation() 402 absl::Status GPUOperation::AssembleCode(const GpuInfo& gpu_info) { in AssembleCode() 438 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleDispatches() 455 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups() 545 absl::Status Fuse2InputElemWith2SimpleElem(const GpuInfo& gpu_info, in Fuse2InputElemWith2SimpleElem()
|
H A D | work_group_picking.cc | 37 const GpuInfo& gpu_info, WorkGroupSizeAlignment z_alignment) { in GenerateWorkGroupSizesXYMultipleOf() 67 const GpuInfo& gpu_info, WorkGroupSizeAlignment z_alignment) { in GenerateWorkGroupSizesXMultipleOf() 92 void GetWorkGroupsAlignedToGrid(const GpuInfo& gpu_info, in GetWorkGroupsAlignedToGrid() 237 void GetPossibleWorkGroupsXYMultipleOf(int multiplier, const GpuInfo& gpu_info, in GetPossibleWorkGroupsXYMultipleOf() 246 void GetPossibleWorkGroupsXMultipleOf(int multiplier, const GpuInfo& gpu_info, in GetPossibleWorkGroupsXMultipleOf() 271 void GetPossibleWorkGroups(TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleWorkGroups() 293 void GetPossibleWorkGroupsConv(TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleWorkGroupsConv()
|
H A D | arguments.cc | 186 absl::Status BufferToKernelLanguage(const GpuInfo& gpu_info, in BufferToKernelLanguage() 430 const GpuInfo& gpu_info, in Compile() 440 absl::Status Arguments::ResolveConstExprPass(const GpuInfo& gpu_info, in ResolveConstExprPass() 472 absl::Status Arguments::ResolveConstExpr(const GpuInfo& gpu_info, in ResolveConstExpr() 483 const GpuInfo& gpu_info, in ResolveSelectorsPass() 533 const GpuInfo& gpu_info, in ResolveSelector() 596 absl::Status Arguments::AddObjectsScalarArgs(const GpuInfo& gpu_info) { in AddObjectsScalarArgs() 632 absl::Status Arguments::ResolveKernelGlobalSpaceBuffers(const GpuInfo& gpu_info, in ResolveKernelGlobalSpaceBuffers()
|
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/common/tasks/ |
H A D | depthwise_conv.cc | 85 std::string GetSrcXYCheck(const GpuInfo& gpu_info, in GetSrcXYCheck() 103 bool UseBuffersForWeights(const GpuInfo& gpu_info) { in UseBuffersForWeights() 131 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups() 141 std::string DepthwiseConv::GenerateSrcUpload(const GpuInfo& gpu_info) { in GenerateSrcUpload() 181 std::string DepthwiseConv::GenerateWeightsUpload(const GpuInfo& gpu_info) { in GenerateWeightsUpload() 218 std::string DepthwiseConv::GenerateCode(const GpuInfo& gpu_info) { in GenerateCode() 388 const GpuInfo& gpu_info, const OperationDef& definition, in CreateDepthwiseConvolution2D() 432 const GpuInfo& gpu_info, const OperationDef& definition, in CreateDepthwiseConvolution2DDynamicWeights() 454 const GpuInfo& gpu_info, const OperationDef& definition, in CreateDepthwiseConvolution3D()
|
H A D | conv_generic.cc | 175 const GpuInfo& gpu_info, const BHWC* dst_shape) in ConvGeneric() 201 const BHWC& weights_shape, const GpuInfo& gpu_info, in ConvGeneric() 213 const GpuInfo& gpu_info, const BHWC* dst_shape) in ConvGeneric() 238 const GpuInfo& gpu_info, const BHWDC* dst_shape) in ConvGeneric() 260 void ConvGeneric::GenerateCode(const GpuInfo& gpu_info) { in GenerateCode() 362 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups() 376 std::string ConvGeneric::GenerateConv(const GpuInfo& gpu_info, in GenerateConv() 1457 const GpuInfo& gpu_info, const OperationDef& definition, int src_depth, in GuessBestParamsApple() 1470 const GpuInfo& gpu_info, const OperationDef& definition, int src_depth, in GuessBestParams() 1823 const GpuInfo& gpu_info, const OperationDef& definition, in GuessBestParams() [all …]
|
H A D | winograd.cc | 52 std::string GetKernelWinograd4x4To36(const GpuInfo& gpu_info, in GetKernelWinograd4x4To36() 251 const GpuInfo& gpu_info) { in CreateWinograd4x4To36() 275 const GpuInfo& gpu_info) in Winograd4x4To36TileX6() 289 const OperationDef& op_def, const GpuInfo& gpu_info) { in GetWinograd4x4To36TileX6Code() 514 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups() 533 const GpuInfo& gpu_info, const OperationDef& definition, in CreateWinograd4x4To36TileX6() 570 const GpuInfo& gpu_info) in Winograd36To4x4Tile4x1() 581 const OperationDef& op_def, const GpuInfo& gpu_info) { in GetWinograd36To4x4Tile4x1Code() 732 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups() 751 const GpuInfo& gpu_info, const OperationDef& definition, in CreateWinograd36To4x4Tile4x1()
|
H A D | elementwise.cc | 30 std::string GetOneInputCode(const GpuInfo& gpu_info, in GetOneInputCode() 249 const GpuInfo& gpu_info, const OperationDef& definition, in CreateElementwiseTwoInput() 275 const GpuInfo& gpu_info, const OperationDef& definition, in CreateElementwiseTwoInput() 305 ElementwiseDescriptor CreateElementwiseDesc(const GpuInfo& gpu_info, in CreateElementwiseDesc() 332 GPUOperation CreateElementwiseOneInput(const GpuInfo& gpu_info, in CreateElementwiseOneInput() 341 GPUOperation CreateElementwise(const GpuInfo& gpu_info, in CreateElementwise() 403 const GpuInfo& gpu_info, const OperationDef& definition, in CreateElementwiseOneInputWithBroadcast() 421 GPUOperation CreateElementwiseWithBroadcast(const GpuInfo& gpu_info, in CreateElementwiseWithBroadcast()
|
H A D | convolution_transposed.cc | 32 bool UseBufferForWeights(const GpuInfo& gpu_info) { in UseBufferForWeights() 39 const GpuInfo& gpu_info) in ConvolutionTransposed() 84 const ConvolutionTransposed3DAttributes& attr, const GpuInfo& gpu_info) in ConvolutionTransposed() 132 const OperationDef& op_def, const GpuInfo& gpu_info, in GenerateConvolutionTransposedCode() 602 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups() 609 const GpuInfo& gpu_info, const OperationDef& definition, in CreateConvolutionTransposed() 622 const GpuInfo& gpu_info, const OperationDef& definition, in CreateConvolutionTransposed3D() 635 const GpuInfo& gpu_info, const OperationDef& definition, in CreateConvolutionTransposedDynamicWeights()
|
H A D | depthwise_conv_3x3.cc | 31 const GpuInfo& gpu_info) in DepthwiseConv3x3() 56 const GpuInfo& gpu_info, const OperationDef& op_def, in GenerateDepthwiseConvCode() 306 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups() 316 bool IsDepthwiseConv3x3Supported(const GpuInfo& gpu_info, in IsDepthwiseConv3x3Supported() 335 const GpuInfo& gpu_info, const OperationDef& definition, in CreateDepthwiseConv3x3()
|
H A D | fully_connected.cc | 33 bool UseBufferForWeights(const GpuInfo& gpu_info) { in UseBufferForWeights() 70 const GpuInfo& gpu_info) in FullyConnected() 105 const OperationDef& op_def, const GpuInfo& gpu_info, in GetFullyConnectedKernelCode() 220 FullyConnected CreateFullyConnected(const GpuInfo& gpu_info, in CreateFullyConnected() 236 FullyConnected CreateFullyConnected(const GpuInfo& gpu_info, in CreateFullyConnected()
|
H A D | convolution_transposed_4x4.cc | 30 const GpuInfo& gpu_info) { in GetBestWeightsUploadType() 59 const OperationDef& definition, const GpuInfo& gpu_info) in ConvolutionTransposed4x4() 81 const GpuInfo& gpu_info, const OperationDef& op_def, in GenerateConvolutionTransposedCode() 403 const GpuInfo& gpu_info, const OperationDef& definition, in CreateConvolutionTransposed4x4() 416 const GpuInfo& gpu_info, const OperationDef& definition, in CreateConvolutionTransposed4x4DynamicWeights()
|
H A D | reduce.cc | 32 int GetMaximumWGTotalSize(const GpuInfo& gpu_info) { in GetMaximumWGTotalSize() 129 const OperationDef& definition, const GpuInfo& gpu_info) in Reduce() 177 const GpuInfo& gpu_info, in GetReduceKernelCode() 514 const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups() 527 const GpuInfo& gpu_info) { in CreateReduce() 534 const OperationDef& definition, const GpuInfo& gpu_info) { in CreateReduce()
|
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/common/selectors/default/ |
H A D | convolution_selector.cc | 37 const GpuInfo& gpu_info, const OperationDef& op_def, in SelectConvolutionAdreno() 50 const GpuInfo& gpu_info, const OperationDef& op_def) { in SelectConvolutionNVidia() 62 const GpuInfo& gpu_info, const OperationDef& op_def) { in SelectConvolutionApple() 80 const GpuInfo& gpu_info, const OperationDef& op_def, in SelectConvolution() 99 const GpuInfo& gpu_info, const OperationDef& op_def, in SelectConvolutionForWinograd() 108 const BHWC& dst_shape, const GpuInfo& gpu_info, in SelectConvolutionWithDynamicWeights() 118 const OHWI& weights_shape, const BHWC& dst_shape, const GpuInfo& gpu_info, in SelectConvolutionBatchedMatMul()
|
H A D | dw_convolution_selector.cc | 29 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolutionAdreno() 41 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolutionPowerVR() 53 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolutionMali() 71 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolutionApple() 87 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolution()
|
H A D | convolution_transposed_selector.cc | 32 const ConvolutionTransposedAttributes& attr, const GpuInfo& gpu_info, in SelectConvolutionTransposedAdreno() 50 const ConvolutionTransposedAttributes& attr, const GpuInfo& gpu_info, in SelectConvolutionTransposedPowerVR() 76 const ConvolutionTransposedAttributes& attr, const GpuInfo& gpu_info, in SelectConvolutionTransposedMali() 85 const ConvolutionTransposedAttributes& attr, const GpuInfo& gpu_info, in SelectConvolutionTransposed() 104 const ConvolutionTransposedAttributes& attr, const GpuInfo& gpu_info, in SelectConvolutionTransposedWithDynamicWeights()
|
/aosp_15_r20/external/mesa3d/src/gallium/drivers/freedreno/ |
H A D | gmemtool.c | 65 struct gpu_info { struct 78 static const struct gpu_info gpu_infos[] = { argument 130 const struct gpu_info *gpu_info = NULL; in main() local
|
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/common/tasks/special/ |
H A D | depthwise_conv_plus_1x1_conv.cc | 37 std::string MultiplyAccumulate(const GpuInfo& gpu_info, in MultiplyAccumulate() 163 void ThinPointwiseFuser::CreateConstantsGpuBuffer(const GpuInfo& gpu_info) { in CreateConstantsGpuBuffer() 216 bool ThinPointwiseFuser::IsNodeSupported(const GpuInfo& gpu_info, in IsNodeSupported() 316 bool ThinPointwiseFuser::ReserveNode(const GpuInfo& gpu_info, Node* node) { in ReserveNode() 353 void ThinPointwiseFuser::AddNode(const GpuInfo& gpu_info, Node* node) { in AddNode() 391 const GpuInfo& gpu_info, const DepthwiseConvolution2DAttributes& attr) { in AddDepthwiseConvNode() 500 void ThinPointwiseFuser::AddConvNode(const GpuInfo& gpu_info, in AddConvNode() 545 const GpuInfo& gpu_info, const GraphFloat32& graph, in Finalize() 617 const GpuInfo& gpu_info, CalculationsPrecision precision, in TryDepthwiseConvPlus1x1Conv()
|
H A D | fc_fc_add.cc | 32 bool UseBufferForWeights(const GpuInfo& gpu_info) { in UseBufferForWeights() 66 FCFCAdd::FCFCAdd(const OperationDef& definition, const GpuInfo& gpu_info) in FCFCAdd() 103 const GpuInfo& gpu_info, in GetFCFCAddKernelCode() 252 FCFCAdd CreateFCFCAdd(const GpuInfo& gpu_info, const OperationDef& definition, in CreateFCFCAdd() 275 FCFCAdd CreateFCFCAdd(const GpuInfo& gpu_info, const OperationDef& definition, in CreateFCFCAdd() 301 const GpuInfo& gpu_info, CalculationsPrecision precision, in TryFCFCAdd()
|
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/cl/ |
H A D | environment.cc | 52 bool IsGpuSupportsStorageType(const GpuInfo& gpu_info, in IsGpuSupportsStorageType() 74 bool IsGpuSupportsPrecision(const GpuInfo& gpu_info, in IsGpuSupportsPrecision() 188 TensorStorageType GetFastestStorageType(const GpuInfo& gpu_info) { in GetFastestStorageType() 213 const GpuInfo& gpu_info) { in GetStorageTypeWithMinimalMemoryConsumption() 251 bool CanUseSubBufferForImage2d(const GpuInfo& gpu_info) { in CanUseSubBufferForImage2d()
|
H A D | inference_context.cc | 67 bool IsBufferBased(const GpuInfo& gpu_info, const TensorStorageType& type) { in IsBufferBased() 88 const GpuInfo& gpu_info, ValueId id) { in GetTensorType() 141 const GpuInfo& gpu_info, in GetBufferAsignment() 221 void InferenceContext::ExecutionHints::Init(const GpuInfo& gpu_info) { in Init() 437 const GpuModel& gpu_model, const GpuInfo& gpu_info, in AllocateMemory() 481 const GpuModel& gpu_model, const GpuInfo& gpu_info, in AllocateBufferBasedTensors() 603 const GpuModel& gpu_model, const GpuInfo& gpu_info, in AllocateStrongShapesTensors() 683 const GpuInfo& gpu_info, in Tune() 996 const GpuInfo& gpu_info, in GetTotalBufferSizeForTensors()
|
/aosp_15_r20/external/tensorflow/tensorflow/core/kernels/ |
H A D | nccl_ops.cc | 109 auto* gpu_info = c->device()->tensorflow_accelerator_device_info(); in ComputeAsync() local 140 auto* gpu_info = c->device()->tensorflow_accelerator_device_info(); in ComputeAsync() local 176 auto* gpu_info = c->device()->tensorflow_accelerator_device_info(); in ComputeAsync() local 210 auto* gpu_info = c->device()->tensorflow_accelerator_device_info(); in ComputeAsync() local 246 auto* gpu_info = c->device()->tensorflow_accelerator_device_info(); in ComputeAsync() local
|
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/gl/ |
H A D | compiler.cc | 64 bool ExceedsMaxSize(const Object& object, const GpuInfo& gpu_info) { in ExceedsMaxSize() 72 ObjectType ChooseFastestObjectType(const GpuInfo& gpu_info) { in ChooseFastestObjectType() 76 ObjectType ChooseFastestRefObjectType(const GpuInfo& gpu_info, in ChooseFastestRefObjectType() 98 CompilerImpl(const NodeShader* node_shader, const GpuInfo* gpu_info, in CompilerImpl() 303 const GpuInfo* gpu_info, in NewCompiler()
|