Home
last modified time | relevance | path

Searched defs:gpu_info (Results 1 – 25 of 114) sorted by relevance

12345

/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/common/selectors/
H A Dsimple_selectors.cc58 const GpuInfo& gpu_info) { in SelectLSTM()
68 const GpuInfo& gpu_info, in SelectPReLU()
74 const GpuInfo& gpu_info, in SelectPooling()
80 const MaxUnpooling2DAttributes& attr, const GpuInfo& gpu_info, in SelectMaxUnpooling()
105 const GpuInfo& gpu_info) { in SelectResampler()
120 const OperationDef& op_def, const GpuInfo& gpu_info, in SelectConcat()
142 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolutionDynamicWeights()
174 void SelectSplit(const SplitAttributes& attr, const GpuInfo& gpu_info, in SelectSplit()
197 const GpuInfo& gpu_info) { in SelectReduce()
226 const GpuInfo& gpu_info, const Padding2D& padding, in SelectWinograd4x4To36()
[all …]
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/common/task/
H A Dtensor_desc.cc84 std::string GetConversionForImage(const GpuInfo& gpu_info, DataType src_type, in GetConversionForImage()
98 std::string GetConversion(const GpuInfo& gpu_info, in GetConversion()
384 absl::Status TensorDescriptor::PerformConstExpr(const GpuInfo& gpu_info, in PerformConstExpr()
402 const GpuInfo& gpu_info, const std::string& selector, in PerformSelector()
463 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformReadSelector()
511 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformReadNearestSelector()
544 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformReadBilinearSelector()
617 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformReadPerChannelSelector()
695 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformWriteSelector()
714 const GpuInfo& gpu_info, const std::vector<std::string>& args, in PerformWriteLinearSelector()
[all …]
H A Dutil.cc28 std::string GetGlslConversion(const GpuInfo& gpu_info, DataType src_type, in GetGlslConversion()
136 int GetRecommendedBlockSizeForConv(const GpuInfo& gpu_info, in GetRecommendedBlockSizeForConv()
218 std::string GetTypeDeclaration(const GpuInfo& gpu_info, DataType data_type, in GetTypeDeclaration()
232 std::string GetZeroValue(const GpuInfo& gpu_info, DataType data_type, in GetZeroValue()
247 std::string GetOneValue(const GpuInfo& gpu_info, DataType data_type, in GetOneValue()
262 std::string GetTypeConversion(const GpuInfo& gpu_info, DataType src_type, in GetTypeConversion()
H A Dgpu_operation.cc196 const GpuInfo& gpu_info, GPUOperation* operation) { in FuseSimpleElemWithSimpleElem()
228 const GpuInfo& gpu_info, GPUOperation* operation) { in Fuse2InputElemWithSimpleElemAsFirstInput()
263 const GpuInfo& gpu_info, GPUOperation* operation43) { in Fuse2InputElemWithSimpleElemAsSecondInput()
287 absl::Status GPUOperation::AddOperation(const GpuInfo& gpu_info, in AddOperation()
402 absl::Status GPUOperation::AssembleCode(const GpuInfo& gpu_info) { in AssembleCode()
438 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleDispatches()
455 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups()
545 absl::Status Fuse2InputElemWith2SimpleElem(const GpuInfo& gpu_info, in Fuse2InputElemWith2SimpleElem()
H A Dwork_group_picking.cc37 const GpuInfo& gpu_info, WorkGroupSizeAlignment z_alignment) { in GenerateWorkGroupSizesXYMultipleOf()
67 const GpuInfo& gpu_info, WorkGroupSizeAlignment z_alignment) { in GenerateWorkGroupSizesXMultipleOf()
92 void GetWorkGroupsAlignedToGrid(const GpuInfo& gpu_info, in GetWorkGroupsAlignedToGrid()
237 void GetPossibleWorkGroupsXYMultipleOf(int multiplier, const GpuInfo& gpu_info, in GetPossibleWorkGroupsXYMultipleOf()
246 void GetPossibleWorkGroupsXMultipleOf(int multiplier, const GpuInfo& gpu_info, in GetPossibleWorkGroupsXMultipleOf()
271 void GetPossibleWorkGroups(TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleWorkGroups()
293 void GetPossibleWorkGroupsConv(TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleWorkGroupsConv()
H A Darguments.cc186 absl::Status BufferToKernelLanguage(const GpuInfo& gpu_info, in BufferToKernelLanguage()
430 const GpuInfo& gpu_info, in Compile()
440 absl::Status Arguments::ResolveConstExprPass(const GpuInfo& gpu_info, in ResolveConstExprPass()
472 absl::Status Arguments::ResolveConstExpr(const GpuInfo& gpu_info, in ResolveConstExpr()
483 const GpuInfo& gpu_info, in ResolveSelectorsPass()
533 const GpuInfo& gpu_info, in ResolveSelector()
596 absl::Status Arguments::AddObjectsScalarArgs(const GpuInfo& gpu_info) { in AddObjectsScalarArgs()
632 absl::Status Arguments::ResolveKernelGlobalSpaceBuffers(const GpuInfo& gpu_info, in ResolveKernelGlobalSpaceBuffers()
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/common/tasks/
H A Ddepthwise_conv.cc85 std::string GetSrcXYCheck(const GpuInfo& gpu_info, in GetSrcXYCheck()
103 bool UseBuffersForWeights(const GpuInfo& gpu_info) { in UseBuffersForWeights()
131 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups()
141 std::string DepthwiseConv::GenerateSrcUpload(const GpuInfo& gpu_info) { in GenerateSrcUpload()
181 std::string DepthwiseConv::GenerateWeightsUpload(const GpuInfo& gpu_info) { in GenerateWeightsUpload()
218 std::string DepthwiseConv::GenerateCode(const GpuInfo& gpu_info) { in GenerateCode()
388 const GpuInfo& gpu_info, const OperationDef& definition, in CreateDepthwiseConvolution2D()
432 const GpuInfo& gpu_info, const OperationDef& definition, in CreateDepthwiseConvolution2DDynamicWeights()
454 const GpuInfo& gpu_info, const OperationDef& definition, in CreateDepthwiseConvolution3D()
H A Dconv_generic.cc175 const GpuInfo& gpu_info, const BHWC* dst_shape) in ConvGeneric()
201 const BHWC& weights_shape, const GpuInfo& gpu_info, in ConvGeneric()
213 const GpuInfo& gpu_info, const BHWC* dst_shape) in ConvGeneric()
238 const GpuInfo& gpu_info, const BHWDC* dst_shape) in ConvGeneric()
260 void ConvGeneric::GenerateCode(const GpuInfo& gpu_info) { in GenerateCode()
362 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups()
376 std::string ConvGeneric::GenerateConv(const GpuInfo& gpu_info, in GenerateConv()
1457 const GpuInfo& gpu_info, const OperationDef& definition, int src_depth, in GuessBestParamsApple()
1470 const GpuInfo& gpu_info, const OperationDef& definition, int src_depth, in GuessBestParams()
1823 const GpuInfo& gpu_info, const OperationDef& definition, in GuessBestParams()
[all …]
H A Dwinograd.cc52 std::string GetKernelWinograd4x4To36(const GpuInfo& gpu_info, in GetKernelWinograd4x4To36()
251 const GpuInfo& gpu_info) { in CreateWinograd4x4To36()
275 const GpuInfo& gpu_info) in Winograd4x4To36TileX6()
289 const OperationDef& op_def, const GpuInfo& gpu_info) { in GetWinograd4x4To36TileX6Code()
514 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups()
533 const GpuInfo& gpu_info, const OperationDef& definition, in CreateWinograd4x4To36TileX6()
570 const GpuInfo& gpu_info) in Winograd36To4x4Tile4x1()
581 const OperationDef& op_def, const GpuInfo& gpu_info) { in GetWinograd36To4x4Tile4x1Code()
732 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups()
751 const GpuInfo& gpu_info, const OperationDef& definition, in CreateWinograd36To4x4Tile4x1()
H A Delementwise.cc30 std::string GetOneInputCode(const GpuInfo& gpu_info, in GetOneInputCode()
249 const GpuInfo& gpu_info, const OperationDef& definition, in CreateElementwiseTwoInput()
275 const GpuInfo& gpu_info, const OperationDef& definition, in CreateElementwiseTwoInput()
305 ElementwiseDescriptor CreateElementwiseDesc(const GpuInfo& gpu_info, in CreateElementwiseDesc()
332 GPUOperation CreateElementwiseOneInput(const GpuInfo& gpu_info, in CreateElementwiseOneInput()
341 GPUOperation CreateElementwise(const GpuInfo& gpu_info, in CreateElementwise()
403 const GpuInfo& gpu_info, const OperationDef& definition, in CreateElementwiseOneInputWithBroadcast()
421 GPUOperation CreateElementwiseWithBroadcast(const GpuInfo& gpu_info, in CreateElementwiseWithBroadcast()
H A Dconvolution_transposed.cc32 bool UseBufferForWeights(const GpuInfo& gpu_info) { in UseBufferForWeights()
39 const GpuInfo& gpu_info) in ConvolutionTransposed()
84 const ConvolutionTransposed3DAttributes& attr, const GpuInfo& gpu_info) in ConvolutionTransposed()
132 const OperationDef& op_def, const GpuInfo& gpu_info, in GenerateConvolutionTransposedCode()
602 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups()
609 const GpuInfo& gpu_info, const OperationDef& definition, in CreateConvolutionTransposed()
622 const GpuInfo& gpu_info, const OperationDef& definition, in CreateConvolutionTransposed3D()
635 const GpuInfo& gpu_info, const OperationDef& definition, in CreateConvolutionTransposedDynamicWeights()
H A Ddepthwise_conv_3x3.cc31 const GpuInfo& gpu_info) in DepthwiseConv3x3()
56 const GpuInfo& gpu_info, const OperationDef& op_def, in GenerateDepthwiseConvCode()
306 TuningType tuning_type, const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups()
316 bool IsDepthwiseConv3x3Supported(const GpuInfo& gpu_info, in IsDepthwiseConv3x3Supported()
335 const GpuInfo& gpu_info, const OperationDef& definition, in CreateDepthwiseConv3x3()
H A Dfully_connected.cc33 bool UseBufferForWeights(const GpuInfo& gpu_info) { in UseBufferForWeights()
70 const GpuInfo& gpu_info) in FullyConnected()
105 const OperationDef& op_def, const GpuInfo& gpu_info, in GetFullyConnectedKernelCode()
220 FullyConnected CreateFullyConnected(const GpuInfo& gpu_info, in CreateFullyConnected()
236 FullyConnected CreateFullyConnected(const GpuInfo& gpu_info, in CreateFullyConnected()
H A Dconvolution_transposed_4x4.cc30 const GpuInfo& gpu_info) { in GetBestWeightsUploadType()
59 const OperationDef& definition, const GpuInfo& gpu_info) in ConvolutionTransposed4x4()
81 const GpuInfo& gpu_info, const OperationDef& op_def, in GenerateConvolutionTransposedCode()
403 const GpuInfo& gpu_info, const OperationDef& definition, in CreateConvolutionTransposed4x4()
416 const GpuInfo& gpu_info, const OperationDef& definition, in CreateConvolutionTransposed4x4DynamicWeights()
H A Dreduce.cc32 int GetMaximumWGTotalSize(const GpuInfo& gpu_info) { in GetMaximumWGTotalSize()
129 const OperationDef& definition, const GpuInfo& gpu_info) in Reduce()
177 const GpuInfo& gpu_info, in GetReduceKernelCode()
514 const GpuInfo& gpu_info, in GetPossibleKernelWorkGroups()
527 const GpuInfo& gpu_info) { in CreateReduce()
534 const OperationDef& definition, const GpuInfo& gpu_info) { in CreateReduce()
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/common/selectors/default/
H A Dconvolution_selector.cc37 const GpuInfo& gpu_info, const OperationDef& op_def, in SelectConvolutionAdreno()
50 const GpuInfo& gpu_info, const OperationDef& op_def) { in SelectConvolutionNVidia()
62 const GpuInfo& gpu_info, const OperationDef& op_def) { in SelectConvolutionApple()
80 const GpuInfo& gpu_info, const OperationDef& op_def, in SelectConvolution()
99 const GpuInfo& gpu_info, const OperationDef& op_def, in SelectConvolutionForWinograd()
108 const BHWC& dst_shape, const GpuInfo& gpu_info, in SelectConvolutionWithDynamicWeights()
118 const OHWI& weights_shape, const BHWC& dst_shape, const GpuInfo& gpu_info, in SelectConvolutionBatchedMatMul()
H A Ddw_convolution_selector.cc29 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolutionAdreno()
41 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolutionPowerVR()
53 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolutionMali()
71 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolutionApple()
87 const DepthwiseConvolution2DAttributes& attr, const GpuInfo& gpu_info, in SelectDWConvolution()
H A Dconvolution_transposed_selector.cc32 const ConvolutionTransposedAttributes& attr, const GpuInfo& gpu_info, in SelectConvolutionTransposedAdreno()
50 const ConvolutionTransposedAttributes& attr, const GpuInfo& gpu_info, in SelectConvolutionTransposedPowerVR()
76 const ConvolutionTransposedAttributes& attr, const GpuInfo& gpu_info, in SelectConvolutionTransposedMali()
85 const ConvolutionTransposedAttributes& attr, const GpuInfo& gpu_info, in SelectConvolutionTransposed()
104 const ConvolutionTransposedAttributes& attr, const GpuInfo& gpu_info, in SelectConvolutionTransposedWithDynamicWeights()
/aosp_15_r20/external/mesa3d/src/gallium/drivers/freedreno/
H A Dgmemtool.c65 struct gpu_info { struct
78 static const struct gpu_info gpu_infos[] = { argument
130 const struct gpu_info *gpu_info = NULL; in main() local
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/common/tasks/special/
H A Ddepthwise_conv_plus_1x1_conv.cc37 std::string MultiplyAccumulate(const GpuInfo& gpu_info, in MultiplyAccumulate()
163 void ThinPointwiseFuser::CreateConstantsGpuBuffer(const GpuInfo& gpu_info) { in CreateConstantsGpuBuffer()
216 bool ThinPointwiseFuser::IsNodeSupported(const GpuInfo& gpu_info, in IsNodeSupported()
316 bool ThinPointwiseFuser::ReserveNode(const GpuInfo& gpu_info, Node* node) { in ReserveNode()
353 void ThinPointwiseFuser::AddNode(const GpuInfo& gpu_info, Node* node) { in AddNode()
391 const GpuInfo& gpu_info, const DepthwiseConvolution2DAttributes& attr) { in AddDepthwiseConvNode()
500 void ThinPointwiseFuser::AddConvNode(const GpuInfo& gpu_info, in AddConvNode()
545 const GpuInfo& gpu_info, const GraphFloat32& graph, in Finalize()
617 const GpuInfo& gpu_info, CalculationsPrecision precision, in TryDepthwiseConvPlus1x1Conv()
H A Dfc_fc_add.cc32 bool UseBufferForWeights(const GpuInfo& gpu_info) { in UseBufferForWeights()
66 FCFCAdd::FCFCAdd(const OperationDef& definition, const GpuInfo& gpu_info) in FCFCAdd()
103 const GpuInfo& gpu_info, in GetFCFCAddKernelCode()
252 FCFCAdd CreateFCFCAdd(const GpuInfo& gpu_info, const OperationDef& definition, in CreateFCFCAdd()
275 FCFCAdd CreateFCFCAdd(const GpuInfo& gpu_info, const OperationDef& definition, in CreateFCFCAdd()
301 const GpuInfo& gpu_info, CalculationsPrecision precision, in TryFCFCAdd()
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/cl/
H A Denvironment.cc52 bool IsGpuSupportsStorageType(const GpuInfo& gpu_info, in IsGpuSupportsStorageType()
74 bool IsGpuSupportsPrecision(const GpuInfo& gpu_info, in IsGpuSupportsPrecision()
188 TensorStorageType GetFastestStorageType(const GpuInfo& gpu_info) { in GetFastestStorageType()
213 const GpuInfo& gpu_info) { in GetStorageTypeWithMinimalMemoryConsumption()
251 bool CanUseSubBufferForImage2d(const GpuInfo& gpu_info) { in CanUseSubBufferForImage2d()
H A Dinference_context.cc67 bool IsBufferBased(const GpuInfo& gpu_info, const TensorStorageType& type) { in IsBufferBased()
88 const GpuInfo& gpu_info, ValueId id) { in GetTensorType()
141 const GpuInfo& gpu_info, in GetBufferAsignment()
221 void InferenceContext::ExecutionHints::Init(const GpuInfo& gpu_info) { in Init()
437 const GpuModel& gpu_model, const GpuInfo& gpu_info, in AllocateMemory()
481 const GpuModel& gpu_model, const GpuInfo& gpu_info, in AllocateBufferBasedTensors()
603 const GpuModel& gpu_model, const GpuInfo& gpu_info, in AllocateStrongShapesTensors()
683 const GpuInfo& gpu_info, in Tune()
996 const GpuInfo& gpu_info, in GetTotalBufferSizeForTensors()
/aosp_15_r20/external/tensorflow/tensorflow/core/kernels/
H A Dnccl_ops.cc109 auto* gpu_info = c->device()->tensorflow_accelerator_device_info(); in ComputeAsync() local
140 auto* gpu_info = c->device()->tensorflow_accelerator_device_info(); in ComputeAsync() local
176 auto* gpu_info = c->device()->tensorflow_accelerator_device_info(); in ComputeAsync() local
210 auto* gpu_info = c->device()->tensorflow_accelerator_device_info(); in ComputeAsync() local
246 auto* gpu_info = c->device()->tensorflow_accelerator_device_info(); in ComputeAsync() local
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/gl/
H A Dcompiler.cc64 bool ExceedsMaxSize(const Object& object, const GpuInfo& gpu_info) { in ExceedsMaxSize()
72 ObjectType ChooseFastestObjectType(const GpuInfo& gpu_info) { in ChooseFastestObjectType()
76 ObjectType ChooseFastestRefObjectType(const GpuInfo& gpu_info, in ChooseFastestRefObjectType()
98 CompilerImpl(const NodeShader* node_shader, const GpuInfo* gpu_info, in CompilerImpl()
303 const GpuInfo* gpu_info, in NewCompiler()

12345