1 /* Copyright 2020 The TensorFlow Authors. All Rights Reserved.
2 
3 Licensed under the Apache License, Version 2.0 (the "License");
4 you may not use this file except in compliance with the License.
5 You may obtain a copy of the License at
6 
7     http://www.apache.org/licenses/LICENSE-2.0
8 
9 Unless required by applicable law or agreed to in writing, software
10 distributed under the License is distributed on an "AS IS" BASIS,
11 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 See the License for the specific language governing permissions and
13 limitations under the License.
14 ==============================================================================*/
15 
16 #ifndef TENSORFLOW_LITE_DELEGATES_GPU_COMMON_TASKS_CONVOLUTION_TRANSPOSED_3X3_H_
17 #define TENSORFLOW_LITE_DELEGATES_GPU_COMMON_TASKS_CONVOLUTION_TRANSPOSED_3X3_H_
18 
19 #include <vector>
20 
21 #include "tensorflow/lite/delegates/gpu/common/data_type.h"
22 #include "tensorflow/lite/delegates/gpu/common/operations.h"
23 #include "tensorflow/lite/delegates/gpu/common/shape.h"
24 #include "tensorflow/lite/delegates/gpu/common/status.h"
25 #include "tensorflow/lite/delegates/gpu/common/task/buffer_desc.h"
26 #include "tensorflow/lite/delegates/gpu/common/task/gpu_operation.h"
27 #include "tensorflow/lite/delegates/gpu/common/task/tensor_desc.h"
28 #include "tensorflow/lite/delegates/gpu/common/task/tensor_linear_desc.h"
29 #include "tensorflow/lite/delegates/gpu/common/task/weights_conversion.h"
30 #include "tensorflow/lite/delegates/gpu/common/task/weights_layout.h"
31 #include "tensorflow/lite/delegates/gpu/common/tensor.h"
32 #include "tensorflow/lite/delegates/gpu/common/types.h"
33 
34 namespace tflite {
35 namespace gpu {
36 
37 class ConvolutionTransposed3x3 : public GPUOperation {
38  public:
39   ConvolutionTransposed3x3() = default;
40   void GetPossibleKernelWorkGroups(
41       TuningType tuning_type, const GpuInfo& gpu_info,
42       const KernelInfo& kernel_info,
43       std::vector<int3>* work_groups) const override;
44   absl::Status BindArguments(ArgumentsBinder* args) override;
45   int3 GetGridSize() const override;
46 
47   // Move only
48   ConvolutionTransposed3x3(ConvolutionTransposed3x3&& operation) = default;
49   ConvolutionTransposed3x3& operator=(ConvolutionTransposed3x3&& operation) =
50       default;
51   ConvolutionTransposed3x3(const ConvolutionTransposed3x3&) = delete;
52   ConvolutionTransposed3x3& operator=(const ConvolutionTransposed3x3&) = delete;
53 
GetWeightsDescription()54   WeightsDescription GetWeightsDescription() const {
55     WeightsDescription desc;
56     desc.layout = weights_layout_;
57     desc.spatial_remap = GetSpatialWeightsRemap();
58     return desc;
59   }
60 
61   enum class WeightsUploadType {
62     LOCAL_MEM_ASYNC,
63     LOCAL_MEM_BY_THREADS,
64     GLOBAL_MEM,
65     CONSTANT_MEM,
66   };
67 
68  private:
69   ConvolutionTransposed3x3(const OperationDef& definition,
70                            const GpuInfo& gpu_info, int2 padding);
71   friend ConvolutionTransposed3x3 CreateConvolutionTransposed3x3(
72       const GpuInfo& gpu_info, const OperationDef& definition,
73       const ConvolutionTransposedAttributes& attr);
74   friend ConvolutionTransposed3x3 CreateConvolutionTransposed3x3DynamicWeights(
75       const GpuInfo& gpu_info, const OperationDef& definition,
76       const ConvolutionTransposedAttributes& attr);
77 
78   void UploadWeights(
79       const tflite::gpu::Tensor<OHWI, DataType::FLOAT32>& weights);
80 
81   std::vector<int> GetSpatialWeightsRemap() const;
82 
83   std::string GenerateConvolutionTransposedCode(
84       const GpuInfo& gpu_info, const OperationDef& op_def,
85       ConvolutionTransposed3x3::WeightsUploadType weights_upload_type,
86       int2 padding, int3 work_group_launch_order);
87 
88   int2 padding_;
89   WeightsUploadType weights_upload_type_;
90   WeightsLayout weights_layout_;
91 };
92 
93 bool IsConvolutionTransposed3x3Supported(
94     const OperationDef& definition,
95     const ConvolutionTransposedAttributes& attr);
96 
97 ConvolutionTransposed3x3 CreateConvolutionTransposed3x3(
98     const GpuInfo& gpu_info, const OperationDef& definition,
99     const ConvolutionTransposedAttributes& attr);
100 
101 ConvolutionTransposed3x3 CreateConvolutionTransposed3x3DynamicWeights(
102     const GpuInfo& gpu_info, const OperationDef& definition,
103     const ConvolutionTransposedAttributes& attr);
104 
105 }  // namespace gpu
106 }  // namespace tflite
107 
108 #endif  // TENSORFLOW_LITE_DELEGATES_GPU_COMMON_TASKS_CONVOLUTION_TRANSPOSED_3X3_H_
109