Lines Matching refs:std

30 const std::int32_t kMaxCacheFriendlySize = 24 * 1024;
33 void CacheFriendlyMatrixMatrix(std::uint8_t* scratch, const IN_TYPE* lhs, in CacheFriendlyMatrixMatrix()
34 const IN_TYPE* rhs, std::int32_t m, in CacheFriendlyMatrixMatrix()
35 std::int32_t n, std::int32_t k, OUT_TYPE* result, in CacheFriendlyMatrixMatrix()
36 std::int32_t result_stride, const F& operation) { in CacheFriendlyMatrixMatrix()
37 const std::int32_t rhs_size = n * k * sizeof(IN_TYPE); in CacheFriendlyMatrixMatrix()
39 const std::int32_t optimal_n = in CacheFriendlyMatrixMatrix()
40 std::max(1, 3 * (kMaxCacheFriendlySize / (k * 3))); in CacheFriendlyMatrixMatrix()
41 const std::int32_t chunks_count_less_one = n / optimal_n - 1; in CacheFriendlyMatrixMatrix()
42 const std::int32_t chunk_size = optimal_n * k; in CacheFriendlyMatrixMatrix()
48 const std::int32_t n_left = n - chunks_count_less_one * optimal_n; in CacheFriendlyMatrixMatrix()
60 GemmQuantized8BitOperation(std::int32_t lhs_offset, std::int32_t rhs_offset, in GemmQuantized8BitOperation()
61 std::int32_t sum_offset, std::int32_t multiplier, in GemmQuantized8BitOperation()
62 std::int32_t shift) in GemmQuantized8BitOperation()
69 void ExecuteMatrixMatrix(std::uint8_t* scratch, const std::uint8_t* lhs, in ExecuteMatrixMatrix()
70 const std::uint8_t* rhs, std::int32_t m, in ExecuteMatrixMatrix()
71 std::int32_t n, std::int32_t k, std::uint8_t* result, in ExecuteMatrixMatrix()
72 std::int32_t result_stride) const { in ExecuteMatrixMatrix()
77 void ExecuteCacheFriendlyMatrixMatrix(std::uint8_t* scratch, in ExecuteCacheFriendlyMatrixMatrix()
78 const std::uint8_t* lhs, in ExecuteCacheFriendlyMatrixMatrix()
79 const std::uint8_t* rhs, std::int32_t m, in ExecuteCacheFriendlyMatrixMatrix()
80 std::int32_t n, std::int32_t k, in ExecuteCacheFriendlyMatrixMatrix()
81 std::uint8_t* result, in ExecuteCacheFriendlyMatrixMatrix()
82 std::int32_t result_stride) const { in ExecuteCacheFriendlyMatrixMatrix()
87 static std::int32_t ScratchPerThread(std::int32_t m, std::int32_t n, in ScratchPerThread()
88 std::int32_t k) { in ScratchPerThread()
93 std::int32_t lhs_offset;
94 std::int32_t rhs_offset;
95 std::int32_t sum_offset;
96 std::int32_t multiplier;
97 std::int32_t shift;
102 GemmFloatOperation(std::int32_t lhs_offset, std::int32_t rhs_offset, in GemmFloatOperation()
108 void ExecuteMatrixMatrix(std::uint8_t* scratch, const std::uint8_t* lhs, in ExecuteMatrixMatrix()
109 const std::uint8_t* rhs, std::int32_t m, in ExecuteMatrixMatrix()
110 std::int32_t n, std::int32_t k, float* result, in ExecuteMatrixMatrix()
111 std::int32_t result_stride) const { in ExecuteMatrixMatrix()
116 void ExecuteCacheFriendlyMatrixMatrix(std::uint8_t* scratch, in ExecuteCacheFriendlyMatrixMatrix()
117 const std::uint8_t* lhs, in ExecuteCacheFriendlyMatrixMatrix()
118 const std::uint8_t* rhs, std::int32_t m, in ExecuteCacheFriendlyMatrixMatrix()
119 std::int32_t n, std::int32_t k, in ExecuteCacheFriendlyMatrixMatrix()
121 std::int32_t result_stride) const { in ExecuteCacheFriendlyMatrixMatrix()
126 static std::int32_t ScratchPerThread(std::int32_t m, std::int32_t n, in ScratchPerThread()
127 std::int32_t k) { in ScratchPerThread()
132 std::int32_t lhs_offset;
133 std::int32_t rhs_offset;
139 GemmInt32Operation(std::int32_t lhs_offset, std::int32_t rhs_offset) in GemmInt32Operation()
142 void ExecuteMatrixMatrix(std::uint8_t* scratch, const std::uint8_t* lhs, in ExecuteMatrixMatrix()
143 const std::uint8_t* rhs, std::int32_t m, in ExecuteMatrixMatrix()
144 std::int32_t n, std::int32_t k, std::int32_t* result, in ExecuteMatrixMatrix()
145 std::int32_t result_stride) const { in ExecuteMatrixMatrix()
150 void ExecuteCacheFriendlyMatrixMatrix(std::uint8_t* scratch, in ExecuteCacheFriendlyMatrixMatrix()
151 const std::uint8_t* lhs, in ExecuteCacheFriendlyMatrixMatrix()
152 const std::uint8_t* rhs, std::int32_t m, in ExecuteCacheFriendlyMatrixMatrix()
153 std::int32_t n, std::int32_t k, in ExecuteCacheFriendlyMatrixMatrix()
154 std::int32_t* result, in ExecuteCacheFriendlyMatrixMatrix()
155 std::int32_t result_stride) const { in ExecuteCacheFriendlyMatrixMatrix()
160 static std::int32_t ScratchPerThread(std::int32_t m, std::int32_t n, in ScratchPerThread()
161 std::int32_t k) { in ScratchPerThread()
166 std::int32_t lhs_offset;
167 std::int32_t rhs_offset;
172 std::int32_t gemm_q8_scratch(std::int32_t m, std::int32_t n, std::int32_t k, in gemm_q8_scratch()
173 std::int32_t max_threads) { in gemm_q8_scratch()
178 void multi_thread_gemm_q8(gemmlowp::WorkersPool* pool, std::int32_t max_threads, in multi_thread_gemm_q8()
179 std::uint8_t* scratch, const std::uint8_t* lhs, in multi_thread_gemm_q8()
180 const std::uint8_t* rhs, std::int32_t m, in multi_thread_gemm_q8()
181 std::int32_t n, std::int32_t k, in multi_thread_gemm_q8()
182 std::int32_t lhs_offset, std::int32_t rhs_offset, in multi_thread_gemm_q8()
183 std::int32_t sum_offset, std::int32_t multiplier, in multi_thread_gemm_q8()
184 std::int32_t shift, std::uint8_t* result) { in multi_thread_gemm_q8()
191 std::int32_t gemm_f_scratch(std::int32_t m, std::int32_t n, std::int32_t k, in gemm_f_scratch()
192 std::int32_t max_threads) { in gemm_f_scratch()
197 void multi_thread_gemm_f(gemmlowp::WorkersPool* pool, std::int32_t max_threads, in multi_thread_gemm_f()
198 std::uint8_t* scratch, const std::uint8_t* lhs, in multi_thread_gemm_f()
199 const std::uint8_t* rhs, std::int32_t m, in multi_thread_gemm_f()
200 std::int32_t n, std::int32_t k, in multi_thread_gemm_f()
201 std::int32_t lhs_offset, std::int32_t rhs_offset, in multi_thread_gemm_f()
208 std::int32_t gemm_i32_scratch(std::int32_t m, std::int32_t n, std::int32_t k, in gemm_i32_scratch()
209 std::int32_t max_threads) { in gemm_i32_scratch()
215 std::int32_t max_threads, std::uint8_t* scratch, in multi_thread_gemm_i32()
216 const std::uint8_t* lhs, const std::uint8_t* rhs, in multi_thread_gemm_i32()
217 std::int32_t m, std::int32_t n, std::int32_t k, in multi_thread_gemm_i32()
218 std::int32_t lhs_offset, std::int32_t rhs_offset, in multi_thread_gemm_i32()
219 std::int32_t* result) { in multi_thread_gemm_i32()