Lines Matching refs:aligned
76 def ZipName(rows, leftovers, aligned): argument
77 return zip_Nx8_neon.BuildName(rows, leftovers, aligned)
80 def GenerateZipRhs(emitter, aligned, cols, leftovers): argument
84 ZipName(3, leftovers, aligned),
92 ZipName(cols, leftovers, aligned),
109 def GenerateMulRows(emitter, result, result_type, lhs_add, rhs_add, aligned, argument
113 ZipName(rows, leftovers, aligned),
134 def GenerateQuantized8BitMul(emitter, aligned, rows, cols, leftovers): argument
137 GenerateMulRows(emitter, 'temp_result', 'int32', False, True, aligned, 3,
140 qnt_Nx8_neon.BuildMultiQuantizeName(aligned, 3),
150 GenerateMulRows(emitter, 'temp_result', 'int32', False, True, aligned, rows,
153 qnt_Nx8_neon.BuildMultiQuantizeName(aligned, rows),
159 def GenerateFullMul(emitter, result_type, aligned, rows, cols, leftovers): argument
161 GenerateMulRows(emitter, 'result_chunk', result_type, True, True, aligned, 3,
169 GenerateMulRows(emitter, 'result_chunk', result_type, True, True, aligned,
173 def BuildName(output_type, aligned, rows, cols, leftover): argument
175 if aligned:
209 def GenerateGemm(emitter, output_type, aligned, rows, cols, leftovers): argument
212 BuildName(output_type, aligned, rows, cols, leftovers),
221 GenerateZipRhs(emitter, aligned, cols, leftovers)
222 GenerateQuantized8BitMul(emitter, aligned, rows, cols, leftovers)
225 GenerateZipRhs(emitter, aligned, cols, leftovers)
226 GenerateFullMul(emitter, 'int32', aligned, rows, cols, leftovers)
229 GenerateZipRhs(emitter, aligned, cols, leftovers)
230 GenerateFullMul(emitter, 'float', aligned, rows, cols, leftovers)
237 def GenerateGemmCall(emitter, output_type, aligned, m_mod, n_mod, leftovers): argument
240 BuildName(output_type, aligned, m_mod, n_mod, leftovers)),
244 def GenerateGemmSwitch3(emitter, output_type, aligned, m_mod, n_mod): argument
251 GenerateGemmCall(emitter, output_type, aligned, m_mod, n_mod, leftovers)
258 def GenerateGemmSwitch2(emitter, output_type, aligned, m_mod): argument
265 GenerateGemmSwitch3(emitter, output_type, aligned, m_mod, n_mod)
272 def GenerateGemmSwitch1(emitter, output_type, aligned): argument
279 GenerateGemmSwitch2(emitter, output_type, aligned, m_mod)
345 for aligned in [True, False]:
349 GenerateGemm(emitter, output_type, aligned, rows, cols, leftover)