Searched refs:aggregators (Results 1 – 5 of 5) sorted by relevance
/external/gemmlowp/meta/generators/ |
D | mul_1x8_Mx8_neon.py | 14 def GenerateLoadMultiplyAggregate(emitter, registers, lanes_count, aggregators, argument 43 emitter.EmitVPadal('u16', aggregators[i], multiply_results[i]) 49 emitter.EmitVPadal('u16', aggregators[i + 4], multiply_results[i]) 87 def GenerateAggregatorReduceStore(emitter, registers, lanes_count, aggregators, argument 111 for aggregator in aggregators: 115 temp = aggregators[0] 116 emitter.EmitVPadd('u32', registers.Low(temp), registers.Low(aggregators[0]), 117 registers.Low(aggregators[1])) 118 emitter.EmitVPadd('u32', registers.High(temp), registers.Low(aggregators[2]), 119 registers.Low(aggregators[3])) [all …]
|
D | quantized_mul_kernels_common.py | 234 aggregators = [registers.QuadRegister() for unused_i in range(count)] 237 emitter.EmitVMov('i32', aggregators[i], emitter.ImmediateConstant(0)) 239 emitter.EmitVMov('i32', aggregators[i], aggregators[i - 3]) 240 return aggregators 243 def _Generate3x3LoadMultiplyAggregate(emitter, registers, aggregators, lhs, rhs, argument 270 emitter.EmitVPadal('u16', aggregators[0], temp[0]) 271 emitter.EmitVPadal('u16', aggregators[1], temp[1]) 272 emitter.EmitVPadal('u16', aggregators[2], temp[2]) 273 emitter.EmitVPadal('u16', aggregators[3], temp[3]) 291 emitter.EmitVPadal('u16', aggregators[4], temp[0]) [all …]
|
D | streams_common.py | 58 aggregators, inputs, output): argument 72 for (aggregator, row) in zip(aggregators, block): 88 aggregators, output_address): argument 92 emitter, registers, aggregators, output_address, 100 aggregators, output_address): argument 104 emitter, registers, aggregators, output_address, 111 def _GenerateAggregatorReduction(emitter, registers, aggregators, argument 122 for aggregator in aggregators: 125 reduced_count = (len(aggregators) + 3) / 4 126 reduced = aggregators[:reduced_count] [all …]
|
D | mul_Nx8_Mx8_neon.py | 51 aggregators = [] 54 aggregators.append(aggregator) 58 emitter.EmitVMov('i32', aggregator, aggregators[i - 3]) 60 return aggregators 64 right_lanes, aggregators, count): argument 97 emitter.EmitVPadal('u16', aggregators[i], multiply_results[i]) 109 right_lanes, aggregators, count, argument 138 emitter.EmitVPadal('u16', aggregators[0], temp[0]) 139 emitter.EmitVPadal('u16', aggregators[1], temp[1]) 140 emitter.EmitVPadal('u16', aggregators[2], temp[2]) [all …]
|
/external/gemmlowp/meta/ |
D | README | 18 specialized 8bit multiplication, aggregating to vector aggregators and then
|