HomeSort by relevance Sort by last modified time
    Searched refs:input_address (Results 1 - 10 of 10) sorted by null

  /external/gemmlowp/meta/generators/
zip_Nx8_neon.py 21 def __init__(self, input_address, load, aggregator):
22 self.input_address = input_address
27 def GenerateZipLanes(emitter, registers, zip_lanes, input_address, stride):
34 input_address: register that contains the input address for the first lane.
41 last_address_register = input_address
44 lanes.append(ZipLane(input_address, registers.DoubleRegister(),
77 emitter.DereferenceIncrement(lane.input_address, alignment))
102 emitter.Dereference(lane.input_address, None))
107 emitter.Dereference(lane.input_address, None)
    [all...]
mul_Nx8_Mx8_neon.py 20 def __init__(self, input_address):
21 self.input_address = input_address
74 emitter.DereferenceIncrement(left_lanes.input_address, 64))
77 emitter.DereferenceIncrement(right_lanes.input_address, 64))
79 emitter.EmitPldOffset(left_lanes.input_address, emitter.ImmediateConstant(64))
80 emitter.EmitPldOffset(right_lanes.input_address,
120 emitter.DereferenceIncrement(left_lanes.input_address, 64))
123 emitter.DereferenceIncrement(right_lanes.input_address, 64))
125 emitter.EmitPldOffset(left_lanes.input_address, emitter.ImmediateConstant(64)
    [all...]
streams_common.py 37 def _GenerateInputs(emitter, registers, lanes_count, input_address, stride):
40 last_address_register = input_address
43 inputs.append(input_address)
69 for (row, input_address) in zip(block, inputs):
70 emitter.EmitVLoadE(8, elements_count, row, input_address, None)
206 elements_count, aggregators, input_address,
219 block, input_address, stride)
250 input_address = registers.MapOutputParameter('in')
272 aggregators, input_address, stride,
282 leftovers, aggregators, input_address,
    [all...]
transform_kernels_common.py 57 def Transform(self, emitter, registers, input_address, elements,
64 emitter.EmitVLoadAE(8, elements, load, input_address, None)
65 emitter.EmitPldOffset(input_address, emitter.ImmediateConstant(16))
103 def Transform(self, emitter, registers, input_address, elements,
110 emitter.EmitVLoadAE(8, elements, load, input_address, None)
111 emitter.EmitPldOffset(input_address, emitter.ImmediateConstant(32))
172 def Transform(self, emitter, registers, input_address, elements,
179 emitter.EmitVLoadAE(32, elements, load, input_address, None)
180 emitter.EmitPldOffset(input_address, emitter.ImmediateConstant(64))
253 def Transform(self, emitter, registers, input_address, elements
    [all...]
neon_emitter.py 717 input_address, stride):
722 input_deref = self.Dereference(input_address, None)
723 input_deref_increment = self.DereferenceIncrement(input_address, None)
729 self.EmitPld(input_address)
735 self.EmitPld(input_address)
746 self.EmitPld(input_address)
758 self.EmitPld(input_address)
771 self.EmitPld(input_address)
785 self.EmitPld(input_address)
793 self.EmitPld(input_address)
    [all...]
neon_emitter_64.py     [all...]
quantized_mul_kernels_common.py 19 def _ReadParams(emitter, registers, input_address, elements, min_register):
25 emitter.EmitVLoadAE(registers_count * 4, 32, registers, input_address, 64)
  /external/tensorflow/tensorflow/compiler/xla/service/gpu/
ir_emitter_unnested.cc     [all...]
ir_emitter.cc 672 llvm::Value* input_address = local
676 *function, {accumulator_addr, input_address}, accumulator_addr));
    [all...]
  /external/tensorflow/tensorflow/compiler/xla/service/cpu/
ir_emitter.cc     [all...]

Completed in 562 milliseconds