Source code for devices.xylo.syns61201.power_cycles_model

"""
Cycle count model for XyloAudio 2 SYNS61201
"""

from rockpool.typehints import FloatVector
from typing import Tuple
import samna
import numpy as np

XyloA2Config = samna.xyloCore2.configuration.XyloConfiguration

__all__ = ["cycles_model", "est_clock_freq"]


[docs]def cycles_model( config: XyloA2Config, input_sp: FloatVector = 1.0, hidden_sp: FloatVector = 1.0, output_sp: FloatVector = 1.0, ) -> Tuple[float, float]: """ Calculate the average number of cycles required for a given network architecture This function contains a model which estimates the number of master clock cycles required for the Xylo SNN SYNS61202 inference core to compute one time-step for a given chip configuration in ``config``. Use :py:func:`.devices.xylo.syns61201.config_from_specification` to obtain a chip configuration, along with :py:meth:`.Module.as_graph` and :py:func:`.devices.xylo.syns61201.mapper`, as described in the deployment tutorials for Xylo. By default the model provides a "worst-case" estimation, assuming that every neuron and every input channel fire on each time-step. If desired, real input rasters and real hidden and output spike rasters can be provided for analysis. Alternative spiking probabilities can also be provided as floats ``0..1``. Note that when estimating spiking probablility, only boolean values are relevant --- either a spike or no spike per time step per channel. Multiple events per bin cost the same as a single event. Args: config (XyloA2Config): A XyloAudio 2 configuration for which to calculate the cycle requirements input_sp (FloatVector): Either a floating-point number 0..1, specifying the average input firing rate, or an actual input spike raster to use in evaluation. Default: `1.0`; estimate a worst-case scenario hidden_sp (FloatVector): Either a floating-point number 0..1, specifying the average hidden neuron firing rate, or an actual hidden spike raster to use in evaluation. Default: `1.0`; estimate a worst-case scenario output_sp (FloatVector): Either a floating-point number 0..1, specifying the average output neuron firing rate, or an actual output spike raster to use in evaluation. Default: `1.0`; estimate a worst-case scenario Returns: Tuple[float, float]: (clk_cyles_reqd, additional_isyn2_ops) clk_cyles_reqd (float): The average number of master clock cycles required for this configuration, for the Xylo SNN core to compute one network `dt` additional_isyn2_ops (float): The average additional number of operations required when Isyn2 is enabled. Will be zero if Isyn2 is disabled. Note: These operations occur in parallel to Isyn1, and do not require additional master clock cycles. """ # - Cycle count magic numbers input_loop_cycles = 3.5 hidden_update_cycles = 7 output_isyn_update_cycles = 8 fixed_hidden_neuron_cycles = 19 fixed_output_neuron_spk_cycles = 12 # - Spiking probabilities if np.size(input_sp) > 1: input_spk_prob = np.count_nonzero(input_sp) / np.size(input_sp) else: input_spk_prob = input_sp if np.size(hidden_sp) > 1: hidden_spk_prob = np.count_nonzero(hidden_sp) / np.size(hidden_sp) else: hidden_spk_prob = hidden_sp if np.size(output_sp) > 1: output_spk_prob = np.count_nonzero(output_sp) / np.size(output_sp) else: output_spk_prob = output_sp # - Extract network shapes Nin, _ = np.array(config.input.weights).shape Nhid = len(config.reservoir.neurons) Nien = Nhid _, Nout = np.array(config.readout.weights).shape Noen = Nhid # - Is synapse 2 enabled? is_isyn2_enabled = config.synapse2_enable # - Average fanout for the network Nhid_fanout_avg = np.mean( np.sum(np.abs(np.sign(np.array(config.reservoir.weights))), axis=1) ) # - Number of alias sources and targets alias_target_count = np.zeros(Nhid) alias_source_count = np.zeros(Nhid) for id, n in enumerate(config.reservoir.neurons): if n.alias_target is not None: alias_target_count[n.alias_target] += 1 alias_source_count[id] += 1 is_alias_target_prob = np.mean(alias_target_count) is_alias_source_prob = np.mean(alias_source_count) additional_isyn2_ops = 0 # - Input spike processing single_input_neuron_cycles = input_spk_prob * Nien * input_loop_cycles input_spike_processing_cycles = Nin * (single_input_neuron_cycles + 1) additional_isyn2_ops += is_isyn2_enabled * (0.5 + 1) * input_spk_prob * Nin * Nien # - Hidden neuron Isyn single_hidden_neuron_isyn_cycles = ( Nhid_fanout_avg * hidden_update_cycles * hidden_spk_prob + 3 ) hidden_isyn_processing_cycles = single_hidden_neuron_isyn_cycles * Nhid additional_isyn2_ops += ( is_isyn2_enabled * (4 + 1) * Nhid_fanout_avg * hidden_spk_prob * Nhid ) # - Output neuron Isyn single_output_neuron_isyn_cycles = hidden_spk_prob * ( 1 + Nout * output_isyn_update_cycles ) output_isyn_processing_cycles = single_output_neuron_isyn_cycles * Noen # - Hidden neuron spiking var_hidden_neuron_cycles = ( max(hidden_spk_prob, is_alias_target_prob * is_alias_source_prob) * 2 + max( hidden_spk_prob * is_alias_target_prob, is_alias_target_prob * is_alias_source_prob, ) * 3 + hidden_spk_prob * 1 + max(hidden_spk_prob, is_alias_target_prob) * is_alias_source_prob * 1 ) total_single_hidden_neuron_spk_cycles = ( fixed_hidden_neuron_cycles + var_hidden_neuron_cycles ) hidden_spk_processing_cycles = total_single_hidden_neuron_spk_cycles * Nhid additional_isyn2_ops += is_isyn2_enabled * 1 * Nhid # - Output neuron spiking var_output_neuron_spk_cycles = 0 * output_spk_prob total_output_neuron_spk_cycles = ( fixed_output_neuron_spk_cycles + var_output_neuron_spk_cycles ) output_spk_processing_cycles = total_output_neuron_spk_cycles * Nout # - Total processing cycles est_processing_cycles = ( input_spike_processing_cycles + hidden_isyn_processing_cycles + output_isyn_processing_cycles + hidden_spk_processing_cycles + output_spk_processing_cycles ) return est_processing_cycles, additional_isyn2_ops
[docs]def est_clock_freq(config: XyloA2Config, dt: float, margin: float = 0.2): """ Estimate the required master clock frequency, to run a network in real-time This function will perform a worst-case analysis, assuming that every input channel, every hidden neuron and every output neuron fire an event on each `dt`. An additional margin is included (Default: 20%), to guarantee that the model will run in real time at the suggested master clock frequency. Args: config (XyloA2Config): A XyloAudio 2 configuration for which to estimate the required clock frequency dt (float): The required network `dt`, in seconds margin (float): The additional overhead safety margin to add to the estimation, as a fraction. Default: `0.2` (20%) """ cycles, _ = cycles_model(config) return cycles * (1 + margin) / dt