Source code for spaic.Backend.Backend

# -*- coding: utf-8 -*-
"""
Created on 2020/8/6
@project: SPAIC
@filename: Backend
@author: Hong Chaofei
@contact: hongchf@gmail.com
@description:
定义网络仿真使用的backend，如 Pytorch, Tensorflow, CUDA, 达尔文芯片等，以及相应的微分方程求解方法比如 Euler, 2阶 Runge-Kutta等
"""
import sys
from abc import abstractmethod, ABC
from collections import OrderedDict
from typing import Dict
# from ..Network.BaseModule import BaseModule, VariableAgent, Op
import numpy as np
from ..Network.Operator import Op

backends = dict()


[docs]class Backend(ABC):
    '''
    Basic backend class. All specified backend backend should subclass it.
    The backend is a parameter for the build function and becomes an attribute of all objects defined
    in the frontend backend network in building process. These objects build their initial data
    and specified operations into the attributes of backend, according to _variables
    and _operations respectively. The data will update in each step according the computation graph.
    Args:
        dt (float, optional): the length of a backend timestep, in millisecond.
    Attributes:
        device (str): the desired device of returned tensor. Its value can be 'cpu' or 'cuda'. If None, uses
            the current device for the default tensor type.
        builded (bool): whether the object defined in the frontend backend network has been builded.
        time (float): current backend time, in millisecond.
        n_time_step (int): the num of current time step.

        _variables (OrderedDict): records all variables from the build function of frontend objects.
        _parameters_dict (OrderedDict): records the variables to be trained.
        _InitVariables_dict (OrderedDict): reserves a copy of the initialization variables for initialization.
        _graph_var_dicts (dict): has following format: {'variables_dict': self._variables, 'temp_dict': dict(), 'update_dict': dict(), 'reduce_dict': dict()},
            recording the intermediate value of variables in computation progress.

        basic_operate (dict): dictionary of basic operators, mapping from operator names using in frontend to
            the funtion objects implemented in backend.
        _operations (list): records all basic operations from the build function of frontend objects, each of
            which has following format: [ret_var_name: str, operation_name, input_var_name1: str, input_var_name2 :str, ...].
        _graph_operations (list): redefine each basic operation, that is, add the corresponding keyword in the _graph_var_dicts to each variable,
            which has following format: [(dict_type, ret_var_name), operation_name, [(dict_type1, input_var_name1),(dict_type2, input_var_name2),...]].
        _standalone_operations (list): records all standalone operations from the build function of frontend objects,
            each of which has following format: (ret_var_name: str, function, input_var_names: list).
        _initial_operations (list): records all initial operations from the build function of frontend objects, each of
            which has following format: (ret_var_name: str, function, input_var_names: list).

        _monitors (list): records all monitors defined in fronted network through build function of Monitor object.

    Methods:
        build_graph: build a computation graph before performing the calculation.
        graph_update_step: update value of _graph_var_dicts.
        initial_step: initialize network variables.
        update_step: update the return variables of standalone operations and basic operations and current backend time.
        r_update_step: update the return variables of basic operations without using graph_update_step().
        add_variable: add variables from front objects to _variables of Backend.
        add_backend_variable: add variables according to the specified backend.
        add_operation: add basic operations from front objects to _operations of Backend.
        register_standalone: add standalone operations from front objects to _standalone_operations of Backend.
        register_initial: add initial operations from front objects to _initial_operations of Backend.
    '''
    basic_operate = dict()
    param_init_operate = dict()  # -> param_init_operate

    backend_name = 'None'

    def __init__(self, dt=0.1):
        super(Backend, self).__init__()
        self.device = None
        self.runtime = None
        self.builded = False
        self.partition = None
        self.dt = dt  # the length of a backend timestep
        self.time = 0.0  # current backend time
        self.n_time_step = 0  # the num of current time step
        self._batch_size = 1

        self._variables = dict()  # build from orderedDict to Tuple
        self._update_dict = dict()
        self._reduce_dict = dict()
        self._temp_dict = dict()
        self._parameters_dict = dict()
        self._clamp_parameter_dict = dict()
        self._delay_dict = dict()  # store conduction delays
        self._SparseVariables_dict = dict()
        self._InitVariables_dict = dict()
        # self._variable_agent_dict: Dict[VariableAgent] = dict()
        # self._temp_agent_dict: Dict[VariableAgent] = dict()
        self._variable_agent_dict = dict()
        self._temp_agent_dict = dict()

        self._operations = list()
        self._standalone_operations = list()
        self._initial_operations = list()

        self._monitors = list()  # TODO: need to add to update
        self._stored_states = dict()  # TODO: store network self._variables in the dict
        self.full_enable_grad = False
        self.forward_build = False  # 标识连接间有没有一步delay

        self.basic_operate['threshold'] = self.threshold
        self.basic_operate['reset'] = self.reset
        self.basic_operate['var_linear'] = self.var_linear
        self.basic_operate['mat_linear'] = self.mat_linear
        self.basic_operate['mat_mult_weight'] = self.mat_mult_weight
        self.basic_operate['mat_mult_weight_complex'] = self.mat_mult_weight_complex
        self.basic_operate['mat_mult_weight_2complex'] = self.mat_mult_weight_2complex
        self.basic_operate['mat_mult_pre'] = self.mat_mult_pre
        self.basic_operate['mat_mult'] = self.mat_mult
        self.basic_operate['bmm'] = self.bmm
        self.basic_operate['ger'] = self.ger
        self.basic_operate['sparse_mat_mult_weight'] = self.sparse_mat_mult_weight
        self.basic_operate['var_mult'] = self.var_mult
        self.basic_operate['add'] = self.add
        self.basic_operate['minus'] = self.minus
        self.basic_operate['div'] = self.div
        self.basic_operate['cat'] = self.cat
        self.basic_operate['stack'] = self.stack
        self.basic_operate['permute'] = self.permute
        self.basic_operate['view'] = self.view
        self.basic_operate['assign'] = self.assign
        self.basic_operate['unsqueeze'] = self.unsqueeze

        self.basic_operate['reduce_sum'] = self.reduce_sum
        self.basic_operate['conv_2d'] = self.conv_2d
        self.basic_operate['conv_2d_complex'] = self.conv_2d_complex
        self.basic_operate['relu'] = self.relu

        self.basic_operate['sin'] = self.sin
        self.basic_operate['cos'] = self.cos
        self.basic_operate['tan'] = self.tan
        self.basic_operate['log'] = self.log
        self.basic_operate['log2'] = self.log2
        self.basic_operate['log10'] = self.log10

        self.basic_operate['upsample'] = self.upsample
        self.basic_operate['conv_max_pool2d'] = self.conv_max_pool2d
        self.basic_operate['conv_avg_pool2d'] = self.conv_avg_pool2d
        self.basic_operate['conv_add_bias'] = self.conv_add_bias
        self.basic_operate['max_pool2d'] = self.max_pool2d
        self.basic_operate['post_max_pool2d_complex'] = self.post_max_pool2d_complex
        self.basic_operate['avg_pool2d'] = self.avg_pool2d
        self.basic_operate['batchnorm2d'] = self.batchnorm2d
        self.basic_operate['dropout'] = self.dropout
        self.basic_operate['reshape_mat_mult'] = self.reshape_mat_mult
        self.basic_operate['exp'] = self.exp
        self.basic_operate['mult_sum_weight'] = self.mult_sum_weight
        self.basic_operate['im2col_indices'] = self.im2col_indices
        self.basic_operate['conv2d_flatten'] = self.conv2d_flatten
        self.basic_operate['feature_map_flatten'] = self.feature_map_flatten
        self.basic_operate['weight_norm'] = self.weight_norm
        self.basic_operate['to'] = self.to

        self.param_init_operate['uniform'] = self.uniform
        self.param_init_operate['normal'] = self.normal
        self.param_init_operate['xavier_uniform'] = self.xavier_uniform
        self.param_init_operate['xavier_noraml'] = self.xavier_normal
        self.param_init_operate['kaiming_uniform'] = self.kaiming_uniform
        self.param_init_operate['kaiming_normal'] = self.kaiming_normal
        self.param_init_operate['constant'] = self.constant
        self.param_init_operate['sparse'] = self.sparse

        # self._graph_var_dicts = {'variables_dict': self._variables, 'temp_dict': dict(), 'update_dict': dict(),
        #                          'reduce_dict': dict()}

        self._graph_operations = list()
        self._push_operations = list()
        self._fetch_operations = list()

[docs]    def set_batch_size(self, batch_size):
        self._batch_size = batch_size

[docs]    def get_batch_size(self):
        return self._batch_size

[docs]    def set_runtime(self, runtime):
        self.runtime = runtime

[docs]    def register_basic_op(self, name, op_function):
        """
        register the function as basic operation to backend's _basic_operation dict
        Args:
            name:
            op_function:

        Returns:

        """
        name = name.lower()
        assert callable(op_function)
        if name in self.basic_operate:
            raise ValueError(('A model with the name "%s" has already been registered') % name)

        self.basic_operate[name] = op_function

[docs]    def build_graph(self):
        '''
        Build a computation graph before performing the calculation.
        Note that only the basic operations are redefiend into the _graph_operations list. The format of _graph_operations is as follows:
        [(dict_type, ret_var_name), operation_name, [(dict_type1, input_var_name1),(dict_type2, input_var_name2),...]].
        Traverse all basic operations and add the corresponding keyword in the _graph_var_dicts as dict_type to each variable in basic operation.
        '''
        from ..Network.BaseModule import VariableAgent

        variables_index = {k: i for i, k in enumerate(self._variables.keys())}

        self.initial_step()

        operation_type = 'update_dict or temp_dict or reduce_dict'
        # traverse basic operations

        fetch_operations = []
        push_operations = []
        graph_operations = []
        # self._graph_operations = list()
        # self._push_operations = list()
        # self._fetch_operations = list()

        for op in self._operations:
            if len(op.output) == 0 and len(op.input) == 0:
                # functions with no input and output will not push into the computation graph
                raise ValueError(" Operation lacks both input and output can't be build")
            elif len(op.output) == 0:
                fetch_operations.append(op)
            elif len(op.input) == 0:
                push_operations.append(op)
            else:
                graph_operations.append(op)

        ################################
        ##  for push_operation build  ##
        ################################
        update_dict = dict()
        reduce_dict = dict()

        for ind, op in enumerate(push_operations):
            outputs = []
            agent_outputs = []
            # if the operation return one variable, then it is appended into a list, to accordant with multi-variable returns
            if len(op.output) == 1:
                outputs.append(op.func())
            else:
                outputs = op.func()
            # return variable is a list
            for ind, var_name in enumerate(op.output):
                if var_name in self._variables:
                    # when the same ret_var_name occurs more than once, op.output is added to the reduce_dict of _graph_var_dicts
                    if var_name in update_dict:
                        reduce_dict[var_name] = [update_dict[var_name], outputs[ind]]
                        agent_outputs.append(self._variable_agent_dict[var_name].new_labeled_agent('reduce_dict'))
                        # # add op.output into graph: reduce_dict
                        # self._graph_var_dicts['reduce_dict'][op.output] = []
                        # revise the first reduce operation
                        for gop in self._push_operations:
                            for var in gop.output:
                                assert isinstance(var, VariableAgent)
                                if var.var_name == var_name:
                                    var.dict_label = 'reduce_dict'
                                    break
                        del update_dict[var_name]
                    elif var_name in reduce_dict:
                        reduce_dict[var_name].append(outputs[ind])
                        agent_outputs.append(self._variable_agent_dict[var_name].new_labeled_agent('reduce_dict'))
                    else:
                        # In the push_operation, new data is directly pushed to update_dict, as
                        # there is no need to remain the last step variable value
                        update_dict[var_name] = outputs[ind]
                        agent_outputs.append(self._variable_agent_dict[var_name].new_labeled_agent('update_dict'))
                else:
                    raise ValueError("No state variable to get the input ")

            # add the operation to built graph
            op.output = agent_outputs
            for agent in agent_outputs:
                agent.set_funcs.append(op)
            self._push_operations.append(op)

        # for var_name in reduce_dict:
        #     # add the reduce_sum operation into the graph
        #     self._graph_operations.append(
        #         [[('update_dict', var_name)], self.reduce_sum_update, [('reduce_dict', var_name)]])

        #################################
        ##  for graph_operation build  ##
        #################################
        temp_dict = dict()
        self.owners = set()
        temp_reduce_sum_ops = []
        self._temp_agent_dict = dict()
        for ind, op in enumerate(graph_operations):
            inputs = []
            agent_inputs = []
            for var_name in op.input:
                # try:
                #     var_name in self._variables
                # except:
                #     a = 1

                if '[updated]' in var_name:
                    var_name = var_name.replace("[updated]", "")

                    if var_name in update_dict:
                        inputs.append(update_dict[var_name])
                        agent_inputs.append(self._variable_agent_dict[var_name].new_labeled_agent('update_dict'))
                    elif var_name in reduce_dict:
                        # if the reduce_dict[var_name] is frozen: do reduce_sum operation before this op, and put the value to update_dict
                        # if not use the old variables dict

                        frozen = True
                        op_len = len(graph_operations)
                        for search_id in range(ind + 1, op_len):
                            if var_name in graph_operations[search_id].output:
                                frozen = False
                        if frozen:  # all reduce_dict append ops have been done before this call
                            value = self.reduce_sum(self.stack(reduce_dict[var_name]))
                            inputs.append(value)
                            agent_inputs.append(self._variable_agent_dict[var_name].new_labeled_agent('update_dict'))
                            temp_reduce_sum_ops.append((var_name, len(reduce_dict[var_name])))
                            # add the reduce_sum operation into the graph
                            self._graph_operations.append(
                                Op([self._variable_agent_dict[var_name].new_labeled_agent('update_dict')],
                                   self.reduce_sum_update,
                                   [self._variable_agent_dict[var_name].new_labeled_agent('reduce_dict')],
                                   func=self.reduce_sum_update, owner=self, requires_grad=True))
                        else:
                            assert var_name in self._variables
                            inputs.append(self._variables[var_name])
                            agent_inputs.append(self._variable_agent_dict[var_name].new_labeled_agent('variables_dict'))
                    elif var_name in self._variables:
                        inputs.append(self._variables[var_name])
                        agent_inputs.append(self._variable_agent_dict[var_name].new_labeled_agent('variables_dict'))

                    else:
                        raise ValueError(" No State Variable [%s] in the update_dict" % var_name)
                elif var_name in self._variables:
                    inputs.append(self._variables[var_name])
                    if var_name not in self._variable_agent_dict:
                        self._variable_agent_dict[var_name] = VariableAgent(self, var_name)
                    agent_inputs.append(self._variable_agent_dict[var_name].new_labeled_agent('variables_dict'))


                elif var_name in temp_dict:
                    inputs.append(temp_dict[var_name])
                    if var_name in self._temp_agent_dict:
                        agent_inputs.append(self._temp_agent_dict[var_name])
                    else:
                        raise ValueError("asking a temp variable that has not been declared")
                else:
                    raise ValueError(" No State Variable [%s] in the variable dict" % var_name)

            outputs = []
            agent_outputs = []
            if len(op.output) == 0:
                self.var_check(op.func, inputs)
                op.func(*inputs)
            else:
                self.var_check(op.func, inputs)
                self.remove_tensor(inputs)
                if len(op.output) == 1:
                    outputs.append(op.func(*inputs))

                else:
                    outputs = op.func(*inputs)
                for ind, var_name in enumerate(op.output):
                    if var_name in self._variables:
                        # when the same ret_var_name occurs more than once, op.output is added to the reduce_dict of _graph_var_dicts
                        if var_name in update_dict:
                            reduce_dict[var_name] = [update_dict[var_name], outputs[ind]]
                            agent_outputs.append(self._variable_agent_dict[var_name].new_labeled_agent('reduce_dict'))
                            # # add op.output into graph: reduce_dict
                            # revise the first reduce operation
                            InGop = True
                            for pop in self._push_operations:
                                tmp_label_outputs = pop.output
                                for var in pop.output:
                                    if var.var_name == var_name:
                                        var.dict_label = 'reduce_dict'
                                        InGop = False
                                        break
                                else:
                                    continue
                                break
                            for gop in self._graph_operations:
                                # for all operations need the updated reduce_dict variable as input before reduce_sum are converted to use old variables_dict variables
                                for tmp_input in gop.input:
                                    if tmp_input.dict_label == 'update_dict' and tmp_input.var_name == var_name:
                                        tmp_input.dict_label = 'variables_dict'
                                if InGop:
                                    for gop in self._graph_operations:
                                        for output in gop.output:
                                            if output.var_name == var_name:
                                                output.dict_label = 'reduce_dict'
                                                break
                            del update_dict[var_name]
                        elif var_name in reduce_dict:
                            reduce_dict[var_name].append(outputs[ind])
                            agent_outputs.append(self._variable_agent_dict[var_name].new_labeled_agent('reduce_dict'))
                        else:
                            update_dict[var_name] = outputs[ind]
                            agent_outputs.append(self._variable_agent_dict[var_name].new_labeled_agent('update_dict'))
                    else:
                        temp_dict[var_name] = outputs[ind]
                        ### Whether allow duplication of name, choose allow recently.
                        agent_outputs.append(VariableAgent(self, var_name, dict_label='temp_dict'))
                        self._temp_agent_dict[var_name] = agent_outputs[-1]

                        ### If not allow duplication of name, use code bellow:
                        # if var_name in self._temp_agent_dict:
                        #     # raise ValueError("setting value to temp variable multiple times")
                        #     pass
                        #
                        # else:
                        #     agent_outputs.append(VariableAgent(self, var_name, dict_label='temp_dict'))
                        #     self._temp_agent_dict[var_name] = agent_outputs[-1]

            # add the operation to built graph
            op.input = agent_inputs
            op.output = agent_outputs
            for agent in agent_inputs:
                agent.get_funcs.append(op)
            for agent in agent_outputs:
                agent.set_funcs.append(op)
            self._graph_operations.append(op)

        for reduce_op in temp_reduce_sum_ops:
            reduce_len = len(reduce_dict[reduce_op[0]])
            if reduce_len != reduce_op[1]:
                raise ValueError(
                    "Can't use [updated] tag for variable: %s, as it is a reduce_dict variable which is have updating conflict" %
                    reduce_op[0])
            else:
                del reduce_dict[reduce_op[0]]
        # for reduced variables that not used within [update]
        for var_name in reduce_dict:
            # add the reduce_sum operation into the graph
            self._graph_operations.append(
                Op([self._variable_agent_dict[var_name].new_labeled_agent('update_dict')],
                   self.reduce_sum_update, [self._variable_agent_dict[var_name].new_labeled_agent('reduce_dict')],
                   func=self.reduce_sum_update, owner=self, requires_grad=True))

        #################################
        ##  for fetch_operation build  ##
        #################################
        for ind, op in enumerate(fetch_operations):
            inputs = []
            agent_inputs = []
            for var_name in op.input:
                if '[updated]' in var_name:
                    # there is no need to have updated tag, as all variables computed in graph_operation have benn updated
                    var_name = var_name.replace("[updated]", "")
                if var_name in self._variables:
                    inputs.append(self._variables[var_name])
                    agent_inputs.append(self._variable_agent_dict[var_name].new_labeled_agent('variables_dict'))
                # elif var_name in temp_dict:
                #     inputs.append(temp_dict[var_name])
                #     label_inputs.append(('temp_dict', var_name))
                else:
                    raise ValueError(" No State Variable [%s] in the update_dict" % var_name)

            self.var_check(op.func, inputs)
            op.func(*inputs)

            op.input = agent_inputs
            # add the operation to built graph
            self._fetch_operations.append(op)

        # self._variables.update(update_dict)
        # for ii in range(len(self._graph_operations)):
        #     self._graph_operations[ii] = tuple(self._graph_operations[ii])
        self._graph_operations = tuple(self._graph_operations)

        self.set_func_grad()

        self.groups, self.isolate = self.get_dependency()
        self.get_place()

[docs]    def get_dependency(self):
        import matplotlib.pyplot as plt
        import networkx as nx
        if self.partition:
            g = nx.DiGraph()
            for ind, op in enumerate(self._graph_operations):
                op.set_identifier(ind)
            g.add_nodes_from([op._identifier for op in self._graph_operations])
            for ind, op in enumerate(self._graph_operations):
                for output in op.output:
                    for get_op in output.get_funcs:
                        if op._identifier < get_op._identifier:
                            g.add_edge(op._identifier, get_op._identifier)

            plt.figure(figsize=(100, 100))
            nx.draw_networkx(g)
            # plt.savefig('test.jpg')

            isolate = []
            leaf = []
            for i in range(len(self._graph_operations)):
                if g.degree(i) == 0:
                    isolate.append(i)
                else:
                    if g.out_degree(i) == 0:
                        leaf.append(i)

            g = g.to_undirected()
            groups = set()
            for i in leaf:
                group = frozenset(nx.dfs_tree(g, i))
                groups.add(group)
        else:
            groups = [self._graph_operations]
            isolate = []
        return groups, isolate

[docs]    def set_func_grad(self):
        if self.full_enable_grad:
            for op in self._operations:
                op.requires_grad = True
            for op in self._initial_operations:
                op.requires_grad = True

        for op in self._operations:
            if op.requires_grad:
                op.func = self.to_grad_func(op.func)
            else:
                op.func = self.to_nograd_func(op.func)

        for op in self._initial_operations:
            if op.requires_grad:
                op.func = self.to_grad_func(op.func)
            else:
                op.func = self.to_nograd_func(op.func)

[docs]    def var_check(self, op, *args):
        '''
        For specified operation, check the type or the shape of input variables.
        '''
        if op == 'mat_mult':
            if args[0][0].shape[1] != args[0][1].shape[0]:
                raise ValueError("%s and %s do not match" % (args[0].shape, args[1].shape))
        pass

[docs]    def graph_update_step_r(self):

        for op in self._graph_operations:
            inputs = []
            for var in op.input:
                inputs.append(self._graph_var_dicts[var[0]][var[1]])

            if op.output[0] is None:
                op.func(*inputs)
            elif op.output[0] == 'reduce_dict':
                self._graph_var_dicts['reduce_dict'][op.output[1]].append(op.func(*inputs))
            else:
                self._graph_var_dicts[op.output[0]][op.output[1]] = op.func(*inputs)

            # if '[updated]' in op.output[1]:
            #     op_name = op.output[1].strip('[updated]')
            #     if op_name in self._graph_var_dicts['update_dict'] and op_name in self._graph_var_dicts['variables_dict']:
            #         self._graph_var_dicts['update_dict'][op_name] = self._graph_var_dicts['temp_dict'][op.output[1]]  # 更新返回名中带[updated]的变量的值

        return  # tuple(self._graph_var_dicts['variables_dict'].values())

[docs]    def get_place(self):
        if self.partition:
            for ind, g in enumerate(self.groups):
                c = []
                g = [self._graph_operations[x] for x in g]
                for op in g:
                    for input in op.input:
                        if input._var_name.split(':')[-1] == '{weight}':
                            c.append(self._variables[input._var_name].device)
                place = max(set(c), key=c.count)
                for op in g:
                    op.place = place
            g = [self._graph_operations[x] for x in self.isolate]
            for ind, op in enumerate(g):
                for input in op.input:
                    if input._var_name.split(':')[-1] == '{weight}':
                        op.place = self._variables[input._var_name].device
                        break
                    else:
                        op.place = self.device[ind % self.device_count]
        else:
            for ind, op in enumerate(self._graph_operations):
                for input in op.input:
                    if input._var_name.split(':')[-1] == '{weight}':
                        op.place = self._variables[input._var_name].device
                        break
                    else:
                        op.place = self.device[ind % self.device_count]

[docs]    def graph_update_step(self):
        for op in self._graph_operations:
            # for inputs
            inputs = []
            for var in op.input:
                inputs.append(var.value)
            # compute the operation
            result = op.func(*inputs)
            if len(op.output) == 1: result = [result]
            # assign the result variables
            for ind, var in enumerate(op.output):
                var.value = result[ind]

[docs]    def push_update_step(self):
        for op in self._push_operations:
            result = op.func()
            if len(op.output) == 1: result = [result]
            for ind, var in enumerate(op.output):
                var.value = result[ind]

[docs]    def fetch_update_step(self):
        for op in self._fetch_operations:
            # for inputs
            inputs = []
            for var in op.input:
                inputs.append(var.value)
            op.func(*inputs)

[docs]    def initial_step(self):
        '''
        Initialize network variables.
        '''

        # Initialize the current backend time and the num of time step
        self.last_time = 0.0
        self.time = 0.0  # current backend time
        self.n_time_step = 0
        for key, value in self._variables.items():
            if '[stay]' in key:
                self._InitVariables_dict[key] = self._variables[key].detach()

        # Initialize untrainable variables
        self._variables.clear()

        # Initialize system spacial variables such as backend dt
        self._variables['[dt]'] = self.dt
        self._variables['[batch_size]'] = self._batch_size

        for key, value in self._InitVariables_dict.items():
            self._variables[key] = value

        # Initialize the trainable parameters
        for key, clamp_code in self._clamp_parameter_dict.items():
            clamp_code[0](*clamp_code[1])

        for key, value in self._parameters_dict.items():
            self._variables[key] = value

        for key, value in self._SparseVariables_dict.items():
            index_name = key + '_sparse_index'
            value_name = key + '_sparse_value'
            shape_name = key + '_sparse_shape'
            if index_name in self._variables.keys() and value_name in self._variables.keys():
                self._variables[key] = self.sparse_to_dense(index_name, value_name, shape_name)

        # Initialize the record of Monitor
        for monitor in self._monitors:
            monitor.init_record()

        # Traverse initial operations
        for op in self._initial_operations:
            inputs = []
            for var_name in op.input:
                if var_name in self._variables:
                    inputs.append(self._variables[var_name])
                else:
                    raise ValueError(" No State Variable [%s] in the variable dict" % var_name)
            if op.output is None:
                op.func(*inputs)
            else:
                result = op.func(*inputs)
                if len(op.output) == 1: result = [result]
                for ind, output in enumerate(op.output):
                    self._variables[output] = result[ind]

        # Change intial variable's batch_size
        for key in self._variables.keys():
            if hasattr(self._variables[key], 'shape'):
                shape = self._variables[key].shape
                if self._variables[key].ndim > 1 and shape[0] == 1 and (key not in self._parameters_dict):
                    expand_shape = -np.ones_like(shape, dtype=int)
                    expand_shape[0] = self._batch_size
                    self._variables[key] = self._variables[key].expand(tuple(expand_shape))

            # if '{O}' in key:
            #     o_shape = self._variables[key].shape
            #
            #     shape = []
            #     for s in o_shape:
            #         if s != 1:
            #             shape.append(s)
            #         else:
            #             shape.append(self._batch_size)
            #     self._variables[key] = torch.zeros(shape, dtype=torch.float32, device=self.device)

[docs]    def clear_step(self):
        '''

        Returns:

        '''

        self._operations = list()
        self._graph_operations = list()
        self._push_operations = list()
        self._fetch_operations = list()

[docs]    def initial_continue_step(self):
        '''
        Initialize network for continuous run.
        '''

        self.last_time = self.time

[docs]    def update_step(self):
        '''
        Update the return variables of standalone operations and basic operations and current backend time.
        Returns:
            tuple(self._variables.values())
        '''

        # push input data
        self.push_update_step()

        # static graph compuation
        if self.device_count > 1:
            self.graph_update_step_multigpu()
        else:
            self.graph_update_step()

        # Update time and state variables
        self.n_time_step += 1
        self.time = round(self.n_time_step * self.dt, 2)
        self._variables.update(self._update_dict)

        # fetch output data
        self.fetch_update_step()

        # Record Variables
        for monitor in self._monitors:
            monitor.update_step(self._variables)

        self._reduce_dict = dict()
        self._temp_dict = dict()
        self._update_dict = dict()

        return tuple(self._variables.values())

[docs]    def update_time_steps(self):
        while (self.runtime > self.time - self.last_time):
            self.update_step()

[docs]    def r_update_step(self):
        '''
        Update the return variables of basic operations without using graph_update_step().
        Returns:
            tuple(self._variables.values())
        '''

        reduce_dict = dict()
        self._graph_var_dicts['update_dict'].clear()
        self._graph_var_dicts['temp_dict'].clear()
        self._graph_var_dicts['reduce_dict'].clear()

        # Traverse standalone operations
        for op in self._standalone_operations:
            inputs = []
            for var_name in op.input:
                if 'pytorch' in backends:
                    inputs.append(self._variables[var_name])
                else:
                    inputs.append(self.to_numpy(self._variables[var_name]))

            if op.output is None:
                op.func(*inputs)
            else:
                if 'pytorch' in backends:
                    self._variables[op.output] = op.func(*inputs)
                else:
                    self._variables[op.output] = self.to_tensor(op.func(*inputs))

        # update one time_step
        for op in self._operations:
            if op.output in self._graph_var_dicts['variables_dict']:
                inputs = []
                for var_name in op.input:
                    if '[updated]' in var_name:
                        var_name = var_name.replace("[updated]", "")
                        if var_name in self._graph_var_dicts['update_dict']:
                            inputs.append(self._graph_var_dicts['update_dict'][var_name])
                        else:
                            raise ValueError(" No State Variable [%s] in the update_dict" % var_name)
                    elif var_name in self._graph_var_dicts['variables_dict']:
                        inputs.append(self._graph_var_dicts['variables_dict'][var_name])
                    elif var_name in self._graph_var_dicts['temp_dict']:
                        inputs.append(self._graph_var_dicts['temp_dict'][var_name])
                    else:
                        raise ValueError(" No State Variable [%s] in the variable dict" % var_name)

                if op.output in self._graph_var_dicts['update_dict']:
                    if op.output in self._graph_var_dicts['reduce_dict']:
                        self._graph_var_dicts['reduce_dict'][op.output].append(op.func(*inputs))
                    else:
                        self._graph_var_dicts['reduce_dict'][op.output] = [
                            self._graph_var_dicts['update_dict'][op.output],
                            op.func(*inputs)]
                else:
                    self._graph_var_dicts['update_dict'][op.output] = op.func(*inputs)
                    pass

            else:
                inputs = []
                for var_name in op.input:
                    if '[updated]' in var_name:
                        var_name = var_name.replace("[updated]", "")
                        if var_name in self._graph_var_dicts['update_dict']:
                            inputs.append(self._graph_var_dicts['update_dict'][var_name])
                        else:
                            raise ValueError(" No State Variable [%s] in the update_dict" % var_name)
                    elif var_name in self._graph_var_dicts['variables_dict']:
                        inputs.append(self._graph_var_dicts['variables_dict'][var_name])
                    elif var_name in self._graph_var_dicts['temp_dict']:
                        inputs.append(self._graph_var_dicts['temp_dict'][var_name])
                    else:
                        raise ValueError(" No State Variable [%s] in the variable dict" % var_name)
                self._graph_var_dicts['temp_dict'][op.output] = op.func(*inputs)

                if '[updated]' in op.output:
                    op_name = op.output.replace("[updated]", "")
                    if op_name in self._graph_var_dicts['update_dict']:
                        self._graph_var_dicts['update_dict'][op_name] = self._graph_var_dicts['temp_dict'][
                            op.output]  # update the variable in update_dict
                    else:
                        raise ValueError(" No State Variable [%s] in the update_dict" % var_name)

        # Update reduce_dict into update_dict
        for key, value in reduce_dict.items():
            value = self.stack(value)
            self._graph_var_dicts['update_dict'][key] = self.reduce_sum(value)
            self._graph_var_dicts['update_dict'][key] = []

        # update time
        self.n_time_step += 1
        self.time = round(self.n_time_step * self.dt, 2)

        self._graph_var_dicts['variables_dict'].update(self._graph_var_dicts['update_dict'])

        # Record Variables
        for monitor in self._monitors:
            monitor.update_step(self._graph_var_dicts)

        return tuple(self._variables.values())

[docs]    def reduce_sum_update(self, value):
        reduced = self.reduce_sum(self.stack(value))
        return reduced

[docs]    def get_varialble(self, name):

        if name in self._parameters_dict:
            return self._parameters_dict[name]
        elif name in self._variables:
            return self._variables[name]
        else:
            raise ValueError("not found variable:%s in the backend" % name)

[docs]    def set_variable_value(self, name, value, is_parameter):
        '''
        Set the backend value, in specific Backend
        Args:
            name:
            value:
            is_parameter:

        Returns:

        '''
        NotImplementedError()

[docs]    def add_variable(self, module, name: str, shape, value=None, is_parameter=False, is_sparse=False,
                     init=None, init_param=None,
                     min=None, max=None, is_constant=False, prefer_device=None):
        '''
        Add variables from front objects to _variables of Backend and get copies to assign to _parameters_dict and _InitVariables_dict.
        Args:
            module (spaic.BaseModule) : the parent Module object the variable is belongs to
            name (str): the name of the added variable
            shape (list, int): the shape of the variable
            value (optional): the value of the variable
            is_parameter (bool, optional): whether the variable is trainable
            init (optional):
        '''
        from ..IO.Initializer import BaseInitializer
        from ..Network.BaseModule import VariableAgent
        if is_parameter:
            if isinstance(value, BaseInitializer):
                self._parameters_dict[name] = self.add_backend_variable(module, name, shape, None, grad=True,
                                                                        is_sparse=is_sparse,
                                                                        init=value.__class__.__name__,
                                                                        init_param=value.__dict__,
                                                                        prefer_device=prefer_device)
            else:
                self._parameters_dict[name] = self.add_backend_variable(module, name, shape, value, grad=True,
                                                                        is_sparse=is_sparse,
                                                                        init=init, init_param=init_param,
                                                                        prefer_device=prefer_device)
            # store clamp operations
            if min is not None and max is not None:
                self._clamp_parameter_dict[name] = (self.clamp_, [self._parameters_dict[name], min, max])
            elif min is not None:
                self._clamp_parameter_dict[name] = (self.clamp_min_, [self._parameters_dict[name], min])
            elif max is not None:
                self._clamp_parameter_dict[name] = (self.clamp_max_, [self._parameters_dict[name], max])


        # 稀疏矩阵weight非叶子节点，反传的时候更新的是weight中的value,但前向计算的时候用的是weight,所以对于稀疏矩阵要单独用个dict记录以便初始化
        elif is_sparse:
            self._SparseVariables_dict[name] = self.add_backend_variable(module, name, shape, value, grad=True,
                                                                         is_sparse=is_sparse, init=init,
                                                                         init_param=init_param,
                                                                         prefer_device=prefer_device)
        elif is_constant:
            self._InitVariables_dict[name] = value
        elif isinstance(value, BaseInitializer):
            self._InitVariables_dict[name] = self.add_backend_variable(module, name, shape, None, grad=False,
                                                                       is_sparse=is_sparse,
                                                                       init=value.__class__.__name__,
                                                                       init_param=value.__dict__,
                                                                       prefer_device=prefer_device)
        else:
            self._InitVariables_dict[name] = self.add_backend_variable(module, name, shape, value, grad=False,
                                                                       is_sparse=is_sparse, init=init,
                                                                       init_param=init_param,
                                                                       prefer_device=prefer_device)

        var_agent = VariableAgent(self, name, is_parameter)
        self._variable_agent_dict[name] = var_agent
        return var_agent

[docs]    def has_variable(self, name: str):
        if name.endswith('[updated]'):
            name = name.replace("[updated]", "")
        elif name.endswith('[stay]'):
            name = name.replace("[stay]", "")

        if name in self._variables:
            return True
        elif name in self._InitVariables_dict:
            return True
        elif name in self._parameters_dict:
            return True
        elif name in self._SparseVariables_dict:
            return True
        else:
            return False

[docs]    def add_delay(self, var_name, max_delay):
        from ..Network.DelayQueue import DelayQueue
        max_len = int(max_delay / self.dt)
        if var_name in self._delay_dict:
            if self._delay_dict[var_name].max_len < max_len:
                self._delay_dict[var_name].max_len = max_len
        else:
            self._delay_dict[var_name] = DelayQueue(var_name, max_len, self)
            self.register_initial(Op(None, self._delay_dict[var_name].initial, [var_name, '[batch_size]'], owner=self,
                                     requires_grad=True))
            self.register_standalone(
                Op(None, self._delay_dict[var_name].push, [var_name, ], owner=self, requires_grad=True))
        return self._delay_dict[var_name]

[docs]    @abstractmethod
    def add_backend_variable(self, module, name, shape, value=None, grad=False, is_sparse=False, init=None,
                             init_param=None):
        '''
        This method will be overwritten by different subclasses to add variables to _variables of specified backend.
        Args:
            module (spaic.BaseModule) : the parent Module object the variable is belongs to
            name (str): the name of the added variable
            shape (list, int): the shape of the variable
            value (optional): the value of the variable
            is_parameter (bool, optional): whether the variable is trainable
            init (optinal):
            grad (bool, optional): whether to use grad
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def sparse_to_dense(self, index_name, value_name, shape_name):
        '''
        This method will be sparse matrix to dense matrix.
        Args:
            index_name (str)
            value_name (str)
            shape_name (str)
        '''
        NotImplementedError()

[docs]    def add_operation(self, op):
        '''
        Add basic operations from front objects to _operations of Backend.
        '''
        # op = Op()
        from ..Network.BaseModule import BaseModule
        assert isinstance(op, Op)
        if isinstance(op.output, str):
            op.output = [op.output]
        elif op.output is None:
            op.output = []
        if isinstance(op.input, str):
            op.input = [op.input]
        elif op.input is None:
            op.input = []

        if op.func_name in self.basic_operate:
            op.func = self.basic_operate[op.func_name]
            if not isinstance(op.owner, Backend):
                assert isinstance(op.owner, BaseModule)
                op.owner._ops.append(op)
            op.operation_type = "_operations"
            self._operations.append(op)
        elif callable(op.func_name):
            self.register_standalone(op)
        else:
            raise ValueError("No operation %s in basic_operate" % op.func)

[docs]    def register_standalone(self, op):
        '''
        Add standalone operations from front objects to _standalone_operations of Backend.
        '''
        from ..Network.BaseModule import BaseModule
        assert isinstance(op, Op)
        if isinstance(op.output, str):
            op.output = [op.output]
        elif op.output is None:
            op.output = []
        if isinstance(op.input, str):
            op.input = [op.input]
        elif op.input is None:
            op.input = []
        if not isinstance(op.owner, Backend):
            assert isinstance(op.owner, BaseModule)
            op.owner._ops.append(op)

        assert callable(op.func_name)
        op.func = op.func_name
        op.operation_type = "_operations"
        self._operations.append(op)

[docs]    def register_initial(self, op):
        '''
        Add initial operations from front objects to _initial_operations of Backend..
        op  = {output, func, input, owner, place, requires_grad}
        '''
        from ..Network.BaseModule import BaseModule
        assert isinstance(op, Op)
        if isinstance(op.func, str):
            if op.func_name in self.basic_operate:
                op.func = self.basic_operate[op.func_name]
            else:
                raise ValueError("No operation %s in basic_operate" % op.func)
        else:
            assert callable(op.func_name)
            op.func = op.func_name
        if isinstance(op.input, str):
            op.input = [op.input]
        elif op.input is None:
            op.input = []
        if isinstance(op.output, str):
            op.output = [op.output]
        elif op.output is None:
            op.output = []

        if not isinstance(op.owner, Backend):
            assert isinstance(op.owner, BaseModule)
            op.owner._ops.append(op)
        op.operation_type = "_initial_operations"
        self._initial_operations.append(op)

[docs]    def store(self, name='default'):
        '''
        Store backend_name and _variables into _stored_states dictionary.
        Args:
            name (str, optional): the name of network state.
        '''
        self._stored_states[name] = (self.backend_name, self._variables)

[docs]    def restore(self, name='default'):
        '''
        Restore network state from _stored_states dictionary.
        Args:
            name (str): the name of network state.
        '''
        if name not in self._stored_states:
            raise ValueError("No network state named: %s is stored" % name)
        else:
            stored_backend = self._stored_states[name][0]
            if stored_backend != self.backend_name:
                raise ValueError(
                    "The stored network is run by %s not %s" % (stored_backend, self.backend_name))
            else:
                self._variables = self._stored_states[name]

[docs]    def check_key(self, ckey, target_dict):
        cnetname = ckey[:ckey.find('<net>')]
        for key, value in target_dict.items():
            netname = key[:key.find('<net>')]
            break
        ckey = ckey.replace(cnetname, netname)
        if ckey in target_dict.keys():
            return ckey

        import warnings
        warnings.warn('Key error occurs, please check keys.')

        # result = [key for key in target_dict.keys() if key.endswith(variables[variables.find('<net>'):])]
        # if result:
        #     if len(result) > 1:
        #         import warnings
        #         warnings.warn('Given key matchs two variables in the backend dict, choose the first one as default')
        #     result = result[0]
        # return result

[docs]    @abstractmethod
    def to_nograd_func(self, func):
        '''
        Define the function as with no_grad
        Args:
            func:

        Returns:

        '''

[docs]    @abstractmethod
    def to_grad_func(self, func):
        '''
        Define the function as with enable_grad
        Args:
            func:

        Returns:

        '''

    # -------- basic backends operations -----
[docs]    @abstractmethod
    def threshold(self, v, v_th):
        '''
        Args:
            v: membrane voltage
            v_th: threshold
        Returns:
            v> v_th
        '''

[docs]    @abstractmethod
    def reset(self, v, o):
        '''

        Args:
            v: membrane voltage
            o: output spike

        Returns:
            if o>0, return 0
            else reutn v
        '''

[docs]    @abstractmethod
    def cat(self, x, dim=1):
        '''
        Joining data together along a dimension.
        Note that the total dimension of the data remains the same after cat.
        Args:
            x (list):
            dim (int): the dimension to cat.
        Returns:
            concat(x, dim)
        '''

[docs]    @abstractmethod
    def stack(self, x, dim=1):
        '''
        Add new dimension when stack data.
        Args:
            x (list):
            dim (int): the dimension to stack.
        Returns:
            stack(x, dim)
        '''

[docs]    @abstractmethod
    def permute(self, x, permute_dim):
        '''
        Parameters
        ----------
        x---> input
        permute_dim---> the dimension index of permute operation
        Returns
        -------
        '''

[docs]    @abstractmethod
    def view(self, x, view_dim):
        '''
        Parameters
        ----------
        x---> input
        view_dim---> the shape of view operation
        Returns
        -------
        '''

[docs]    def assign(self, x):
        '''
        Parameters
        ----------
        y---> target
        x---> input
        y = x
        Returns
        -------
        '''
        return x

[docs]    @abstractmethod
    def unsqueeze(self, x, dim):
        '''
        Parameters
        ----------
        x---> input
        dim---> the dim of unsqueeze operation
        Returns
        -------
        '''

[docs]    @abstractmethod
    def reduce_sum(self, x, *dim):
        '''
        Reduce the dimensions of the data
        Args:
            x (list):
            dim (tuple(int)): the dimension to reduce.
        Returns:
            sum(x, dim)
        '''

[docs]    @abstractmethod
    def index_select(self, x, indices, dim=1):
        '''
        Parameters
        ----------
        x
        indices
        Returns
        -------
        '''

[docs]    @abstractmethod
    def scatter(self, x, indices):
        '''
        Parameters
        ----------
        x
        indices
        Returns
        -------
        '''

[docs]    @abstractmethod
    def conv1d(self, x, kernel):
        '''
        Parameters
        ----------
        x
        kernel
        Returns
        -------
        '''

[docs]    @abstractmethod
    def conv_2d_complex(self, x, kernel, stride, padding, dilation, groups, beta, delay=None):
        '''

        Args:
            x:
            kernel:
            stride:
            padding:
            dilation:
            groups:
            beta:

        Returns:

        '''

[docs]    @abstractmethod
    def conv_trans2d(self, x, kernel, stride, padding, dilation, groups):
        '''
            transposed conv 2d
            Parameters
            ----------
            x
            kernel
            Returns
            -------
            '''

[docs]    @abstractmethod
    def conv_trans1d(self, x, kernel):
        '''
        transposed conv 1d
        Parameters
        ----------
        x
        kernel
        Returns
        -------
        '''

[docs]    @abstractmethod
    def im2col_indices(self, x, kh, kw, padding, stride):
        '''
        Parameters
        ----------
        x: 4D array  N, FH, FW, C_{in}
        kh: kernel_height
        kw: kernel_width
        stride:
        padding:
        Returns
        ----------
        '''

[docs]    @abstractmethod
    def conv2d_flatten(self, x):
        '''
        Parameters
        ----------
        x: 4D array (batch_size, out_channels, height, width)
        Returns
        3D array (batch_size, out_channels, height * width)
        ----------
        '''

[docs]    @abstractmethod
    def feature_map_flatten(self, x):
        '''
        For RSTDP and STDP learning rules which is  follwed with conv pre_layer
        Parameters
        ----------
        x: 4D array (batch_size, out_channels, height, width)
        Returns
        2D array (batch_size, out_channels * height * width)
        ----------
        '''

[docs]    @abstractmethod
    def add(self, x, y):
        '''
        Add the tensor y to the input x and returns a new result.
        Args:
            x (Tensor): input
            y (Tensor or Number): the second input
        Returns:
            x + y
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def minus(self, x, y):
        '''
        The first input minus the second input
        Args:
            x (Tensor): input
            y (Tensor or Number): the second input
        Returns:
            x - y
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def div(self, x, y):
        '''
        The first input div the second input
        Args:
            x (Tensor): input
            y (Tensor or Number): the second input

        Returns:
            x/y

        '''
        NotImplementedError()

[docs]    @abstractmethod
    def relu(self, x):
        '''
        Rectified Linear
        Args:
            x:

        Returns:
            x = x if x>0. else x = 0
        '''

[docs]    @abstractmethod
    def mat_mult_weight(self, A, X):
        '''
        Matrix product.
        Args:
            A (Tensor): the first input to be multiplied
            X (Tensor): the second input to be multiplied
        Returns:
            mat_mult_weight(A,X)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def mat_mult_weight_complex(self, A, X, beta, delay=None):
        NotImplementedError()

[docs]    @abstractmethod
    def mat_mult_weight_2complex(self, A, X, beta):
        NotImplementedError()

[docs]    @abstractmethod
    def mat_mult_pre(self, A, X):
        '''
        Matrix product.
        Args:
            A (Tensor): the first input to be multiplied
            X (Tensor): the second input to be multiplied
        Returns:
            mat_mult_pre(A,X)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def sigmoid(self, x):
        '''

        Args:
            x:

        Returns:

        '''

[docs]    @abstractmethod
    def upsample(self, x, scale):
        NotImplementedError()

[docs]    @abstractmethod
    def mat_mult(self, A, X):
        '''
        Matrix product.
        Args:
            A (Tensor): the first input to be multiplied
            X (Tensor): the second input to be multiplied
        Returns:
            mat_mult(A,X)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def reshape_mat_mult(self, A, X):
        '''
        Matrix product.
        Args:
            A (Tensor): the first input to be multiplied
            X (Tensor): the second input to be multiplied
        Returns:
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def bmm(self, A, X):
        '''
        Performs a batch matrix-matrix product.
        Args:
            A (Tensor): the first input to be multiplied  [batch_size, n, m]
            X (Tensor): the second input to be multiplied  [batch_size, m, p]
        Returns:
            bmm(A,X)   [batch_size, n, p]
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def sparse_mat_mult_weight(self, A, X):
        '''
        Sparse matrix product.
        Args:
            A (Tensor): the first input to be multiplied
            X (Tensor): the second input to be multiplied
        Returns:
            sparse_mat_mult_weight(A,X)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def var_mult(self, A, X):
        '''
        Args:
            A, X
        Returns:
            A * X
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def mult_sum_weight(self, A, X):
        '''
         sum(A*X, dim=-2)
        Args:
            A:
            X:

        Returns:

        '''
        NotImplementedError()

[docs]    @abstractmethod
    def mat_linear(self, A, X, b):
        '''
        Args:
            A
            X
            b
        Returns:
            mat_mul(A,X)+b
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def ger(self, A, X):
        '''
        Args:
            A
            X
        Returns:
            ger(A,X)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def var_linear(self, A, X, b):
        '''
        If A is matrix, then A and X should have the same shape, A*X is elemen-wise multiplication
        else  A should be a scalar value.
        Returns:
            A*X +b
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def to_numpy(self, data):
        '''
        Args：
            data
        Returns:
            data.numpy()
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def to_tensor(self, data):
        '''
        Args:
            data
        Returns:
            torch.tensor(data)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def clamp_(self, data, min, max):
        '''
            in-place clamp the data
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def clamp_max_(self, data, max):
        '''
            in-place clamp the max of the data
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def clamp_min_(self, data, min):
        '''
            in-place clamp the min of the data
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def uniform(self, data, a=0.0, b=1.0):
        '''
        Args:
            data(tensor): an n-dimensional torch.Tensor
            a(float): the lower bound of the uniform distribution
            b(float): the upper bound of the uniform distribution
        Returns:
            torch.nn.init.uniform_(data, a=0.0, b=1.0)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def normal(self, data, mean=0.0, std=1.0):
        '''
        Args:
            data(tensor): an n-dimensional torch.Tensor
            mean(float): the mean of the normal distribution
            std(float): the standard deviation of the normal distribution
        Returns:
            torch.nn.init.normal_(data, mean=0.0, std=1.0)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def xavier_normal(self, data, gain=1.0):
        '''
        Args:
            data(tensor): an n-dimensional torch.Tensor
            gain: an optional scaling factor
        Returns:
            torch.nn.init.xavier_normal_(data, gain=1.0)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def xavier_uniform(self, data, gain=1.0):
        '''
        Args:
            data(tensor): an n-dimensional torch.Tensor
            gain: an optional scaling factor
        Returns:
            torch.nn.init.xavier_uniform_(data, gain=1.0)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def kaiming_normal(self, data, a=0, mode='fan_in', nonlinearity='leaky_relu'):
        '''
        Args:
            data(tensor): an n-dimensional torch.Tensor
            a: the negative slope of the rectifier used after this layer (only used with 'leaky_relu')
            mode: either 'fan_in' (default) or 'fan_out'. Choosing 'fan_in' preserves the magnitude of the variance of the weights in the forward pass. Choosing 'fan_out' preserves the magnitudes in the backwards pass.
            nonlinearity: the non-linear function (nn.functional name), recommended to use only with 'relu' or 'leaky_relu' (default).
        Returns:
            torch.nn.init.kaiming_normal_(data, a=0, mode='fan_in', nonlinearity='leaky_relu')
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def kaiming_uniform(self, data, a=0, mode='fan_in', nonlinearity='leaky_relu'):
        '''
        Args:
            data(tensor): an n-dimensional torch.Tensor
            a: the negative slope of the rectifier used after this layer (only used with 'leaky_relu')
            mode: either 'fan_in' (default) or 'fan_out'. Choosing 'fan_in' preserves the magnitude of the variance of the weights in the forward pass. Choosing 'fan_out' preserves the magnitudes in the backwards pass.
            nonlinearity: the non-linear function (nn.functional name), recommended to use only with 'relu' or 'leaky_relu' (default).
        Returns:
            torch.nn.init.kaiming_uniform_(data, a=0, mode='fan_in', nonlinearity='leaky_relu')
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def constant(self, data, constant_value=0.0):
        '''
        Args:
            data(tensor): an n-dimensional torch.Tensor
            constant_value(float): the value to fill the tensor with
        Returns:
            torch.nn.init.constant_(data, constant_value)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def to(self, data, device):
        '''
        Args:
            data(tensor): an n-dimensional torch.Tensor
            constant_value(float): the value to fill the tensor with
        Returns:
            torch.nn.init.constant_(data, constant_value)
        '''
        NotImplementedError()

[docs]    @abstractmethod
    def weight_norm(self, weight, amp):
        '''

        w = g/||v|| * v
        Args:
            weight: v
            amp: g

        Returns: amp*weight/norm(weight)
        '''

    # @abstractmethod
    # def euler_update(self):
    #     pass
    #
    # @abstractmethod
    # def rk2_update(self):
    #     pass
    #
    # @abstractmethod
    # def reset(self, v, v_reset, u_reset, spike):
    #      '''
    #      voltage reset
    #
    #      Parameters
    #      ----------
    #      v
    #      v_reset
    #      u_reset
    #      spike
    #
    #      Returns
    #      -------
    #      v[spike] = v_reset
    #      v[spike] += u_reset
    #      '''
    #
    # @abstractmethod
    # def reset_u(self, u, u_reset, spike):
    #      '''
    #      recovery reset
    #
    #      Parameters
    #      ----------
    #      u
    #      _reset
    #      spike
    #
    #      Returns
    #      -------
    #      u[spike] = u+u_reset
    #      '''
    #      NotImplementedError()
    #
    # @abstractmethod
    # def next_stage(self, x):
    #     '''
    #
    #    Parameters
    #    ----------
    #    x: list
    #
    #    Returns
    #    -------
    #    x[index]
    #    '''
    #
    # @abstractmethod
    # def izh_v(self, v, u, psp):
    #     '''
    #
    #     Parameters
    #     ----------
    #     v: list
    #     u: list
    #     psp: list
    #
    #     Returns
    #     -------
    #     V=V+dt*(0.04*V^2+5*V+140-U+PSP)
    #     '''
    #     NotImplementedError()
    #
    # @abstractmethod
    # def izh_u(self, a, b, v, u):
    #     '''
    #
    #     Parameters
    #     ----------
    #     a: list
    #     b: list
    #     u: list
    #     v: list
    #
    #     Returns
    #     -------
    #     U=U+a*(b*V-U)
    #     '''
    #     NotImplementedError()

[docs]    def exp(self, x):
        '''
        Args:
            x(tensor): an n-dimensional torch.Tensor
        Returns:
           return exp(x)
        '''
        NotImplementedError()

[docs]    def sin(self, x):
        '''
        Args:
            x(tensor): an n-dimensional torch.Tensor
        Returns:
           return exp(x)
        '''
        NotImplementedError()

[docs]    def cos(self, x):
        '''
        Args:
            x(tensor): an n-dimensional torch.Tensor
        Returns:
           return exp(x)
        '''
        NotImplementedError()

[docs]    def tan(self, x):
        '''
        Args:
            x(tensor): an n-dimensional torch.Tensor
        Returns:
           return exp(x)
        '''
        NotImplementedError()

[docs]    def log(self, x):
        '''
        Args:
            x(tensor): an n-dimensional torch.Tensor
        Returns:
           return exp(x)
        '''
        NotImplementedError()

[docs]    def log2(self, x):
        '''
        Args:
            x(tensor): an n-dimensional torch.Tensor
        Returns:
           return exp(x)
        '''
        NotImplementedError()

[docs]    def log10(self, x):
        '''
        Args:
            x(tensor): an n-dimensional torch.Tensor
        Returns:
           return exp(x)
        '''
        NotImplementedError()

# class Darwin_Backend(Backend):
#
#     def __init__(self):
#         super(Darwin_Backend, self).__init__()
#         pass