pytorch-dnc/dnc/sdnc.py

#!/usr/bin/env python3
# -*- coding: utf-8 -*-

import torch.nn as nn
import torch as T
from torch.autograd import Variable as var
import numpy as np

from torch.nn.utils.rnn import pad_packed_sequence as pad
from torch.nn.utils.rnn import pack_padded_sequence as pack
from torch.nn.utils.rnn import PackedSequence
from torch.nn.init import orthogonal_, xavier_uniform_

from .util import *
from .sparse_temporal_memory import SparseTemporalMemory
from .dnc import DNC


class SDNC(DNC):

  def __init__(
      self,
      input_size,
      hidden_size,
      rnn_type='lstm',
      num_layers=1,
      num_hidden_layers=2,
      bias=True,
      batch_first=True,
      dropout=0,
      bidirectional=False,
      nr_cells=5000,
      sparse_reads=4,
      temporal_reads=4,
      read_heads=4,
      cell_size=10,
      nonlinearity='tanh',
      gpu_id=-1,
      independent_linears=False,
      share_memory=True,
      debug=False,
      clip=20
  ):
    super(SDNC, self).__init__(
        input_size=input_size,
        hidden_size=hidden_size,
        rnn_type=rnn_type,
        num_layers=num_layers,
        num_hidden_layers=num_hidden_layers,
        bias=bias,
        batch_first=batch_first,
        dropout=dropout,
        bidirectional=bidirectional,
        nr_cells=nr_cells,
        read_heads=read_heads,
        cell_size=cell_size,
        nonlinearity=nonlinearity,
        gpu_id=gpu_id,
        independent_linears=independent_linears,
        share_memory=share_memory,
        debug=debug,
        clip=clip
    )

    self.sparse_reads = sparse_reads
    self.temporal_reads = temporal_reads

    self.memories = []

    for layer in range(self.num_layers):
      # memories for each layer
      if not self.share_memory:
        self.memories.append(
            SparseTemporalMemory(
                input_size=self.output_size,
                mem_size=self.nr_cells,
                cell_size=self.w,
                sparse_reads=self.sparse_reads,
                read_heads=self.read_heads,
                temporal_reads=self.temporal_reads,
                gpu_id=self.gpu_id,
                mem_gpu_id=self.gpu_id,
                independent_linears=self.independent_linears
            )
        )
        setattr(self, 'rnn_layer_memory_' + str(layer), self.memories[layer])

    # only one memory shared by all layers
    if self.share_memory:
      self.memories.append(
          SparseTemporalMemory(
              input_size=self.output_size,
              mem_size=self.nr_cells,
              cell_size=self.w,
              sparse_reads=self.sparse_reads,
              read_heads=self.read_heads,
              temporal_reads=self.temporal_reads,
              gpu_id=self.gpu_id,
              mem_gpu_id=self.gpu_id,
              independent_linears=self.independent_linears
          )
      )
      setattr(self, 'rnn_layer_memory_shared', self.memories[0])

  def _debug(self, mhx, debug_obj):
    if not debug_obj:
      debug_obj = {
          'memory': [],
          'visible_memory': [],
          'link_matrix': [],
          'rev_link_matrix': [],
          'precedence': [],
          'read_weights': [],
          'write_weights': [],
          'read_vectors': [],
          'least_used_mem': [],
          'usage': [],
          'read_positions': []
      }

    debug_obj['memory'].append(mhx['memory'][0].data.cpu().numpy())
    debug_obj['visible_memory'].append(mhx['visible_memory'][0].data.cpu().numpy())
    debug_obj['link_matrix'].append(mhx['link_matrix'][0].data.cpu().numpy())
    debug_obj['rev_link_matrix'].append(mhx['rev_link_matrix'][0].data.cpu().numpy())
    debug_obj['precedence'].append(mhx['precedence'][0].unsqueeze(0).data.cpu().numpy())
    debug_obj['read_weights'].append(mhx['read_weights'][0].unsqueeze(0).data.cpu().numpy())
    debug_obj['write_weights'].append(mhx['write_weights'][0].unsqueeze(0).data.cpu().numpy())
    debug_obj['read_vectors'].append(mhx['read_vectors'][0].data.cpu().numpy())
    debug_obj['least_used_mem'].append(mhx['least_used_mem'][0].unsqueeze(0).data.cpu().numpy())
    debug_obj['usage'].append(mhx['usage'][0].unsqueeze(0).data.cpu().numpy())
    debug_obj['read_positions'].append(mhx['read_positions'][0].unsqueeze(0).data.cpu().numpy())

    return debug_obj
Add sdnc nn 2017-11-27 19:16:53 +08:00			`#!/usr/bin/env python3`
Remove SDNC tests 2017-12-01 22:18:39 +08:00			`# -- coding: utf-8 --`
Add sdnc nn 2017-11-27 19:16:53 +08:00
			`import torch.nn as nn`
			`import torch as T`
			`from torch.autograd import Variable as var`
			`import numpy as np`

			`from torch.nn.utils.rnn import pad_packed_sequence as pad`
			`from torch.nn.utils.rnn import pack_padded_sequence as pack`
			`from torch.nn.utils.rnn import PackedSequence`
port to pytorch 1.x 2019-04-05 14:14:41 +08:00			`from torch.nn.init import orthogonal_, xavier_uniform_`
Add sdnc nn 2017-11-27 19:16:53 +08:00
			`from .util import *`
Refactor and remove duplicate code, introduce SAMs without temporal addressing 2017-12-18 14:51:37 +08:00			`from .sparse_temporal_memory import SparseTemporalMemory`
			`from .dnc import DNC`
Add sdnc nn 2017-11-27 19:16:53 +08:00

Refactor and remove duplicate code, introduce SAMs without temporal addressing 2017-12-18 14:51:37 +08:00			`class SDNC(DNC):`
Add sdnc nn 2017-11-27 19:16:53 +08:00
			`def __init__(`
			`self,`
			`input_size,`
			`hidden_size,`
			`rnn_type='lstm',`
			`num_layers=1,`
			`num_hidden_layers=2,`
			`bias=True,`
			`batch_first=True,`
			`dropout=0,`
			`bidirectional=False,`
Update readme 2017-12-11 03:13:52 +08:00			`nr_cells=5000,`
Preliminary working temporal tracking 2017-12-11 19:46:47 +08:00			`sparse_reads=4,`
			`temporal_reads=4,`
Rewrite sdnc, more read heads 2017-12-07 19:29:51 +08:00			`read_heads=4,`
Add sdnc nn 2017-11-27 19:16:53 +08:00			`cell_size=10,`
			`nonlinearity='tanh',`
			`gpu_id=-1,`
			`independent_linears=False,`
			`share_memory=True,`
			`debug=False,`
			`clip=20`
			`):`
Refactor and remove duplicate code, introduce SAMs without temporal addressing 2017-12-18 14:51:37 +08:00			`super(SDNC, self).__init__(`
			`input_size=input_size,`
			`hidden_size=hidden_size,`
			`rnn_type=rnn_type,`
			`num_layers=num_layers,`
			`num_hidden_layers=num_hidden_layers,`
			`bias=bias,`
			`batch_first=batch_first,`
			`dropout=dropout,`
			`bidirectional=bidirectional,`
			`nr_cells=nr_cells,`
			`read_heads=read_heads,`
			`cell_size=cell_size,`
			`nonlinearity=nonlinearity,`
			`gpu_id=gpu_id,`
			`independent_linears=independent_linears,`
			`share_memory=share_memory,`
			`debug=debug,`
			`clip=clip`
			`)`
Add sdnc nn 2017-11-27 19:16:53 +08:00
			`self.sparse_reads = sparse_reads`
Preliminary working temporal tracking 2017-12-11 19:46:47 +08:00			`self.temporal_reads = temporal_reads`
Add sdnc nn 2017-11-27 19:16:53 +08:00
			`self.memories = []`

			`for layer in range(self.num_layers):`
			`# memories for each layer`
			`if not self.share_memory:`
			`self.memories.append(`
Refactor and remove duplicate code, introduce SAMs without temporal addressing 2017-12-18 14:51:37 +08:00			`SparseTemporalMemory(`
Add sdnc nn 2017-11-27 19:16:53 +08:00			`input_size=self.output_size,`
			`mem_size=self.nr_cells,`
			`cell_size=self.w,`
Rewrite sdnc, more read heads 2017-12-07 19:29:51 +08:00			`sparse_reads=self.sparse_reads,`
			`read_heads=self.read_heads,`
Preliminary working temporal tracking 2017-12-11 19:46:47 +08:00			`temporal_reads=self.temporal_reads,`
Add sdnc nn 2017-11-27 19:16:53 +08:00			`gpu_id=self.gpu_id,`
finally no nans :relief: 2017-11-30 22:37:52 +08:00			`mem_gpu_id=self.gpu_id,`
Add sdnc nn 2017-11-27 19:16:53 +08:00			`independent_linears=self.independent_linears`
			`)`
			`)`
			`setattr(self, 'rnn_layer_memory_' + str(layer), self.memories[layer])`

			`# only one memory shared by all layers`
			`if self.share_memory:`
			`self.memories.append(`
Refactor and remove duplicate code, introduce SAMs without temporal addressing 2017-12-18 14:51:37 +08:00			`SparseTemporalMemory(`
Add sdnc nn 2017-11-27 19:16:53 +08:00			`input_size=self.output_size,`
			`mem_size=self.nr_cells,`
			`cell_size=self.w,`
Rewrite sdnc, more read heads 2017-12-07 19:29:51 +08:00			`sparse_reads=self.sparse_reads,`
			`read_heads=self.read_heads,`
Preliminary working temporal tracking 2017-12-11 19:46:47 +08:00			`temporal_reads=self.temporal_reads,`
Add sdnc nn 2017-11-27 19:16:53 +08:00			`gpu_id=self.gpu_id,`
finally no nans :relief: 2017-11-30 22:37:52 +08:00			`mem_gpu_id=self.gpu_id,`
Add sdnc nn 2017-11-27 19:16:53 +08:00			`independent_linears=self.independent_linears`
			`)`
			`)`
			`setattr(self, 'rnn_layer_memory_shared', self.memories[0])`

			`def _debug(self, mhx, debug_obj):`
			`if not debug_obj:`
			`debug_obj = {`
			`'memory': [],`
Get debugging working and initialize properly 2017-12-09 20:58:59 +08:00			`'visible_memory': [],`
Preliminary working temporal tracking 2017-12-11 19:46:47 +08:00			`'link_matrix': [],`
			`'rev_link_matrix': [],`
			`'precedence': [],`
Add sdnc nn 2017-11-27 19:16:53 +08:00			`'read_weights': [],`
			`'write_weights': [],`
Get debugging working and initialize properly 2017-12-09 20:58:59 +08:00			`'read_vectors': [],`
revert to using FLANN indexes, in a faster way 2017-12-11 02:51:08 +08:00			`'least_used_mem': [],`
Get debugging working and initialize properly 2017-12-09 20:58:59 +08:00			`'usage': [],`
			`'read_positions': []`
Add sdnc nn 2017-11-27 19:16:53 +08:00			`}`

Get debugging working and initialize properly 2017-12-09 20:58:59 +08:00			`debug_obj['memory'].append(mhx['memory'][0].data.cpu().numpy())`
			`debug_obj['visible_memory'].append(mhx['visible_memory'][0].data.cpu().numpy())`
Preliminary working temporal tracking 2017-12-11 19:46:47 +08:00			`debug_obj['link_matrix'].append(mhx['link_matrix'][0].data.cpu().numpy())`
			`debug_obj['rev_link_matrix'].append(mhx['rev_link_matrix'][0].data.cpu().numpy())`
			`debug_obj['precedence'].append(mhx['precedence'][0].unsqueeze(0).data.cpu().numpy())`
Get debugging working and initialize properly 2017-12-09 20:58:59 +08:00			`debug_obj['read_weights'].append(mhx['read_weights'][0].unsqueeze(0).data.cpu().numpy())`
			`debug_obj['write_weights'].append(mhx['write_weights'][0].unsqueeze(0).data.cpu().numpy())`
			`debug_obj['read_vectors'].append(mhx['read_vectors'][0].data.cpu().numpy())`
revert to using FLANN indexes, in a faster way 2017-12-11 02:51:08 +08:00			`debug_obj['least_used_mem'].append(mhx['least_used_mem'][0].unsqueeze(0).data.cpu().numpy())`
Get debugging working and initialize properly 2017-12-09 20:58:59 +08:00			`debug_obj['usage'].append(mhx['usage'][0].unsqueeze(0).data.cpu().numpy())`
			`debug_obj['read_positions'].append(mhx['read_positions'][0].unsqueeze(0).data.cpu().numpy())`

Add sdnc nn 2017-11-27 19:16:53 +08:00			`return debug_obj`