In [2]:

    
import os,sys,inspect
currentdir = os.path.dirname(os.path.abspath(inspect.getfile(inspect.currentframe())))
parentdir = os.path.dirname(currentdir)
sys.path.insert(0,parentdir) 

from importlib import reload 
import torch
import fasttext
from ptb import lang_util
import tensorflow as tf
import torch
from torch.nn import CrossEntropyLoss, NLLLoss
import numpy as np



In [3]:

    
import rsm_samplers
import rsm
from ptb import lang_util
import rsm_experiment
reload(rsm_samplers)
reload(rsm)
reload(lang_util)
reload(rsm_experiment)

CONFIG = {
    'debug': False,
    'path': "/Users/jgordon/nta/results",
    'data_dir': "/Users/jgordon/nta/datasets",
    'dataset': 'ptb',
    'predictor_hidden_size': 1200,
    'predictor_output_size': 10000,
    'batch_size': 300,
    'batches_in_epoch': 2000,
    'batches_in_first_epoch': 2,
    'batch_log_interval': 2000,
    'vocab_size': 10000,
    'eval_interval': 3,
    'eval_batch_size': 100,
    'eval_batches_in_epoch': 824, #8243,
    'learning_rate': 0.0005,
    'm_groups': 1500,
    'n_cells_per_group': 1,
    'k_winners': 80,
    'k_winner_cells': 1,
    'pred_l2_reg': 0.000001,
    'dec_l2_reg': 0.000001,
    'input_bias': True,
    'eval_interval': 5,
    'eps': 0.5,
    'gamma': 0.0,
    'forget_mu': 0.025,
    'weight_sparsity': None,
    'mult_integration': False,
    'fpartition': None,
    'boost_strength': 0.5,
    'boost_strength_factor': 0.85,
    'boost_strat': 'col_boosting',
    'do_inhibition': False,
    'x_b_norm': True,
    'balance_part_winners': True,
    'decode_activation_fn': None,
    'decode_bias': False,
    'embed_dim': 100,
    'input_size': (1, 100),
    'output_size': 100,
    'embedding_kind': 'ptb_fasttext_e5',
    'max_decay': 0.95,
    'mem_floor': 0.0005,
    'trainable_decay': True,
    'word_cache_decay': 0.99
}

Adj RSM entropy



In [4]:

    
import math

def max_entropy(n, k):
    """The maximum entropy we could get with n units and k winners."""
    s = float(k) / n
    if 0.0 < s < 1.0:
        entropy = -s * math.log(s, 2) - (1 - s) * math.log(1 - s, 2)
    else:
        entropy = 0

    return n * entropy

def binary_entropy(x):
    """Calculate entropy for a list of binary random variables.

    :param x: (torch tensor) the probability of the variable to be 1.
    :return: entropy: (torch tensor) entropy, sum(entropy)
    """
    entropy = -x * x.log2() - (1 - x) * (1 - x).log2()
    entropy[x * (1 - x) == 0] = 0
    return entropy, entropy.sum()

def update_duty_cycle(duty_cycle, learning_iterations, x):
    batch_size = x.shape[0]
    learning_iterations += batch_size
    period = min(1000, learning_iterations)
    duty_cycle.mul_(period - batch_size)
    duty_cycle.add_(x.gt(0).sum(dim=0, dtype=torch.float))
    duty_cycle.div_(period)

def forward_and_get_entropy(exp, loader, bsz):
    exp.model.train() 
    tc = exp.m_groups * exp.n_cells_per_group
    k = exp.k_winners
    duty_cycle = torch.zeros(tc)
    learning_iterations = 0
    with torch.no_grad():
        hidden = exp._init_hidden(bsz)
        for _b_idx, (inputs, targets, pred_targets, input_labels) in enumerate(loader):
            inputs = inputs.to(exp.device)
            targets = targets.to(exp.device)
            pred_targets = pred_targets.to(exp.device)
            input_labels = input_labels.to(exp.device)

            output, hidden = exp.model(inputs, hidden)
            
            update_duty_cycle(duty_cycle, learning_iterations, exp.model.RSM_1.col_winners.squeeze())
    
    _, ent = binary_entropy(duty_cycle)
    max_ent = max_entropy(tc, k)
    
#     e = exp.model.RSM_1.kwinners_col.entropy()
#     max_e = exp.model.RSM_1.kwinners_col.max_entropy()
    print("Adj RSM: entropy / max entropy: %.3f/%.3f" % (ent, max_e))
    return ent



In [5]:

    
# Load bRSM
exp = rsm_experiment.RSMExperiment(config=CONFIG)
exp.model_setup(CONFIG, restore_path="/Users/jgordon/Desktop/rsm_highlights/PTB/RSMTune_0_2019-09-20_21-15-18mchjovgl/checkpoint_112")

print("Train...")
e_boost_train = forward_and_get_entropy(exp, exp.train_loader, 300)
print("Test...")
e_boost_test = forward_and_get_entropy(exp, exp.val_loader, 100)









    



setup: Using cpu
Maybe download PTB...






    









    



Loaded embedding dict (ptb_fasttext_e5) with 10000 entries
Built dataloaders...
Loading from /Users/jgordon/Desktop/rsm_highlights/PTB/RSMTune_0_2019-09-20_21-15-18mchjovgl/checkpoint_112






    



/Users/jgordon/miniconda3/envs/standard/lib/python3.7/site-packages/torch/serialization.py:454: SourceChangeWarning: source code of class 'rsm.RSMNet' has changed. you can retrieve the original source code by accessing the object's source attribute or set `torch.nn.Module.dump_patches = True` and use the patch tool to revert the changes.
  warnings.warn(msg, SourceChangeWarning)
/Users/jgordon/miniconda3/envs/standard/lib/python3.7/site-packages/torch/serialization.py:454: SourceChangeWarning: source code of class 'rsm.RSMLayer' has changed. you can retrieve the original source code by accessing the object's source attribute or set `torch.nn.Module.dump_patches = True` and use the patch tool to revert the changes.
  warnings.warn(msg, SourceChangeWarning)






    



Train...






    



---------------------------------------------------------------------------
AttributeError                            Traceback (most recent call last)
<ipython-input-5-ab4859e0afa8> in <module>
      4 
      5 print("Train...")
----> 6 e_boost_train = forward_and_get_entropy(exp, exp.train_loader, 300)
      7 print("Test...")
      8 e_boost_test = forward_and_get_entropy(exp, exp.val_loader, 100)

<ipython-input-4-999d56e714e2> in forward_and_get_entropy(exp, loader, bsz)
     43             input_labels = input_labels.to(exp.device)
     44 
---> 45             output, hidden = exp.model(inputs, hidden)
     46 
     47             update_duty_cycle(duty_cycle, learning_iterations, exp.model.RSM_1.col_winners.squeeze())

~/miniconda3/envs/standard/lib/python3.7/site-packages/torch/nn/modules/module.py in __call__(self, *input, **kwargs)
    491             result = self._slow_forward(*input, **kwargs)
    492         else:
--> 493             result = self.forward(*input, **kwargs)
    494         for hook in self._forward_hooks.values():
    495             hook_result = hook(self, input, result)

~/nta/nupic.research/projects/rsm/rsm.py in forward(self, x_a_batch, hidden)
    191             hidden_in = (lay_x_b, lay_x_above, lay_phi, lay_psi)
    192 
--> 193             pred_output, hidden = layer(layer_input, hidden_in)
    194 
    195             # If layers > 1, higher layers predict lower layer's phi (TOOD: or should be x_b?)

~/miniconda3/envs/standard/lib/python3.7/site-packages/torch/nn/modules/module.py in __call__(self, *input, **kwargs)
    491             result = self._slow_forward(*input, **kwargs)
    492         else:
--> 493             result = self.forward(*input, **kwargs)
    494         for hook in self._forward_hooks.values():
    495             hook_result = hook(self, input, result)

~/nta/nupic.research/projects/rsm/rsm.py in forward(self, x_a_batch, hidden)
    760         self._debug_log({"sigma": sigma})
    761 
--> 762         y = self._inhibited_winners(sigma, phi)
    763 
    764         phi, psi = self._update_memory_and_inhibition(y, phi, psi, x_b=x_b_in)

~/nta/nupic.research/projects/rsm/rsm.py in _inhibited_winners(self, sigma, phi)
    704         pi = pi.detach()  # Prevent gradients from flowing through inhibition/masking
    705 
--> 706         y_pre_act = self._k_winners(sigma, pi)
    707 
    708         activation = RSMLayer.ACT_FNS[self.activation_fn]

~/nta/nupic.research/projects/rsm/rsm.py in _k_winners(self, sigma, pi)
    685             y_pre_act = m_pi * m_lambda * sigma
    686 
--> 687         self._update_duty_cycle(col_winners.squeeze())
    688 
    689 

~/nta/nupic.research/projects/rsm/rsm.py in _update_duty_cycle(self, winners)
    617         '''
    618         batch_size = winners.shape[0]
--> 619         self.learning_iterations += batch_size
    620         period = min(1000, self.learning_iterations)
    621         self.duty_cycle.mul_(period - batch_size)

~/miniconda3/envs/standard/lib/python3.7/site-packages/torch/nn/modules/module.py in __getattr__(self, name)
    537                 return modules[name]
    538         raise AttributeError("'{}' object has no attribute '{}'".format(
--> 539             type(self).__name__, name))
    540 
    541     def __setattr__(self, name, value):

AttributeError: 'RSMLayer' object has no attribute 'learning_iterations'



In [ ]:

    
# Load inhibited RSM
exp = rsm_experiment.RSMExperiment(config=CONFIG)
exp.model_setup(CONFIG, restore_path="/Users/jgordon/Desktop/rsm_highlights/PTB/Ablation/Flat_PTB_Abl_Inh/RSMTune_0_2019-09-22_22-35-225sg3eimn/checkpoint_102")

print("Train...")
e_inh_train = forward_and_get_entropy(exp, exp.train_loader, 300)
print("Test...")
e_inh_test = forward_and_get_entropy(exp, exp.val_loader, 100)



In [7]:

    
import matplotlib.pyplot as plt

MAX_ENT = 450.6


labels = ['Inhibition', 'Boosting']
inh_entropies = [e_inh_train.item(), e_boost_train.item()]
boost_entropies = [e_inh_test.item(), e_boost_test.item()]

x = np.arange(len(labels))  # the label locations
width = 0.35  # the width of the bars

fig, ax = plt.subplots()

rects1 = ax.bar(x - width/2, inh_entropies, width, label='Train')
rects2 = ax.bar(x + width/2, boost_entropies, width, label='Test')

# Add some text for labels, title and custom x-axis tick labels, etc.
ax.set_ylabel('Entropy (bits)')
ax.set_title('Layer entropy comparison: inhibition vs boosting')
ax.set_xticks(x)
ax.set_xticklabels(labels)
ax.plot([0, 2], [MAX_ENT, MAX_ENT], c='gray', label="Max entropy")
ax.legend()









    



---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-7-9a366e9bb6ff> in <module>
      5 
      6 labels = ['Inhibition', 'Boosting']
----> 7 inh_entropies = [e_inh_train.item(), e_boost_train.item()]
      8 boost_entropies = [e_inh_test.item(), e_boost_test.item()]
      9 

NameError: name 'e_inh_train' is not defined



In [14]:

    
import matplotlib.pyplot as plt

def get_event_filename(dir):
    for path in os.listdir(dir):   
        if 'events' in path:    
            return dir + '/' + path
    print("No event for %s" % dir)
    
def get_entropy_curves(filename):
    xaxis = []
    train_ents = []
    test_ents = []
    for event in tf.compat.v1.train.summary_iterator(filename):
        for value in event.summary.value:
            if 'entropy' in value.tag:
                if not xaxis or xaxis[-1] != event.step:
                    xaxis.append(event.step)
            if 'train_entropy' in value.tag:
                ent = value.simple_value
                train_ents.append(ent)
            elif 'test_entropy' in value.tag:
                ent = value.simple_value
                test_ents.append(ent)
    return xaxis, train_ents, test_ents

fig, axs = plt.subplots(1, 2, dpi=144, figsize=(10, 6))

axs[0].set_title("Train")
axs[1].set_title("Test")
axs[0].set_xlabel("Mini-batches (1000s)")
axs[1].set_xlabel("Mini-batches (1000s)")
axs[0].set_ylabel("Binary Entropy (bits)")
axs[1].set_ylabel("Binary Entropy (bits)")

labels = [
    "No boosting or inhibition",
    "Inhibition",
    "Boosting"
]



fn = get_event_filename("/Users/jgordon/Desktop/rsm_highlights/PTB/Entropy/RSMTune_0_boost_strength_0_2019-10-10_20-58-14_5pr4jhk")
xaxis, train_ents, test_ents = get_entropy_curves(fn)

l_none = axs[0].plot(xaxis, train_ents, label="No boosting or inhibition", c='red')
axs[1].plot(xaxis, test_ents, label="No boosting or inhibition", c='red')

fn = get_event_filename("/Users/jgordon/Desktop/rsm_highlights/PTB/Entropy/RSMTune_1_boost_strat_rsm_inhibition_2019-10-01_03-23-26anv1eoa5")
xaxis, train_ents, test_ents = get_entropy_curves(fn)

l_in = axs[0].plot(xaxis, train_ents, label="Inhibition", c='green', dashes=[1,1])
axs[1].plot(xaxis, test_ents, label="Inhibition", c='green', dashes=[1, 1])

fn = get_event_filename("/Users/jgordon/Desktop/rsm_highlights/PTB/Entropy/RSMTune_0_2019-10-01_03-24-58ogm7b9bn")
xaxis, train_ents, test_ents = get_entropy_curves(fn)

l_ns = axs[0].plot(xaxis, train_ents, c='blue', dashes=[4, 1])
axs[1].plot(xaxis, test_ents, label="Boosting", c='blue', dashes=[4, 1])

plt.figlegend(l_none + l_in + l_ns, labels, loc = 'lower center', ncol=3, labelspacing=0.3 )
plt.suptitle("Layer Entropy: Boosting vs Inhibition")

for ax in axs:
    ax.spines['right'].set_visible(False)
    ax.spines['top'].set_visible(False)
    ax.set_ylim((250, 460))
    ax.plot([0, 62], [MAX_ENT, MAX_ENT], c='#DDDDDD', label="Max entropy", dashes=[4, 2])
plt.savefig('Charts/entropy.png')
plt.show()