From 72d08bc8411509e80ab4aa40294e41311a605ab7 Mon Sep 17 00:00:00 2001
From: JonathanAMichaels <Jonathan.asher.michaels@gmail.com>
Date: Wed, 10 Jan 2018 16:43:29 -0800
Subject: [PATCH] final clean up

---
 examples/geneticRNN_Example_CO.m   |   6 +-
 examples/geneticRNN_Example_DNMS.m |  11 +-
 geneticRNN_learn_model.m           | 247 +++++++++-----------
 geneticRNN_learn_model_2.m         | 343 ----------------------------
 geneticRNN_learn_model_2.m~        | 349 -----------------------------
 geneticRNN_rollout_model.m         |   2 +-
 6 files changed, 111 insertions(+), 847 deletions(-)
 delete mode 100644 geneticRNN_learn_model_2.m
 delete mode 100644 geneticRNN_learn_model_2.m~

diff --git a/examples/geneticRNN_Example_CO.m b/examples/geneticRNN_Example_CO.m
index d9b13bb..32e6421 100644
--- a/examples/geneticRNN_Example_CO.m
+++ b/examples/geneticRNN_Example_CO.m
@@ -58,10 +58,10 @@
 evalOpts = [2 1]; % Plotting level and frequency of evaluation
 
 %% Train network
-% This step should take about 5 minutes, depending on your processor.
-% Should stopped at the desired time by pressing the STOP button and waiting for 1 iteration
+% This step should take less than 5 minutes on a 16 core machine.
+% Should be stopped at the desired time by pressing the STOP button and waiting for 1 iteration.
 % Look inside to see information about the many optional parameters.
-[net, learnStats] = geneticRNN_learn_model_2(inp, mutationPower, populationSize, truncationSize, fitnessFunInputs, policyInitInputs, ...
+[net, learnStats] = geneticRNN_learn_model(inp, mutationPower, populationSize, truncationSize, fitnessFunInputs, policyInitInputs, ...
     'evalOpts', evalOpts, ...
     'policyInitInputsOptional', policyInitInputsOptional, ...
     'targetFun', targetFun, 'targetFunPassthrough', targetFunPassthrough);
diff --git a/examples/geneticRNN_Example_DNMS.m b/examples/geneticRNN_Example_DNMS.m
index ec6a1fb..a11545f 100644
--- a/examples/geneticRNN_Example_DNMS.m
+++ b/examples/geneticRNN_Example_DNMS.m
@@ -53,7 +53,7 @@
 B = size(targ{1},1); % Outputs
 I = size(inp{1},1); % Inputs
 p = 1; % Sparsity
-g = 1.2; % Spectral scaling
+g = 1.1; % Spectral scaling
 dt = 10; % Time step
 tau = 50; % Time constant
 
@@ -70,14 +70,13 @@
 evalOpts = [2 1]; % Plotting level and frequency of evaluation
 
 %% Train network
-% This step should take about 5 minutes, depending on your processor.
-% Should stopped at the desired time by pressing the STOP button and waiting for 1 iteration
+% This step should take less than 5 minutes on a 16 core machine.
+% Should be stopped at the desired time by pressing the STOP button and waiting for 1 iteration.
 % Look inside to see information about the many optional parameters.
-[net, learnStats] = geneticRNN_learn_model_2(mutationPower, populationSize, truncationSize, fitnessFunInputs, policyInitInputs, ...
+[net, learnStats] = geneticRNN_learn_model(inp, mutationPower, populationSize, truncationSize, fitnessFunInputs, policyInitInputs, ...
     'input', inp, ...
     'evalOpts', evalOpts, ...
     'policyInitInputsOptional', policyInitInputsOptional);
 
 %% Run network
-[Z0, Z1, R, X, kin] = geneticRNN_run_model(net, 'input', inp);
-
+[Z0, Z1, R, X, kin] = geneticRNN_run_model(net, inp);
\ No newline at end of file
diff --git a/geneticRNN_learn_model.m b/geneticRNN_learn_model.m
index 2a93637..b5029b5 100644
--- a/geneticRNN_learn_model.m
+++ b/geneticRNN_learn_model.m
@@ -1,107 +1,75 @@
-function [winner, varargout] = geneticRNN_learn_model(mutationPower, populationSize, truncationSize, fitnessFunInputs, policyInitInputs, varargin)
+function [winner, varargout] = geneticRNN_learn_model(inp, mutationPower, populationSize, truncationSize, fitnessFunInputs, policyInitInputs, varargin)
 
-% net = hebbRNN_learn_model(x0, net, F, perturbProb, eta, varargin)
-%
-% This function trains a recurrent neural network using reward-modulated
-% Hebbian learning to produce desired outputs. During each trial the
-% activations of random neurons are randomly perturbed. All fluctuations in
-% the activation of each neuron are accumulated (supra-linearly) as an
-% elegibility trace. At the end of each trial the error of the output is
-% compared against the expected error and the difference is used to
-% reinforce connectivity changes (net.J) that produce the desired output.
-%
-% The details of training the network are based on those
-% presented in the following work:
-% "Flexible decision-making in recurrent neural networks trained with a
-% biologically plausible rule. Thomas Miconi (2016)"
-% Published on BioRxiv. The current version can be found under the following URL:
-% http://biorxiv.org/content/early/2016/07/26/057729
+% net = geneticRNN_learn_model(inp, mutationPower, populationSize, truncationSize, fitnessFunInputs, policyInitInputs, varargin)
 %
+% This function trains a recurrent neural network using a simple genetic algorithm
+% to complete the desired goal.
 %
 % INPUTS:
 %
-% x0 -- the initial activation (t == 0) of all neurons
-% Must be of size: net.N x 1
+% inp -- Inputs to the network. Must be present, but can be empty.
+%
+% mutationPower -- Standard deviation of normally distributed noise to add in each generation
 %
-% net -- the network structure created by hebbRNN_create_model
+% populationSize -- Number of individuals in each generation
 %
-% F -- the desired output
-% Must be a cell of size: 1 x conditions
-% Each cell must be of size: net.B x time points
+% truncationSize -- Number of individuals to save for next generation
 %
-% perturbProb -- the probability of perturbing the activation of each neuron
-% per second
+% fitnessFunInputs -- Target information for calculating the fitness
 %
-% eta -- the learning rate
+% policyInitInputs -- Inputs for the policy initialization function
 %
 %
 % OPTIONAL INPUTS:
+% 
+% mutationPowerDecay -- Natural decay rate of mutation power
 %
-% input -- the input to the network
-% Must be a cell of size: 1 x conditions
-% Each cell must be of size: net.I x time points
-% Default: []
+% mutationPowerDrop -- Decay rate of mutation power when we don't learn anything on a given generation
 %
-% targettimes -- the time points used to generate the error signal
-% Default: entire trial
+% weightCompression -- Whether or not to compress policy (logical)
 %
-% beta -- the variance of the neural perturbation
-% Default: 0.5. Don't change this unless you know what you're doing
+% weightDecay -- Whether or not to decay policy (logical)
 %
-% maxdJ -- the absolute connectivity values above this level will be
-% clipped
-% Default: 1e-4. Don't change this unless you know what you're doing
+% fitnessFun -- function handle for assessing fitness
+% Default: @defaultFitnessFunction
 %
-% alphaX -- the weight given to previous time points of the activation
-% trace
-% Default: 0. Don't change this unless you know what you're doing
+% policyInitFun -- function handle for initializing the policy
+% Default: @geneticRNN_create_model
 %
-% alphaR -- the weight given to previous time points of the error
-% prediction trace
-% Default: 0.33. Don't change this unless you know what you're doing
+% policyInitInputsOptional -- Optional inputs for the policy initialization function
 %
-% targetFun -- the handle of a function that uses the firing rates of the
+% targetFun -- The handle of a function that uses the firing rates of the
 % output units to produce some desired output. Function must follow
 % conventions of supplied default function.
 % Default: @defaultTargetFunction
 %
-% targetFunPassthrough -- a user-defined structure that is automatically
+% targetFunPassthrough -- A user-defined structure that is automatically
 % passed through to the targetFun, permitting custom variables to be passed
 % Default: []
 %
-% tolerance -- at what error level below which the training will terminate
-% Default: 0 (will train forever).
-%
-% batchType -- conditions are train either in random order each pass
-% (pseudorand), or always in order (linear)
-% Default: 'pseudorand'
-%
-% plotFun -- the handle of a function that plots information about the
+% plotFun -- The handle of a function that plots information about the
 % network during the learning process. Function must follow conventions
 % of supplied default function.
 % Default: @defaultPlottingFunction
 %
-% evalOpts -- a vector of size 2, specifying how much information should be
+% evalOpts -- A vector of size 2, specifying how much information should be
 % displayed during training (0 - nothing, 1 - text only, 2 - text +
 % figures), and how often the network should be evaluated. This vector is
 % passed to the plotting function.
-% Default: [0 50]
+% Default: [1 1]
 %
 %
 % OUTPUTS:
 %
-% net -- the network structure
+% winner -- the network structure
 %
 % errStats -- the structure containing error information from learning
 % (optional)
 %
 %
-% Copyright (c) Jonathan A Michaels 2016
+% Copyright (c) Jonathan A Michaels 2018
 % German Primate Center
 % jonathanamichaels AT gmail DOT com
-%
-% If used in published work please see repository README.md for citation
-% and license information: https://github.com/JonathanAMichaels/hebbRNN
 
 
 % Start counting
@@ -113,9 +81,10 @@
 % Variable input considerations
 optargin = size(varargin,2);
 
-inp = []; % Default inputs
 mutationPowerDecay = 0.99;
 mutationPowerDrop = 0.7;
+weightCompression = true; % By default we will compress
+weightDecay = false; % By default we won't use decay
 targetFun = @defaultTargetFunction; % Default output function (native)
 plotFun = @defaultPlottingFunction; % Default plotting function (native)
 fitnessFun = @defaultFitnessFunction; % Default fitness function (native)
@@ -125,16 +94,17 @@
 evalOpts = [1 1]; % Default evaluation values [plottingOptions evaluateEveryXIterations]
 
 for iVar = 1:2:optargin
-    switch varargin{iVar}
-        
-        case 'input'
-            inp = varargin{iVar+1};
-            
+    switch varargin{iVar}            
         case 'mutationPowerDecay'
             mutationPowerDecay = varargin{iVar+1};
         case 'mutationPowerDrop'
             mutationPowerDrop = varargin{iVar+1};
             
+        case 'weightCompression'
+            weightCompression = varargin{iVar+1};
+        case 'weightDecay'
+            weightDecay = varargin{iVar+1};
+            
         case 'fitnessFun'
             fitnessFun = varargin{iVar+1};
         case 'policyInitFun'
@@ -155,120 +125,107 @@
     end
 end
 
-%% Checks
-% The input can be either empty, or specified at each time point by the user.
-
 errStats.fitness = []; errStats.generation = []; % Initialize error statistics
-g = 1;
-previousGen = [];
-decay = 1;
+g = 1; % Initialize generation
+allDecay1 = []; allDecay2 = []; allMutationPower = []; % Initialize decay history
 
 %% Main Program %%
 % Runs until tolerated error is met or stop button is pressed
 figure(97)
-set(gcf, 'Position', [0 0 100 50], 'MenuBar', 'none', 'ToolBar', 'none', 'Name', 'Stop', 'NumberTitle', 'off')
+set(gcf, 'Position', [0 50 100 50], 'MenuBar', 'none', 'ToolBar', 'none', 'Name', 'Stop', 'NumberTitle', 'off')
 UIButton = uicontrol('Style', 'togglebutton', 'String', 'STOP', 'Position', [0 0 100 50], 'FontSize', 25);
 while UIButton.Value == 0
-    tic
-    fitness = zeros(length(inp),populationSize);
-    bigR = cell(1,populationSize);
-    bigZ1 = cell(1,populationSize);
-    net = repmat(struct('I',0,'B',0,'N',0,'p',0,'g',0,'J',0,'netNoiseSigma',0,'dt',0,'tau',0,'wIn',0,'wFb',0,'wOut',0,'bJ',0,'bOut',0,'x0',0,'actFun',0,'actFunDeriv',0,'energyCost',0), ...
-    1, populationSize);
-
+    %% Initialize parameters
+    if weightCompression
+        decay1 = 1 - mutationPower;
+    else
+        decay1 = 1;
+    end
     decay2 = mutationPower * 1e-1;
+    allDecay1 = cat(2, allDecay1, decay1);
+    allDecay2 = cat(2, allDecay2, decay2);
+    allMutationPower = cat(2, allMutationPower, mutationPower);
+    fitness = zeros(length(inp),populationSize);
+    
+    %% Generate random seeds
+    theseSeeds = randsample(1e8, populationSize);
+    if g > 1
+        previousSeeds = masterSeeds(randsample(size(masterSeeds,1), populationSize, true), :);
+        previousSeeds(1,:) = masterSeeds(1,:); % Save the elite!
+        theseSeeds(1) = nan; % Save the elite!
+        sendSeeds = [previousSeeds, theseSeeds];
+    else
+        sendSeeds = theseSeeds;
+    end
+    
+    %% Heavy lifting
     parfor i = 1:populationSize
-        if g == 1
-            % Generate new networks
-            net(i) = policyInitFun(policyInitInputs, policyInitInputsOptional);
-        else
-            if i == 1
-                net(i) = previousGen(1);
-            else
-                k = randsample(truncationSize, 1);
-                net(i) = previousGen(k);
-                
-                net(i).wIn = (net(i).wIn + (randn(size(net(i).wIn)) * mutationPower .* (net(i).wIn ~= 0))) .* (decay * ones(size(net(i).wIn)));
-                net(i).wFb = (net(i).wFb + (randn(size(net(i).wFb)) * mutationPower .* (net(i).wFb ~= 0))) .* (decay * ones(size(net(i).wFb)));
-                net(i).wOut = (net(i).wOut + (randn(size(net(i).wOut)) * mutationPower .* (net(i).wOut ~= 0))) .* (decay * ones(size(net(i).wOut)));
-                net(i).J = (net(i).J + (randn(size(net(i).J)) * mutationPower .* (net(i).J ~= 0))) .* (decay * ones(size(net(i).J)));
-                net(i).bJ = (net(i).bJ + (randn(size(net(i).bJ)) * mutationPower .* (net(i).bJ ~= 0))) .* (decay * ones(size(net(i).bJ)));
-                net(i).bOut = (net(i).bOut + (randn(size(net(i).bOut)) * mutationPower .* (net(i).bOut ~= 0))) .* (decay * ones(size(net(i).bOut)));
-                net(i).x0 = (net(i).x0 + (randn(size(net(i).x0)) * mutationPower .* (net(i).x0 ~= 0))) .* (decay * ones(size(net(i).x0)));
-%                 
-                net(i).wIn = net(i).wIn - decay2*(net(i).wIn-decay2 > 0) + decay2*(net(i).wIn+decay2 < 0);
-                net(i).wFb = net(i).wFb - decay2*(net(i).wFb-decay2 > 0) + decay2*(net(i).wFb+decay2 < 0);
-                net(i).wOut = net(i).wOut - decay2*(net(i).wOut-decay2 > 0) + decay2*(net(i).wOut+decay2 < 0);
-                net(i).J = net(i).J - decay2*(net(i).J-decay2 > 0) + decay2*(net(i).J+decay2 < 0);
-                net(i).bJ = net(i).bJ - decay2*(net(i).bJ-decay2 > 0) + decay2*(net(i).bJ+decay2 < 0);
-                net(i).bOut = net(i).bOut - decay2*(net(i).bOut-decay2 > 0) + decay2*(net(i).bOut+decay2 < 0);
-                net(i).x0 = net(i).x0 - decay2*(net(i).x0-decay2 > 0) + decay2*(net(i).x0+decay2 < 0);
-                
-%                 net(i).wIn(abs(net(i).wIn) <= decay2) = 0;
-%                 net(i).wFb(abs(net(i).wFb) <= decay2) = 0;
-%                 net(i).wOut(abs(net(i).wOut) <= decay2) = 0;
-%                 net(i).J(abs(net(i).J) <= decay2) = 0;
-%                 net(i).bJ(abs(net(i).bJ) <= decay2) = 0;
-%                 net(i).bOut(abs(net(i).bOut) <= decay2) = 0;
-%                 net(i).x0(abs(net(i).x0) <= decay2) = 0;
-            end
-        end
-        
+        % Hack the random number generator
+        stream = RandStream('mrg32k3a');
+        RandStream.setGlobalStream(stream);
+        stream.Substream = i;
+        % Rollout the model based on the random seeds
+        net = geneticRNN_rollout_model(policyInitFun, policyInitInputs, policyInitInputsOptional, allMutationPower, allDecay1, allDecay2, weightDecay, sendSeeds(i,:));
         % Run model
-        [Z0, Z1, R, dR, ~] = geneticRNN_run_model(net(i), 'input', inp, 'targetFun', targetFun, 'targetFunPassthrough', targetFunPassthrough);
+        [~, Z1, ~, ~] = geneticRNN_run_model(net, inp, 'targetFun', targetFun, 'targetFunPassthrough', targetFunPassthrough);
         % Assess fitness
-        fitness(:,i) = fitnessFun(net(i).J, Z0, Z1, dR, fitnessFunInputs);
-        
-        bigZ1{i} = Z1;
-        bigR{i} = R;
+        fitness(:,i) = fitnessFun(Z1, fitnessFunInputs);
     end
+    
+    %% Sort and save best policies
     [~, sortInd] = sort(mean(fitness,1), 'descend');
-    net = net(sortInd);
     fitness = fitness(:,sortInd(1:truncationSize));
-    bigZ1 = bigZ1{sortInd(1)};
-    bigR = bigR{sortInd(1)};
+    masterSeeds = sendSeeds(sortInd(1:truncationSize),:);
     
-    if sortInd(1) == 1
-        mutationPower = mutationPower * mutationPowerDrop;
-    end
+    %% Recalculate best network for plotting or output
+    % Hack the random number generator
+    stream = RandStream('mrg32k3a');
+    RandStream.setGlobalStream(stream);
+    stream.Substream = sortInd(1);
+    % Rollout the model based on the random seeds
+    net = geneticRNN_rollout_model(policyInitFun, policyInitInputs, policyInitInputsOptional, allMutationPower, allDecay1, allDecay2, weightDecay, masterSeeds(1,:));
+    % Run model
+    [~, Z1, R, ~] = geneticRNN_run_model(net, inp, 'targetFun', targetFun, 'targetFunPassthrough', targetFunPassthrough);
     
     %% Save stats
     errStats.fitness(:,end+1) = fitness(:,1);
     errStats.generation(end+1) = g;
     
-    
     %% Populate statistics for plotting function
     plotStats.fitness = fitness;
     plotStats.mutationPower = mutationPower;
     plotStats.generation = g;
-    plotStats.bigZ1 = bigZ1;
-    plotStats.bigR = bigR;
+    plotStats.bigZ1 = Z1;
+    plotStats.bigR = R;
     plotStats.targ = fitnessFunInputs;
     
     %% Run supplied plotting function
     if mod(g,evalOpts(2)) == 0
         plotFun(plotStats, errStats, evalOpts)
     end
-
-    previousGen = net(1:truncationSize);
-    mutationPower = mutationPower * mutationPowerDecay;
+    
+    %% Decay mutation power
+    if sortInd(1) == 1
+        mutationPower = mutationPower * mutationPowerDrop; % Big drop if we didn't learn anything
+    else
+        mutationPower = mutationPower * mutationPowerDecay; % Small drop if we learned something
+    end
+    
     g = g + 1;
-    toc
 end
 
-
 %% Output error statistics if required
 if ( nout >= 1 )
     varargout{1} = errStats;
 end
 
 %% Save hard-earned elite network
-winner = previousGen(1);
+winner = net;
 
 disp('Training time required:')
 toc
 
-%% Default plotting function
+    %% Default plotting function
     function defaultPlottingFunction(plotStats, errStats, evalOptions)
         if evalOptions(1) >= 0
             disp(['Generation: ' num2str(plotStats.generation) '  Fitness: ' num2str(mean(plotStats.fitness(:,1))) '  Mutation Power: ' num2str(plotStats.mutationPower)])
@@ -315,21 +272,21 @@ function defaultPlottingFunction(plotStats, errStats, evalOptions)
         drawnow
     end
 
-    function fitness = defaultFitnessFunction(J, Z0, Z1, dR, targ)
+    %% Default fitness function
+    function fitness = defaultFitnessFunction(Z1, targ)
         fitness = zeros(1,length(Z1));
         for cond = 1:length(Z1)
             ind = ~isnan(targ{cond});
-            
-            useZ0 = Z0{cond};
             useZ1 = Z1{cond}(ind);
-            usedR = dR{cond};
             useF = targ{cond}(ind);
             
-            err(1) = sum(abs(useZ1(:)-useF(:)));
-            %temp = J*usedR;
-            err(2) = 0;%sum(temp(:).^2) / size(usedR,2);%0.0*sum(abs(useZ0(:)));
-            
+            err(1) = sum(abs(useZ1(:)-useF(:)));       
             fitness(cond) = -sum(err);
         end
     end
+
+    %% Default output function
+    function [z, targetFeedforward] = defaultTargetFunction(~, r, ~, targetFeedforward)
+        z = r; % Just passes firing rate
+    end
 end
\ No newline at end of file
diff --git a/geneticRNN_learn_model_2.m b/geneticRNN_learn_model_2.m
deleted file mode 100644
index 90a0d1a..0000000
--- a/geneticRNN_learn_model_2.m
+++ /dev/null
@@ -1,343 +0,0 @@
-function [winner, varargout] = geneticRNN_learn_model(inp, mutationPower, populationSize, truncationSize, fitnessFunInputs, policyInitInputs, varargin)
-
-% net = hebbRNN_learn_model(x0, net, F, perturbProb, eta, varargin)
-%
-% This function trains a recurrent neural network using reward-modulated
-% Hebbian learning to produce desired outputs. During each trial the
-% activations of random neurons are randomly perturbed. All fluctuations in
-% the activation of each neuron are accumulated (supra-linearly) as an
-% elegibility trace. At the end of each trial the error of the output is
-% compared against the expected error and the difference is used to
-% reinforce connectivity changes (net.J) that produce the desired output.
-%
-% The details of training the network are based on those
-% presented in the following work:
-% "Flexible decision-making in recurrent neural networks trained with a
-% biologically plausible rule. Thomas Miconi (2016)"
-% Published on BioRxiv. The current version can be found under the following URL:
-% http://biorxiv.org/content/early/2016/07/26/057729
-%
-%
-% INPUTS:
-%
-% x0 -- the initial activation (t == 0) of all neurons
-% Must be of size: net.N x 1
-%
-% net -- the network structure created by hebbRNN_create_model
-%
-% F -- the desired output
-% Must be a cell of size: 1 x conditions
-% Each cell must be of size: net.B x time points
-%
-% perturbProb -- the probability of perturbing the activation of each neuron
-% per second
-%
-% eta -- the learning rate
-%
-%
-% OPTIONAL INPUTS:
-%
-% input -- the input to the network
-% Must be a cell of size: 1 x conditions
-% Each cell must be of size: net.I x time points
-% Default: []
-%
-% targettimes -- the time points used to generate the error signal
-% Default: entire trial
-%
-% beta -- the variance of the neural perturbation
-% Default: 0.5. Don't change this unless you know what you're doing
-%
-% maxdJ -- the absolute connectivity values above this level will be
-% clipped
-% Default: 1e-4. Don't change this unless you know what you're doing
-%
-% alphaX -- the weight given to previous time points of the activation
-% trace
-% Default: 0. Don't change this unless you know what you're doing
-%
-% alphaR -- the weight given to previous time points of the error
-% prediction trace
-% Default: 0.33. Don't change this unless you know what you're doing
-%
-% targetFun -- the handle of a function that uses the firing rates of the
-% output units to produce some desired output. Function must follow
-% conventions of supplied default function.
-% Default: @defaultTargetFunction
-%
-% targetFunPassthrough -- a user-defined structure that is automatically
-% passed through to the targetFun, permitting custom variables to be passed
-% Default: []
-%
-% tolerance -- at what error level below which the training will terminate
-% Default: 0 (will train forever).
-%
-% batchType -- conditions are train either in random order each pass
-% (pseudorand), or always in order (linear)
-% Default: 'pseudorand'
-%
-% plotFun -- the handle of a function that plots information about the
-% network during the learning process. Function must follow conventions
-% of supplied default function.
-% Default: @defaultPlottingFunction
-%
-% evalOpts -- a vector of size 2, specifying how much information should be
-% displayed during training (0 - nothing, 1 - text only, 2 - text +
-% figures), and how often the network should be evaluated. This vector is
-% passed to the plotting function.
-% Default: [0 50]
-%
-%
-% OUTPUTS:
-%
-% net -- the network structure
-%
-% errStats -- the structure containing error information from learning
-% (optional)
-%
-%
-% Copyright (c) Jonathan A Michaels 2016
-% German Primate Center
-% jonathanamichaels AT gmail DOT com
-%
-% If used in published work please see repository README.md for citation
-% and license information: https://github.com/JonathanAMichaels/hebbRNN
-
-
-% Start counting
-tic
-
-% Variable output considerations
-nout = max(nargout,1)-1;
-
-% Variable input considerations
-optargin = size(varargin,2);
-
-mutationPowerDecay = 0.99;
-mutationPowerDrop = 0.7;
-weightCompression = true;
-weightDecay = false;
-targetFun = @defaultTargetFunction; % Default output function (native)
-plotFun = @defaultPlottingFunction; % Default plotting function (native)
-fitnessFun = @defaultFitnessFunction; % Default fitness function (native)
-policyInitFun = @geneticRNN_create_model;
-policyInitInputsOptional = [];
-targetFunPassthrough = []; % Default passthrough to output function
-evalOpts = [1 1]; % Default evaluation values [plottingOptions evaluateEveryXIterations]
-
-for iVar = 1:2:optargin
-    switch varargin{iVar}            
-        case 'mutationPowerDecay'
-            mutationPowerDecay = varargin{iVar+1};
-        case 'mutationPowerDrop'
-            mutationPowerDrop = varargin{iVar+1};
-            
-        case 'weightCompression'
-            weightCompression = varargin{iVar+1};
-        case 'weightDecay'
-            weightDecay = varargin{iVar+1};
-            
-        case 'fitnessFun'
-            fitnessFun = varargin{iVar+1};
-        case 'policyInitFun'
-            policyInitFun = varargin{iVar+1};
-        case 'policyInitInputsOptional'
-            policyInitInputsOptional = varargin{iVar+1};
-            
-        case 'targetFun'
-            targetFun = varargin{iVar+1};
-        case 'targetFunPassthrough'
-            targetFunPassthrough = varargin{iVar+1};
-            
-            
-        case 'plotFun'
-            plotFun = varargin{iVar+1};
-        case 'evalOpts'
-            evalOpts = varargin{iVar+1};
-    end
-end
-
-%% Save options to network structure for posterity
-%
-
-%% Checks
-% The input can be either empty, or specified at each time point by the user.
-
-errStats.fitness = []; errStats.generation = []; % Initialize error statistics
-g = 1;
-allDecay1 = [];
-allDecay2 = [];
-allMutationPower = [];
-
-%% Main Program %%
-% Runs until tolerated error is met or stop button is pressed
-figure(97)
-set(gcf, 'Position', [0 50 100 50], 'MenuBar', 'none', 'ToolBar', 'none', 'Name', 'Stop', 'NumberTitle', 'off')
-UIButton = uicontrol('Style', 'togglebutton', 'String', 'STOP', 'Position', [0 0 100 50], 'FontSize', 25);
-while UIButton.Value == 0
-    tic
-    %% Initialize parameters
-    if weightCompression
-        decay1 = 1 - mutationPower;
-    else
-        decay1 = 1;
-    end
-    decay2 = mutationPower * 1e-1;
-    allDecay1 = cat(2, allDecay1, decay1);
-    allDecay2 = cat(2, allDecay2, decay2);
-    allMutationPower = cat(2, allMutationPower, mutationPower);
-    fitness = zeros(length(inp),populationSize);
-    
-    %% Generate random seeds
-    theseSeeds = randsample(1e8, populationSize);
-    if g > 1
-        previousSeeds = masterSeeds(randsample(size(masterSeeds,1), populationSize, true), :);
-        previousSeeds(1,:) = masterSeeds(1,:); % Save the elite!
-        theseSeeds(1) = nan; % Save the elite!
-        sendSeeds = [previousSeeds, theseSeeds];
-    else
-        sendSeeds = theseSeeds;
-    end
-    
-    %% Heavy lifting
-    parfor i = 1:populationSize
-        % Hack the random number generator
-        stream = RandStream('mrg32k3a');
-        RandStream.setGlobalStream(stream);
-        stream.Substream = i;
-        % Rollout the model based on the random seeds
-        net = geneticRNN_rollout_model(policyInitFun, policyInitInputs, policyInitInputsOptional, allMutationPower, allDecay1, allDecay2, weightDecay, sendSeeds(i,:));
-        % Run model
-        [~, Z1, ~, ~] = geneticRNN_run_model(net, inp, 'targetFun', targetFun, 'targetFunPassthrough', targetFunPassthrough);
-        % Assess fitness
-        fitness(:,i) = fitnessFun(Z1, fitnessFunInputs);
-    end
-    
-    %% Sort and save best policies
-    [~, sortInd] = sort(mean(fitness,1), 'descend');
-    fitness = fitness(:,sortInd(1:truncationSize));
-    masterSeeds = sendSeeds(sortInd(1:truncationSize),:);
-    
-
-    %% Recalculate best network for plotting or output
-    % Hack the random number generator
-    stream = RandStream('mrg32k3a');
-    RandStream.setGlobalStream(stream);
-    stream.Substream = sortInd(1);
-    % Rollout the model based on the random seeds
-    net = geneticRNN_rollout_model(policyInitFun, policyInitInputs, policyInitInputsOptional, allMutationPower, allDecay1, allDecay2, weightDecay, masterSeeds(1,:));
-    % Run model
-    [~, Z1, R, ~] = geneticRNN_run_model(net, inp, 'targetFun', targetFun, 'targetFunPassthrough', targetFunPassthrough);
-    % Assess fitness
-    check = fitnessFun(Z1, fitnessFunInputs);
-    
-    
-    disp(mean(check))
-    disp(mean(fitness(:,1)))
-    
-    %% Save stats
-    errStats.fitness(:,end+1) = fitness(:,1);
-    errStats.generation(end+1) = g;
-    
-    %% Populate statistics for plotting function
-    plotStats.fitness = fitness;
-    plotStats.mutationPower = mutationPower;
-    plotStats.generation = g;
-    plotStats.bigZ1 = Z1;
-    plotStats.bigR = R;
-    plotStats.targ = fitnessFunInputs;
-    
-    %% Run supplied plotting function
-    if mod(g,evalOpts(2)) == 0
-        plotFun(plotStats, errStats, evalOpts)
-    end
-    
-    %% Decay mutation power
-    if sortInd(1) == 1
-        mutationPower = mutationPower * mutationPowerDrop; % Big drop if we didn't learn anything
-    else
-        mutationPower = mutationPower * mutationPowerDecay; % Small drop if we learned something
-    end
-    
-    g = g + 1;
-    toc
-end
-
-
-%% Output error statistics if required
-if ( nout >= 1 )
-    varargout{1} = errStats;
-end
-
-%% Save hard-earned elite network
-winner = net;
-
-disp('Training time required:')
-toc
-
-
-%% Default plotting function
-    function defaultPlottingFunction(plotStats, errStats, evalOptions)
-        if evalOptions(1) >= 0
-            disp(['Generation: ' num2str(plotStats.generation) '  Fitness: ' num2str(mean(plotStats.fitness(:,1))) '  Mutation Power: ' num2str(plotStats.mutationPower)])
-        end
-        if evalOptions(1) >= 1
-            figure(98)
-            set(gcf, 'Name', 'Error', 'NumberTitle', 'off')
-            c = lines(size(plotStats.fitness,1));
-            for type = 1:size(plotStats.fitness,1)
-                h1(type) = plot(plotStats.generation, plotStats.fitness(type,1), '.', 'MarkerSize', 20, 'Color', c(type,:));
-                hold on
-            end
-            plot(plotStats.generation, mean(plotStats.fitness(:,1),1), '.', 'MarkerSize', 40, 'Color', [0 0 0]);
-            set(gca, 'XLim', [1 plotStats.generation+0.1])
-            xlabel('Generation')
-            ylabel('Fitness')
-        end
-        if evalOptions(1) >= 2
-            figure(99)
-            set(gcf, 'Name', 'Output and Neural Activity', 'NumberTitle', 'off')
-            clf
-            subplot(4,1,1)
-            hold on
-            c = lines(length(plotStats.bigZ1));
-            for condCount = 1:length(plotStats.bigZ1)
-                h2(condCount,:) = plot(plotStats.bigZ1{condCount}', 'Color', c(condCount,:));
-                h3(condCount,:) = plot(plotStats.targ{condCount}', '.', 'MarkerSize', 8, 'Color', c(condCount,:));
-            end
-            legend([h2(1,1) h3(1,1)], 'Network Output', 'Target Output', 'Location', 'SouthWest')
-            xlabel('Time Steps')
-            ylabel('Output')
-            set(gca, 'XLim', [1 size(plotStats.bigZ1{1},2)])
-            for n = 1:3
-                subplot(4,1,n+1)
-                hold on
-                for condCount = 1:length(plotStats.bigR)
-                    plot(plotStats.bigR{condCount}(n,:)', 'Color', c(condCount,:))
-                end
-                xlabel('Time Steps')
-                ylabel(['Firing Rate (Neuron ' num2str(n) ')'])
-                set(gca, 'XLim', [1 size(plotStats.bigR{1},2)])
-            end
-        end
-        drawnow
-    end
-
-    function fitness = defaultFitnessFunction(Z1, targ)
-        fitness = zeros(1,length(Z1));
-        for cond = 1:length(Z1)
-            ind = ~isnan(targ{cond});
-            useZ1 = Z1{cond}(ind);
-            useF = targ{cond}(ind);
-            
-            err(1) = sum(abs(useZ1(:)-useF(:)));       
-            fitness(cond) = -sum(err);
-        end
-    end
-
-
-%% Default output function
-    function [z, targetFeedforward] = defaultTargetFunction(~, r, ~, targetFeedforward)
-        z = r; % Just passes firing rate
-    end
-end
\ No newline at end of file
diff --git a/geneticRNN_learn_model_2.m~ b/geneticRNN_learn_model_2.m~
deleted file mode 100644
index 6f5013c..0000000
--- a/geneticRNN_learn_model_2.m~
+++ /dev/null
@@ -1,349 +0,0 @@
-function [winner, varargout] = geneticRNN_learn_model(mutationPower, populationSize, truncationSize, fitnessFunInputs, policyInitInputs, varargin)
-
-% net = hebbRNN_learn_model(x0, net, F, perturbProb, eta, varargin)
-%
-% This function trains a recurrent neural network using reward-modulated
-% Hebbian learning to produce desired outputs. During each trial the
-% activations of random neurons are randomly perturbed. All fluctuations in
-% the activation of each neuron are accumulated (supra-linearly) as an
-% elegibility trace. At the end of each trial the error of the output is
-% compared against the expected error and the difference is used to
-% reinforce connectivity changes (net.J) that produce the desired output.
-%
-% The details of training the network are based on those
-% presented in the following work:
-% "Flexible decision-making in recurrent neural networks trained with a
-% biologically plausible rule. Thomas Miconi (2016)"
-% Published on BioRxiv. The current version can be found under the following URL:
-% http://biorxiv.org/content/early/2016/07/26/057729
-%
-%
-% INPUTS:
-%
-% x0 -- the initial activation (t == 0) of all neurons
-% Must be of size: net.N x 1
-%
-% net -- the network structure created by hebbRNN_create_model
-%
-% F -- the desired output
-% Must be a cell of size: 1 x conditions
-% Each cell must be of size: net.B x time points
-%
-% perturbProb -- the probability of perturbing the activation of each neuron
-% per second
-%
-% eta -- the learning rate
-%
-%
-% OPTIONAL INPUTS:
-%
-% input -- the input to the network
-% Must be a cell of size: 1 x conditions
-% Each cell must be of size: net.I x time points
-% Default: []
-%
-% targettimes -- the time points used to generate the error signal
-% Default: entire trial
-%
-% beta -- the variance of the neural perturbation
-% Default: 0.5. Don't change this unless you know what you're doing
-%
-% maxdJ -- the absolute connectivity values above this level will be
-% clipped
-% Default: 1e-4. Don't change this unless you know what you're doing
-%
-% alphaX -- the weight given to previous time points of the activation
-% trace
-% Default: 0. Don't change this unless you know what you're doing
-%
-% alphaR -- the weight given to previous time points of the error
-% prediction trace
-% Default: 0.33. Don't change this unless you know what you're doing
-%
-% targetFun -- the handle of a function that uses the firing rates of the
-% output units to produce some desired output. Function must follow
-% conventions of supplied default function.
-% Default: @defaultTargetFunction
-%
-% targetFunPassthrough -- a user-defined structure that is automatically
-% passed through to the targetFun, permitting custom variables to be passed
-% Default: []
-%
-% tolerance -- at what error level below which the training will terminate
-% Default: 0 (will train forever).
-%
-% batchType -- conditions are train either in random order each pass
-% (pseudorand), or always in order (linear)
-% Default: 'pseudorand'
-%
-% plotFun -- the handle of a function that plots information about the
-% network during the learning process. Function must follow conventions
-% of supplied default function.
-% Default: @defaultPlottingFunction
-%
-% evalOpts -- a vector of size 2, specifying how much information should be
-% displayed during training (0 - nothing, 1 - text only, 2 - text +
-% figures), and how often the network should be evaluated. This vector is
-% passed to the plotting function.
-% Default: [0 50]
-%
-%
-% OUTPUTS:
-%
-% net -- the network structure
-%
-% errStats -- the structure containing error information from learning
-% (optional)
-%
-%
-% Copyright (c) Jonathan A Michaels 2016
-% German Primate Center
-% jonathanamichaels AT gmail DOT com
-%
-% If used in published work please see repository README.md for citation
-% and license information: https://github.com/JonathanAMichaels/hebbRNN
-
-
-% Start counting
-tic
-
-% Variable output considerations
-nout = max(nargout,1)-1;
-
-% Variable input considerations
-optargin = size(varargin,2);
-
-inp = []; % Default inputs
-mutationPowerDecay = 0.99;
-mutationPowerDrop = 0.7;
-weightCompression = true;
-weightDecay = false;
-targetFun = @defaultTargetFunction; % Default output function (native)
-plotFun = @defaultPlottingFunction; % Default plotting function (native)
-fitnessFun = @defaultFitnessFunction; % Default fitness function (native)
-policyInitFun = @geneticRNN_create_model;
-policyInitInputsOptional = [];
-targetFunPassthrough = []; % Default passthrough to output function
-evalOpts = [1 1]; % Default evaluation values [plottingOptions evaluateEveryXIterations]
-
-for iVar = 1:2:optargin
-    switch varargin{iVar}
-        
-        case 'input'
-            inp = varargin{iVar+1};
-            
-        case 'mutationPowerDecay'
-            mutationPowerDecay = varargin{iVar+1};
-        case 'mutationPowerDrop'
-            mutationPowerDrop = varargin{iVar+1};
-            
-        case 'weightCompression'
-            weightCompression = varargin{iVar+1};
-        case 'weightDecay'
-            weightDecay = varargin{iVar+1};
-            
-        case 'fitnessFun'
-            fitnessFun = varargin{iVar+1};
-        case 'policyInitFun'
-            policyInitFun = varargin{iVar+1};
-        case 'policyInitInputsOptional'
-            policyInitInputsOptional = varargin{iVar+1};
-            
-        case 'targetFun'
-            targetFun = varargin{iVar+1};
-        case 'targetFunPassthrough'
-            targetFunPassthrough = varargin{iVar+1};
-            
-            
-        case 'plotFun'
-            plotFun = varargin{iVar+1};
-        case 'evalOpts'
-            evalOpts = varargin{iVar+1};
-    end
-end
-
-%% Save options to network structure for posterity
-%
-
-%% Checks
-% The input can be either empty, or specified at each time point by the user.
-
-errStats.fitness = []; errStats.generation = []; % Initialize error statistics
-g = 1;
-allDecay1 = [];
-allDecay2 = [];
-allMutationPower = [];
-
-%% Main Program %%
-% Runs until tolerated error is met or stop button is pressed
-figure(97)
-set(gcf, 'Position', [0 0 100 50], 'MenuBar', 'none', 'ToolBar', 'none', 'Name', 'Stop', 'NumberTitle', 'off')
-UIButton = uicontrol('Style', 'togglebutton', 'String', 'STOP', 'Position', [0 0 100 50], 'FontSize', 25);
-while UIButton.Value == 0
-    
-    tic
-    fitness = zeros(length(inp),populationSize);
-    
-    if weightCompression
-        decay1 = 1 - mutationPower;
-    else
-        decay1 = 1;
-    end
-    decay2 = mutationPower * 1e-1;
-    
-    theseSeeds = randsample(1e8, populationSize);
-    if g > 1
-        previousSeeds = masterSeeds(randsample(size(masterSeeds,1), populationSize, true), :);
-        previousSeeds(1,:) = masterSeeds(1,:);
-        theseSeeds(1) = nan;
-        sendSeeds = [previousSeeds, theseSeeds];
-    else
-        sendSeeds = theseSeeds;
-    end
-    allDecay1 = cat(2, allDecay1, decay1);
-    allDecay2 = cat(2, allDecay2, decay2);
-    allMutationPower = cat(2, allMutationPower, mutationPower);
-    
-    parfor i = 1:populationSize
-        stream = RandStream('mrg32k3a');
-        RandStream.setGlobalStream(stream);
-        stream.Substream = i;
-        
-        net = geneticRNN_rollout_model(policyInitFun, policyInitInputs, policyInitInputsOptional, allMutationPower, allDecay1, allDecay2, weightDecay, sendSeeds(i,:));
-        % Run model
-        [Z0, Z1, ~, dR, ~] = geneticRNN_run_model(net, 'input', inp, 'targetFun', targetFun, 'targetFunPassthrough', targetFunPassthrough);
-        % Assess fitness
-        fitness(:,i) = fitnessFun(net.J, Z0, Z1, dR, fitnessFunInputs);
-    end
-    
-    [~, sortInd] = sort(mean(fitness,1), 'descend');
-    fitness = fitness(:,sortInd(1:truncationSize));
-    masterSeeds = sendSeeds(sortInd(1:truncationSize),:);
-    
-   sendSeeds = masterSeed(1,:)
-   useInd = sortInd(1);
-   parfor i = 1
-        stream = RandStream('mrg32k3a');
-        RandStream.setGlobalStream(stream);
-        stream.Substream = useInd;
-        
-        net = geneticRNN_rollout_model(policyInitFun, policyInitInputs, policyInitInputsOptional, allMutationPower, allDecay1, allDecay2, weightDecay, sendSeeds);
-        % Run model
-        [Z0, Z1{i}, R{i}, dR, ~] = geneticRNN_run_model(net, 'input', inp, 'targetFun', targetFun, 'targetFunPassthrough', targetFunPassthrough);
-        % Assess fitness
-        check{i} = fitnessFun(net.J, Z0, Z1, dR, fitnessFunInputs);
-    end
-    
-    disp(mean(check{1}))
-    disp(mean(fitness(:,1)))
-    
-    %% Save stats
-    errStats.fitness(:,end+1) = fitness(:,1);
-    errStats.generation(end+1) = g;
-    
-    %% Populate statistics for plotting function
-    plotStats.fitness = fitness;
-    plotStats.mutationPower = mutationPower;
-    plotStats.generation = g;
-    plotStats.bigZ1 = Z1;
-    plotStats.bigR = R;
-    plotStats.targ = fitnessFunInputs;
-    
-    %% Run supplied plotting function
-    if mod(g,evalOpts(2)) == 0
-        plotFun(plotStats, errStats, evalOpts)
-    end
-    
-    if sortInd(1) == 1
-        mutationPower = mutationPower * mutationPowerDrop;
-    else
-        mutationPower = mutationPower * mutationPowerDecay;
-    end
-    g = g + 1;
-    toc
-end
-
-
-%% Output error statistics if required
-if ( nout >= 1 )
-    varargout{1} = errStats;
-end
-
-%% Save hard-earned elite network
-winner = bestNet;
-
-disp('Training time required:')
-toc
-
-
-%% Default plotting function
-    function defaultPlottingFunction(plotStats, errStats, evalOptions)
-        if evalOptions(1) >= 0
-            disp(['Generation: ' num2str(plotStats.generation) '  Fitness: ' num2str(mean(plotStats.fitness(:,1))) '  Mutation Power: ' num2str(plotStats.mutationPower)])
-        end
-        if evalOptions(1) >= 1
-            figure(98)
-            set(gcf, 'Name', 'Error', 'NumberTitle', 'off')
-            c = lines(size(plotStats.fitness,1));
-            for type = 1:size(plotStats.fitness,1)
-                h1(type) = plot(plotStats.generation, plotStats.fitness(type,1), '.', 'MarkerSize', 20, 'Color', c(type,:));
-                hold on
-            end
-            plot(plotStats.generation, mean(plotStats.fitness(:,1),1), '.', 'MarkerSize', 40, 'Color', [0 0 0]);
-            set(gca, 'XLim', [1 plotStats.generation+0.1])
-            xlabel('Generation')
-            ylabel('Fitness')
-        end
-        if evalOptions(1) >= 2
-            figure(99)
-            set(gcf, 'Name', 'Output and Neural Activity', 'NumberTitle', 'off')
-            clf
-            subplot(4,1,1)
-            hold on
-            c = lines(length(plotStats.bigZ1));
-            for condCount = 1:length(plotStats.bigZ1)
-                h2(condCount,:) = plot(plotStats.bigZ1{condCount}', 'Color', c(condCount,:));
-                h3(condCount,:) = plot(plotStats.targ{condCount}', '.', 'MarkerSize', 8, 'Color', c(condCount,:));
-            end
-            legend([h2(1,1) h3(1,1)], 'Network Output', 'Target Output', 'Location', 'SouthWest')
-            xlabel('Time Steps')
-            ylabel('Output')
-            set(gca, 'XLim', [1 size(plotStats.bigZ1{1},2)])
-            for n = 1:3
-                subplot(4,1,n+1)
-                hold on
-                for condCount = 1:length(plotStats.bigR)
-                    plot(plotStats.bigR{condCount}(n,:)', 'Color', c(condCount,:))
-                end
-                xlabel('Time Steps')
-                ylabel(['Firing Rate (Neuron ' num2str(n) ')'])
-                set(gca, 'XLim', [1 size(plotStats.bigR{1},2)])
-            end
-        end
-        drawnow
-    end
-
-    function fitness = defaultFitnessFunction(J, Z0, Z1, dR, targ)
-        fitness = zeros(1,length(Z1));
-        for cond = 1:length(Z1)
-            ind = ~isnan(targ{cond});
-            
-            useZ0 = Z0{cond};
-            useZ1 = Z1{cond}(ind);
-            usedR = dR{cond};
-            useF = targ{cond}(ind);
-            
-            err(1) = sum(abs(useZ1(:)-useF(:)));
-            %temp = J*usedR;
-            err(2) = 0;%sum(temp(:).^2) / size(usedR,2);%0.0*sum(abs(useZ0(:)));
-            
-            fitness(cond) = -sum(err);
-        end
-    end
-
-
-%% Default output function
-    function [z, targetFeedforward] = defaultTargetFunction(~, r, ~, targetFeedforward)
-        z = r; % Just passes firing rate
-    end
-end
\ No newline at end of file
diff --git a/geneticRNN_rollout_model.m b/geneticRNN_rollout_model.m
index 222b9ef..73900f8 100644
--- a/geneticRNN_rollout_model.m
+++ b/geneticRNN_rollout_model.m
@@ -20,7 +20,7 @@
 %
 % weightDecay -- Whether or not to perform weight decay (logical)
 %
-% seeds - Vector of random generator seeds to rollout
+% seeds -- Vector of random generator seeds to rollout
 %
 %
 % OUTPUTS: