xcsf/neural__layer__lstm_8c_source.html

 /*

  * This program is free software: you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation, either version 3 of the License, or

  * (at your option) any later version.

  *

  * This program is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

  * GNU General Public License for more details.

  *

  * You should have received a copy of the GNU General Public License

  * along with this program.  If not, see <http://www.gnu.org/licenses/>.

  */


 #include "neural_layer_lstm.h"

 #include "blas.h"

 #include "neural_activations.h"

 #include "neural_layer_connected.h"

 #include "sam.h"

 #include "utils.h"


 #define N_MU (6)


 static const int MU_TYPE[N_MU] = {

     SAM_RATE_SELECT,

     SAM_RATE_SELECT,

     SAM_RATE_SELECT,

     SAM_RATE_SELECT,

     SAM_RATE_SELECT,

     SAM_RATE_SELECT

 };


 static void

 set_layer_n_weights(struct Layer *l)

 {

     l->n_weights = l->uf->n_weights + l->ui->n_weights + l->ug->n_weights +

         l->uo->n_weights + l->wf->n_weights + l->wi->n_weights +

         l->wg->n_weights + l->wo->n_weights;

 }


 static void

 set_layer_n_biases(struct Layer *l)

 {

     l->n_biases = l->uf->n_biases + l->ui->n_biases + l->ug->n_biases +

         l->uo->n_biases + l->wf->n_biases + l->wi->n_biases + l->wg->n_biases +

         l->wo->n_biases;

 }


 static void

 set_layer_n_active(struct Layer *l)

 {

     l->n_active = l->uf->n_active + l->ui->n_active + l->ug->n_active +

         l->uo->n_active + l->wf->n_active + l->wi->n_active + l->wg->n_active +

         l->wo->n_active;

 }


 static void

 malloc_layer_arrays(struct Layer *l)

 {

     layer_guard_outputs(l);

     l->delta = calloc(l->n_outputs, sizeof(double));

     l->output = calloc(l->n_outputs, sizeof(double));

     l->state = calloc(l->n_outputs, sizeof(double));

     l->prev_state = calloc(l->n_outputs, sizeof(double));

     l->prev_cell = calloc(l->n_outputs, sizeof(double));

     l->cell = calloc(l->n_outputs, sizeof(double));

     l->f = calloc(l->n_outputs, sizeof(double));

     l->i = calloc(l->n_outputs, sizeof(double));

     l->g = calloc(l->n_outputs, sizeof(double));

     l->o = calloc(l->n_outputs, sizeof(double));

     l->c = calloc(l->n_outputs, sizeof(double));

     l->h = calloc(l->n_outputs, sizeof(double));

     l->temp = calloc(l->n_outputs, sizeof(double));

     l->temp2 = calloc(l->n_outputs, sizeof(double));

     l->temp3 = calloc(l->n_outputs, sizeof(double));

     l->dc = calloc(l->n_outputs, sizeof(double));

 }


 static void

 malloc_layers(struct Layer *l)

 {

     l->uf = malloc(sizeof(struct Layer));

     l->ui = malloc(sizeof(struct Layer));

     l->ug = malloc(sizeof(struct Layer));

     l->uo = malloc(sizeof(struct Layer));

     l->wf = malloc(sizeof(struct Layer));

     l->wi = malloc(sizeof(struct Layer));

     l->wg = malloc(sizeof(struct Layer));

     l->wo = malloc(sizeof(struct Layer));

 }


 static void

 free_layer_arrays(const struct Layer *l)

 {

     free(l->delta);

     free(l->output);

     free(l->state);

     free(l->prev_state);

     free(l->prev_cell);

     free(l->cell);

     free(l->f);

     free(l->i);

     free(l->g);

     free(l->o);

     free(l->c);

     free(l->h);

     free(l->temp);

     free(l->temp2);

     free(l->temp3);

     free(l->dc);

 }


 static void

 set_eta(struct Layer *l)

 {

     l->eta = l->uf->eta;

     l->ui->eta = l->eta;

     l->ug->eta = l->eta;

     l->uo->eta = l->eta;

     l->wf->eta = l->eta;

     l->wi->eta = l->eta;

     l->wg->eta = l->eta;

     l->wo->eta = l->eta;

 }


 static void

 reset_layer_deltas(const struct Layer *l)

 {

     size_t size = l->n_outputs * sizeof(double);

     memset(l->wf->delta, 0, size);

     memset(l->wi->delta, 0, size);

     memset(l->wg->delta, 0, size);

     memset(l->wo->delta, 0, size);

     memset(l->uf->delta, 0, size);

     memset(l->ui->delta, 0, size);

     memset(l->ug->delta, 0, size);

     memset(l->uo->delta, 0, size);

 }


 static bool

 mutate_eta(struct Layer *l)

 {

     if (layer_mutate_eta(l->uf, l->mu[0])) {

         set_eta(l);

         return true;

     }

     return false;

 }


 static bool

 mutate_neurons(struct Layer *l)

 {

     const int n = layer_mutate_neurons(l->uf, l->mu[1]);

     if (n != 0) {

         layer_add_neurons(l->uf, n);

         layer_add_neurons(l->ui, n);

         layer_add_neurons(l->ug, n);

         layer_add_neurons(l->uo, n);

         layer_add_neurons(l->wf, n);

         layer_add_neurons(l->wi, n);

         layer_add_neurons(l->wg, n);

         layer_add_neurons(l->wo, n);

         layer_resize(l->wf, l->uf);

         layer_resize(l->wi, l->uf);

         layer_resize(l->wg, l->uf);

         layer_resize(l->wo, l->uf);

         l->n_outputs = l->uf->n_outputs;

         l->out_w = l->n_outputs;

         l->out_c = 1;

         l->out_h = 1;

         set_layer_n_weights(l);

         set_layer_n_biases(l);

         set_layer_n_active(l);

         free_layer_arrays(l);

         malloc_layer_arrays(l);

         return true;

     }

     return false;

 }


 static bool

 mutate_connectivity(struct Layer *l)

 {

     bool mod = false;

     mod = layer_mutate_connectivity(l->uf, l->mu[2], l->mu[3]) ? true : mod;

     mod = layer_mutate_connectivity(l->ui, l->mu[2], l->mu[3]) ? true : mod;

     mod = layer_mutate_connectivity(l->ug, l->mu[2], l->mu[3]) ? true : mod;

     mod = layer_mutate_connectivity(l->uo, l->mu[2], l->mu[3]) ? true : mod;

     mod = layer_mutate_connectivity(l->wf, l->mu[2], l->mu[3]) ? true : mod;

     mod = layer_mutate_connectivity(l->wi, l->mu[2], l->mu[3]) ? true : mod;

     mod = layer_mutate_connectivity(l->wg, l->mu[2], l->mu[3]) ? true : mod;

     mod = layer_mutate_connectivity(l->wo, l->mu[2], l->mu[3]) ? true : mod;

     set_layer_n_active(l);

     return mod;

 }


 static bool

 mutate_weights(struct Layer *l)

 {

     bool mod = false;

     mod = layer_mutate_weights(l->uf, l->mu[4]) ? true : mod;

     mod = layer_mutate_weights(l->ui, l->mu[4]) ? true : mod;

     mod = layer_mutate_weights(l->ug, l->mu[4]) ? true : mod;

     mod = layer_mutate_weights(l->uo, l->mu[4]) ? true : mod;

     mod = layer_mutate_weights(l->wf, l->mu[4]) ? true : mod;

     mod = layer_mutate_weights(l->wi, l->mu[4]) ? true : mod;

     mod = layer_mutate_weights(l->wg, l->mu[4]) ? true : mod;

     mod = layer_mutate_weights(l->wo, l->mu[4]) ? true : mod;

     return mod;

 }


 void

 neural_layer_lstm_init(struct Layer *l, const struct ArgsLayer *args)

 {

     l->options = layer_args_opt(args);

     l->function = args->function;

     l->recurrent_function = args->recurrent_function;

     l->n_inputs = args->n_inputs;

     l->n_outputs = args->n_init;

     l->max_outputs = args->n_max;

     l->out_w = l->n_outputs;

     l->out_c = 1;

     l->out_h = 1;

     l->eta_max = args->eta;

     l->momentum = args->momentum;

     l->max_neuron_grow = args->max_neuron_grow;

     l->decay = args->decay;

     struct ArgsLayer *cargs = layer_args_copy(args);

     cargs->type = CONNECTED; // lstm is composed of 8 connected layers

     cargs->function = LINEAR;

     l->uf = layer_init(cargs); // input layers

     l->ui = layer_init(cargs);

     l->ug = layer_init(cargs);

     l->uo = layer_init(cargs);

     cargs->n_inputs = cargs->n_init;

     l->wf = layer_init(cargs); // self layers

     l->wi = layer_init(cargs);

     l->wg = layer_init(cargs);

     l->wo = layer_init(cargs);

     free(cargs);

     set_layer_n_biases(l);

     set_layer_n_weights(l);

     set_layer_n_active(l);

     set_eta(l);

     malloc_layer_arrays(l);

     l->mu = malloc(sizeof(double) * N_MU);

     sam_init(l->mu, N_MU, MU_TYPE);

 }


 struct Layer *

 neural_layer_lstm_copy(const struct Layer *src)

 {

     if (src->type != LSTM) {

         printf("neural_layer_lstm_copy(): incorrect source layer type\n");

         exit(EXIT_FAILURE);

     }

     struct Layer *l = malloc(sizeof(struct Layer));

     layer_defaults(l);

     l->type = src->type;

     l->layer_vptr = src->layer_vptr;

     l->function = src->function;

     l->recurrent_function = src->recurrent_function;

     l->options = src->options;

     l->n_inputs = src->n_inputs;

     l->n_outputs = src->n_outputs;

     l->out_w = src->out_w;

     l->out_h = src->out_h;

     l->out_c = src->out_c;

     l->n_weights = src->n_weights;

     l->n_biases = src->n_biases;

     l->n_active = src->n_active;

     l->eta = src->eta;

     l->eta_max = src->eta_max;

     l->momentum = src->momentum;

     l->decay = src->decay;

     l->max_neuron_grow = src->max_neuron_grow;

     l->max_outputs = src->max_outputs;

     l->uf = layer_copy(src->uf);

     l->ui = layer_copy(src->ui);

     l->ug = layer_copy(src->ug);

     l->uo = layer_copy(src->uo);

     l->wf = layer_copy(src->wf);

     l->wi = layer_copy(src->wi);

     l->wg = layer_copy(src->wg);

     l->wo = layer_copy(src->wo);

     malloc_layer_arrays(l);

     l->mu = malloc(sizeof(double) * N_MU);

     memcpy(l->mu, src->mu, sizeof(double) * N_MU);

     return l;

 }


 void

 neural_layer_lstm_free(const struct Layer *l)

 {

     layer_free(l->uf);

     layer_free(l->ui);

     layer_free(l->ug);

     layer_free(l->uo);

     layer_free(l->wf);

     layer_free(l->wi);

     layer_free(l->wg);

     layer_free(l->wo);

     free(l->uf);

     free(l->ui);

     free(l->ug);

     free(l->uo);

     free(l->wf);

     free(l->wi);

     free(l->wg);

     free(l->wo);

     free_layer_arrays(l);

     free(l->mu);

 }


 void

 neural_layer_lstm_rand(struct Layer *l)

 {

     layer_rand(l->uf);

     layer_rand(l->ui);

     layer_rand(l->ug);

     layer_rand(l->uo);

     layer_rand(l->wf);

     layer_rand(l->wi);

     layer_rand(l->wg);

     layer_rand(l->wo);

 }


 void

 neural_layer_lstm_forward(const struct Layer *l, const struct Net *net,

                           const double *input)

 {

     layer_forward(l->uf, net, input);

     layer_forward(l->ui, net, input);

     layer_forward(l->ug, net, input);

     layer_forward(l->uo, net, input);

     layer_forward(l->wf, net, l->h);

     layer_forward(l->wi, net, l->h);

     layer_forward(l->wg, net, l->h);

     layer_forward(l->wo, net, l->h);

     memcpy(l->f, l->wf->output, sizeof(double) * l->n_outputs);

     blas_axpy(l->n_outputs, 1, l->uf->output, 1, l->f, 1);

     memcpy(l->i, l->wi->output, sizeof(double) * l->n_outputs);

     blas_axpy(l->n_outputs, 1, l->ui->output, 1, l->i, 1);

     memcpy(l->g, l->wg->output, sizeof(double) * l->n_outputs);

     blas_axpy(l->n_outputs, 1, l->ug->output, 1, l->g, 1);

     memcpy(l->o, l->wo->output, sizeof(double) * l->n_outputs);

     blas_axpy(l->n_outputs, 1, l->uo->output, 1, l->o, 1);

     neural_activate_array(l->f, l->f, l->n_outputs, l->recurrent_function);

     neural_activate_array(l->i, l->i, l->n_outputs, l->recurrent_function);

     neural_activate_array(l->g, l->g, l->n_outputs, l->function);

     neural_activate_array(l->o, l->o, l->n_outputs, l->recurrent_function);

     memcpy(l->temp, l->i, sizeof(double) * l->n_outputs);

     blas_mul(l->n_outputs, l->g, 1, l->temp, 1);

     blas_mul(l->n_outputs, l->f, 1, l->c, 1);

     blas_axpy(l->n_outputs, 1, l->temp, 1, l->c, 1);

     memcpy(l->h, l->c, sizeof(double) * l->n_outputs);

     neural_activate_array(l->h, l->h, l->n_outputs, l->function);

     blas_mul(l->n_outputs, l->o, 1, l->h, 1);

     memcpy(l->cell, l->c, sizeof(double) * l->n_outputs);

     memcpy(l->output, l->h, sizeof(double) * l->n_outputs);

 }


 void

 neural_layer_lstm_backward(const struct Layer *l, const struct Net *net,

                            const double *input, double *delta)

 {

     reset_layer_deltas(l);

     memcpy(l->temp3, l->delta, sizeof(double) * l->n_outputs);

     memcpy(l->temp, l->c, sizeof(double) * l->n_outputs);

     neural_activate_array(l->temp, l->temp, l->n_outputs, l->function);

     memcpy(l->temp2, l->temp3, sizeof(double) * l->n_outputs);

     blas_mul(l->n_outputs, l->o, 1, l->temp2, 1);

     neural_gradient_array(l->temp, l->temp2, l->n_outputs, l->function);

     blas_axpy(l->n_outputs, 1, l->dc, 1, l->temp2, 1);

     memcpy(l->temp, l->c, sizeof(double) * l->n_outputs);

     neural_activate_array(l->temp, l->temp, l->n_outputs, l->function);

     blas_mul(l->n_outputs, l->temp3, 1, l->temp, 1);

     neural_gradient_array(l->o, l->temp, l->n_outputs, l->recurrent_function);

     memcpy(l->wo->delta, l->temp, sizeof(double) * l->n_outputs);

     layer_backward(l->wo, net, l->prev_state, 0);

     memcpy(l->uo->delta, l->temp, sizeof(double) * l->n_outputs);

     layer_backward(l->uo, net, input, delta);

     memcpy(l->temp, l->temp2, sizeof(double) * l->n_outputs);

     blas_mul(l->n_outputs, l->i, 1, l->temp, 1);

     neural_gradient_array(l->g, l->temp, l->n_outputs, l->function);

     memcpy(l->wg->delta, l->temp, sizeof(double) * l->n_outputs);

     layer_backward(l->wg, net, l->prev_state, 0);

     memcpy(l->ug->delta, l->temp, sizeof(double) * l->n_outputs);

     layer_backward(l->ug, net, input, delta);

     memcpy(l->temp, l->temp2, sizeof(double) * l->n_outputs);

     blas_mul(l->n_outputs, l->g, 1, l->temp, 1);

     neural_gradient_array(l->i, l->temp, l->n_outputs, l->recurrent_function);

     memcpy(l->wi->delta, l->temp, sizeof(double) * l->n_outputs);

     layer_backward(l->wi, net, l->prev_state, 0);

     memcpy(l->ui->delta, l->temp, sizeof(double) * l->n_outputs);

     layer_backward(l->ui, net, input, delta);

     memcpy(l->temp, l->temp2, sizeof(double) * l->n_outputs);

     blas_mul(l->n_outputs, l->prev_cell, 1, l->temp, 1);

     neural_gradient_array(l->f, l->temp, l->n_outputs, l->recurrent_function);

     memcpy(l->wf->delta, l->temp, sizeof(double) * l->n_outputs);

     layer_backward(l->wf, net, l->prev_state, 0);

     memcpy(l->uf->delta, l->temp, sizeof(double) * l->n_outputs);

     layer_backward(l->uf, net, input, delta);

     memcpy(l->temp, l->temp2, sizeof(double) * l->n_outputs);

     blas_mul(l->n_outputs, l->f, 1, l->temp, 1);

     memcpy(l->dc, l->temp, sizeof(double) * l->n_outputs);

 }


 void

 neural_layer_lstm_update(const struct Layer *l)

 {

     if (l->options & LAYER_SGD_WEIGHTS && l->eta > 0) {

         layer_update(l->wf);

         layer_update(l->wi);

         layer_update(l->wg);

         layer_update(l->wo);

         layer_update(l->uf);

         layer_update(l->ui);

         layer_update(l->ug);

         layer_update(l->uo);

     }

 }


 void

 neural_layer_lstm_resize(struct Layer *l, const struct Layer *prev)

 {

     layer_resize(l->uf, prev);

     layer_resize(l->ui, prev);

     layer_resize(l->ug, prev);

     layer_resize(l->uo, prev);

     layer_resize(l->uf, prev);

     l->n_inputs = prev->n_outputs;

     set_layer_n_weights(l);

     set_layer_n_biases(l);

     set_layer_n_active(l);

 }


 double *

 neural_layer_lstm_output(const struct Layer *l)

 {

     return l->output;

 }


 bool

 neural_layer_lstm_mutate(struct Layer *l)

 {

     sam_adapt(l->mu, N_MU, MU_TYPE);

     bool mod = false;

     if ((l->options & LAYER_EVOLVE_ETA) && mutate_eta(l)) {

         mod = true;

     }

     if ((l->options & LAYER_EVOLVE_NEURONS) && mutate_neurons(l)) {

         mod = true;

     }

     if ((l->options & LAYER_EVOLVE_CONNECT) && mutate_connectivity(l)) {

         mod = true;

     }

     if ((l->options & LAYER_EVOLVE_WEIGHTS) && mutate_weights(l)) {

         mod = true;

     }

     if ((l->options & LAYER_EVOLVE_FUNCTIONS) &&

         layer_mutate_functions(l, l->mu[5])) {

         mod = true;

     }

     return mod;

 }


 void

 neural_layer_lstm_print(const struct Layer *l, const bool print_weights)

 {

     char *json_str = neural_layer_lstm_json_export(l, print_weights);

     printf("%s\n", json_str);

     free(json_str);

 }


 char *

 neural_layer_lstm_json_export(const struct Layer *l, const bool return_weights)

 {

     cJSON *json = cJSON_CreateObject();

     cJSON_AddStringToObject(json, "type", "lstm");

     cJSON_AddStringToObject(json, "activation",

                             neural_activation_string(l->function));

     cJSON_AddStringToObject(json, "recurrent_activation",

                             neural_activation_string(l->recurrent_function));

     cJSON_AddNumberToObject(json, "n_inputs", l->n_inputs);

     cJSON_AddNumberToObject(json, "n_outputs", l->n_outputs);

     cJSON_AddNumberToObject(json, "eta", l->eta);

     cJSON *mutation = cJSON_CreateDoubleArray(l->mu, N_MU);

     cJSON_AddItemToObject(json, "mutation", mutation);

     char *weights_str = layer_weight_json(l->uf, return_weights);

     cJSON *uf = cJSON_Parse(weights_str);

     free(weights_str);

     cJSON_AddItemToObject(json, "uf_layer", uf);

     weights_str = layer_weight_json(l->ui, return_weights);

     cJSON *ui = cJSON_Parse(weights_str);

     free(weights_str);

     cJSON_AddItemToObject(json, "ui_layer", ui);

     weights_str = layer_weight_json(l->ug, return_weights);

     cJSON *ug = cJSON_Parse(weights_str);

     free(weights_str);

     cJSON_AddItemToObject(json, "ug_layer", ug);

     weights_str = layer_weight_json(l->uo, return_weights);

     cJSON *uo = cJSON_Parse(weights_str);

     free(weights_str);

     cJSON_AddItemToObject(json, "uo_layer", uo);

     weights_str = layer_weight_json(l->wf, return_weights);

     cJSON *wf = cJSON_Parse(weights_str);

     free(weights_str);

     cJSON_AddItemToObject(json, "wf_layer", wf);

     weights_str = layer_weight_json(l->wi, return_weights);

     cJSON *wi = cJSON_Parse(weights_str);

     free(weights_str);

     cJSON_AddItemToObject(json, "wi_layer", wi);

     weights_str = layer_weight_json(l->wg, return_weights);

     cJSON *wg = cJSON_Parse(weights_str);

     free(weights_str);

     cJSON_AddItemToObject(json, "wg_layer", wg);

     weights_str = layer_weight_json(l->wo, return_weights);

     cJSON *wo = cJSON_Parse(weights_str);

     free(weights_str);

     cJSON_AddItemToObject(json, "wo_layer", wo);

     char *string = cJSON_Print(json);

     cJSON_Delete(json);

     return string;

 }


 size_t

 neural_layer_lstm_save(const struct Layer *l, FILE *fp)

 {

     size_t s = 0;

     s += fwrite(&l->n_inputs, sizeof(int), 1, fp);

     s += fwrite(&l->n_outputs, sizeof(int), 1, fp);

     s += fwrite(&l->n_weights, sizeof(int), 1, fp);

     s += fwrite(&l->n_biases, sizeof(int), 1, fp);

     s += fwrite(&l->max_outputs, sizeof(int), 1, fp);

     s += fwrite(&l->n_active, sizeof(int), 1, fp);

     s += fwrite(&l->eta, sizeof(double), 1, fp);

     s += fwrite(&l->eta_max, sizeof(double), 1, fp);

     s += fwrite(&l->momentum, sizeof(double), 1, fp);

     s += fwrite(&l->decay, sizeof(double), 1, fp);

     s += fwrite(&l->max_neuron_grow, sizeof(int), 1, fp);

     s += fwrite(&l->options, sizeof(uint32_t), 1, fp);

     s += fwrite(l->mu, sizeof(double), N_MU, fp);

     s += fwrite(l->state, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->prev_state, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->cell, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->f, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->i, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->g, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->o, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->c, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->h, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->temp, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->temp2, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->temp3, sizeof(double), l->n_outputs, fp);

     s += fwrite(l->dc, sizeof(double), l->n_outputs, fp);

     s += layer_save(l->uf, fp);

     s += layer_save(l->ui, fp);

     s += layer_save(l->ug, fp);

     s += layer_save(l->uo, fp);

     s += layer_save(l->wf, fp);

     s += layer_save(l->wi, fp);

     s += layer_save(l->wg, fp);

     s += layer_save(l->wo, fp);

     return s;

 }


 size_t

 neural_layer_lstm_load(struct Layer *l, FILE *fp)

 {

     size_t s = 0;

     s += fread(&l->n_inputs, sizeof(int), 1, fp);

     s += fread(&l->n_outputs, sizeof(int), 1, fp);

     s += fread(&l->n_weights, sizeof(int), 1, fp);

     s += fread(&l->n_biases, sizeof(int), 1, fp);

     s += fread(&l->max_outputs, sizeof(int), 1, fp);

     s += fread(&l->n_active, sizeof(int), 1, fp);

     s += fread(&l->eta, sizeof(double), 1, fp);

     s += fread(&l->eta_max, sizeof(double), 1, fp);

     s += fread(&l->momentum, sizeof(double), 1, fp);

     s += fread(&l->decay, sizeof(double), 1, fp);

     s += fread(&l->max_neuron_grow, sizeof(int), 1, fp);

     s += fread(&l->options, sizeof(uint32_t), 1, fp);

     l->out_w = l->n_outputs;

     l->out_c = 1;

     l->out_h = 1;

     malloc_layer_arrays(l);

     l->mu = malloc(sizeof(double) * N_MU);

     s += fread(l->mu, sizeof(double), N_MU, fp);

     s += fread(l->state, sizeof(double), l->n_outputs, fp);

     s += fread(l->prev_state, sizeof(double), l->n_outputs, fp);

     s += fread(l->cell, sizeof(double), l->n_outputs, fp);

     s += fread(l->f, sizeof(double), l->n_outputs, fp);

     s += fread(l->i, sizeof(double), l->n_outputs, fp);

     s += fread(l->g, sizeof(double), l->n_outputs, fp);

     s += fread(l->o, sizeof(double), l->n_outputs, fp);

     s += fread(l->c, sizeof(double), l->n_outputs, fp);

     s += fread(l->h, sizeof(double), l->n_outputs, fp);

     s += fread(l->temp, sizeof(double), l->n_outputs, fp);

     s += fread(l->temp2, sizeof(double), l->n_outputs, fp);

     s += fread(l->temp3, sizeof(double), l->n_outputs, fp);

     s += fread(l->dc, sizeof(double), l->n_outputs, fp);

     malloc_layers(l);

     s += layer_load(l->uf, fp);

     s += layer_load(l->ui, fp);

     s += layer_load(l->ug, fp);

     s += layer_load(l->uo, fp);

     s += layer_load(l->wf, fp);

     s += layer_load(l->wi, fp);

     s += layer_load(l->wg, fp);

     s += layer_load(l->wo, fp);

     return s;

 }

blas_axpy
void blas_axpy(const int N, const double ALPHA, const double *X, const int INCX, double *Y, const int INCY)
Multiplies vector X by the scalar ALPHA and adds it to the vector Y.
Definition: blas.c:138

blas_mul
void blas_mul(const int N, const double *X, const int INCX, double *Y, const int INCY)
Multiplies vector X by the vector Y and stores the result in vector Y.
Definition: blas.c:217

blas.h
Basic linear algebra functions.

neural_activation_string
const char * neural_activation_string(const int a)
Returns the name of a specified activation function.
Definition: neural_activations.c:110

neural_gradient_array
void neural_gradient_array(const double *state, double *delta, const int n, const int a)
Applies a gradient function to a vector of neuron states.
Definition: neural_activations.c:215

neural_activate_array
void neural_activate_array(double *state, double *output, const int n, const int a)
Applies an activation function to a vector of neuron states.
Definition: neural_activations.c:199

neural_activations.h
Neural network activation functions.

LINEAR
#define LINEAR
Linear [-inf,inf].
Definition: neural_activations.h:31

layer_mutate_connectivity
bool layer_mutate_connectivity(struct Layer *l, const double mu_enable, const double mu_disable)
Mutates a layer's connectivity by zeroing weights.
Definition: neural_layer.c:176

layer_defaults
void layer_defaults(struct Layer *l)
Initialises a layer to default values.
Definition: neural_layer.c:413

layer_mutate_neurons
int layer_mutate_neurons(const struct Layer *l, const double mu)
Returns the number of neurons to add or remove from a layer.
Definition: neural_layer.c:106

layer_mutate_functions
bool layer_mutate_functions(struct Layer *l, const double mu)
Mutates a layer's activation function by random selection.
Definition: neural_layer.c:283

layer_weight_json
char * layer_weight_json(const struct Layer *l, const bool return_weights)
Returns a json formatted string representation of a layer's weights.
Definition: neural_layer.c:324

layer_guard_outputs
void layer_guard_outputs(const struct Layer *l)
Check number of outputs is within bounds.
Definition: neural_layer.c:595

layer_add_neurons
void layer_add_neurons(struct Layer *l, const int N)
Adds N neurons to a layer. Negative N removes neurons.
Definition: neural_layer.c:130

layer_mutate_eta
bool layer_mutate_eta(struct Layer *l, const double mu)
Mutates the gradient descent rate of a neural layer.
Definition: neural_layer.c:88

layer_mutate_weights
bool layer_mutate_weights(struct Layer *l, const double mu)
Mutates a layer's weights and biases by adding random numbers from a Gaussian normal distribution wit...
Definition: neural_layer.c:252

layer_rand
static void layer_rand(struct Layer *l)
Randomises a layer.
Definition: neural_layer.h:259

layer_resize
static void layer_resize(struct Layer *l, const struct Layer *prev)
Resizes a layer using the previous layer's inputs.
Definition: neural_layer.h:228

LAYER_EVOLVE_ETA
#define LAYER_EVOLVE_ETA
Layer may evolve rate of gradient descent.
Definition: neural_layer.h:55

LAYER_EVOLVE_FUNCTIONS
#define LAYER_EVOLVE_FUNCTIONS
Layer may evolve functions.
Definition: neural_layer.h:53

layer_save
static size_t layer_save(const struct Layer *l, FILE *fp)
Writes the layer to a file.
Definition: neural_layer.h:373

layer_init
static struct Layer * layer_init(const struct ArgsLayer *args)
Creates and initialises a new layer.
Definition: neural_layer.h:356

layer_copy
static struct Layer * layer_copy(const struct Layer *src)
Creates and returns a copy of a specified layer.
Definition: neural_layer.h:239

LAYER_EVOLVE_WEIGHTS
#define LAYER_EVOLVE_WEIGHTS
Layer may evolve weights.
Definition: neural_layer.h:51

layer_free
static void layer_free(const struct Layer *l)
Frees the memory used by the layer.
Definition: neural_layer.h:249

layer_backward
static void layer_backward(const struct Layer *l, const struct Net *net, const double *input, double *delta)
Backward propagates the error through a layer.
Definition: neural_layer.h:194

layer_load
static size_t layer_load(struct Layer *l, FILE *fp)
Reads the layer from a file.
Definition: neural_layer.h:387

LSTM
#define LSTM
Layer type LSTM.
Definition: neural_layer.h:34

LAYER_EVOLVE_NEURONS
#define LAYER_EVOLVE_NEURONS
Layer may evolve neurons.
Definition: neural_layer.h:52

LAYER_EVOLVE_CONNECT
#define LAYER_EVOLVE_CONNECT
Layer may evolve connectivity.
Definition: neural_layer.h:56

layer_update
static void layer_update(const struct Layer *l)
Updates the weights and biases of a layer.
Definition: neural_layer.h:205

layer_forward
static void layer_forward(const struct Layer *l, const struct Net *net, const double *input)
Forward propagates an input through the layer.
Definition: neural_layer.h:181

LAYER_SGD_WEIGHTS
#define LAYER_SGD_WEIGHTS
Layer may perform gradient descent.
Definition: neural_layer.h:54

CONNECTED
#define CONNECTED
Layer type connected.
Definition: neural_layer.h:29

layer_args_opt
uint32_t layer_args_opt(const struct ArgsLayer *args)
Returns a bitstring representing the permissions granted by a layer.
Definition: neural_layer_args.c:541

layer_args_copy
struct ArgsLayer * layer_args_copy(const struct ArgsLayer *src)
Creates and returns a copy of specified layer parameters.
Definition: neural_layer_args.c:77

neural_layer_connected.h
An implementation of a fully-connected layer of perceptrons.

neural_layer_lstm_backward
void neural_layer_lstm_backward(const struct Layer *l, const struct Net *net, const double *input, double *delta)
Backward propagates an LSTM layer.
Definition: neural_layer_lstm.c:461

neural_layer_lstm_rand
void neural_layer_lstm_rand(struct Layer *l)
Randomises an LSTM layer weights.
Definition: neural_layer_lstm.c:400

neural_layer_lstm_mutate
bool neural_layer_lstm_mutate(struct Layer *l)
Mutates an LSTM layer.
Definition: neural_layer_lstm.c:561

mutate_eta
static bool mutate_eta(struct Layer *l)
Mutates the gradient descent rate used to update an LSTM layer.
Definition: neural_layer_lstm.c:192

neural_layer_lstm_output
double * neural_layer_lstm_output(const struct Layer *l)
Returns the output from an LSTM layer.
Definition: neural_layer_lstm.c:550

neural_layer_lstm_free
void neural_layer_lstm_free(const struct Layer *l)
Free memory used by an LSTM layer.
Definition: neural_layer_lstm.c:373

free_layer_arrays
static void free_layer_arrays(const struct Layer *l)
Free memory used by an LSTM layer.
Definition: neural_layer_lstm.c:131

malloc_layer_arrays
static void malloc_layer_arrays(struct Layer *l)
Allocate memory used by an LSTM layer.
Definition: neural_layer_lstm.c:88

neural_layer_lstm_copy
struct Layer * neural_layer_lstm_copy(const struct Layer *src)
Initialises and creates a copy of one LSTM layer from another.
Definition: neural_layer_lstm.c:327

neural_layer_lstm_load
size_t neural_layer_lstm_load(struct Layer *l, FILE *fp)
Reads an LSTM layer from a file.
Definition: neural_layer_lstm.c:709

set_layer_n_weights
static void set_layer_n_weights(struct Layer *l)
Sets the total number of weights in an LSTM layer.
Definition: neural_layer_lstm.c:52

neural_layer_lstm_resize
void neural_layer_lstm_resize(struct Layer *l, const struct Layer *prev)
Resizes an LSTM layer if the previous layer has changed size.
Definition: neural_layer_lstm.c:531

N_MU
#define N_MU
Number of mutation rates applied to an LSTM layer.
Definition: neural_layer_lstm.c:33

mutate_neurons
static bool mutate_neurons(struct Layer *l)
Mutates the number of neurons in an LSTM layer.
Definition: neural_layer_lstm.c:207

neural_layer_lstm_print
void neural_layer_lstm_print(const struct Layer *l, const bool print_weights)
Prints an LSTM layer.
Definition: neural_layer_lstm.c:590

set_layer_n_active
static void set_layer_n_active(struct Layer *l)
Sets the number of active (non-zero) weights in an LSTM layer.
Definition: neural_layer_lstm.c:76

MU_TYPE
static const int MU_TYPE[(6)]
Self-adaptation method for mutating an LSTM layer.
Definition: neural_layer_lstm.c:38

neural_layer_lstm_save
size_t neural_layer_lstm_save(const struct Layer *l, FILE *fp)
Writes an LSTM layer to a file.
Definition: neural_layer_lstm.c:662

mutate_weights
static bool mutate_weights(struct Layer *l)
Mutates the magnitude of weights and biases in an LSTM layer.
Definition: neural_layer_lstm.c:264

reset_layer_deltas
static void reset_layer_deltas(const struct Layer *l)
Zeros the deltas used to update an LSTM layer.
Definition: neural_layer_lstm.c:173

set_layer_n_biases
static void set_layer_n_biases(struct Layer *l)
Sets the total number of biases in an LSTM layer.
Definition: neural_layer_lstm.c:64

neural_layer_lstm_update
void neural_layer_lstm_update(const struct Layer *l)
Updates the weights and biases of an LSTM layer.
Definition: neural_layer_lstm.c:511

malloc_layers
static void malloc_layers(struct Layer *l)
Allocate memory for the sub-layers.
Definition: neural_layer_lstm.c:114

neural_layer_lstm_json_export
char * neural_layer_lstm_json_export(const struct Layer *l, const bool return_weights)
Returns a json formatted string representation of an LSTM layer.
Definition: neural_layer_lstm.c:605

neural_layer_lstm_init
void neural_layer_lstm_init(struct Layer *l, const struct ArgsLayer *args)
Initialises a long short-term memory layer.
Definition: neural_layer_lstm.c:284

mutate_connectivity
static bool mutate_connectivity(struct Layer *l)
Mutates the number of active weights in an LSTM layer.
Definition: neural_layer_lstm.c:243

set_eta
static void set_eta(struct Layer *l)
Sets the gradient descent rate used to update an LSTM layer.
Definition: neural_layer_lstm.c:156

neural_layer_lstm_forward
void neural_layer_lstm_forward(const struct Layer *l, const struct Net *net, const double *input)
Forward propagates an LSTM layer.
Definition: neural_layer_lstm.c:419

neural_layer_lstm.h
An implementation of a long short-term memory layer.

sam_init
void sam_init(double *mu, const int N, const int *type)
Initialises self-adaptive mutation rates.
Definition: sam.c:43

sam_adapt
void sam_adapt(double *mu, const int N, const int *type)
Self-adapts mutation rates.
Definition: sam.c:68

sam.h
Self-adaptive mutation functions.

SAM_RATE_SELECT
#define SAM_RATE_SELECT
Ten normally distributed rates.
Definition: sam.h:29

ArgsLayer
Parameters for initialising a neural network layer.
Definition: neural_layer_args.h:31

ArgsLayer::n_init
int n_init
Initial number of units / neurons / filters.
Definition: neural_layer_args.h:34

ArgsLayer::decay
double decay
Weight decay for gradient descent.
Definition: neural_layer_args.h:48

ArgsLayer::momentum
double momentum
Momentum for gradient descent.
Definition: neural_layer_args.h:47

ArgsLayer::function
int function
Activation function.
Definition: neural_layer_args.h:37

ArgsLayer::max_neuron_grow
int max_neuron_grow
Maximum number neurons to add per mutation event.
Definition: neural_layer_args.h:36

ArgsLayer::eta
double eta
Gradient descent rate.
Definition: neural_layer_args.h:45

ArgsLayer::n_max
int n_max
Maximum number of units / neurons.
Definition: neural_layer_args.h:35

ArgsLayer::n_inputs
int n_inputs
Number of inputs.
Definition: neural_layer_args.h:33

ArgsLayer::type
int type
Layer type: CONNECTED, DROPOUT, etc.
Definition: neural_layer_args.h:32

ArgsLayer::recurrent_function
int recurrent_function
Recurrent activation function.
Definition: neural_layer_args.h:38

Layer
Neural network layer data structure.
Definition: neural_layer.h:73

Layer::wf
struct Layer * wf
LSTM.
Definition: neural_layer.h:110

Layer::output
double * output
Current neuron outputs (after activation function)
Definition: neural_layer.h:76

Layer::decay
double decay
Weight decay for gradient descent.
Definition: neural_layer.h:89

Layer::wo
struct Layer * wo
LSTM.
Definition: neural_layer.h:113

Layer::state
double * state
Current neuron states (before activation function)
Definition: neural_layer.h:75

Layer::uo
struct Layer * uo
LSTM.
Definition: neural_layer.h:109

Layer::recurrent_function
int recurrent_function
LSTM.
Definition: neural_layer.h:105

Layer::max_neuron_grow
int max_neuron_grow
Maximum number neurons to add per mutation event.
Definition: neural_layer.h:93

Layer::ug
struct Layer * ug
LSTM.
Definition: neural_layer.h:108

Layer::n_inputs
int n_inputs
Number of layer inputs.
Definition: neural_layer.h:90

Layer::g
double * g
LSTM.
Definition: neural_layer.h:118

Layer::n_biases
int n_biases
Number of layer biases.
Definition: neural_layer.h:95

Layer::mu
double * mu
Mutation rates.
Definition: neural_layer.h:84

Layer::function
int function
Layer activation function.
Definition: neural_layer.h:97

Layer::c
double * c
LSTM.
Definition: neural_layer.h:120

Layer::temp
double * temp
LSTM.
Definition: neural_layer.h:122

Layer::wg
struct Layer * wg
LSTM.
Definition: neural_layer.h:112

Layer::layer_vptr
struct LayerVtbl const  * layer_vptr
Functions acting on layers.
Definition: neural_layer.h:100

Layer::max_outputs
int max_outputs
Maximum number of neurons in the layer.
Definition: neural_layer.h:92

Layer::h
double * h
LSTM.
Definition: neural_layer.h:121

Layer::n_weights
int n_weights
Number of layer weights.
Definition: neural_layer.h:94

Layer::dc
double * dc
LSTM.
Definition: neural_layer.h:125

Layer::temp3
double * temp3
LSTM.
Definition: neural_layer.h:124

Layer::eta_max
double eta_max
Maximum gradient descent rate.
Definition: neural_layer.h:86

Layer::uf
struct Layer * uf
LSTM.
Definition: neural_layer.h:106

Layer::i
double * i
LSTM.
Definition: neural_layer.h:117

Layer::temp2
double * temp2
LSTM.
Definition: neural_layer.h:123

Layer::o
double * o
LSTM.
Definition: neural_layer.h:119

Layer::n_outputs
int n_outputs
Number of layer outputs.
Definition: neural_layer.h:91

Layer::n_active
int n_active
Number of active weights / connections.
Definition: neural_layer.h:96

Layer::ui
struct Layer * ui
LSTM.
Definition: neural_layer.h:107

Layer::prev_state
double * prev_state
Previous state for recursive layers.
Definition: neural_layer.h:101

Layer::out_w
int out_w
Pool, Conv, and Upsample.
Definition: neural_layer.h:130

Layer::type
int type
Layer type: CONNECTED, DROPOUT, etc.
Definition: neural_layer.h:74

Layer::cell
double * cell
LSTM.
Definition: neural_layer.h:114

Layer::out_c
int out_c
Pool, Conv, and Upsample.
Definition: neural_layer.h:132

Layer::wi
struct Layer * wi
LSTM.
Definition: neural_layer.h:111

Layer::delta
double * delta
Delta for updating weights.
Definition: neural_layer.h:83

Layer::options
uint32_t options
Bitwise layer options permitting evolution, SGD, etc.
Definition: neural_layer.h:77

Layer::f
double * f
LSTM.
Definition: neural_layer.h:116

Layer::prev_cell
double * prev_cell
LSTM.
Definition: neural_layer.h:115

Layer::out_h
int out_h
Pool, Conv, and Upsample.
Definition: neural_layer.h:131

Layer::eta
double eta
Gradient descent rate.
Definition: neural_layer.h:85

Layer::momentum
double momentum
Momentum for gradient descent.
Definition: neural_layer.h:88

Net
Neural network data structure.
Definition: neural.h:48

utils.h
Utility functions for random number handling, etc.