xcsf/neural__layer__lstm_8c_source.html

/*

 * This program is free software: you can redistribute it and/or modify

 * it under the terms of the GNU General Public License as published by

 * the Free Software Foundation, either version 3 of the License, or

 * (at your option) any later version.

 *

 * This program is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 * GNU General Public License for more details.

 *

 * You should have received a copy of the GNU General Public License

 * along with this program.  If not, see <http://www.gnu.org/licenses/>.

 */


#include "neural_layer_lstm.h"

#include "blas.h"

#include "neural_activations.h"

#include "neural_layer_connected.h"

#include "sam.h"

#include "utils.h"


#define N_MU (6)


static const int MU_TYPE[N_MU] = {

    SAM_RATE_SELECT,

    SAM_RATE_SELECT,

    SAM_RATE_SELECT,

    SAM_RATE_SELECT,

    SAM_RATE_SELECT,

    SAM_RATE_SELECT

};


static void


set_layer_n_weights(struct Layer *l)

{

    l->n_weights = l->uf->n_weights + l->ui->n_weights + l->ug->n_weights +

        l->uo->n_weights + l->wf->n_weights + l->wi->n_weights +

        l->wg->n_weights + l->wo->n_weights;

}


static void


set_layer_n_biases(struct Layer *l)

{

    l->n_biases = l->uf->n_biases + l->ui->n_biases + l->ug->n_biases +

        l->uo->n_biases + l->wf->n_biases + l->wi->n_biases + l->wg->n_biases +

        l->wo->n_biases;

}


static void


set_layer_n_active(struct Layer *l)

{

    l->n_active = l->uf->n_active + l->ui->n_active + l->ug->n_active +

        l->uo->n_active + l->wf->n_active + l->wi->n_active + l->wg->n_active +

        l->wo->n_active;

}


static void


malloc_layer_arrays(struct Layer *l)

{

    layer_guard_outputs(l);

    l->delta = calloc(l->n_outputs, sizeof(double));

    l->output = calloc(l->n_outputs, sizeof(double));

    l->state = calloc(l->n_outputs, sizeof(double));

    l->prev_state = calloc(l->n_outputs, sizeof(double));

    l->prev_cell = calloc(l->n_outputs, sizeof(double));

    l->cell = calloc(l->n_outputs, sizeof(double));

    l->f = calloc(l->n_outputs, sizeof(double));

    l->i = calloc(l->n_outputs, sizeof(double));

    l->g = calloc(l->n_outputs, sizeof(double));

    l->o = calloc(l->n_outputs, sizeof(double));

    l->c = calloc(l->n_outputs, sizeof(double));

    l->h = calloc(l->n_outputs, sizeof(double));

    l->temp = calloc(l->n_outputs, sizeof(double));

    l->temp2 = calloc(l->n_outputs, sizeof(double));

    l->temp3 = calloc(l->n_outputs, sizeof(double));

    l->dc = calloc(l->n_outputs, sizeof(double));

}


static void


malloc_layers(struct Layer *l)

{

    l->uf = malloc(sizeof(struct Layer));

    l->ui = malloc(sizeof(struct Layer));

    l->ug = malloc(sizeof(struct Layer));

    l->uo = malloc(sizeof(struct Layer));

    l->wf = malloc(sizeof(struct Layer));

    l->wi = malloc(sizeof(struct Layer));

    l->wg = malloc(sizeof(struct Layer));

    l->wo = malloc(sizeof(struct Layer));

}


static void


free_layer_arrays(const struct Layer *l)

{

    free(l->delta);

    free(l->output);

    free(l->state);

    free(l->prev_state);

    free(l->prev_cell);

    free(l->cell);

    free(l->f);

    free(l->i);

    free(l->g);

    free(l->o);

    free(l->c);

    free(l->h);

    free(l->temp);

    free(l->temp2);

    free(l->temp3);

    free(l->dc);

}


static void


set_eta(struct Layer *l)

{

    l->eta = l->uf->eta;

    l->ui->eta = l->eta;

    l->ug->eta = l->eta;

    l->uo->eta = l->eta;

    l->wf->eta = l->eta;

    l->wi->eta = l->eta;

    l->wg->eta = l->eta;

    l->wo->eta = l->eta;

}


static void


reset_layer_deltas(const struct Layer *l)

{

    size_t size = l->n_outputs * sizeof(double);

    memset(l->wf->delta, 0, size);

    memset(l->wi->delta, 0, size);

    memset(l->wg->delta, 0, size);

    memset(l->wo->delta, 0, size);

    memset(l->uf->delta, 0, size);

    memset(l->ui->delta, 0, size);

    memset(l->ug->delta, 0, size);

    memset(l->uo->delta, 0, size);

}


static bool


mutate_eta(struct Layer *l)

{

    if (layer_mutate_eta(l->uf, l->mu[0])) {

        set_eta(l);

        return true;

    }

    return false;

}


static bool


mutate_neurons(struct Layer *l)

{

    const int n = layer_mutate_neurons(l->uf, l->mu[1]);

    if (n != 0) {

        layer_add_neurons(l->uf, n);

        layer_add_neurons(l->ui, n);

        layer_add_neurons(l->ug, n);

        layer_add_neurons(l->uo, n);

        layer_add_neurons(l->wf, n);

        layer_add_neurons(l->wi, n);

        layer_add_neurons(l->wg, n);

        layer_add_neurons(l->wo, n);

        layer_resize(l->wf, l->uf);

        layer_resize(l->wi, l->uf);

        layer_resize(l->wg, l->uf);

        layer_resize(l->wo, l->uf);

        l->n_outputs = l->uf->n_outputs;

        l->out_w = l->n_outputs;

        l->out_c = 1;

        l->out_h = 1;

        set_layer_n_weights(l);

        set_layer_n_biases(l);

        set_layer_n_active(l);

        free_layer_arrays(l);

        malloc_layer_arrays(l);

        return true;

    }

    return false;

}


static bool


mutate_connectivity(struct Layer *l)

{

    bool mod = false;

    mod = layer_mutate_connectivity(l->uf, l->mu[2], l->mu[3]) ? true : mod;

    mod = layer_mutate_connectivity(l->ui, l->mu[2], l->mu[3]) ? true : mod;

    mod = layer_mutate_connectivity(l->ug, l->mu[2], l->mu[3]) ? true : mod;

    mod = layer_mutate_connectivity(l->uo, l->mu[2], l->mu[3]) ? true : mod;

    mod = layer_mutate_connectivity(l->wf, l->mu[2], l->mu[3]) ? true : mod;

    mod = layer_mutate_connectivity(l->wi, l->mu[2], l->mu[3]) ? true : mod;

    mod = layer_mutate_connectivity(l->wg, l->mu[2], l->mu[3]) ? true : mod;

    mod = layer_mutate_connectivity(l->wo, l->mu[2], l->mu[3]) ? true : mod;

    set_layer_n_active(l);

    return mod;

}


static bool


mutate_weights(struct Layer *l)

{

    bool mod = false;

    mod = layer_mutate_weights(l->uf, l->mu[4]) ? true : mod;

    mod = layer_mutate_weights(l->ui, l->mu[4]) ? true : mod;

    mod = layer_mutate_weights(l->ug, l->mu[4]) ? true : mod;

    mod = layer_mutate_weights(l->uo, l->mu[4]) ? true : mod;

    mod = layer_mutate_weights(l->wf, l->mu[4]) ? true : mod;

    mod = layer_mutate_weights(l->wi, l->mu[4]) ? true : mod;

    mod = layer_mutate_weights(l->wg, l->mu[4]) ? true : mod;

    mod = layer_mutate_weights(l->wo, l->mu[4]) ? true : mod;

    return mod;

}


void


neural_layer_lstm_init(struct Layer *l, const struct ArgsLayer *args)

{

    l->options = layer_args_opt(args);

    l->function = args->function;

    l->recurrent_function = args->recurrent_function;

    l->n_inputs = args->n_inputs;

    l->n_outputs = args->n_init;

    l->max_outputs = args->n_max;

    l->out_w = l->n_outputs;

    l->out_c = 1;

    l->out_h = 1;

    l->eta_max = args->eta;

    l->momentum = args->momentum;

    l->max_neuron_grow = args->max_neuron_grow;

    l->decay = args->decay;

    struct ArgsLayer *cargs = layer_args_copy(args);

    cargs->type = CONNECTED; // lstm is composed of 8 connected layers

    cargs->function = LINEAR;

    l->uf = layer_init(cargs); // input layers

    l->ui = layer_init(cargs);

    l->ug = layer_init(cargs);

    l->uo = layer_init(cargs);

    cargs->n_inputs = cargs->n_init;

    l->wf = layer_init(cargs); // self layers

    l->wi = layer_init(cargs);

    l->wg = layer_init(cargs);

    l->wo = layer_init(cargs);

    free(cargs);

    set_layer_n_biases(l);

    set_layer_n_weights(l);

    set_layer_n_active(l);

    set_eta(l);

    malloc_layer_arrays(l);

    l->mu = malloc(sizeof(double) * N_MU);

    sam_init(l->mu, N_MU, MU_TYPE);

}


struct Layer *


neural_layer_lstm_copy(const struct Layer *src)

{

    if (src->type != LSTM) {

        printf("neural_layer_lstm_copy(): incorrect source layer type\n");

        exit(EXIT_FAILURE);

    }

    struct Layer *l = malloc(sizeof(struct Layer));

    layer_defaults(l);

    l->type = src->type;

    l->layer_vptr = src->layer_vptr;

    l->function = src->function;

    l->recurrent_function = src->recurrent_function;

    l->options = src->options;

    l->n_inputs = src->n_inputs;

    l->n_outputs = src->n_outputs;

    l->out_w = src->out_w;

    l->out_h = src->out_h;

    l->out_c = src->out_c;

    l->n_weights = src->n_weights;

    l->n_biases = src->n_biases;

    l->n_active = src->n_active;

    l->eta = src->eta;

    l->eta_max = src->eta_max;

    l->momentum = src->momentum;

    l->decay = src->decay;

    l->max_neuron_grow = src->max_neuron_grow;

    l->max_outputs = src->max_outputs;

    l->uf = layer_copy(src->uf);

    l->ui = layer_copy(src->ui);

    l->ug = layer_copy(src->ug);

    l->uo = layer_copy(src->uo);

    l->wf = layer_copy(src->wf);

    l->wi = layer_copy(src->wi);

    l->wg = layer_copy(src->wg);

    l->wo = layer_copy(src->wo);

    malloc_layer_arrays(l);

    l->mu = malloc(sizeof(double) * N_MU);

    memcpy(l->mu, src->mu, sizeof(double) * N_MU);

    return l;

}


void


neural_layer_lstm_free(const struct Layer *l)

{

    layer_free(l->uf);

    layer_free(l->ui);

    layer_free(l->ug);

    layer_free(l->uo);

    layer_free(l->wf);

    layer_free(l->wi);

    layer_free(l->wg);

    layer_free(l->wo);

    free(l->uf);

    free(l->ui);

    free(l->ug);

    free(l->uo);

    free(l->wf);

    free(l->wi);

    free(l->wg);

    free(l->wo);

    free_layer_arrays(l);

    free(l->mu);

}


void


neural_layer_lstm_rand(struct Layer *l)

{

    layer_rand(l->uf);

    layer_rand(l->ui);

    layer_rand(l->ug);

    layer_rand(l->uo);

    layer_rand(l->wf);

    layer_rand(l->wi);

    layer_rand(l->wg);

    layer_rand(l->wo);

}


void


neural_layer_lstm_forward(const struct Layer *l, const struct Net *net,

                          const double *input)

{

    layer_forward(l->uf, net, input);

    layer_forward(l->ui, net, input);

    layer_forward(l->ug, net, input);

    layer_forward(l->uo, net, input);

    layer_forward(l->wf, net, l->h);

    layer_forward(l->wi, net, l->h);

    layer_forward(l->wg, net, l->h);

    layer_forward(l->wo, net, l->h);

    memcpy(l->f, l->wf->output, sizeof(double) * l->n_outputs);

    blas_axpy(l->n_outputs, 1, l->uf->output, 1, l->f, 1);

    memcpy(l->i, l->wi->output, sizeof(double) * l->n_outputs);

    blas_axpy(l->n_outputs, 1, l->ui->output, 1, l->i, 1);

    memcpy(l->g, l->wg->output, sizeof(double) * l->n_outputs);

    blas_axpy(l->n_outputs, 1, l->ug->output, 1, l->g, 1);

    memcpy(l->o, l->wo->output, sizeof(double) * l->n_outputs);

    blas_axpy(l->n_outputs, 1, l->uo->output, 1, l->o, 1);

    neural_activate_array(l->f, l->f, l->n_outputs, l->recurrent_function);

    neural_activate_array(l->i, l->i, l->n_outputs, l->recurrent_function);

    neural_activate_array(l->g, l->g, l->n_outputs, l->function);

    neural_activate_array(l->o, l->o, l->n_outputs, l->recurrent_function);

    memcpy(l->temp, l->i, sizeof(double) * l->n_outputs);

    blas_mul(l->n_outputs, l->g, 1, l->temp, 1);

    blas_mul(l->n_outputs, l->f, 1, l->c, 1);

    blas_axpy(l->n_outputs, 1, l->temp, 1, l->c, 1);

    memcpy(l->h, l->c, sizeof(double) * l->n_outputs);

    neural_activate_array(l->h, l->h, l->n_outputs, l->function);

    blas_mul(l->n_outputs, l->o, 1, l->h, 1);

    memcpy(l->cell, l->c, sizeof(double) * l->n_outputs);

    memcpy(l->output, l->h, sizeof(double) * l->n_outputs);

}


void


neural_layer_lstm_backward(const struct Layer *l, const struct Net *net,

                           const double *input, double *delta)

{

    reset_layer_deltas(l);

    memcpy(l->temp3, l->delta, sizeof(double) * l->n_outputs);

    memcpy(l->temp, l->c, sizeof(double) * l->n_outputs);

    neural_activate_array(l->temp, l->temp, l->n_outputs, l->function);

    memcpy(l->temp2, l->temp3, sizeof(double) * l->n_outputs);

    blas_mul(l->n_outputs, l->o, 1, l->temp2, 1);

    neural_gradient_array(l->temp, l->temp2, l->n_outputs, l->function);

    blas_axpy(l->n_outputs, 1, l->dc, 1, l->temp2, 1);

    memcpy(l->temp, l->c, sizeof(double) * l->n_outputs);

    neural_activate_array(l->temp, l->temp, l->n_outputs, l->function);

    blas_mul(l->n_outputs, l->temp3, 1, l->temp, 1);

    neural_gradient_array(l->o, l->temp, l->n_outputs, l->recurrent_function);

    memcpy(l->wo->delta, l->temp, sizeof(double) * l->n_outputs);

    layer_backward(l->wo, net, l->prev_state, 0);

    memcpy(l->uo->delta, l->temp, sizeof(double) * l->n_outputs);

    layer_backward(l->uo, net, input, delta);

    memcpy(l->temp, l->temp2, sizeof(double) * l->n_outputs);

    blas_mul(l->n_outputs, l->i, 1, l->temp, 1);

    neural_gradient_array(l->g, l->temp, l->n_outputs, l->function);

    memcpy(l->wg->delta, l->temp, sizeof(double) * l->n_outputs);

    layer_backward(l->wg, net, l->prev_state, 0);

    memcpy(l->ug->delta, l->temp, sizeof(double) * l->n_outputs);

    layer_backward(l->ug, net, input, delta);

    memcpy(l->temp, l->temp2, sizeof(double) * l->n_outputs);

    blas_mul(l->n_outputs, l->g, 1, l->temp, 1);

    neural_gradient_array(l->i, l->temp, l->n_outputs, l->recurrent_function);

    memcpy(l->wi->delta, l->temp, sizeof(double) * l->n_outputs);

    layer_backward(l->wi, net, l->prev_state, 0);

    memcpy(l->ui->delta, l->temp, sizeof(double) * l->n_outputs);

    layer_backward(l->ui, net, input, delta);

    memcpy(l->temp, l->temp2, sizeof(double) * l->n_outputs);

    blas_mul(l->n_outputs, l->prev_cell, 1, l->temp, 1);

    neural_gradient_array(l->f, l->temp, l->n_outputs, l->recurrent_function);

    memcpy(l->wf->delta, l->temp, sizeof(double) * l->n_outputs);

    layer_backward(l->wf, net, l->prev_state, 0);

    memcpy(l->uf->delta, l->temp, sizeof(double) * l->n_outputs);

    layer_backward(l->uf, net, input, delta);

    memcpy(l->temp, l->temp2, sizeof(double) * l->n_outputs);

    blas_mul(l->n_outputs, l->f, 1, l->temp, 1);

    memcpy(l->dc, l->temp, sizeof(double) * l->n_outputs);

}


void


neural_layer_lstm_update(const struct Layer *l)

{

    if (l->options & LAYER_SGD_WEIGHTS && l->eta > 0) {

        layer_update(l->wf);

        layer_update(l->wi);

        layer_update(l->wg);

        layer_update(l->wo);

        layer_update(l->uf);

        layer_update(l->ui);

        layer_update(l->ug);

        layer_update(l->uo);

    }

}


void


neural_layer_lstm_resize(struct Layer *l, const struct Layer *prev)

{

    layer_resize(l->uf, prev);

    layer_resize(l->ui, prev);

    layer_resize(l->ug, prev);

    layer_resize(l->uo, prev);

    layer_resize(l->uf, prev);

    l->n_inputs = prev->n_outputs;

    set_layer_n_weights(l);

    set_layer_n_biases(l);

    set_layer_n_active(l);

}


double *


neural_layer_lstm_output(const struct Layer *l)

{

    return l->output;

}


bool


neural_layer_lstm_mutate(struct Layer *l)

{

    sam_adapt(l->mu, N_MU, MU_TYPE);

    bool mod = false;

    if ((l->options & LAYER_EVOLVE_ETA) && mutate_eta(l)) {

        mod = true;

    }

    if ((l->options & LAYER_EVOLVE_NEURONS) && mutate_neurons(l)) {

        mod = true;

    }

    if ((l->options & LAYER_EVOLVE_CONNECT) && mutate_connectivity(l)) {

        mod = true;

    }

    if ((l->options & LAYER_EVOLVE_WEIGHTS) && mutate_weights(l)) {

        mod = true;

    }

    if ((l->options & LAYER_EVOLVE_FUNCTIONS) &&

        layer_mutate_functions(l, l->mu[5])) {

        mod = true;

    }

    return mod;

}


void


neural_layer_lstm_print(const struct Layer *l, const bool print_weights)

{

    char *json_str = neural_layer_lstm_json_export(l, print_weights);

    printf("%s\n", json_str);

    free(json_str);

}


char *


neural_layer_lstm_json_export(const struct Layer *l, const bool return_weights)

{

    cJSON *json = cJSON_CreateObject();

    cJSON_AddStringToObject(json, "type", "lstm");

    cJSON_AddStringToObject(json, "activation",

                            neural_activation_string(l->function));

    cJSON_AddStringToObject(json, "recurrent_activation",

                            neural_activation_string(l->recurrent_function));

    cJSON_AddNumberToObject(json, "n_inputs", l->n_inputs);

    cJSON_AddNumberToObject(json, "n_outputs", l->n_outputs);

    cJSON_AddNumberToObject(json, "eta", l->eta);

    cJSON *mutation = cJSON_CreateDoubleArray(l->mu, N_MU);

    cJSON_AddItemToObject(json, "mutation", mutation);

    char *weights_str = layer_weight_json(l->uf, return_weights);

    cJSON *uf = cJSON_Parse(weights_str);

    free(weights_str);

    cJSON_AddItemToObject(json, "uf_layer", uf);

    weights_str = layer_weight_json(l->ui, return_weights);

    cJSON *ui = cJSON_Parse(weights_str);

    free(weights_str);

    cJSON_AddItemToObject(json, "ui_layer", ui);

    weights_str = layer_weight_json(l->ug, return_weights);

    cJSON *ug = cJSON_Parse(weights_str);

    free(weights_str);

    cJSON_AddItemToObject(json, "ug_layer", ug);

    weights_str = layer_weight_json(l->uo, return_weights);

    cJSON *uo = cJSON_Parse(weights_str);

    free(weights_str);

    cJSON_AddItemToObject(json, "uo_layer", uo);

    weights_str = layer_weight_json(l->wf, return_weights);

    cJSON *wf = cJSON_Parse(weights_str);

    free(weights_str);

    cJSON_AddItemToObject(json, "wf_layer", wf);

    weights_str = layer_weight_json(l->wi, return_weights);

    cJSON *wi = cJSON_Parse(weights_str);

    free(weights_str);

    cJSON_AddItemToObject(json, "wi_layer", wi);

    weights_str = layer_weight_json(l->wg, return_weights);

    cJSON *wg = cJSON_Parse(weights_str);

    free(weights_str);

    cJSON_AddItemToObject(json, "wg_layer", wg);

    weights_str = layer_weight_json(l->wo, return_weights);

    cJSON *wo = cJSON_Parse(weights_str);

    free(weights_str);

    cJSON_AddItemToObject(json, "wo_layer", wo);

    char *string = cJSON_Print(json);

    cJSON_Delete(json);

    return string;

}


size_t


neural_layer_lstm_save(const struct Layer *l, FILE *fp)

{

    size_t s = 0;

    s += fwrite(&l->n_inputs, sizeof(int), 1, fp);

    s += fwrite(&l->n_outputs, sizeof(int), 1, fp);

    s += fwrite(&l->n_weights, sizeof(int), 1, fp);

    s += fwrite(&l->n_biases, sizeof(int), 1, fp);

    s += fwrite(&l->max_outputs, sizeof(int), 1, fp);

    s += fwrite(&l->n_active, sizeof(int), 1, fp);

    s += fwrite(&l->eta, sizeof(double), 1, fp);

    s += fwrite(&l->eta_max, sizeof(double), 1, fp);

    s += fwrite(&l->momentum, sizeof(double), 1, fp);

    s += fwrite(&l->decay, sizeof(double), 1, fp);

    s += fwrite(&l->max_neuron_grow, sizeof(int), 1, fp);

    s += fwrite(&l->options, sizeof(uint32_t), 1, fp);

    s += fwrite(l->mu, sizeof(double), N_MU, fp);

    s += fwrite(l->state, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->prev_state, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->cell, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->f, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->i, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->g, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->o, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->c, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->h, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->temp, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->temp2, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->temp3, sizeof(double), l->n_outputs, fp);

    s += fwrite(l->dc, sizeof(double), l->n_outputs, fp);

    s += layer_save(l->uf, fp);

    s += layer_save(l->ui, fp);

    s += layer_save(l->ug, fp);

    s += layer_save(l->uo, fp);

    s += layer_save(l->wf, fp);

    s += layer_save(l->wi, fp);

    s += layer_save(l->wg, fp);

    s += layer_save(l->wo, fp);

    return s;

}


size_t


neural_layer_lstm_load(struct Layer *l, FILE *fp)

{

    size_t s = 0;

    s += fread(&l->n_inputs, sizeof(int), 1, fp);

    s += fread(&l->n_outputs, sizeof(int), 1, fp);

    s += fread(&l->n_weights, sizeof(int), 1, fp);

    s += fread(&l->n_biases, sizeof(int), 1, fp);

    s += fread(&l->max_outputs, sizeof(int), 1, fp);

    s += fread(&l->n_active, sizeof(int), 1, fp);

    s += fread(&l->eta, sizeof(double), 1, fp);

    s += fread(&l->eta_max, sizeof(double), 1, fp);

    s += fread(&l->momentum, sizeof(double), 1, fp);

    s += fread(&l->decay, sizeof(double), 1, fp);

    s += fread(&l->max_neuron_grow, sizeof(int), 1, fp);

    s += fread(&l->options, sizeof(uint32_t), 1, fp);

    l->out_w = l->n_outputs;

    l->out_c = 1;

    l->out_h = 1;

    malloc_layer_arrays(l);

    l->mu = malloc(sizeof(double) * N_MU);

    s += fread(l->mu, sizeof(double), N_MU, fp);

    s += fread(l->state, sizeof(double), l->n_outputs, fp);

    s += fread(l->prev_state, sizeof(double), l->n_outputs, fp);

    s += fread(l->cell, sizeof(double), l->n_outputs, fp);

    s += fread(l->f, sizeof(double), l->n_outputs, fp);

    s += fread(l->i, sizeof(double), l->n_outputs, fp);

    s += fread(l->g, sizeof(double), l->n_outputs, fp);

    s += fread(l->o, sizeof(double), l->n_outputs, fp);

    s += fread(l->c, sizeof(double), l->n_outputs, fp);

    s += fread(l->h, sizeof(double), l->n_outputs, fp);

    s += fread(l->temp, sizeof(double), l->n_outputs, fp);

    s += fread(l->temp2, sizeof(double), l->n_outputs, fp);

    s += fread(l->temp3, sizeof(double), l->n_outputs, fp);

    s += fread(l->dc, sizeof(double), l->n_outputs, fp);

    malloc_layers(l);

    s += layer_load(l->uf, fp);

    s += layer_load(l->ui, fp);

    s += layer_load(l->ug, fp);

    s += layer_load(l->uo, fp);

    s += layer_load(l->wf, fp);

    s += layer_load(l->wi, fp);

    s += layer_load(l->wg, fp);

    s += layer_load(l->wo, fp);

    return s;

}


blas_axpy
void blas_axpy(const int N, const double ALPHA, const double *X, const int INCX, double *Y, const int INCY)
Multiplies vector X by the scalar ALPHA and adds it to the vector Y.
Definition blas.c:138

blas_mul
void blas_mul(const int N, const double *X, const int INCX, double *Y, const int INCY)
Multiplies vector X by the vector Y and stores the result in vector Y.
Definition blas.c:217

blas.h
Basic linear algebra functions.

neural_activation_string
const char * neural_activation_string(const int a)
Returns the name of a specified activation function.
Definition neural_activations.c:110

neural_gradient_array
void neural_gradient_array(const double *state, double *delta, const int n, const int a)
Applies a gradient function to a vector of neuron states.
Definition neural_activations.c:215

neural_activate_array
void neural_activate_array(double *state, double *output, const int n, const int a)
Applies an activation function to a vector of neuron states.
Definition neural_activations.c:199

neural_activations.h
Neural network activation functions.

LINEAR
#define LINEAR
Linear [-inf,inf].
Definition neural_activations.h:31

layer_mutate_connectivity
bool layer_mutate_connectivity(struct Layer *l, const double mu_enable, const double mu_disable)
Mutates a layer's connectivity by zeroing weights.
Definition neural_layer.c:176

layer_defaults
void layer_defaults(struct Layer *l)
Initialises a layer to default values.
Definition neural_layer.c:413

layer_mutate_neurons
int layer_mutate_neurons(const struct Layer *l, const double mu)
Returns the number of neurons to add or remove from a layer.
Definition neural_layer.c:106

layer_mutate_functions
bool layer_mutate_functions(struct Layer *l, const double mu)
Mutates a layer's activation function by random selection.
Definition neural_layer.c:283

layer_guard_outputs
void layer_guard_outputs(const struct Layer *l)
Check number of outputs is within bounds.
Definition neural_layer.c:595

layer_add_neurons
void layer_add_neurons(struct Layer *l, const int N)
Adds N neurons to a layer. Negative N removes neurons.
Definition neural_layer.c:130

layer_weight_json
char * layer_weight_json(const struct Layer *l, const bool return_weights)
Returns a json formatted string representation of a layer's weights.
Definition neural_layer.c:324

layer_mutate_eta
bool layer_mutate_eta(struct Layer *l, const double mu)
Mutates the gradient descent rate of a neural layer.
Definition neural_layer.c:88

layer_mutate_weights
bool layer_mutate_weights(struct Layer *l, const double mu)
Mutates a layer's weights and biases by adding random numbers from a Gaussian normal distribution wit...
Definition neural_layer.c:252

layer_rand
static void layer_rand(struct Layer *l)
Randomises a layer.
Definition neural_layer.h:258

layer_resize
static void layer_resize(struct Layer *l, const struct Layer *prev)
Resizes a layer using the previous layer's inputs.
Definition neural_layer.h:227

LAYER_EVOLVE_ETA
#define LAYER_EVOLVE_ETA
Layer may evolve rate of gradient descent.
Definition neural_layer.h:55

LAYER_EVOLVE_FUNCTIONS
#define LAYER_EVOLVE_FUNCTIONS
Layer may evolve functions.
Definition neural_layer.h:53

layer_save
static size_t layer_save(const struct Layer *l, FILE *fp)
Writes the layer to a file.
Definition neural_layer.h:372

LAYER_EVOLVE_WEIGHTS
#define LAYER_EVOLVE_WEIGHTS
Layer may evolve weights.
Definition neural_layer.h:51

layer_free
static void layer_free(const struct Layer *l)
Frees the memory used by the layer.
Definition neural_layer.h:248

layer_backward
static void layer_backward(const struct Layer *l, const struct Net *net, const double *input, double *delta)
Backward propagates the error through a layer.
Definition neural_layer.h:194

layer_load
static size_t layer_load(struct Layer *l, FILE *fp)
Reads the layer from a file.
Definition neural_layer.h:386

LSTM
#define LSTM
Layer type LSTM.
Definition neural_layer.h:34

LAYER_EVOLVE_NEURONS
#define LAYER_EVOLVE_NEURONS
Layer may evolve neurons.
Definition neural_layer.h:52

LAYER_EVOLVE_CONNECT
#define LAYER_EVOLVE_CONNECT
Layer may evolve connectivity.
Definition neural_layer.h:56

layer_update
static void layer_update(const struct Layer *l)
Updates the weights and biases of a layer.
Definition neural_layer.h:205

layer_init
static struct Layer * layer_init(const struct ArgsLayer *args)
Creates and initialises a new layer.
Definition neural_layer.h:355

layer_forward
static void layer_forward(const struct Layer *l, const struct Net *net, const double *input)
Forward propagates an input through the layer.
Definition neural_layer.h:181

layer_copy
static struct Layer * layer_copy(const struct Layer *src)
Creates and returns a copy of a specified layer.
Definition neural_layer.h:238

LAYER_SGD_WEIGHTS
#define LAYER_SGD_WEIGHTS
Layer may perform gradient descent.
Definition neural_layer.h:54

CONNECTED
#define CONNECTED
Layer type connected.
Definition neural_layer.h:29

layer_args_opt
uint32_t layer_args_opt(const struct ArgsLayer *args)
Returns a bitstring representing the permissions granted by a layer.
Definition neural_layer_args.c:541

layer_args_copy
struct ArgsLayer * layer_args_copy(const struct ArgsLayer *src)
Creates and returns a copy of specified layer parameters.
Definition neural_layer_args.c:77

neural_layer_connected.h
An implementation of a fully-connected layer of perceptrons.

neural_layer_lstm_backward
void neural_layer_lstm_backward(const struct Layer *l, const struct Net *net, const double *input, double *delta)
Backward propagates an LSTM layer.
Definition neural_layer_lstm.c:461

neural_layer_lstm_rand
void neural_layer_lstm_rand(struct Layer *l)
Randomises an LSTM layer weights.
Definition neural_layer_lstm.c:400

neural_layer_lstm_mutate
bool neural_layer_lstm_mutate(struct Layer *l)
Mutates an LSTM layer.
Definition neural_layer_lstm.c:561

mutate_eta
static bool mutate_eta(struct Layer *l)
Mutates the gradient descent rate used to update an LSTM layer.
Definition neural_layer_lstm.c:192

neural_layer_lstm_json_export
char * neural_layer_lstm_json_export(const struct Layer *l, const bool return_weights)
Returns a json formatted string representation of an LSTM layer.
Definition neural_layer_lstm.c:605

neural_layer_lstm_free
void neural_layer_lstm_free(const struct Layer *l)
Free memory used by an LSTM layer.
Definition neural_layer_lstm.c:373

neural_layer_lstm_output
double * neural_layer_lstm_output(const struct Layer *l)
Returns the output from an LSTM layer.
Definition neural_layer_lstm.c:550

free_layer_arrays
static void free_layer_arrays(const struct Layer *l)
Free memory used by an LSTM layer.
Definition neural_layer_lstm.c:131

malloc_layer_arrays
static void malloc_layer_arrays(struct Layer *l)
Allocate memory used by an LSTM layer.
Definition neural_layer_lstm.c:88

neural_layer_lstm_load
size_t neural_layer_lstm_load(struct Layer *l, FILE *fp)
Reads an LSTM layer from a file.
Definition neural_layer_lstm.c:709

set_layer_n_weights
static void set_layer_n_weights(struct Layer *l)
Sets the total number of weights in an LSTM layer.
Definition neural_layer_lstm.c:52

neural_layer_lstm_resize
void neural_layer_lstm_resize(struct Layer *l, const struct Layer *prev)
Resizes an LSTM layer if the previous layer has changed size.
Definition neural_layer_lstm.c:531

N_MU
#define N_MU
Number of mutation rates applied to an LSTM layer.
Definition neural_layer_lstm.c:33

mutate_neurons
static bool mutate_neurons(struct Layer *l)
Mutates the number of neurons in an LSTM layer.
Definition neural_layer_lstm.c:207

neural_layer_lstm_print
void neural_layer_lstm_print(const struct Layer *l, const bool print_weights)
Prints an LSTM layer.
Definition neural_layer_lstm.c:590

set_layer_n_active
static void set_layer_n_active(struct Layer *l)
Sets the number of active (non-zero) weights in an LSTM layer.
Definition neural_layer_lstm.c:76

MU_TYPE
static const int MU_TYPE[(6)]
Self-adaptation method for mutating an LSTM layer.
Definition neural_layer_lstm.c:38

neural_layer_lstm_save
size_t neural_layer_lstm_save(const struct Layer *l, FILE *fp)
Writes an LSTM layer to a file.
Definition neural_layer_lstm.c:662

mutate_weights
static bool mutate_weights(struct Layer *l)
Mutates the magnitude of weights and biases in an LSTM layer.
Definition neural_layer_lstm.c:264

reset_layer_deltas
static void reset_layer_deltas(const struct Layer *l)
Zeros the deltas used to update an LSTM layer.
Definition neural_layer_lstm.c:173

set_layer_n_biases
static void set_layer_n_biases(struct Layer *l)
Sets the total number of biases in an LSTM layer.
Definition neural_layer_lstm.c:64

neural_layer_lstm_update
void neural_layer_lstm_update(const struct Layer *l)
Updates the weights and biases of an LSTM layer.
Definition neural_layer_lstm.c:511

malloc_layers
static void malloc_layers(struct Layer *l)
Allocate memory for the sub-layers.
Definition neural_layer_lstm.c:114

neural_layer_lstm_copy
struct Layer * neural_layer_lstm_copy(const struct Layer *src)
Initialises and creates a copy of one LSTM layer from another.
Definition neural_layer_lstm.c:327

neural_layer_lstm_init
void neural_layer_lstm_init(struct Layer *l, const struct ArgsLayer *args)
Initialises a long short-term memory layer.
Definition neural_layer_lstm.c:284

mutate_connectivity
static bool mutate_connectivity(struct Layer *l)
Mutates the number of active weights in an LSTM layer.
Definition neural_layer_lstm.c:243

set_eta
static void set_eta(struct Layer *l)
Sets the gradient descent rate used to update an LSTM layer.
Definition neural_layer_lstm.c:156

neural_layer_lstm_forward
void neural_layer_lstm_forward(const struct Layer *l, const struct Net *net, const double *input)
Forward propagates an LSTM layer.
Definition neural_layer_lstm.c:419

neural_layer_lstm.h
An implementation of a long short-term memory layer.

sam_init
void sam_init(double *mu, const int N, const int *type)
Initialises self-adaptive mutation rates.
Definition sam.c:43

sam_adapt
void sam_adapt(double *mu, const int N, const int *type)
Self-adapts mutation rates.
Definition sam.c:68

sam.h
Self-adaptive mutation functions.

SAM_RATE_SELECT
#define SAM_RATE_SELECT
Ten normally distributed rates.
Definition sam.h:29

ArgsLayer
Parameters for initialising a neural network layer.
Definition neural_layer_args.h:31

ArgsLayer::n_init
int n_init
Initial number of units / neurons / filters.
Definition neural_layer_args.h:34

ArgsLayer::decay
double decay
Weight decay for gradient descent.
Definition neural_layer_args.h:48

ArgsLayer::momentum
double momentum
Momentum for gradient descent.
Definition neural_layer_args.h:47

ArgsLayer::function
int function
Activation function.
Definition neural_layer_args.h:37

ArgsLayer::max_neuron_grow
int max_neuron_grow
Maximum number neurons to add per mutation event.
Definition neural_layer_args.h:36

ArgsLayer::eta
double eta
Gradient descent rate.
Definition neural_layer_args.h:45

ArgsLayer::n_max
int n_max
Maximum number of units / neurons.
Definition neural_layer_args.h:35

ArgsLayer::n_inputs
int n_inputs
Number of inputs.
Definition neural_layer_args.h:33

ArgsLayer::type
int type
Layer type: CONNECTED, DROPOUT, etc.
Definition neural_layer_args.h:32

ArgsLayer::recurrent_function
int recurrent_function
Recurrent activation function.
Definition neural_layer_args.h:38

Layer
Neural network layer data structure.
Definition neural_layer.h:73

Layer::wf
struct Layer * wf
LSTM.
Definition neural_layer.h:110

Layer::output
double * output
Current neuron outputs (after activation function)
Definition neural_layer.h:76

Layer::decay
double decay
Weight decay for gradient descent.
Definition neural_layer.h:89

Layer::wo
struct Layer * wo
LSTM.
Definition neural_layer.h:113

Layer::state
double * state
Current neuron states (before activation function)
Definition neural_layer.h:75

Layer::uo
struct Layer * uo
LSTM.
Definition neural_layer.h:109

Layer::recurrent_function
int recurrent_function
LSTM.
Definition neural_layer.h:105

Layer::max_neuron_grow
int max_neuron_grow
Maximum number neurons to add per mutation event.
Definition neural_layer.h:93

Layer::ug
struct Layer * ug
LSTM.
Definition neural_layer.h:108

Layer::n_inputs
int n_inputs
Number of layer inputs.
Definition neural_layer.h:90

Layer::g
double * g
LSTM.
Definition neural_layer.h:118

Layer::n_biases
int n_biases
Number of layer biases.
Definition neural_layer.h:95

Layer::mu
double * mu
Mutation rates.
Definition neural_layer.h:84

Layer::function
int function
Layer activation function.
Definition neural_layer.h:97

Layer::c
double * c
LSTM.
Definition neural_layer.h:120

Layer::temp
double * temp
LSTM.
Definition neural_layer.h:122

Layer::wg
struct Layer * wg
LSTM.
Definition neural_layer.h:112

Layer::layer_vptr
struct LayerVtbl const  * layer_vptr
Functions acting on layers.
Definition neural_layer.h:100

Layer::max_outputs
int max_outputs
Maximum number of neurons in the layer.
Definition neural_layer.h:92

Layer::h
double * h
LSTM.
Definition neural_layer.h:121

Layer::n_weights
int n_weights
Number of layer weights.
Definition neural_layer.h:94

Layer::dc
double * dc
LSTM.
Definition neural_layer.h:125

Layer::temp3
double * temp3
LSTM.
Definition neural_layer.h:124

Layer::eta_max
double eta_max
Maximum gradient descent rate.
Definition neural_layer.h:86

Layer::uf
struct Layer * uf
LSTM.
Definition neural_layer.h:106

Layer::i
double * i
LSTM.
Definition neural_layer.h:117

Layer::temp2
double * temp2
LSTM.
Definition neural_layer.h:123

Layer::o
double * o
LSTM.
Definition neural_layer.h:119

Layer::n_outputs
int n_outputs
Number of layer outputs.
Definition neural_layer.h:91

Layer::n_active
int n_active
Number of active weights / connections.
Definition neural_layer.h:96

Layer::ui
struct Layer * ui
LSTM.
Definition neural_layer.h:107

Layer::prev_state
double * prev_state
Previous state for recursive layers.
Definition neural_layer.h:101

Layer::out_w
int out_w
Pool, Conv, and Upsample.
Definition neural_layer.h:130

Layer::type
int type
Layer type: CONNECTED, DROPOUT, etc.
Definition neural_layer.h:74

Layer::cell
double * cell
LSTM.
Definition neural_layer.h:114

Layer::out_c
int out_c
Pool, Conv, and Upsample.
Definition neural_layer.h:132

Layer::wi
struct Layer * wi
LSTM.
Definition neural_layer.h:111

Layer::delta
double * delta
Delta for updating weights.
Definition neural_layer.h:83

Layer::options
uint32_t options
Bitwise layer options permitting evolution, SGD, etc.
Definition neural_layer.h:77

Layer::f
double * f
LSTM.
Definition neural_layer.h:116

Layer::prev_cell
double * prev_cell
LSTM.
Definition neural_layer.h:115

Layer::out_h
int out_h
Pool, Conv, and Upsample.
Definition neural_layer.h:131

Layer::eta
double eta
Gradient descent rate.
Definition neural_layer.h:85

Layer::momentum
double momentum
Momentum for gradient descent.
Definition neural_layer.h:88

Net
Neural network data structure.
Definition neural.h:48

utils.h
Utility functions for random number handling, etc.