xcsf/neural__layer__convolutional_8c_source.html

/*

 * This program is free software: you can redistribute it and/or modify

 * it under the terms of the GNU General Public License as published by

 * the Free Software Foundation, either version 3 of the License, or

 * (at your option) any later version.

 *

 * This program is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 * GNU General Public License for more details.

 *

 * You should have received a copy of the GNU General Public License

 * along with this program.  If not, see <http://www.gnu.org/licenses/>.

 */


#include "neural_layer_convolutional.h"

#include "blas.h"

#include "image.h"

#include "neural_activations.h"

#include "sam.h"

#include "utils.h"


#define N_MU (6)


static const int MU_TYPE[N_MU] = {

    SAM_RATE_SELECT,

    SAM_RATE_SELECT,

    SAM_RATE_SELECT,

    SAM_RATE_SELECT,

    SAM_RATE_SELECT,

    SAM_RATE_SELECT

};


static int


get_out_height(const struct Layer *l)

{

    return (l->height + 2 * l->pad - l->size) / l->stride + 1;

}


static int


get_out_width(const struct Layer *l)

{

    return (l->width + 2 * l->pad - l->size) / l->stride + 1;

}


static size_t


get_workspace_size(const struct Layer *l)

{

    const size_t workspace_size = (size_t) l->out_h * l->out_w * l->size *

        l->size * l->channels * sizeof(double);

    if (workspace_size < 1) {

        printf("neural_layer_convolutional: invalid workspace size\n");

        layer_print(l, false);

        exit(EXIT_FAILURE);

    }

    return workspace_size;

}


static void


guard_malloc(const struct Layer *l)

{

    layer_guard_biases(l);

    layer_guard_outputs(l);

    layer_guard_weights(l);

}


static void


malloc_layer_arrays(struct Layer *l)

{

    guard_malloc(l);

    l->delta = calloc(l->n_outputs, sizeof(double));

    l->state = calloc(l->n_outputs, sizeof(double));

    l->output = calloc(l->n_outputs, sizeof(double));

    l->weights = malloc(sizeof(double) * l->n_weights);

    l->weight_updates = calloc(l->n_weights, sizeof(double));

    l->weight_active = malloc(sizeof(bool) * l->n_weights);

    l->biases = malloc(sizeof(double) * l->n_biases);

    l->bias_updates = calloc(l->n_biases, sizeof(double));

    l->temp = malloc(get_workspace_size(l));

    l->mu = malloc(sizeof(double) * N_MU);

}


static void


realloc_layer_arrays(struct Layer *l)

{

    guard_malloc(l);

    l->delta = realloc(l->delta, sizeof(double) * l->n_outputs);

    l->state = realloc(l->state, sizeof(double) * l->n_outputs);

    l->output = realloc(l->output, sizeof(double) * l->n_outputs);

    l->weights = realloc(l->weights, sizeof(double) * l->n_weights);

    l->weight_updates =

        realloc(l->weight_updates, sizeof(double) * l->n_weights);

    l->weight_active = realloc(l->weight_active, sizeof(bool) * l->n_weights);

    l->biases = realloc(l->biases, sizeof(double) * l->n_biases);

    l->bias_updates = realloc(l->bias_updates, sizeof(double) * l->n_biases);

    l->temp = realloc(l->temp, get_workspace_size(l));

}


void


neural_layer_convolutional_free(const struct Layer *l)

{

    free(l->delta);

    free(l->state);

    free(l->output);

    free(l->weights);

    free(l->weight_updates);

    free(l->weight_active);

    free(l->biases);

    free(l->bias_updates);

    free(l->temp);

    free(l->mu);

}


void


neural_layer_convolutional_init(struct Layer *l, const struct ArgsLayer *args)

{

    l->options = layer_args_opt(args);

    l->function = args->function;

    l->height = args->height;

    l->width = args->width;

    l->channels = args->channels;

    l->n_filters = args->n_init;

    l->max_outputs = args->n_max;

    l->stride = args->stride;

    l->size = args->size;

    l->pad = args->pad;

    l->max_neuron_grow = args->max_neuron_grow;

    l->eta_max = args->eta;

    l->eta_min = args->eta_min;

    l->momentum = args->momentum;

    l->decay = args->decay;

    l->n_biases = l->n_filters;

    l->n_weights = l->channels * l->n_filters * l->size * l->size;

    l->n_active = l->n_weights;

    l->out_h = get_out_height(l);

    l->out_w = get_out_width(l);

    l->out_c = l->n_filters;

    l->n_inputs = l->width * l->height * l->channels;

    l->n_outputs = l->out_h * l->out_w * l->out_c;

    layer_init_eta(l);

    malloc_layer_arrays(l);

    for (int i = 0; i < l->n_weights; ++i) {

        l->weights[i] = rand_normal(0, WEIGHT_SD_INIT);

        l->weight_active[i] = true;

    }

    memset(l->biases, 0, sizeof(double) * l->n_biases);

    sam_init(l->mu, N_MU, MU_TYPE);

}


struct Layer *


neural_layer_convolutional_copy(const struct Layer *src)

{

    if (src->type != CONVOLUTIONAL) {

        printf("neural_layer_convolut_copy() incorrect source layer type\n");

        exit(EXIT_FAILURE);

    }

    struct Layer *l = malloc(sizeof(struct Layer));

    layer_defaults(l);

    l->type = src->type;

    l->layer_vptr = src->layer_vptr;

    l->options = src->options;

    l->function = src->function;

    l->height = src->height;

    l->width = src->width;

    l->channels = src->channels;

    l->n_filters = src->n_filters;

    l->stride = src->stride;

    l->size = src->size;

    l->pad = src->pad;

    l->n_weights = src->n_weights;

    l->n_active = src->n_active;

    l->out_h = src->out_h;

    l->out_w = src->out_w;

    l->out_c = src->out_c;

    l->n_outputs = src->n_outputs;

    l->n_inputs = src->n_inputs;

    l->max_outputs = src->max_outputs;

    l->max_neuron_grow = src->max_neuron_grow;

    l->n_biases = src->n_biases;

    l->momentum = src->momentum;

    l->decay = src->decay;

    l->eta = src->eta;

    l->eta_max = src->eta_max;

    l->eta_min = src->eta_min;

    malloc_layer_arrays(l);

    memcpy(l->weights, src->weights, sizeof(double) * src->n_weights);

    memcpy(l->weight_active, src->weight_active, sizeof(bool) * src->n_weights);

    memcpy(l->biases, src->biases, sizeof(double) * src->n_biases);

    memcpy(l->mu, src->mu, sizeof(double) * N_MU);

    return l;

}


void


neural_layer_convolutional_rand(struct Layer *l)

{

    layer_weight_rand(l);

}


void


neural_layer_convolutional_forward(const struct Layer *l, const struct Net *net,

                                   const double *input)

{

    (void) net;

    const int m = l->n_filters;

    const int k = l->size * l->size * l->channels;

    const int n = l->out_w * l->out_h;

    const double *a = l->weights;

    double *b = l->temp;

    double *c = l->state;

    memset(l->state, 0, sizeof(double) * l->n_outputs);

    if (l->size == 1) {

        blas_gemm(0, 0, m, n, k, 1, a, k, input, n, 1, c, n);

    } else {

        im2col(input, l->channels, l->height, l->width, l->size, l->stride,

               l->pad, b);

        blas_gemm(0, 0, m, n, k, 1, a, k, b, n, 1, c, n);

    }

    for (int i = 0; i < l->n_biases; ++i) {

        for (int j = 0; j < n; ++j) {

            l->state[i * n + j] += l->biases[i];

        }

    }

    neural_activate_array(l->state, l->output, l->n_outputs, l->function);

}


void


neural_layer_convolutional_backward(const struct Layer *l,

                                    const struct Net *net, const double *input,

                                    double *delta)

{

    (void) net;

    const int m = l->n_filters;

    const int n = l->size * l->size * l->channels;

    const int k = l->out_w * l->out_h;

    if (l->options & LAYER_SGD_WEIGHTS) {

        neural_gradient_array(l->state, l->delta, l->n_outputs, l->function);

        for (int i = 0; i < l->n_biases; ++i) {

            l->bias_updates[i] += blas_sum(l->delta + k * i, k);

        }

        const double *a = l->delta;

        double *b = l->temp;

        double *c = l->weight_updates;

        if (l->size == 1) {

            blas_gemm(0, 1, m, n, k, 1, a, k, input, k, 1, c, n);

        } else {

            im2col(input, l->channels, l->height, l->width, l->size, l->stride,

                   l->pad, b);

            blas_gemm(0, 1, m, n, k, 1, a, k, b, k, 1, c, n);

        }

    }

    if (delta) {

        const double *a = l->weights;

        const double *b = l->delta;

        double *c = l->temp;

        if (l->size == 1) {

            c = delta;

        }

        blas_gemm(1, 0, n, k, m, 1, a, n, b, k, 0, c, k);

        if (l->size != 1) {

            col2im(l->temp, l->channels, l->height, l->width, l->size,

                   l->stride, l->pad, delta);

        }

    }

}


void


neural_layer_convolutional_update(const struct Layer *l)

{

    if (l->options & LAYER_SGD_WEIGHTS && l->eta > 0) {

        blas_axpy(l->n_biases, l->eta, l->bias_updates, 1, l->biases, 1);

        blas_scal(l->n_biases, l->momentum, l->bias_updates, 1);

        if (l->decay > 0) {

            blas_axpy(l->n_weights, -(l->decay), l->weights, 1,

                      l->weight_updates, 1);

        }

        blas_axpy(l->n_weights, l->eta, l->weight_updates, 1, l->weights, 1);

        blas_scal(l->n_weights, l->momentum, l->weight_updates, 1);

        layer_weight_clamp(l);

    }

}


void


neural_layer_convolutional_resize(struct Layer *l, const struct Layer *prev)

{

    const int old_n_outputs = l->n_outputs;

    const int old_n_weights = l->n_weights;

    l->width = prev->out_w;

    l->height = prev->out_h;

    l->channels = prev->out_c;

    l->out_w = get_out_width(l);

    l->out_h = get_out_height(l);

    l->n_outputs = l->out_h * l->out_w * l->out_c;

    l->n_inputs = l->width * l->height * l->channels;

    l->n_weights = l->channels * l->n_filters * l->size * l->size;

    realloc_layer_arrays(l);

    for (int i = old_n_weights; i < l->n_weights; ++i) {

        l->weights[i] = rand_normal(0, WEIGHT_SD);

        l->weight_updates[i] = 0;

        l->weight_active[i] = true;

    }

    for (int i = old_n_outputs; i < l->n_outputs; ++i) {

        l->delta[i] = 0;

        l->state[i] = 0;

        l->output[i] = 0;

    }

    layer_calc_n_active(l);

}


static int


neural_layer_convolutional_mutate_filter(const struct Layer *l, const double mu)

{

    int n = 0;

    if (rand_uniform(0, 0.1) < mu) { // 10x higher probability

        while (n == 0) {

            const double m = clamp(rand_normal(0, 0.5), -1, 1);

            n = (int) round(m * l->max_neuron_grow);

        }

        if (l->n_filters + n < 1) {

            n = -(l->n_filters - 1);

        } else if (l->n_filters + n > l->max_outputs) {

            n = l->max_outputs - l->n_filters;

        }

    }

    return n;

}


static void


neural_layer_convolutional_add_filters(struct Layer *l, const int N)

{

    const int old_n_biases = l->n_biases;

    const int old_n_weights = l->n_weights;

    const int old_n_outputs = l->n_outputs;

    l->n_filters += N;

    l->n_biases = l->n_filters;

    l->out_c = l->n_filters;

    l->n_weights = l->channels * l->n_filters * l->size * l->size;

    l->n_outputs = l->out_h * l->out_w * l->out_c;

    realloc_layer_arrays(l);

    for (int i = old_n_weights; i < l->n_weights; ++i) {

        l->weights[i] = rand_normal(0, WEIGHT_SD);

        l->weight_active[i] = true;

        l->weight_updates[i] = 0;

    }

    for (int i = old_n_biases; i < l->n_biases; ++i) {

        l->biases[i] = 0;

        l->bias_updates[i] = 0;

    }

    for (int i = old_n_outputs; i < l->n_outputs; ++i) {

        l->output[i] = 0;

        l->state[i] = 0;

        l->delta[i] = 0;

    }

    layer_calc_n_active(l);

}


bool


neural_layer_convolutional_mutate(struct Layer *l)

{

    sam_adapt(l->mu, N_MU, MU_TYPE);

    bool mod = false;

    if ((l->options & LAYER_EVOLVE_ETA) && layer_mutate_eta(l, l->mu[0])) {

        mod = true;

    }

    if (l->options & LAYER_EVOLVE_NEURONS) {

        const int n = neural_layer_convolutional_mutate_filter(l, l->mu[1]);

        if (n != 0) {

            neural_layer_convolutional_add_filters(l, n);

            mod = true;

        }

    }

    if ((l->options & LAYER_EVOLVE_CONNECT) &&

        layer_mutate_connectivity(l, l->mu[2], l->mu[3])) {

        mod = true;

    }

    if ((l->options & LAYER_EVOLVE_WEIGHTS) &&

        layer_mutate_weights(l, l->mu[4])) {

        mod = true;

    }

    if ((l->options & LAYER_EVOLVE_FUNCTIONS) &&

        layer_mutate_functions(l, l->mu[5])) {

        mod = true;

    }

    return mod;

}


double *


neural_layer_convolutional_output(const struct Layer *l)

{

    return l->output;

}


void


neural_layer_convolutional_print(const struct Layer *l,

                                 const bool print_weights)

{

    char *json_str = neural_layer_convolutional_json_export(l, print_weights);

    printf("%s\n", json_str);

    free(json_str);

}


char *


neural_layer_convolutional_json_export(const struct Layer *l,

                                       const bool return_weights)

{

    cJSON *json = cJSON_CreateObject();

    cJSON_AddStringToObject(json, "type", "convolutional");

    cJSON_AddStringToObject(json, "activation",

                            neural_activation_string(l->function));

    cJSON_AddNumberToObject(json, "n_inputs", l->n_inputs);

    cJSON_AddNumberToObject(json, "n_outputs", l->n_outputs);

    cJSON_AddNumberToObject(json, "n_filters", l->n_filters);

    cJSON_AddNumberToObject(json, "size", l->size);

    cJSON_AddNumberToObject(json, "stride", l->stride);

    cJSON_AddNumberToObject(json, "pad", l->pad);

    cJSON_AddNumberToObject(json, "eta", l->eta);

    cJSON *mutation = cJSON_CreateDoubleArray(l->mu, N_MU);

    cJSON_AddItemToObject(json, "mutation", mutation);

    char *weights_str = layer_weight_json(l, return_weights);

    cJSON *weights = cJSON_Parse(weights_str);

    free(weights_str);

    cJSON_AddItemToObject(json, "weights", weights);

    char *string = cJSON_Print(json);

    cJSON_Delete(json);

    return string;

}


size_t


neural_layer_convolutional_save(const struct Layer *l, FILE *fp)

{

    size_t s = 0;

    s += fwrite(&l->options, sizeof(uint32_t), 1, fp);

    s += fwrite(&l->function, sizeof(int), 1, fp);

    s += fwrite(&l->height, sizeof(int), 1, fp);

    s += fwrite(&l->width, sizeof(int), 1, fp);

    s += fwrite(&l->channels, sizeof(int), 1, fp);

    s += fwrite(&l->n_filters, sizeof(int), 1, fp);

    s += fwrite(&l->stride, sizeof(int), 1, fp);

    s += fwrite(&l->size, sizeof(int), 1, fp);

    s += fwrite(&l->pad, sizeof(int), 1, fp);

    s += fwrite(&l->out_h, sizeof(int), 1, fp);

    s += fwrite(&l->out_w, sizeof(int), 1, fp);

    s += fwrite(&l->out_c, sizeof(int), 1, fp);

    s += fwrite(&l->n_biases, sizeof(int), 1, fp);

    s += fwrite(&l->n_outputs, sizeof(int), 1, fp);

    s += fwrite(&l->n_inputs, sizeof(int), 1, fp);

    s += fwrite(&l->max_outputs, sizeof(int), 1, fp);

    s += fwrite(&l->n_weights, sizeof(int), 1, fp);

    s += fwrite(&l->n_active, sizeof(int), 1, fp);

    s += fwrite(&l->eta, sizeof(double), 1, fp);

    s += fwrite(&l->eta_max, sizeof(double), 1, fp);

    s += fwrite(&l->eta_min, sizeof(double), 1, fp);

    s += fwrite(&l->momentum, sizeof(double), 1, fp);

    s += fwrite(&l->decay, sizeof(double), 1, fp);

    s += fwrite(&l->max_neuron_grow, sizeof(int), 1, fp);

    s += fwrite(l->weights, sizeof(double), l->n_weights, fp);

    s += fwrite(l->weight_updates, sizeof(double), l->n_weights, fp);

    s += fwrite(l->weight_active, sizeof(bool), l->n_weights, fp);

    s += fwrite(l->biases, sizeof(double), l->n_biases, fp);

    s += fwrite(l->bias_updates, sizeof(double), l->n_filters, fp);

    s += fwrite(l->mu, sizeof(double), N_MU, fp);

    return s;

}


size_t


neural_layer_convolutional_load(struct Layer *l, FILE *fp)

{

    size_t s = 0;

    s += fread(&l->options, sizeof(uint32_t), 1, fp);

    s += fread(&l->function, sizeof(int), 1, fp);

    s += fread(&l->height, sizeof(int), 1, fp);

    s += fread(&l->width, sizeof(int), 1, fp);

    s += fread(&l->channels, sizeof(int), 1, fp);

    s += fread(&l->n_filters, sizeof(int), 1, fp);

    s += fread(&l->stride, sizeof(int), 1, fp);

    s += fread(&l->size, sizeof(int), 1, fp);

    s += fread(&l->pad, sizeof(int), 1, fp);

    s += fread(&l->out_h, sizeof(int), 1, fp);

    s += fread(&l->out_w, sizeof(int), 1, fp);

    s += fread(&l->out_c, sizeof(int), 1, fp);

    s += fread(&l->n_biases, sizeof(int), 1, fp);

    s += fread(&l->n_outputs, sizeof(int), 1, fp);

    s += fread(&l->n_inputs, sizeof(int), 1, fp);

    s += fread(&l->max_outputs, sizeof(int), 1, fp);

    s += fread(&l->n_weights, sizeof(int), 1, fp);

    s += fread(&l->n_active, sizeof(int), 1, fp);

    s += fread(&l->eta, sizeof(double), 1, fp);

    s += fread(&l->eta_max, sizeof(double), 1, fp);

    s += fread(&l->eta_min, sizeof(double), 1, fp);

    s += fread(&l->momentum, sizeof(double), 1, fp);

    s += fread(&l->decay, sizeof(double), 1, fp);

    s += fread(&l->max_neuron_grow, sizeof(int), 1, fp);

    malloc_layer_arrays(l);

    s += fread(l->weights, sizeof(double), l->n_weights, fp);

    s += fread(l->weight_updates, sizeof(double), l->n_weights, fp);

    s += fread(l->weight_active, sizeof(bool), l->n_weights, fp);

    s += fread(l->biases, sizeof(double), l->n_biases, fp);

    s += fread(l->bias_updates, sizeof(double), l->n_biases, fp);

    s += fread(l->mu, sizeof(double), N_MU, fp);

    return s;

}


blas_scal
void blas_scal(const int N, const double ALPHA, double *X, const int INCX)
Scales vector X by the scalar ALPHA and overwrites it with the result.
Definition blas.c:160

blas_sum
double blas_sum(const double *X, const int N)
Returns the sum of the vector X.
Definition blas.c:232

blas_axpy
void blas_axpy(const int N, const double ALPHA, const double *X, const int INCX, double *Y, const int INCY)
Multiplies vector X by the scalar ALPHA and adds it to the vector Y.
Definition blas.c:138

blas_gemm
void blas_gemm(const int TA, const int TB, const int M, const int N, const int K, const double ALPHA, const double *A, const int lda, const double *B, const int ldb, const double BETA, double *C, const int ldc)
Performs the matrix-matrix multiplication: .
Definition blas.c:108

blas.h
Basic linear algebra functions.

im2col
void im2col(const double *data_im, const int channels, const int height, const int width, const int ksize, const int stride, const int pad, double *data_col)
Transforms an image vector to a column vector.
Definition image.c:100

col2im
void col2im(const double *data_col, const int channels, const int height, const int width, const int ksize, const int stride, const int pad, double *data_im)
Transforms a column vector to an image vector.
Definition image.c:63

image.h
Image handling functions.

neural_activation_string
const char * neural_activation_string(const int a)
Returns the name of a specified activation function.
Definition neural_activations.c:110

neural_gradient_array
void neural_gradient_array(const double *state, double *delta, const int n, const int a)
Applies a gradient function to a vector of neuron states.
Definition neural_activations.c:215

neural_activate_array
void neural_activate_array(double *state, double *output, const int n, const int a)
Applies an activation function to a vector of neuron states.
Definition neural_activations.c:199

neural_activations.h
Neural network activation functions.

layer_guard_biases
void layer_guard_biases(const struct Layer *l)
Check number of biases is within bounds.
Definition neural_layer.c:581

layer_mutate_connectivity
bool layer_mutate_connectivity(struct Layer *l, const double mu_enable, const double mu_disable)
Mutates a layer's connectivity by zeroing weights.
Definition neural_layer.c:176

layer_defaults
void layer_defaults(struct Layer *l)
Initialises a layer to default values.
Definition neural_layer.c:413

layer_mutate_functions
bool layer_mutate_functions(struct Layer *l, const double mu)
Mutates a layer's activation function by random selection.
Definition neural_layer.c:283

layer_weight_clamp
void layer_weight_clamp(const struct Layer *l)
Clamps a layer's weights and biases in range [WEIGHT_MIN, WEIGHT_MAX].
Definition neural_layer.c:365

layer_guard_outputs
void layer_guard_outputs(const struct Layer *l)
Check number of outputs is within bounds.
Definition neural_layer.c:595

layer_weight_rand
void layer_weight_rand(struct Layer *l)
Randomises a layer's weights and biases.
Definition neural_layer.c:348

layer_weight_json
char * layer_weight_json(const struct Layer *l, const bool return_weights)
Returns a json formatted string representation of a layer's weights.
Definition neural_layer.c:324

layer_calc_n_active
void layer_calc_n_active(struct Layer *l)
Recalculates the number of active connections within a layer.
Definition neural_layer.c:384

layer_init_eta
void layer_init_eta(struct Layer *l)
Initialises a layer's gradient descent rate.
Definition neural_layer.c:399

layer_mutate_eta
bool layer_mutate_eta(struct Layer *l, const double mu)
Mutates the gradient descent rate of a neural layer.
Definition neural_layer.c:88

layer_mutate_weights
bool layer_mutate_weights(struct Layer *l, const double mu)
Mutates a layer's weights and biases by adding random numbers from a Gaussian normal distribution wit...
Definition neural_layer.c:252

layer_guard_weights
void layer_guard_weights(const struct Layer *l)
Check number of weights is within bounds.
Definition neural_layer.c:609

LAYER_EVOLVE_ETA
#define LAYER_EVOLVE_ETA
Layer may evolve rate of gradient descent.
Definition neural_layer.h:55

LAYER_EVOLVE_FUNCTIONS
#define LAYER_EVOLVE_FUNCTIONS
Layer may evolve functions.
Definition neural_layer.h:53

WEIGHT_SD_INIT
#define WEIGHT_SD_INIT
Std dev of Gaussian for weight initialisation.
Definition neural_layer.h:66

LAYER_EVOLVE_WEIGHTS
#define LAYER_EVOLVE_WEIGHTS
Layer may evolve weights.
Definition neural_layer.h:51

LAYER_EVOLVE_NEURONS
#define LAYER_EVOLVE_NEURONS
Layer may evolve neurons.
Definition neural_layer.h:52

LAYER_EVOLVE_CONNECT
#define LAYER_EVOLVE_CONNECT
Layer may evolve connectivity.
Definition neural_layer.h:56

WEIGHT_SD
#define WEIGHT_SD
Std dev of Gaussian for weight resizing.
Definition neural_layer.h:67

LAYER_SGD_WEIGHTS
#define LAYER_SGD_WEIGHTS
Layer may perform gradient descent.
Definition neural_layer.h:54

CONVOLUTIONAL
#define CONVOLUTIONAL
Layer type convolutional.
Definition neural_layer.h:36

layer_print
static void layer_print(const struct Layer *l, const bool print_weights)
Prints the layer.
Definition neural_layer.h:269

layer_args_opt
uint32_t layer_args_opt(const struct ArgsLayer *args)
Returns a bitstring representing the permissions granted by a layer.
Definition neural_layer_args.c:541

get_out_width
static int get_out_width(const struct Layer *l)
Returns the output width of a convolutional layer.
Definition neural_layer_convolutional.c:62

neural_layer_convolutional_json_export
char * neural_layer_convolutional_json_export(const struct Layer *l, const bool return_weights)
Returns a json formatted string of a convolutional layer.
Definition neural_layer_convolutional.c:514

neural_layer_convolutional_update
void neural_layer_convolutional_update(const struct Layer *l)
Updates the weights and biases of a convolutional layer.
Definition neural_layer_convolutional.c:340

neural_layer_convolutional_forward
void neural_layer_convolutional_forward(const struct Layer *l, const struct Net *net, const double *input)
Forward propagates a convolutional layer.
Definition neural_layer_convolutional.c:262

neural_layer_convolutional_output
double * neural_layer_convolutional_output(const struct Layer *l)
Returns the output from a convolutional layer.
Definition neural_layer_convolutional.c:487

neural_layer_convolutional_resize
void neural_layer_convolutional_resize(struct Layer *l, const struct Layer *prev)
Resizes a convolutional layer if the previous layer has changed size.
Definition neural_layer_convolutional.c:361

malloc_layer_arrays
static void malloc_layer_arrays(struct Layer *l)
Allocate memory used by a convolutional layer.
Definition neural_layer_convolutional.c:102

realloc_layer_arrays
static void realloc_layer_arrays(struct Layer *l)
Resize memory used by a convolutional layer.
Definition neural_layer_convolutional.c:122

N_MU
#define N_MU
Number of mutation rates applied to a convolutional layer.
Definition neural_layer_convolutional.c:31

neural_layer_convolutional_print
void neural_layer_convolutional_print(const struct Layer *l, const bool print_weights)
Prints a convolutional layer.
Definition neural_layer_convolutional.c:498

get_workspace_size
static size_t get_workspace_size(const struct Layer *l)
Returns the memory workspace size for a convolutional layer.
Definition neural_layer_convolutional.c:73

neural_layer_convolutional_mutate
bool neural_layer_convolutional_mutate(struct Layer *l)
Mutates a convolutional layer.
Definition neural_layer_convolutional.c:452

neural_layer_convolutional_copy
struct Layer * neural_layer_convolutional_copy(const struct Layer *src)
Initialises and copies one convolutional layer from another.
Definition neural_layer_convolutional.c:203

MU_TYPE
static const int MU_TYPE[(6)]
Self-adaptation method for mutating a convolutional layer.
Definition neural_layer_convolutional.c:36

neural_layer_convolutional_free
void neural_layer_convolutional_free(const struct Layer *l)
Free memory used by a convolutional layer.
Definition neural_layer_convolutional.c:142

get_out_height
static int get_out_height(const struct Layer *l)
Returns the output height of a convolutional layer.
Definition neural_layer_convolutional.c:51

neural_layer_convolutional_save
size_t neural_layer_convolutional_save(const struct Layer *l, FILE *fp)
Writes a convolutional layer to a file.
Definition neural_layer_convolutional.c:546

neural_layer_convolutional_add_filters
static void neural_layer_convolutional_add_filters(struct Layer *l, const int N)
Adds N filters to a layer. Negative N removes filters.
Definition neural_layer_convolutional.c:418

neural_layer_convolutional_mutate_filter
static int neural_layer_convolutional_mutate_filter(const struct Layer *l, const double mu)
Returns the number of kernel filters to add or remove from a layer.
Definition neural_layer_convolutional.c:394

neural_layer_convolutional_load
size_t neural_layer_convolutional_load(struct Layer *l, FILE *fp)
Reads a convolutional layer from a file.
Definition neural_layer_convolutional.c:589

guard_malloc
static void guard_malloc(const struct Layer *l)
Check memory allocation is within bounds.
Definition neural_layer_convolutional.c:90

neural_layer_convolutional_rand
void neural_layer_convolutional_rand(struct Layer *l)
Randomises the weights of a convolutional layer.
Definition neural_layer_convolutional.c:250

neural_layer_convolutional_init
void neural_layer_convolutional_init(struct Layer *l, const struct ArgsLayer *args)
Initialises a 2D convolutional layer.
Definition neural_layer_convolutional.c:162

neural_layer_convolutional_backward
void neural_layer_convolutional_backward(const struct Layer *l, const struct Net *net, const double *input, double *delta)
Backward propagates a convolutional layer.
Definition neural_layer_convolutional.c:296

neural_layer_convolutional.h
An implementation of a 2D convolutional layer.

sam_init
void sam_init(double *mu, const int N, const int *type)
Initialises self-adaptive mutation rates.
Definition sam.c:43

sam_adapt
void sam_adapt(double *mu, const int N, const int *type)
Self-adapts mutation rates.
Definition sam.c:68

sam.h
Self-adaptive mutation functions.

SAM_RATE_SELECT
#define SAM_RATE_SELECT
Ten normally distributed rates.
Definition sam.h:29

ArgsLayer
Parameters for initialising a neural network layer.
Definition neural_layer_args.h:31

ArgsLayer::n_init
int n_init
Initial number of units / neurons / filters.
Definition neural_layer_args.h:34

ArgsLayer::decay
double decay
Weight decay for gradient descent.
Definition neural_layer_args.h:48

ArgsLayer::momentum
double momentum
Momentum for gradient descent.
Definition neural_layer_args.h:47

ArgsLayer::function
int function
Activation function.
Definition neural_layer_args.h:37

ArgsLayer::max_neuron_grow
int max_neuron_grow
Maximum number neurons to add per mutation event.
Definition neural_layer_args.h:36

ArgsLayer::eta
double eta
Gradient descent rate.
Definition neural_layer_args.h:45

ArgsLayer::pad
int pad
Pool and Conv.
Definition neural_layer_args.h:44

ArgsLayer::eta_min
double eta_min
Current gradient descent rate.
Definition neural_layer_args.h:46

ArgsLayer::channels
int channels
Pool, Conv, and Upsample.
Definition neural_layer_args.h:41

ArgsLayer::n_max
int n_max
Maximum number of units / neurons.
Definition neural_layer_args.h:35

ArgsLayer::size
int size
Pool and Conv.
Definition neural_layer_args.h:42

ArgsLayer::width
int width
Pool, Conv, and Upsample.
Definition neural_layer_args.h:40

ArgsLayer::height
int height
Pool, Conv, and Upsample.
Definition neural_layer_args.h:39

ArgsLayer::stride
int stride
Pool, Conv, and Upsample.
Definition neural_layer_args.h:43

Layer
Neural network layer data structure.
Definition neural_layer.h:73

Layer::output
double * output
Current neuron outputs (after activation function)
Definition neural_layer.h:76

Layer::decay
double decay
Weight decay for gradient descent.
Definition neural_layer.h:89

Layer::size
int size
Pool and Conv.
Definition neural_layer.h:133

Layer::state
double * state
Current neuron states (before activation function)
Definition neural_layer.h:75

Layer::pad
int pad
Pool and Conv.
Definition neural_layer.h:129

Layer::max_neuron_grow
int max_neuron_grow
Maximum number neurons to add per mutation event.
Definition neural_layer.h:93

Layer::stride
int stride
Pool, Conv, and Upsample.
Definition neural_layer.h:134

Layer::n_inputs
int n_inputs
Number of layer inputs.
Definition neural_layer.h:90

Layer::n_biases
int n_biases
Number of layer biases.
Definition neural_layer.h:95

Layer::weight_active
bool * weight_active
Whether each connection is present in the layer.
Definition neural_layer.h:79

Layer::weights
double * weights
Weights for calculating neuron states.
Definition neural_layer.h:78

Layer::weight_updates
double * weight_updates
Updates to weights.
Definition neural_layer.h:82

Layer::n_filters
int n_filters
Conv.
Definition neural_layer.h:136

Layer::mu
double * mu
Mutation rates.
Definition neural_layer.h:84

Layer::channels
int channels
Pool, Conv, and Upsample.
Definition neural_layer.h:128

Layer::function
int function
Layer activation function.
Definition neural_layer.h:97

Layer::c
double * c
LSTM.
Definition neural_layer.h:120

Layer::height
int height
Pool, Conv, and Upsample.
Definition neural_layer.h:126

Layer::temp
double * temp
LSTM.
Definition neural_layer.h:122

Layer::layer_vptr
struct LayerVtbl const  * layer_vptr
Functions acting on layers.
Definition neural_layer.h:100

Layer::max_outputs
int max_outputs
Maximum number of neurons in the layer.
Definition neural_layer.h:92

Layer::width
int width
Pool, Conv, and Upsample.
Definition neural_layer.h:127

Layer::n_weights
int n_weights
Number of layer weights.
Definition neural_layer.h:94

Layer::bias_updates
double * bias_updates
Updates to biases.
Definition neural_layer.h:81

Layer::eta_max
double eta_max
Maximum gradient descent rate.
Definition neural_layer.h:86

Layer::i
double * i
LSTM.
Definition neural_layer.h:117

Layer::n_outputs
int n_outputs
Number of layer outputs.
Definition neural_layer.h:91

Layer::biases
double * biases
Biases for calculating neuron states.
Definition neural_layer.h:80

Layer::n_active
int n_active
Number of active weights / connections.
Definition neural_layer.h:96

Layer::out_w
int out_w
Pool, Conv, and Upsample.
Definition neural_layer.h:130

Layer::type
int type
Layer type: CONNECTED, DROPOUT, etc.
Definition neural_layer.h:74

Layer::out_c
int out_c
Pool, Conv, and Upsample.
Definition neural_layer.h:132

Layer::delta
double * delta
Delta for updating weights.
Definition neural_layer.h:83

Layer::options
uint32_t options
Bitwise layer options permitting evolution, SGD, etc.
Definition neural_layer.h:77

Layer::out_h
int out_h
Pool, Conv, and Upsample.
Definition neural_layer.h:131

Layer::eta_min
double eta_min
Minimum gradient descent rate.
Definition neural_layer.h:87

Layer::eta
double eta
Gradient descent rate.
Definition neural_layer.h:85

Layer::momentum
double momentum
Momentum for gradient descent.
Definition neural_layer.h:88

Net
Neural network data structure.
Definition neural.h:48

rand_normal
double rand_normal(const double mu, const double sigma)
Returns a random Gaussian with specified mean and standard deviation.
Definition utils.c:87

rand_uniform
double rand_uniform(const double min, const double max)
Returns a uniform random float [min,max].
Definition utils.c:62

utils.h
Utility functions for random number handling, etc.

clamp
static double clamp(const double a, const double min, const double max)
Returns a float clamped within the specified range.
Definition utils.h:60