xcsf/neural__layer__convolutional_8c_source.html

 /*

  * This program is free software: you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation, either version 3 of the License, or

  * (at your option) any later version.

  *

  * This program is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

  * GNU General Public License for more details.

  *

  * You should have received a copy of the GNU General Public License

  * along with this program.  If not, see <http://www.gnu.org/licenses/>.

  */


 #include "neural_layer_convolutional.h"

 #include "blas.h"

 #include "image.h"

 #include "neural_activations.h"

 #include "sam.h"

 #include "utils.h"


 #define N_MU (6)


 static const int MU_TYPE[N_MU] = {

     SAM_RATE_SELECT,

     SAM_RATE_SELECT,

     SAM_RATE_SELECT,

     SAM_RATE_SELECT,

     SAM_RATE_SELECT,

     SAM_RATE_SELECT

 };


 static int

 get_out_height(const struct Layer *l)

 {

     return (l->height + 2 * l->pad - l->size) / l->stride + 1;

 }


 static int

 get_out_width(const struct Layer *l)

 {

     return (l->width + 2 * l->pad - l->size) / l->stride + 1;

 }


 static size_t

 get_workspace_size(const struct Layer *l)

 {

     const size_t workspace_size = (size_t) l->out_h * l->out_w * l->size *

         l->size * l->channels * sizeof(double);

     if (workspace_size < 1) {

         printf("neural_layer_convolutional: invalid workspace size\n");

         layer_print(l, false);

         exit(EXIT_FAILURE);

     }

     return workspace_size;

 }


 static void

 guard_malloc(const struct Layer *l)

 {

     layer_guard_biases(l);

     layer_guard_outputs(l);

     layer_guard_weights(l);

 }


 static void

 malloc_layer_arrays(struct Layer *l)

 {

     guard_malloc(l);

     l->delta = calloc(l->n_outputs, sizeof(double));

     l->state = calloc(l->n_outputs, sizeof(double));

     l->output = calloc(l->n_outputs, sizeof(double));

     l->weights = malloc(sizeof(double) * l->n_weights);

     l->weight_updates = calloc(l->n_weights, sizeof(double));

     l->weight_active = malloc(sizeof(bool) * l->n_weights);

     l->biases = malloc(sizeof(double) * l->n_biases);

     l->bias_updates = calloc(l->n_biases, sizeof(double));

     l->temp = malloc(get_workspace_size(l));

     l->mu = malloc(sizeof(double) * N_MU);

 }


 static void

 realloc_layer_arrays(struct Layer *l)

 {

     guard_malloc(l);

     l->delta = realloc(l->delta, sizeof(double) * l->n_outputs);

     l->state = realloc(l->state, sizeof(double) * l->n_outputs);

     l->output = realloc(l->output, sizeof(double) * l->n_outputs);

     l->weights = realloc(l->weights, sizeof(double) * l->n_weights);

     l->weight_updates =

         realloc(l->weight_updates, sizeof(double) * l->n_weights);

     l->weight_active = realloc(l->weight_active, sizeof(bool) * l->n_weights);

     l->biases = realloc(l->biases, sizeof(double) * l->n_biases);

     l->bias_updates = realloc(l->bias_updates, sizeof(double) * l->n_biases);

     l->temp = realloc(l->temp, get_workspace_size(l));

 }


 void

 neural_layer_convolutional_free(const struct Layer *l)

 {

     free(l->delta);

     free(l->state);

     free(l->output);

     free(l->weights);

     free(l->weight_updates);

     free(l->weight_active);

     free(l->biases);

     free(l->bias_updates);

     free(l->temp);

     free(l->mu);

 }


 void

 neural_layer_convolutional_init(struct Layer *l, const struct ArgsLayer *args)

 {

     l->options = layer_args_opt(args);

     l->function = args->function;

     l->height = args->height;

     l->width = args->width;

     l->channels = args->channels;

     l->n_filters = args->n_init;

     l->max_outputs = args->n_max;

     l->stride = args->stride;

     l->size = args->size;

     l->pad = args->pad;

     l->max_neuron_grow = args->max_neuron_grow;

     l->eta_max = args->eta;

     l->eta_min = args->eta_min;

     l->momentum = args->momentum;

     l->decay = args->decay;

     l->n_biases = l->n_filters;

     l->n_weights = l->channels * l->n_filters * l->size * l->size;

     l->n_active = l->n_weights;

     l->out_h = get_out_height(l);

     l->out_w = get_out_width(l);

     l->out_c = l->n_filters;

     l->n_inputs = l->width * l->height * l->channels;

     l->n_outputs = l->out_h * l->out_w * l->out_c;

     layer_init_eta(l);

     malloc_layer_arrays(l);

     for (int i = 0; i < l->n_weights; ++i) {

         l->weights[i] = rand_normal(0, WEIGHT_SD_INIT);

         l->weight_active[i] = true;

     }

     memset(l->biases, 0, sizeof(double) * l->n_biases);

     sam_init(l->mu, N_MU, MU_TYPE);

 }


 struct Layer *

 neural_layer_convolutional_copy(const struct Layer *src)

 {

     if (src->type != CONVOLUTIONAL) {

         printf("neural_layer_convolut_copy() incorrect source layer type\n");

         exit(EXIT_FAILURE);

     }

     struct Layer *l = malloc(sizeof(struct Layer));

     layer_defaults(l);

     l->type = src->type;

     l->layer_vptr = src->layer_vptr;

     l->options = src->options;

     l->function = src->function;

     l->height = src->height;

     l->width = src->width;

     l->channels = src->channels;

     l->n_filters = src->n_filters;

     l->stride = src->stride;

     l->size = src->size;

     l->pad = src->pad;

     l->n_weights = src->n_weights;

     l->n_active = src->n_active;

     l->out_h = src->out_h;

     l->out_w = src->out_w;

     l->out_c = src->out_c;

     l->n_outputs = src->n_outputs;

     l->n_inputs = src->n_inputs;

     l->max_outputs = src->max_outputs;

     l->max_neuron_grow = src->max_neuron_grow;

     l->n_biases = src->n_biases;

     l->momentum = src->momentum;

     l->decay = src->decay;

     l->eta = src->eta;

     l->eta_max = src->eta_max;

     l->eta_min = src->eta_min;

     malloc_layer_arrays(l);

     memcpy(l->weights, src->weights, sizeof(double) * src->n_weights);

     memcpy(l->weight_active, src->weight_active, sizeof(bool) * src->n_weights);

     memcpy(l->biases, src->biases, sizeof(double) * src->n_biases);

     memcpy(l->mu, src->mu, sizeof(double) * N_MU);

     return l;

 }


 void

 neural_layer_convolutional_rand(struct Layer *l)

 {

     layer_weight_rand(l);

 }


 void

 neural_layer_convolutional_forward(const struct Layer *l, const struct Net *net,

                                    const double *input)

 {

     (void) net;

     const int m = l->n_filters;

     const int k = l->size * l->size * l->channels;

     const int n = l->out_w * l->out_h;

     const double *a = l->weights;

     double *b = l->temp;

     double *c = l->state;

     memset(l->state, 0, sizeof(double) * l->n_outputs);

     if (l->size == 1) {

         blas_gemm(0, 0, m, n, k, 1, a, k, input, n, 1, c, n);

     } else {

         im2col(input, l->channels, l->height, l->width, l->size, l->stride,

                l->pad, b);

         blas_gemm(0, 0, m, n, k, 1, a, k, b, n, 1, c, n);

     }

     for (int i = 0; i < l->n_biases; ++i) {

         for (int j = 0; j < n; ++j) {

             l->state[i * n + j] += l->biases[i];

         }

     }

     neural_activate_array(l->state, l->output, l->n_outputs, l->function);

 }


 void

 neural_layer_convolutional_backward(const struct Layer *l,

                                     const struct Net *net, const double *input,

                                     double *delta)

 {

     (void) net;

     const int m = l->n_filters;

     const int n = l->size * l->size * l->channels;

     const int k = l->out_w * l->out_h;

     if (l->options & LAYER_SGD_WEIGHTS) {

         neural_gradient_array(l->state, l->delta, l->n_outputs, l->function);

         for (int i = 0; i < l->n_biases; ++i) {

             l->bias_updates[i] += blas_sum(l->delta + k * i, k);

         }

         const double *a = l->delta;

         double *b = l->temp;

         double *c = l->weight_updates;

         if (l->size == 1) {

             blas_gemm(0, 1, m, n, k, 1, a, k, input, k, 1, c, n);

         } else {

             im2col(input, l->channels, l->height, l->width, l->size, l->stride,

                    l->pad, b);

             blas_gemm(0, 1, m, n, k, 1, a, k, b, k, 1, c, n);

         }

     }

     if (delta) {

         const double *a = l->weights;

         const double *b = l->delta;

         double *c = l->temp;

         if (l->size == 1) {

             c = delta;

         }

         blas_gemm(1, 0, n, k, m, 1, a, n, b, k, 0, c, k);

         if (l->size != 1) {

             col2im(l->temp, l->channels, l->height, l->width, l->size,

                    l->stride, l->pad, delta);

         }

     }

 }


 void

 neural_layer_convolutional_update(const struct Layer *l)

 {

     if (l->options & LAYER_SGD_WEIGHTS && l->eta > 0) {

         blas_axpy(l->n_biases, l->eta, l->bias_updates, 1, l->biases, 1);

         blas_scal(l->n_biases, l->momentum, l->bias_updates, 1);

         if (l->decay > 0) {

             blas_axpy(l->n_weights, -(l->decay), l->weights, 1,

                       l->weight_updates, 1);

         }

         blas_axpy(l->n_weights, l->eta, l->weight_updates, 1, l->weights, 1);

         blas_scal(l->n_weights, l->momentum, l->weight_updates, 1);

         layer_weight_clamp(l);

     }

 }


 void

 neural_layer_convolutional_resize(struct Layer *l, const struct Layer *prev)

 {

     const int old_n_outputs = l->n_outputs;

     const int old_n_weights = l->n_weights;

     l->width = prev->out_w;

     l->height = prev->out_h;

     l->channels = prev->out_c;

     l->out_w = get_out_width(l);

     l->out_h = get_out_height(l);

     l->n_outputs = l->out_h * l->out_w * l->out_c;

     l->n_inputs = l->width * l->height * l->channels;

     l->n_weights = l->channels * l->n_filters * l->size * l->size;

     realloc_layer_arrays(l);

     for (int i = old_n_weights; i < l->n_weights; ++i) {

         l->weights[i] = rand_normal(0, WEIGHT_SD);

         l->weight_updates[i] = 0;

         l->weight_active[i] = true;

     }

     for (int i = old_n_outputs; i < l->n_outputs; ++i) {

         l->delta[i] = 0;

         l->state[i] = 0;

         l->output[i] = 0;

     }

     layer_calc_n_active(l);

 }


 static int

 neural_layer_convolutional_mutate_filter(const struct Layer *l, const double mu)

 {

     int n = 0;

     if (rand_uniform(0, 0.1) < mu) { // 10x higher probability

         while (n == 0) {

             const double m = clamp(rand_normal(0, 0.5), -1, 1);

             n = (int) round(m * l->max_neuron_grow);

         }

         if (l->n_filters + n < 1) {

             n = -(l->n_filters - 1);

         } else if (l->n_filters + n > l->max_outputs) {

             n = l->max_outputs - l->n_filters;

         }

     }

     return n;

 }


 static void

 neural_layer_convolutional_add_filters(struct Layer *l, const int N)

 {

     const int old_n_biases = l->n_biases;

     const int old_n_weights = l->n_weights;

     const int old_n_outputs = l->n_outputs;

     l->n_filters += N;

     l->n_biases = l->n_filters;

     l->out_c = l->n_filters;

     l->n_weights = l->channels * l->n_filters * l->size * l->size;

     l->n_outputs = l->out_h * l->out_w * l->out_c;

     realloc_layer_arrays(l);

     for (int i = old_n_weights; i < l->n_weights; ++i) {

         l->weights[i] = rand_normal(0, WEIGHT_SD);

         l->weight_active[i] = true;

         l->weight_updates[i] = 0;

     }

     for (int i = old_n_biases; i < l->n_biases; ++i) {

         l->biases[i] = 0;

         l->bias_updates[i] = 0;

     }

     for (int i = old_n_outputs; i < l->n_outputs; ++i) {

         l->output[i] = 0;

         l->state[i] = 0;

         l->delta[i] = 0;

     }

     layer_calc_n_active(l);

 }


 bool

 neural_layer_convolutional_mutate(struct Layer *l)

 {

     sam_adapt(l->mu, N_MU, MU_TYPE);

     bool mod = false;

     if ((l->options & LAYER_EVOLVE_ETA) && layer_mutate_eta(l, l->mu[0])) {

         mod = true;

     }

     if (l->options & LAYER_EVOLVE_NEURONS) {

         const int n = neural_layer_convolutional_mutate_filter(l, l->mu[1]);

         if (n != 0) {

             neural_layer_convolutional_add_filters(l, n);

             mod = true;

         }

     }

     if ((l->options & LAYER_EVOLVE_CONNECT) &&

         layer_mutate_connectivity(l, l->mu[2], l->mu[3])) {

         mod = true;

     }

     if ((l->options & LAYER_EVOLVE_WEIGHTS) &&

         layer_mutate_weights(l, l->mu[4])) {

         mod = true;

     }

     if ((l->options & LAYER_EVOLVE_FUNCTIONS) &&

         layer_mutate_functions(l, l->mu[5])) {

         mod = true;

     }

     return mod;

 }


 double *

 neural_layer_convolutional_output(const struct Layer *l)

 {

     return l->output;

 }


 void

 neural_layer_convolutional_print(const struct Layer *l,

                                  const bool print_weights)

 {

     char *json_str = neural_layer_convolutional_json_export(l, print_weights);

     printf("%s\n", json_str);

     free(json_str);

 }


 char *

 neural_layer_convolutional_json_export(const struct Layer *l,

                                        const bool return_weights)

 {

     cJSON *json = cJSON_CreateObject();

     cJSON_AddStringToObject(json, "type", "convolutional");

     cJSON_AddStringToObject(json, "activation",

                             neural_activation_string(l->function));

     cJSON_AddNumberToObject(json, "n_inputs", l->n_inputs);

     cJSON_AddNumberToObject(json, "n_outputs", l->n_outputs);

     cJSON_AddNumberToObject(json, "n_filters", l->n_filters);

     cJSON_AddNumberToObject(json, "size", l->size);

     cJSON_AddNumberToObject(json, "stride", l->stride);

     cJSON_AddNumberToObject(json, "pad", l->pad);

     cJSON_AddNumberToObject(json, "eta", l->eta);

     cJSON *mutation = cJSON_CreateDoubleArray(l->mu, N_MU);

     cJSON_AddItemToObject(json, "mutation", mutation);

     char *weights_str = layer_weight_json(l, return_weights);

     cJSON *weights = cJSON_Parse(weights_str);

     free(weights_str);

     cJSON_AddItemToObject(json, "weights", weights);

     char *string = cJSON_Print(json);

     cJSON_Delete(json);

     return string;

 }


 size_t

 neural_layer_convolutional_save(const struct Layer *l, FILE *fp)

 {

     size_t s = 0;

     s += fwrite(&l->options, sizeof(uint32_t), 1, fp);

     s += fwrite(&l->function, sizeof(int), 1, fp);

     s += fwrite(&l->height, sizeof(int), 1, fp);

     s += fwrite(&l->width, sizeof(int), 1, fp);

     s += fwrite(&l->channels, sizeof(int), 1, fp);

     s += fwrite(&l->n_filters, sizeof(int), 1, fp);

     s += fwrite(&l->stride, sizeof(int), 1, fp);

     s += fwrite(&l->size, sizeof(int), 1, fp);

     s += fwrite(&l->pad, sizeof(int), 1, fp);

     s += fwrite(&l->out_h, sizeof(int), 1, fp);

     s += fwrite(&l->out_w, sizeof(int), 1, fp);

     s += fwrite(&l->out_c, sizeof(int), 1, fp);

     s += fwrite(&l->n_biases, sizeof(int), 1, fp);

     s += fwrite(&l->n_outputs, sizeof(int), 1, fp);

     s += fwrite(&l->n_inputs, sizeof(int), 1, fp);

     s += fwrite(&l->max_outputs, sizeof(int), 1, fp);

     s += fwrite(&l->n_weights, sizeof(int), 1, fp);

     s += fwrite(&l->n_active, sizeof(int), 1, fp);

     s += fwrite(&l->eta, sizeof(double), 1, fp);

     s += fwrite(&l->eta_max, sizeof(double), 1, fp);

     s += fwrite(&l->eta_min, sizeof(double), 1, fp);

     s += fwrite(&l->momentum, sizeof(double), 1, fp);

     s += fwrite(&l->decay, sizeof(double), 1, fp);

     s += fwrite(&l->max_neuron_grow, sizeof(int), 1, fp);

     s += fwrite(l->weights, sizeof(double), l->n_weights, fp);

     s += fwrite(l->weight_updates, sizeof(double), l->n_weights, fp);

     s += fwrite(l->weight_active, sizeof(bool), l->n_weights, fp);

     s += fwrite(l->biases, sizeof(double), l->n_biases, fp);

     s += fwrite(l->bias_updates, sizeof(double), l->n_filters, fp);

     s += fwrite(l->mu, sizeof(double), N_MU, fp);

     return s;

 }


 size_t

 neural_layer_convolutional_load(struct Layer *l, FILE *fp)

 {

     size_t s = 0;

     s += fread(&l->options, sizeof(uint32_t), 1, fp);

     s += fread(&l->function, sizeof(int), 1, fp);

     s += fread(&l->height, sizeof(int), 1, fp);

     s += fread(&l->width, sizeof(int), 1, fp);

     s += fread(&l->channels, sizeof(int), 1, fp);

     s += fread(&l->n_filters, sizeof(int), 1, fp);

     s += fread(&l->stride, sizeof(int), 1, fp);

     s += fread(&l->size, sizeof(int), 1, fp);

     s += fread(&l->pad, sizeof(int), 1, fp);

     s += fread(&l->out_h, sizeof(int), 1, fp);

     s += fread(&l->out_w, sizeof(int), 1, fp);

     s += fread(&l->out_c, sizeof(int), 1, fp);

     s += fread(&l->n_biases, sizeof(int), 1, fp);

     s += fread(&l->n_outputs, sizeof(int), 1, fp);

     s += fread(&l->n_inputs, sizeof(int), 1, fp);

     s += fread(&l->max_outputs, sizeof(int), 1, fp);

     s += fread(&l->n_weights, sizeof(int), 1, fp);

     s += fread(&l->n_active, sizeof(int), 1, fp);

     s += fread(&l->eta, sizeof(double), 1, fp);

     s += fread(&l->eta_max, sizeof(double), 1, fp);

     s += fread(&l->eta_min, sizeof(double), 1, fp);

     s += fread(&l->momentum, sizeof(double), 1, fp);

     s += fread(&l->decay, sizeof(double), 1, fp);

     s += fread(&l->max_neuron_grow, sizeof(int), 1, fp);

     malloc_layer_arrays(l);

     s += fread(l->weights, sizeof(double), l->n_weights, fp);

     s += fread(l->weight_updates, sizeof(double), l->n_weights, fp);

     s += fread(l->weight_active, sizeof(bool), l->n_weights, fp);

     s += fread(l->biases, sizeof(double), l->n_biases, fp);

     s += fread(l->bias_updates, sizeof(double), l->n_biases, fp);

     s += fread(l->mu, sizeof(double), N_MU, fp);

     return s;

 }

blas_scal
void blas_scal(const int N, const double ALPHA, double *X, const int INCX)
Scales vector X by the scalar ALPHA and overwrites it with the result.
Definition: blas.c:160

blas_sum
double blas_sum(const double *X, const int N)
Returns the sum of the vector X.
Definition: blas.c:232

blas_axpy
void blas_axpy(const int N, const double ALPHA, const double *X, const int INCX, double *Y, const int INCY)
Multiplies vector X by the scalar ALPHA and adds it to the vector Y.
Definition: blas.c:138

blas_gemm
void blas_gemm(const int TA, const int TB, const int M, const int N, const int K, const double ALPHA, const double *A, const int lda, const double *B, const int ldb, const double BETA, double *C, const int ldc)
Performs the matrix-matrix multiplication: .
Definition: blas.c:108

blas.h
Basic linear algebra functions.

im2col
void im2col(const double *data_im, const int channels, const int height, const int width, const int ksize, const int stride, const int pad, double *data_col)
Transforms an image vector to a column vector.
Definition: image.c:100

col2im
void col2im(const double *data_col, const int channels, const int height, const int width, const int ksize, const int stride, const int pad, double *data_im)
Transforms a column vector to an image vector.
Definition: image.c:63

image.h
Image handling functions.

neural_activation_string
const char * neural_activation_string(const int a)
Returns the name of a specified activation function.
Definition: neural_activations.c:110

neural_gradient_array
void neural_gradient_array(const double *state, double *delta, const int n, const int a)
Applies a gradient function to a vector of neuron states.
Definition: neural_activations.c:215

neural_activate_array
void neural_activate_array(double *state, double *output, const int n, const int a)
Applies an activation function to a vector of neuron states.
Definition: neural_activations.c:199

neural_activations.h
Neural network activation functions.

layer_guard_biases
void layer_guard_biases(const struct Layer *l)
Check number of biases is within bounds.
Definition: neural_layer.c:581

layer_mutate_connectivity
bool layer_mutate_connectivity(struct Layer *l, const double mu_enable, const double mu_disable)
Mutates a layer's connectivity by zeroing weights.
Definition: neural_layer.c:176

layer_defaults
void layer_defaults(struct Layer *l)
Initialises a layer to default values.
Definition: neural_layer.c:413

layer_mutate_functions
bool layer_mutate_functions(struct Layer *l, const double mu)
Mutates a layer's activation function by random selection.
Definition: neural_layer.c:283

layer_weight_json
char * layer_weight_json(const struct Layer *l, const bool return_weights)
Returns a json formatted string representation of a layer's weights.
Definition: neural_layer.c:324

layer_weight_clamp
void layer_weight_clamp(const struct Layer *l)
Clamps a layer's weights and biases in range [WEIGHT_MIN, WEIGHT_MAX].
Definition: neural_layer.c:365

layer_guard_outputs
void layer_guard_outputs(const struct Layer *l)
Check number of outputs is within bounds.
Definition: neural_layer.c:595

layer_weight_rand
void layer_weight_rand(struct Layer *l)
Randomises a layer's weights and biases.
Definition: neural_layer.c:348

layer_calc_n_active
void layer_calc_n_active(struct Layer *l)
Recalculates the number of active connections within a layer.
Definition: neural_layer.c:384

layer_init_eta
void layer_init_eta(struct Layer *l)
Initialises a layer's gradient descent rate.
Definition: neural_layer.c:399

layer_mutate_eta
bool layer_mutate_eta(struct Layer *l, const double mu)
Mutates the gradient descent rate of a neural layer.
Definition: neural_layer.c:88

layer_mutate_weights
bool layer_mutate_weights(struct Layer *l, const double mu)
Mutates a layer's weights and biases by adding random numbers from a Gaussian normal distribution wit...
Definition: neural_layer.c:252

layer_guard_weights
void layer_guard_weights(const struct Layer *l)
Check number of weights is within bounds.
Definition: neural_layer.c:609

LAYER_EVOLVE_ETA
#define LAYER_EVOLVE_ETA
Layer may evolve rate of gradient descent.
Definition: neural_layer.h:55

LAYER_EVOLVE_FUNCTIONS
#define LAYER_EVOLVE_FUNCTIONS
Layer may evolve functions.
Definition: neural_layer.h:53

WEIGHT_SD_INIT
#define WEIGHT_SD_INIT
Std dev of Gaussian for weight initialisation.
Definition: neural_layer.h:66

LAYER_EVOLVE_WEIGHTS
#define LAYER_EVOLVE_WEIGHTS
Layer may evolve weights.
Definition: neural_layer.h:51

LAYER_EVOLVE_NEURONS
#define LAYER_EVOLVE_NEURONS
Layer may evolve neurons.
Definition: neural_layer.h:52

LAYER_EVOLVE_CONNECT
#define LAYER_EVOLVE_CONNECT
Layer may evolve connectivity.
Definition: neural_layer.h:56

WEIGHT_SD
#define WEIGHT_SD
Std dev of Gaussian for weight resizing.
Definition: neural_layer.h:67

LAYER_SGD_WEIGHTS
#define LAYER_SGD_WEIGHTS
Layer may perform gradient descent.
Definition: neural_layer.h:54

CONVOLUTIONAL
#define CONVOLUTIONAL
Layer type convolutional.
Definition: neural_layer.h:36

layer_print
static void layer_print(const struct Layer *l, const bool print_weights)
Prints the layer.
Definition: neural_layer.h:270

layer_args_opt
uint32_t layer_args_opt(const struct ArgsLayer *args)
Returns a bitstring representing the permissions granted by a layer.
Definition: neural_layer_args.c:541

get_out_width
static int get_out_width(const struct Layer *l)
Returns the output width of a convolutional layer.
Definition: neural_layer_convolutional.c:62

neural_layer_convolutional_output
double * neural_layer_convolutional_output(const struct Layer *l)
Returns the output from a convolutional layer.
Definition: neural_layer_convolutional.c:487

neural_layer_convolutional_update
void neural_layer_convolutional_update(const struct Layer *l)
Updates the weights and biases of a convolutional layer.
Definition: neural_layer_convolutional.c:340

neural_layer_convolutional_forward
void neural_layer_convolutional_forward(const struct Layer *l, const struct Net *net, const double *input)
Forward propagates a convolutional layer.
Definition: neural_layer_convolutional.c:262

neural_layer_convolutional_resize
void neural_layer_convolutional_resize(struct Layer *l, const struct Layer *prev)
Resizes a convolutional layer if the previous layer has changed size.
Definition: neural_layer_convolutional.c:361

malloc_layer_arrays
static void malloc_layer_arrays(struct Layer *l)
Allocate memory used by a convolutional layer.
Definition: neural_layer_convolutional.c:102

realloc_layer_arrays
static void realloc_layer_arrays(struct Layer *l)
Resize memory used by a convolutional layer.
Definition: neural_layer_convolutional.c:122

N_MU
#define N_MU
Number of mutation rates applied to a convolutional layer.
Definition: neural_layer_convolutional.c:31

neural_layer_convolutional_copy
struct Layer * neural_layer_convolutional_copy(const struct Layer *src)
Initialises and copies one convolutional layer from another.
Definition: neural_layer_convolutional.c:203

neural_layer_convolutional_print
void neural_layer_convolutional_print(const struct Layer *l, const bool print_weights)
Prints a convolutional layer.
Definition: neural_layer_convolutional.c:498

get_workspace_size
static size_t get_workspace_size(const struct Layer *l)
Returns the memory workspace size for a convolutional layer.
Definition: neural_layer_convolutional.c:73

neural_layer_convolutional_mutate
bool neural_layer_convolutional_mutate(struct Layer *l)
Mutates a convolutional layer.
Definition: neural_layer_convolutional.c:452

MU_TYPE
static const int MU_TYPE[(6)]
Self-adaptation method for mutating a convolutional layer.
Definition: neural_layer_convolutional.c:36

neural_layer_convolutional_free
void neural_layer_convolutional_free(const struct Layer *l)
Free memory used by a convolutional layer.
Definition: neural_layer_convolutional.c:142

get_out_height
static int get_out_height(const struct Layer *l)
Returns the output height of a convolutional layer.
Definition: neural_layer_convolutional.c:51

neural_layer_convolutional_save
size_t neural_layer_convolutional_save(const struct Layer *l, FILE *fp)
Writes a convolutional layer to a file.
Definition: neural_layer_convolutional.c:546

neural_layer_convolutional_add_filters
static void neural_layer_convolutional_add_filters(struct Layer *l, const int N)
Adds N filters to a layer. Negative N removes filters.
Definition: neural_layer_convolutional.c:418

neural_layer_convolutional_mutate_filter
static int neural_layer_convolutional_mutate_filter(const struct Layer *l, const double mu)
Returns the number of kernel filters to add or remove from a layer.
Definition: neural_layer_convolutional.c:394

neural_layer_convolutional_load
size_t neural_layer_convolutional_load(struct Layer *l, FILE *fp)
Reads a convolutional layer from a file.
Definition: neural_layer_convolutional.c:589

guard_malloc
static void guard_malloc(const struct Layer *l)
Check memory allocation is within bounds.
Definition: neural_layer_convolutional.c:90

neural_layer_convolutional_rand
void neural_layer_convolutional_rand(struct Layer *l)
Randomises the weights of a convolutional layer.
Definition: neural_layer_convolutional.c:250

neural_layer_convolutional_init
void neural_layer_convolutional_init(struct Layer *l, const struct ArgsLayer *args)
Initialises a 2D convolutional layer.
Definition: neural_layer_convolutional.c:162

neural_layer_convolutional_backward
void neural_layer_convolutional_backward(const struct Layer *l, const struct Net *net, const double *input, double *delta)
Backward propagates a convolutional layer.
Definition: neural_layer_convolutional.c:296

neural_layer_convolutional_json_export
char * neural_layer_convolutional_json_export(const struct Layer *l, const bool return_weights)
Returns a json formatted string of a convolutional layer.
Definition: neural_layer_convolutional.c:514

neural_layer_convolutional.h
An implementation of a 2D convolutional layer.

sam_init
void sam_init(double *mu, const int N, const int *type)
Initialises self-adaptive mutation rates.
Definition: sam.c:43

sam_adapt
void sam_adapt(double *mu, const int N, const int *type)
Self-adapts mutation rates.
Definition: sam.c:68

sam.h
Self-adaptive mutation functions.

SAM_RATE_SELECT
#define SAM_RATE_SELECT
Ten normally distributed rates.
Definition: sam.h:29

ArgsLayer
Parameters for initialising a neural network layer.
Definition: neural_layer_args.h:31

ArgsLayer::n_init
int n_init
Initial number of units / neurons / filters.
Definition: neural_layer_args.h:34

ArgsLayer::decay
double decay
Weight decay for gradient descent.
Definition: neural_layer_args.h:48

ArgsLayer::momentum
double momentum
Momentum for gradient descent.
Definition: neural_layer_args.h:47

ArgsLayer::function
int function
Activation function.
Definition: neural_layer_args.h:37

ArgsLayer::max_neuron_grow
int max_neuron_grow
Maximum number neurons to add per mutation event.
Definition: neural_layer_args.h:36

ArgsLayer::eta
double eta
Gradient descent rate.
Definition: neural_layer_args.h:45

ArgsLayer::pad
int pad
Pool and Conv.
Definition: neural_layer_args.h:44

ArgsLayer::eta_min
double eta_min
Current gradient descent rate.
Definition: neural_layer_args.h:46

ArgsLayer::channels
int channels
Pool, Conv, and Upsample.
Definition: neural_layer_args.h:41

ArgsLayer::n_max
int n_max
Maximum number of units / neurons.
Definition: neural_layer_args.h:35

ArgsLayer::size
int size
Pool and Conv.
Definition: neural_layer_args.h:42

ArgsLayer::width
int width
Pool, Conv, and Upsample.
Definition: neural_layer_args.h:40

ArgsLayer::height
int height
Pool, Conv, and Upsample.
Definition: neural_layer_args.h:39

ArgsLayer::stride
int stride
Pool, Conv, and Upsample.
Definition: neural_layer_args.h:43

Layer
Neural network layer data structure.
Definition: neural_layer.h:73

Layer::output
double * output
Current neuron outputs (after activation function)
Definition: neural_layer.h:76

Layer::decay
double decay
Weight decay for gradient descent.
Definition: neural_layer.h:89

Layer::size
int size
Pool and Conv.
Definition: neural_layer.h:133

Layer::state
double * state
Current neuron states (before activation function)
Definition: neural_layer.h:75

Layer::pad
int pad
Pool and Conv.
Definition: neural_layer.h:129

Layer::max_neuron_grow
int max_neuron_grow
Maximum number neurons to add per mutation event.
Definition: neural_layer.h:93

Layer::stride
int stride
Pool, Conv, and Upsample.
Definition: neural_layer.h:134

Layer::n_inputs
int n_inputs
Number of layer inputs.
Definition: neural_layer.h:90

Layer::n_biases
int n_biases
Number of layer biases.
Definition: neural_layer.h:95

Layer::weight_active
bool * weight_active
Whether each connection is present in the layer.
Definition: neural_layer.h:79

Layer::weights
double * weights
Weights for calculating neuron states.
Definition: neural_layer.h:78

Layer::weight_updates
double * weight_updates
Updates to weights.
Definition: neural_layer.h:82

Layer::n_filters
int n_filters
Conv.
Definition: neural_layer.h:136

Layer::mu
double * mu
Mutation rates.
Definition: neural_layer.h:84

Layer::channels
int channels
Pool, Conv, and Upsample.
Definition: neural_layer.h:128

Layer::function
int function
Layer activation function.
Definition: neural_layer.h:97

Layer::c
double * c
LSTM.
Definition: neural_layer.h:120

Layer::height
int height
Pool, Conv, and Upsample.
Definition: neural_layer.h:126

Layer::temp
double * temp
LSTM.
Definition: neural_layer.h:122

Layer::layer_vptr
struct LayerVtbl const  * layer_vptr
Functions acting on layers.
Definition: neural_layer.h:100

Layer::max_outputs
int max_outputs
Maximum number of neurons in the layer.
Definition: neural_layer.h:92

Layer::width
int width
Pool, Conv, and Upsample.
Definition: neural_layer.h:127

Layer::n_weights
int n_weights
Number of layer weights.
Definition: neural_layer.h:94

Layer::bias_updates
double * bias_updates
Updates to biases.
Definition: neural_layer.h:81

Layer::eta_max
double eta_max
Maximum gradient descent rate.
Definition: neural_layer.h:86

Layer::i
double * i
LSTM.
Definition: neural_layer.h:117

Layer::n_outputs
int n_outputs
Number of layer outputs.
Definition: neural_layer.h:91

Layer::biases
double * biases
Biases for calculating neuron states.
Definition: neural_layer.h:80

Layer::n_active
int n_active
Number of active weights / connections.
Definition: neural_layer.h:96

Layer::out_w
int out_w
Pool, Conv, and Upsample.
Definition: neural_layer.h:130

Layer::type
int type
Layer type: CONNECTED, DROPOUT, etc.
Definition: neural_layer.h:74

Layer::out_c
int out_c
Pool, Conv, and Upsample.
Definition: neural_layer.h:132

Layer::delta
double * delta
Delta for updating weights.
Definition: neural_layer.h:83

Layer::options
uint32_t options
Bitwise layer options permitting evolution, SGD, etc.
Definition: neural_layer.h:77

Layer::out_h
int out_h
Pool, Conv, and Upsample.
Definition: neural_layer.h:131

Layer::eta_min
double eta_min
Minimum gradient descent rate.
Definition: neural_layer.h:87

Layer::eta
double eta
Gradient descent rate.
Definition: neural_layer.h:85

Layer::momentum
double momentum
Momentum for gradient descent.
Definition: neural_layer.h:88

Net
Neural network data structure.
Definition: neural.h:48

rand_normal
double rand_normal(const double mu, const double sigma)
Returns a random Gaussian with specified mean and standard deviation.
Definition: utils.c:87

rand_uniform
double rand_uniform(const double min, const double max)
Returns a uniform random float [min,max].
Definition: utils.c:62

utils.h
Utility functions for random number handling, etc.

clamp
static double clamp(const double a, const double min, const double max)
Returns a float clamped within the specified range.
Definition: utils.h:60