xcsf/env__mux_8c_source.html

 /*

  * This program is free software: you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation, either version 3 of the License, or

  * (at your option) any later version.

  *

  * This program is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

  * GNU General Public License for more details.

  *

  * You should have received a copy of the GNU General Public License

  * along with this program.  If not, see <http://www.gnu.org/licenses/>.

  */


 #include "env_mux.h"

 #include "param.h"

 #include "utils.h"


 #define MAX_PAYOFF (1.)


 void

 env_mux_init(struct XCSF *xcsf, const int bits)

 {

     struct EnvMux *env = malloc(sizeof(struct EnvMux));

     env->pos_bits = 1;

     while (env->pos_bits + pow(2, env->pos_bits) <= bits) {

         ++(env->pos_bits);

     }

     --(env->pos_bits);

     const int n = env->pos_bits + (int) pow(2, env->pos_bits);

     env->state = malloc(sizeof(double) * n);

     xcsf->env = env;

     param_init(xcsf, n, 1, 2);

 }


 void

 env_mux_free(const struct XCSF *xcsf)

 {

     struct EnvMux *env = xcsf->env;

     free(env->state);

     free(env);

 }


 const double *

 env_mux_get_state(const struct XCSF *xcsf)

 {

     const struct EnvMux *env = xcsf->env;

     for (int i = 0; i < xcsf->x_dim; ++i) {

         env->state[i] = rand_uniform(0, 1);

     }

     return env->state;

 }


 double

 env_mux_execute(const struct XCSF *xcsf, const int action)

 {

     const struct EnvMux *env = xcsf->env;

     int pos = env->pos_bits;

     for (int i = 0; i < env->pos_bits; ++i) {

         if (env->state[i] > 0.5) {

             pos += (int) pow(2, (double) (env->pos_bits - 1 - i));

         }

     }

     const int answer = (env->state[pos] > 0.5) ? 1 : 0;

     return (action == answer) ? MAX_PAYOFF : 0;

 }


 void

 env_mux_reset(const struct XCSF *xcsf)

 {

     (void) xcsf;

 }


 bool

 env_mux_is_done(const struct XCSF *xcsf)

 {

     (void) xcsf;

     return true;

 }


 double

 env_mux_maxpayoff(const struct XCSF *xcsf)

 {

     (void) xcsf;

     return MAX_PAYOFF;

 }


 bool

 env_mux_multistep(const struct XCSF *xcsf)

 {

     (void) xcsf;

     return false;

 }

env_mux_free
void env_mux_free(const struct XCSF *xcsf)
Frees the multiplexer environment.
Definition: env_mux.c:63

env_mux_get_state
const double * env_mux_get_state(const struct XCSF *xcsf)
Returns a random multiplexer problem instance.
Definition: env_mux.c:76

env_mux_execute
double env_mux_execute(const struct XCSF *xcsf, const int action)
Returns the reward for executing a multiplexer action.
Definition: env_mux.c:92

env_mux_reset
void env_mux_reset(const struct XCSF *xcsf)
Dummy method since no multiplexer reset is necessary.
Definition: env_mux.c:110

env_mux_is_done
bool env_mux_is_done(const struct XCSF *xcsf)
Returns whether the multiplexer is in a terminal state.
Definition: env_mux.c:121

env_mux_multistep
bool env_mux_multistep(const struct XCSF *xcsf)
Returns whether the multiplexer is a multistep problem.
Definition: env_mux.c:145

env_mux_maxpayoff
double env_mux_maxpayoff(const struct XCSF *xcsf)
Returns the maximum payoff value possible in the multiplexer.
Definition: env_mux.c:133

MAX_PAYOFF
#define MAX_PAYOFF
Payoff provided for making a correct classification.
Definition: env_mux.c:35

env_mux_init
void env_mux_init(struct XCSF *xcsf, const int bits)
Initialises a real multiplexer environment of specified length.
Definition: env_mux.c:44

env_mux.h
The real multiplexer problem environment.

xcsf
Definition: __init__.py:1

param_init
void param_init(struct XCSF *xcsf, const int x_dim, const int y_dim, const int n_actions)
Initialises default XCSF parameters.
Definition: param.c:45

param.h
Functions for setting and printing parameters.

EnvMux
Real multiplexer environment data structure.
Definition: env_mux.h:32

EnvMux::pos_bits
int pos_bits
Number of position bits.
Definition: env_mux.h:34

EnvMux::state
double * state
Current state.
Definition: env_mux.h:33

XCSF
XCSF data structure.
Definition: xcsf.h:85

rand_uniform
double rand_uniform(const double min, const double max)
Returns a uniform random float [min,max].
Definition: utils.c:62

utils.h
Utility functions for random number handling, etc.