rll/CCL_doc/ccl__learn__alpha_8h_source.html

 /*********************************************************************

 CCL:A library for Constraint Consistent learning

 Copyright (C) 2018 Matthew Howard

 Contact:matthew.j.howard@kcl.ac.uk

 This library is free software; you can redistribute it and/or

 modify it under the terms of the GNU Lesser General Public

 License as published by the Free Software Foundation; either

 version 2.1 of the License, or (at your option) any later version.


 This library is distributed in the hope that it will be useful,

 but WITHOUT ANY WARRANTY; without even the implied warranty of

 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

 Library General Public License for more details.


 You should have received a copy of the GNU Lesser General Public

 License along with this library; if not, write to the Free

 Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.

 *********************************************************************/


 #ifndef __CCL_LEARN_ALPHA_H

 #define __CCL_LEARN_ALPHA_H


 #include <ccl_math.h>

 #include <gsl/gsl_linalg.h>

 #include <gsl/gsl_blas.h>

 #include <gsl/gsl_math.h>

 #include <gsl/gsl_sf.h>

 #include <stdio.h>

 #include <string.h>

 #include <stdlib.h>

 #define NUM_CONSTRAINT 3

 #ifdef __cplusplus

 extern "C" {

 #endif


 typedef struct{

     int dim_b;

     int dim_r;

     int dim_x;

     int dim_u;

     int dim_t;

     int dim_k;

     int dim_n;

     double var;

     double nmse;

     double *w[NUM_CONSTRAINT];

     double * c;

     double  s2;

 } LEARN_A_MODEL;


 typedef struct{

     int MaxIter;

     double Tolfun;

     double Tolx;

     double Jacob;

 } OPTION;


 typedef struct{

     int      dim_x;

     int      dim_u;

     int      dim_n;

     int      dim_b;

     int      dim_k;

     double * xc;

     double * x;

     double * xf;

     double * epsx;

     double   epsf;

     double * r;

     double * J;

     double   S;

     double * A;

     double * v;

     double * D;

     double   Rlo;

     double   Rhi;

     double   l;

     double   lc;

     double * d;

     int      iter;

     int      r_ok;

     int      x_ok;

     double * xd;

     double * rd;

     double   Sd;

     double   dS;

     double   R;

     double   nu;

     double*  d_T;

     double*  J_T;

     double* tmp;

     double* rd_T;

     gsl_matrix* D_pinv;

     gsl_vector* A_d;

     gsl_matrix* A_inv;

     gsl_vector* A_inv_diag;

     gsl_vector* r_T;

 } SOLVE_LM_WS;


 int ccl_learn_alpha_model_alloc(LEARN_A_MODEL *model);


 int ccl_learn_alpha_model_free(LEARN_A_MODEL *model);


 int ccl_solve_lm_ws_alloc(const LEARN_A_MODEL *model,SOLVE_LM_WS * lm_ws);


 int ccl_solve_lm_ws_free(SOLVE_LM_WS * lm_ws);


 void ccl_learn_alpha(const double * Un,const double *X,const int dim_b,const int dim_r,const int dim_n,const int dim_x,const int dim_u,LEARN_A_MODEL optimal);


 void search_learn_alpha(const double *BX,const double *RnUn, LEARN_A_MODEL* model);

 void obj_AUn (const LEARN_A_MODEL* model, const double* W, const double* BX,const double * RnUn,double* fun_out);


 void ccl_get_unit_vector_from_matrix(const double *theta, int dim_n, int dim_t, double *alpha);


 void ccl_solve_lm(const LEARN_A_MODEL* model,const  double* RnUn,const  double* BX, const OPTION option,SOLVE_LM_WS * lm_ws_param, double* W);


 void findjac(const LEARN_A_MODEL* model, const int dim_x,const double* BX, const double * RnUn,const double *y,const double*x,double epsx,double* J);


 void ccl_get_rotation_matrix(const double*theta,const double*currentRn,const LEARN_A_MODEL* model,const int alpha_id,double*Rn);


 void ccl_make_given_matrix(const double theta,int i,int j,int dim,double*G);


 void predict_proj_alpha(double* x, LEARN_A_MODEL* model,double* centres,double variance,double* Iu, double*A);

 #ifdef __cplusplus

 }

 #endif

 #endif


LEARN_A_MODEL::dim_t
int dim_t
Number of parameters needed to represent an unit vector.
Definition: ccl_learn_alpha.h:130

SOLVE_LM_WS::Sd
double Sd
The squared error if xd is taken.
Definition: ccl_learn_alpha.h:186

SOLVE_LM_WS::R
double R
The reduction if xd is taken.
Definition: ccl_learn_alpha.h:188

SOLVE_LM_WS::dim_k
int dim_k
The dimensionality of the constraints.
Definition: ccl_learn_alpha.h:164

SOLVE_LM_WS::D_pinv
gsl_matrix * D_pinv
The peudo-inverse of D.
Definition: ccl_learn_alpha.h:194

predict_proj_alpha
void predict_proj_alpha(double *x, LEARN_A_MODEL *model, double *centres, double variance, double *Iu, double *A)
Computation routine for prediction of the A matrix.

ccl_get_rotation_matrix
void ccl_get_rotation_matrix(const double *theta, const double *currentRn, const LEARN_A_MODEL *model, const int alpha_id, double *Rn)
Computation routine for rotation matrix after finding the k^th constraint vector. ...

SOLVE_LM_WS::J_T
double * J_T
The matrix transpose of J.
Definition: ccl_learn_alpha.h:191

SOLVE_LM_WS::iter
int iter
The iteration number.
Definition: ccl_learn_alpha.h:181

SOLVE_LM_WS::A_inv_diag
gsl_vector * A_inv_diag
The vector of diagonal elements of A matrix.
Definition: ccl_learn_alpha.h:197

SOLVE_LM_WS::dim_n
int dim_n
The number of data points.
Definition: ccl_learn_alpha.h:162

LEARN_A_MODEL::var
double var
The variance of the Un.
Definition: ccl_learn_alpha.h:133

SOLVE_LM_WS::epsf
double epsf
The tolerence fo the objective functions.
Definition: ccl_learn_alpha.h:169

SOLVE_LM_WS::A_d
gsl_vector * A_d
The A matrix at xd.
Definition: ccl_learn_alpha.h:195

SOLVE_LM_WS::xd
double * xd
The next x.
Definition: ccl_learn_alpha.h:184

SOLVE_LM_WS::x
double * x
The flattened and updated model parameters.
Definition: ccl_learn_alpha.h:166

LEARN_A_MODEL::dim_k
int dim_k
The dimensionality of the constraints.
Definition: ccl_learn_alpha.h:131

SOLVE_LM_WS::r_T
gsl_vector * r_T
The vector transpose of r.
Definition: ccl_learn_alpha.h:198

SOLVE_LM_WS::A_inv
gsl_matrix * A_inv
The peudo-inverse of A.
Definition: ccl_learn_alpha.h:196

SOLVE_LM_WS::rd
double * rd
The residual error at xd.
Definition: ccl_learn_alpha.h:185

LEARN_A_MODEL::dim_r
int dim_r
The dimensionality of the task space.
Definition: ccl_learn_alpha.h:127

NUM_CONSTRAINT
#define NUM_CONSTRAINT
Definition: ccl_learn_alpha.h:115

SOLVE_LM_WS::l
double l
The adaptive learning rate.
Definition: ccl_learn_alpha.h:178

SOLVE_LM_WS::dim_u
int dim_u
The dimensionality of the action space.
Definition: ccl_learn_alpha.h:161

SOLVE_LM_WS::Rhi
double Rhi
The upper bound of R.
Definition: ccl_learn_alpha.h:177

ccl_solve_lm_ws_alloc
int ccl_solve_lm_ws_alloc(const LEARN_A_MODEL *model, SOLVE_LM_WS *lm_ws)
Allocates the workspace memory for the LM solver.

SOLVE_LM_WS::d
double * d
The parameter improvement gradient.
Definition: ccl_learn_alpha.h:180

SOLVE_LM_WS::D
double * D
Automatic scaling.
Definition: ccl_learn_alpha.h:175

LEARN_A_MODEL::dim_x
int dim_x
The dimensionality of the state space.
Definition: ccl_learn_alpha.h:128

ccl_solve_lm_ws_free
int ccl_solve_lm_ws_free(SOLVE_LM_WS *lm_ws)
Free the memory for the LM solver.

SOLVE_LM_WS::dS
double dS
The denomitor of the sqaured error is xd is taken.
Definition: ccl_learn_alpha.h:187

LEARN_A_MODEL::c
double * c
The mean of the rbf.
Definition: ccl_learn_alpha.h:136

SOLVE_LM_WS::Rlo
double Rlo
The lower bound of R.
Definition: ccl_learn_alpha.h:176

SOLVE_LM_WS::d_T
double * d_T
The matrix transpose of d.
Definition: ccl_learn_alpha.h:190

SOLVE_LM_WS::dim_b
int dim_b
The number of basis functions.
Definition: ccl_learn_alpha.h:163

SOLVE_LM_WS
This structure defines the workspace variables for solving the non-linear LM optimization.
Definition: ccl_learn_alpha.h:159

search_learn_alpha
void search_learn_alpha(const double *BX, const double *RnUn, LEARN_A_MODEL *model)
Main computation routine for learning a model of A.

SOLVE_LM_WS::x_ok
int x_ok
check if the model parameters are belowed the tolerence
Definition: ccl_learn_alpha.h:183

findjac
void findjac(const LEARN_A_MODEL *model, const int dim_x, const double *BX, const double *RnUn, const double *y, const double *x, double epsx, double *J)
Computation routine for numerical approximation of the objevtive jacobian matrix. ...

ccl_learn_alpha_model_free
int ccl_learn_alpha_model_free(LEARN_A_MODEL *model)
Free the memory for the learn_alpha model.

SOLVE_LM_WS::A
double * A
The dot product of J_T and J.
Definition: ccl_learn_alpha.h:173

SOLVE_LM_WS::r
double * r
The returned value of the residual error.
Definition: ccl_learn_alpha.h:170

SOLVE_LM_WS::dim_x
int dim_x
The dimensionality of the state variable.
Definition: ccl_learn_alpha.h:160

ccl_math.h
CCL header file for math.

LEARN_A_MODEL::dim_n
int dim_n
The number of data points.
Definition: ccl_learn_alpha.h:132

SOLVE_LM_WS::S
double S
The sqaure root if x is taken.
Definition: ccl_learn_alpha.h:172

ccl_make_given_matrix
void ccl_make_given_matrix(const double theta, int i, int j, int dim, double *G)
Computation routine for generating roation matrix of a plane rotation of degree theta in an arbitrary...

LEARN_A_MODEL::dim_u
int dim_u
The dimensionality of the action space.
Definition: ccl_learn_alpha.h:129

LEARN_A_MODEL::nmse
double nmse
The normalised mean square error of the model.
Definition: ccl_learn_alpha.h:134

LEARN_A_MODEL::s2
double s2
The variance of the rbf.
Definition: ccl_learn_alpha.h:137

ccl_learn_alpha_model_alloc
int ccl_learn_alpha_model_alloc(LEARN_A_MODEL *model)
Allocates the memory for the learn_alpha model.

ccl_get_unit_vector_from_matrix
void ccl_get_unit_vector_from_matrix(const double *theta, int dim_n, int dim_t, double *alpha)
Computation routine for generating unit vector for row vector alpha by given theta anlges...

obj_AUn
void obj_AUn(const LEARN_A_MODEL *model, const double *W, const double *BX, const double *RnUn, double *fun_out)
Computation routine for learning constraint by increasing the dimensionality of k.

SOLVE_LM_WS::nu
double nu
The coefficient of changing learning rate.
Definition: ccl_learn_alpha.h:189

SOLVE_LM_WS::tmp
double * tmp
The temporal variable.
Definition: ccl_learn_alpha.h:192

SOLVE_LM_WS::xc
double * xc
A copy of the initial model parameters.
Definition: ccl_learn_alpha.h:165

ccl_solve_lm
void ccl_solve_lm(const LEARN_A_MODEL *model, const double *RnUn, const double *BX, const OPTION option, SOLVE_LM_WS *lm_ws_param, double *W)
Computation routine for optimizing non-linear objective functions using LM approach.

OPTION
This structure defines the OPTION for the optimizer.
Definition: ccl_learn_alpha.h:145

SOLVE_LM_WS::J
double * J
The jacobian at x.
Definition: ccl_learn_alpha.h:171

SOLVE_LM_WS::rd_T
double * rd_T
The matrix transpose of rd.
Definition: ccl_learn_alpha.h:193

SOLVE_LM_WS::lc
double lc
Handling situation when learning rate happends to be 0.
Definition: ccl_learn_alpha.h:179

SOLVE_LM_WS::xf
double * xf
The finalised model parameters.
Definition: ccl_learn_alpha.h:167

ccl_learn_alpha
void ccl_learn_alpha(const double *Un, const double *X, const int dim_b, const int dim_r, const int dim_n, const int dim_x, const int dim_u, LEARN_A_MODEL optimal)
Main computation routine for learning state dependent constraint A.

LEARN_A_MODEL
This structure describes a "LEARN_A_MODEL" (a learn alpha model). This structure constains the diment...
Definition: ccl_learn_alpha.h:125

SOLVE_LM_WS::v
double * v
The dot product of J_T and r.
Definition: ccl_learn_alpha.h:174

SOLVE_LM_WS::r_ok
int r_ok
check if the objective function is belowed the tolerence
Definition: ccl_learn_alpha.h:182

LEARN_A_MODEL::dim_b
int dim_b
The number of basis functions.
Definition: ccl_learn_alpha.h:126

SOLVE_LM_WS::epsx
double * epsx
The tolerence of the model paramters.
Definition: ccl_learn_alpha.h:168