LuziaKn · LuziaKn · commit e9a74615365f · 2020-01-18T13:30:06.000+01:00
changing back to original disturbance
diff --git a/GP.m b/GP.m
@@ -503,6 +503,104 @@ function plot2d(obj, truthfun, varargin)
             colormap(gcf,parula);
         end
         
+         function plotNd(obj, truthfun, varargin)
+        %------------------------------------------------------------------
+        % Make analysis of the GP quality (only for the first output dimension.
+        % This function can only be called when the GP input is 2D
+        %
+        % args:
+        %   truthfun: anonymous function @(x) which returns the true function
+        %   varargin{1} = rangeX1: 
+        %   varargin{2} = rangeX2:  <1,2> range of X1 and X2 where the data 
+        %                           will be evaluated and ploted
+        %------------------------------------------------------------------
+            % output dimension to be analyzed
+            pi = 1;
+        
+            assert(obj.N>0, 'Dataset is empty. Aborting...')
+            % we can not plot more than in 3D
+            assert(obj.n==2, 'This function can only be used when dim(X)=2. Aborting...');
+            
+            % Generate grid where the mean and variance will be calculated
+            if numel(varargin) ~= 2
+                factor = 0.3;
+                rangeX1 = [ min(obj.X(1,:)) - factor*range(obj.X(1,:)), ...
+                            max(obj.X(1,:)) + factor*range(obj.X(1,:))  ];
+                rangeX2 = [ min(obj.X(2,:)) - factor*range(obj.X(2,:)), ...
+                            max(obj.X(2,:)) + factor*range(obj.X(2,:))  ];
+            else
+                rangeX1 = varargin{1};
+                rangeX2 = varargin{2};
+            end
+
+            % generate grid
+            [X1,X2] = meshgrid(linspace(rangeX1(1),rangeX1(2),100),...
+                               linspace(rangeX2(1),rangeX2(2),100));
+            Ytrue = zeros('like',X1);
+            Ystd  = zeros('like',X1);
+            Ymean = zeros('like',X1);
+            for i=1:size(X1,1)
+                for j=1:size(X1,2)
+                    % evaluate true function
+                    mutrue = truthfun([X1(i,j);X2(i,j)]);
+                    Ytrue(i,j) = mutrue(pi); % select desired output dim
+                    % evaluate GP model
+                    [mu,var] = obj.eval([X1(i,j);X2(i,j)],true);
+                    if var < 0
+                        error('GP obtained a negative variance... aborting');
+                    end
+                    Ystd(i,j)  = sqrt(var);
+                    Ymean(i,j) = mu(:,pi);    % select desired output dim
+                end
+            end 
+            
+            % plot data points, and +-2*stddev surfaces 
+            figure('Color','w')
+            hold on; grid on;
+            % surf(X1,X2,Y, 'FaceAlpha',0.3)
+            surf(X1,X2,Ymean+2*Ystd ,Ystd, 'FaceAlpha',0.3)
+            surf(X1,X2,Ymean-2*Ystd,Ystd, 'FaceAlpha',0.3)
+            scatter3(obj.X(1,:),obj.X(2,:),obj.Y(:,pi),'filled','MarkerFaceColor','red')
+            title('mean\pm2*stddev Prediction Curves')
+            shading interp;
+            colormap(gcf,jet);
+            view(30,30)
+            
+            % Comparison between true and prediction mean
+            figure('Color','w')
+            subplot(1,2,1); hold on; grid on;
+            surf(X1,X2,Ytrue, 'FaceAlpha',.8, 'EdgeColor', 'none', 'DisplayName', 'True function');
+            % surf(X1,X2,Ymean, 'FaceAlpha',.5, 'FaceColor','g', 'EdgeColor', 'none', 'DisplayName', 'Prediction mean');
+            scatter3(obj.X(1,:),obj.X(2,:),obj.Y(:,pi),'filled','MarkerFaceColor','red', 'DisplayName', 'Sample points')
+            zlim([ min(obj.Y(:,pi))-range(obj.Y(:,pi)),max(obj.Y(:,pi))+range(obj.Y(:,pi)) ]);
+            legend;
+            xlabel('X1'); ylabel('X2');
+            title('True Function')
+            view(24,12)
+            subplot(1,2,2); hold on; grid on;
+            % surf(X1,X2,Y, 'FaceAlpha',.5, 'FaceColor','b', 'EdgeColor', 'none', 'DisplayName', 'True function');
+            surf(X1,X2,Ymean, 'FaceAlpha',.8, 'EdgeColor', 'none', 'DisplayName', 'Prediction mean');
+            scatter3(obj.X(1,:),obj.X(2,:),obj.Y(:,pi),'filled','MarkerFaceColor','red', 'DisplayName', 'Sample points')
+            zlim([ min(obj.Y(:,pi))-range(obj.Y(:,pi)),max(obj.Y(:,pi))+range(obj.Y(:,pi)) ]);
+            legend;
+            xlabel('X1'); ylabel('X2');
+            title('Prediction Mean')
+            view(24,12)
+            
+            % plot bias and variance
+            figure('Color','w')
+            subplot(1,2,1); hold on; grid on;
+            contourf(X1,X2, abs(Ymean-Ytrue), 50,'LineColor','none')
+            title('Absolute Prediction Bias')
+            colorbar;
+            scatter(obj.X(1,:),obj.X(2,:),'filled','MarkerFaceColor','red')
+            subplot(1,2,2); hold on; grid on;
+            contourf(X1,X2, Ystd.^2, 50 ,'LineColor','none')
+            title('Prediction Variance')
+            colorbar;
+            scatter(obj.X(1,:),obj.X(2,:),'filled','MarkerFaceColor','red')
+            colormap(gcf,parula);
+         end
         
         function plot1d(obj, truthfun, varargin)
         %------------------------------------------------------------------
diff --git a/MotionModelGP_InvPendulum_deffect.m b/MotionModelGP_InvPendulum_deffect.m
@@ -43,7 +43,7 @@
             xdot = f @ MotionModelGP_InvPendulum_nominal(obj,x,u);
             
             % add deffect
-            %xdot(3) = xdot(3) + (0.1 * x(3) - 0.01*x(4) + deg2rad(3)) *10;
+            xdot(3) = xdot(3) + (0.1 * x(3) - 0.01*x(4) + deg2rad(3)) *10;
             
             % xdot(2) = xdot(2) + ( -0.1 * x(1) + deg2rad(3));
         end
diff --git a/MotionModelGP_InvPendulum_nominal.asv b/MotionModelGP_InvPendulum_nominal.asv
@@ -0,0 +1,173 @@
+%------------------------------------------------------------------
+% Programed by: 
+%   - Lucas Rath (lucasrm25@gmail.com)
+%   - 
+%   -
+%------------------------------------------------------------------
+
+
+classdef MotionModelGP_InvPendulum_nominal < MotionModelGP
+%--------------------------------------------------------------------------
+%   xk+1 = fd(xk,uk) + Bd * ( d(zk) + w ),    
+%
+%       where: zk = [Bz_x*xk ; Bz_u*uk],
+%              d ~ N(mean_d(zk),var_d(zk))
+%              w ~ N(0,sigmaw)
+%
+%   
+%   x = [s, ds, th, dth]'   carriage position and pole angle (and derivatives)
+%   u = [F]'                force on the carriage and torque on the pole joint
+%   
+%--------------------------------------------------------------------------
+
+    properties
+        Mc      % mass of the carriage
+        Mp      % mass of the pole
+        b       % friction coefficient between the carriage and the floor
+        I       % inertia matrix of the pole CG
+        l       % pole length
+        g = 9.8
+    end
+    
+    properties(Constant)
+        % keep in mind the dimensions:  xk+1 = fd(xk,uk) + Bd*(d(z)+w)),
+        % where z = [Bz_x*x;Bz_u*u] and x = [s, ds, th, dth]' 
+        
+        Bz_x = [0 0 1 0
+                0 0 0 1] 
+        Bz_u = []; 
+        Bd = [0;            % xk+1 = fd(xk,uk) + Bd*d(zk)
+              0;
+              1;
+              0]
+            
+        n  = 4   % number of outputs x(t)
+        m  = 1   % number of inputs u(t)
+        nz = size(Bz_x,1)  % dimension of z(t)
+        nd = size(Bd,2)   % output dimension of d(z)
+    end
+    
+    
+    methods
+        
+        function obj = MotionModelGP_InvPendulum_nominal (Mc, Mp, b, I, l, d, sigmaw)
+        %------------------------------------------------------------------
+        %   object constructor
+        %------------------------------------------------------------------
+            % call superclass constructor
+            obj = obj @ MotionModelGP(d,sigmaw);
+            % store parameters
+            obj.Mc = Mc;
+            obj.Mp = Mp;
+            obj.b = b;
+            obj.I = I;
+            obj.l = l;
+            
+            % add folder CODEGEN to path. Here there will be some functions
+            % generated with the method generate_invertedPendulum_functions()
+            addpath(fullfile(pwd,'CODEGEN'))
+        end
+        
+        function xdot = f (obj, x, u)
+        %------------------------------------------------------------------
+        %   Continuous time dynamics.
+        %   out:
+        %       xdot: <n,1> time derivative of x given x and u
+        %------------------------------------------------------------------
+            params = [obj.Mc obj.Mp obj.I obj.g obj.l obj.b]';
+            xdot = invertedPendulum_f(x, u, params );
+        end
+        
+        function gradx = gradx_f(obj, x, u)
+        %------------------------------------------------------------------
+        %   Continuous time dynamics.
+        %   out:
+        %       gradx: <n,n> gradient of xdot w.r.t. x
+        %------------------------------------------------------------------
+            params = [obj.Mc obj.Mp obj.I obj.g obj.l obj.b]';
+            gradx = invertedPendulum_gradx_f(x, u, params );
+        end
+        
+        function gradu = gradu_f(obj, x, u)
+        %------------------------------------------------------------------
+        %   Continuous time dynamics.
+        %   out:
+        %       gradu: <m,n> gradient of xdot w.r.t. u
+        %------------------------------------------------------------------
+            params = [obj.Mc obj.Mp obj.I obj.g obj.l obj.b]';
+            gradu = invertedPendulum_gradu_f(x, u, params );
+        end
+        
+        function [A,B] = linearize (obj)
+        %------------------------------------------------------------------
+        % Return continuous time linearized model parameters A,B
+        %       xdot = A*x + B*u
+        %------------------------------------------------------------------
+            Mc=obj.Mc; Mp=obj.Mp; b=obj.b; I=obj.I; l=obj.l; g=obj.g;
+            p = I*(Mc+Mp)+Mc*Mp*l^2;
+            A = [0      1              0           0;
+                 0 -(I+Mp*l^2)*b/p  (Mp^2*g*l^2)/p   0;
+                 0      0              0           1;
+                 0 -(Mp*l*b)/p       Mp*g*l*(Mc+Mp)/p  0];
+            B = [     0;
+                 (I+Mp*l^2)/p;
+                      0;
+                    Mp*l/p];
+        end    
+    end
+    
+    methods(Static)
+        function generate_invertedPendulum_functions()
+        %------------------------------------------------------------------
+        %   Generate continuous time dynamics equations of the inverted 
+        %   pendulum:. This function generates three functions:
+        %       xdot = f(x,u)       - dynamics
+        %       gradx_xdot(x,u)     - gradient of xdot w.r.t. x
+        %       gradu_xdot(x,u)     - gradient of xdot w.r.t. u
+        %
+        %   (Mc+Mp)*dds + b*ds + Mp*l/2*ddth*cos(th) - Mp*l/2*dth^2*sin(th) = F
+        %   (I+Mp*(l/2)^2)*ddth + Mp*g*l/2*sin(th) + Mp*l*dds*cos(th) = T
+        % 
+        %   x = [s, ds, th, dth]'
+        %   u = [F]'
+        %
+        %
+        %   Example how to run this function:
+        %       ip = MotionModelGP_InvertedPendulum(5, 2, 0.1, 0.6, 3, @(z)deal(0,0), 0);
+        %       ip.generate_invertedPendulum_functions();
+        %------------------------------------------------------------------
+            syms g Mc Mp b I l F T s ds dds  th dth ddth real
+            T = 0;  % we are not using this input for now
+            fzero = [(Mc+Mp)*dds + b*ds + Mp*l/2*ddth*cos(th) - Mp*l/2*dth^2*sin(th) - F ;
+                   (I+Mp*(l/2)^2)*ddth + Mp*g*l/2*sin(th) + Mp*l*dds*cos(th) - T  ];
+            sol = solve(fzero,[dds,ddth]);
+            dds = simplify(sol.dds);
+            ddth = simplify(sol.ddth);
+
+            u = F;
+            x = [s, ds, th, dth]';
+            xdot = [ds, dds, dth, ddth]';
+            params = [Mc Mp I g l b ]';
+            
+            
+            folder = fullfile(pwd,'CODEGEN');
+            if ~exist(folder,'dir')
+                mkdir(folder); 
+            end
+            addpath(folder)
+            
+            
+            matlabFunction( xdot, 'Vars', {x;u;params} ,'File', fullfile('CODEGEN','invertedPendulum_f') );
+
+            gradx_f = simplify(jacobian(xdot,x)');
+            matlabFunction( gradx_f, 'Vars', {x;u;params} ,'File', fullfile('CODEGEN','invertedPendulum_gradx_f') );
+
+            gradu_f = simplify(jacobian(xdot,u)');
+            matlabFunction( gradu_f, 'Vars', {x;u;params} ,'File', fullfile('CODEGEN','invertedPendulum_gradu_f') );
+        
+            disp('FINISHED! functions invertedPendulum_f, invertedPendulum_gradx_f and invertedPendulum_gradu_f generated!!')
+
+        end
+    end
+    
+end
diff --git a/MotionModelGP_InvPendulum_nominal.m b/MotionModelGP_InvPendulum_nominal.m
@@ -33,18 +33,18 @@
         % keep in mind the dimensions:  xk+1 = fd(xk,uk) + Bd*(d(z)+w)),
         % where z = [Bz_x*x;Bz_u*u] and x = [s, ds, th, dth]' 
         
-        Bz_x = [0 1 0 0
+        Bz_x = [0 0 1 0
                 0 0 0 1] 
         Bz_u = []; 
-        Bd = [0 0 ;            % xk+1 = fd(xk,uk) + Bd*d(zk)
-              1 0;
-              0 0;
-              0 1]
+        Bd = [0;            % xk+1 = fd(xk,uk) + Bd*d(zk)
+              0;
+              1;
+              0]
             
         n  = 4   % number of outputs x(t)
         m  = 1   % number of inputs u(t)
-        nz = 2   % dimension of z(t)
-        nd = 2   % output dimension of d(z)
+        nz = 2 % dimension of z(t)
+        nd = 1   % output dimension of d(z)
     end
     
     
diff --git a/main_invertedPendulum.asv b/main_invertedPendulum.asv
@@ -24,12 +24,12 @@ maxiter = 15;   % max NMPC iterations per time step
 N = 10;         % NMPC prediction horizon
 
 
-loadPreTrainedGP = false;
+loadPreTrainedGP = true;
 GPfile = fullfile(pwd,'/simresults/20-01-17-out-GP-inverted-pendulum.mat');
-useGP = false;
+useGP = true;
 trainGPonline = true;
 useParallel = false;
-optimizeHyperparameters = true;
+optimizeHyperparameters = false;
 
 
 lookahead = dt*N;
@@ -58,10 +58,10 @@ clearvars d_GP
 %------------------------------------------------------------------
 
 % define noise for true disturbance
-var_w = diag([0,0]);
+var_w = diag([0 0 0 0]);
 
 % create true dynamics model
-trueModel = MotionModelGP_InvPendulum_deffect(Mc*0.9, Mp, b*5 , I*0.5, l*0.5, [], var_w);
+trueModel = MotionModelGP_InvPendulum_deffect(Mc, Mp, b , I, l*2, [], var_w);
 
 %% Create Estimation Model and Nominal Model
 
@@ -72,7 +72,7 @@ trueModel = MotionModelGP_InvPendulum_deffect(Mc*0.9, Mp, b*5 , I*0.5, l*0.5, []
 
 % create nominal dynamics model (no disturbance)
 nomModel = MotionModelGP_InvPendulum_nominal(Mc, Mp, b, I, l, [], []); 
-nomModel = trueModel;
+%nomModel = trueModel;
 
 % -------------------------------------------------------------------------
 %  Create adaptive dynamics model 
@@ -86,9 +86,9 @@ gp_n = MotionModelGP_InvPendulum_nominal.nz;
 gp_p = MotionModelGP_InvPendulum_nominal.nd;
 
 % GP hyperparameters
-var_f   = [0.01,0.01]';                     % output variance
-M       = repmat(diag([1e0,1e0].^2),[1,1,gp_p]);     % length scale
-var_n   = [1e-8,1e-8]';                   % measurement noise variance
+var_f   = repmat(0.01,[gp_p,1]);                     % output variance
+M       = repmat(diag(repmat(1e0,[1,gp_n]).^2),[1,1,gp_p]);     % length scale
+var_n   = repmat(1e-8,[gp_p,1]);                   % measurement noise variance
 maxsize = 100;                      % maximum number of points in the dictionary
 
 % create GP object
@@ -100,7 +100,7 @@ end
 
 % create estimation dynamics model (disturbance is the Gaussian Process GP)
 estModel = MotionModelGP_InvPendulum_nominal(Mc, Mp, b, I, l, @d_GP.eval, var_w);
-% estModel = trueModel;
+%estModel = trueModel;
 
 
 %% Controller
@@ -258,7 +258,7 @@ d_GP.M = M
 d_GP.var_f = var_f;
 d_GP.var_n = var_n;
 
-% d_GP.optimizeHyperParams('ga');
+%d_GP.optimizeHyperParams('ga');
 d_GP.optimizeHyperParams('fmincon');
 
 d_GP.M
diff --git a/main_invertedPendulum.m b/main_invertedPendulum.m