Source code for autompc.sysid.model

# Created by William Edwards (wre2@illinois.edu)

import numpy as np

from abc import ABC, abstractmethod
from pdb import set_trace

[docs]class ModelFactory(ABC):
    """
    The ModelFactory creates and trains a System ID model and provides
    information about the model hyperparameters.
    """
    def __init__(self, system, **kwargs):
        """
        Parameters
        ----------
            system : System
                System for which system ID model will be produced.
        """
        self.system = system
        self.kwargs = kwargs

    def __call__(self, cfg, train_trajs, silent=False, skip_train_model=False):
        """
        Returns a model trained for the given 
        system and configuration.

        Parameters
        ----------
            cfg : Configuration
                Configuration of model hyperparameters
            train_trajs : List of Trajectory objects
                Model training data set
            silent : bool
                Whether to produce output during training
            skip_train_model : bool
                Skip model training when True.
        """
        model_args = cfg.get_dictionary()
        model_args.update(self.kwargs)
        model = self.Model(self.system, **model_args)
        model.factory = self
        if not skip_train_model:
            model.train(train_trajs, silent=silent)

        return model

[docs]    @abstractmethod
    def get_configuration_space(self):
        """
        Returns the model configuration space.
        """
        raise NotImplementedError

[docs]class Model(ABC):
    def __init__(self, system):
        self.system = system

[docs]    @abstractmethod
    def traj_to_state(self, traj):
        """
        Parameters
        ----------
            traj : Trajectory
                State and control history up to present time
        Returns
        -------
            state : numpy array of size self.state_dim
               Corresponding model state
        """
        raise NotImplementedError

[docs]    @abstractmethod
    def update_state(self, state, new_ctrl, new_obs):
        """
        Parameters
        ----------
            state : numpy array of size self.state_dim
                Current model state
            new_ctrl : numpy array of size self.system.ctrl_dim
                New control input
            new_obs : numpy array of size self.system.obs_dim
                New observation
        Returns
        -------
            state : numpy array of size self.state_dim
                Model state after observation and control
        """
        raise NotImplementedError

[docs]    @abstractmethod
    def pred(self, state, ctrl):
        """
        Run model prediction.

        Parameters
        ----------
            state : Numpy array of size self.state_dim
                Model state at time t
            ctrl : Numpy array of size self.system.ctrl_dim
                Control applied at time t
        Returns
        -------
            state : Numpy array of size self.state_dim
                Predicted model state at time t+1
        """
        raise NotImplementedError

[docs]    def pred_batch(self, states, ctrls):
        """
        Run batch model predictions.  Depending on the model, this can
        be much faster than repeatedly calling pred.

        Parameters
        ----------
            state : Numpy array of size (N, self.state_dim)
                N model input states
            ctrl : Numpy array of size (N, self.system.ctrl_dim)
                N controls
        Returns
        -------
            state : Numpy array of size (N, self.state_dim)
                N predicted states
        """
        n = self.state_dim
        m = states.shape[0]
        out = np.empty((m, n))
        for i in range(m):
            out[i,:] = self.pred(states[i,:], ctrls[i,:])
        return out

[docs]    def pred_diff(self, state, ctrl):
        """
        Run model prediction and compute gradients.

        Parameters
        ----------
            state : Numpy array of size self.state_dim
                Model state at time t
            ctrl : Numpy array of size self.system.ctrl_dim
                Control at time t
        Returns
        -------
            state : Numpy array of size self.state_dim
                Predicted model state at time t+1
            state_jac : Numpy  array of shape (self.state_dim, 
                        self.state_dim)
                Gradient of predicted model state wrt to state
            ctrl_jac : Numpy  array of shape (self.state_dim, 
                       self.ctrl_dim)
                Gradient of predicted model state wrt to ctrl
        """
        raise NotImplementedError

[docs]    def pred_diff_batch(self, states, ctrls):
        """
        Run model prediction and compute gradients in batch.

        Parameters
        ----------
            state : Numpy array of shape (N, self.state_dim)
                N input model states
            ctrl : Numpy array of size (N, self.system.ctrl_dim)
                N input controls
        Returns
        -------
            state : Numpy array of size (N, self.state_dim)
                N predicted model states
            state_jac : Numpy  array of shape (N, self.state_dim, 
                        self.state_dim)
                Gradient of predicted model states wrt to state
            ctrl_jac : Numpy  array of shape (N, self.state_dim, 
                       self.ctrl_dim)
                Gradient of predicted model states wrt to ctrl
        """
        n = self.state_dim
        m = states.shape[0]
        out = np.empty((m, n))
        state_jacs = np.empty((m, n, n))
        ctrl_jacs = np.empty((m, n, self.system.ctrl_dim))
        for i in range(m):
            out[i,:], state_jacs[i,:,:], ctrl_jacs[i,:,:] = \
                self.pred_diff(states[i,:], ctrls[i,:])
        return out, state_jacs, ctrl_jacs


[docs]    def to_linear(self):
        """
        Returns: (A, B, state_func, cost_func)
            A, B -- Linear system matrices as Numpy arrays.
        Only implemented for linear models.
        """
        raise NotImplementedError

[docs]    def train(self, trajs, silent=False):
        """
        Parameters
        ----------
            trajs : List of pairs (xs, us)
                Training set of trajectories
            silent : bool
                Silence progress bar output
        Only implemented for trainable models.
        """
        raise NotImplementedError

[docs]    def get_parameters(self):
        """
        Returns a dict containing trained model parameters.

        Only implemented for trainable models.
        """
        raise NotImplementedError

[docs]    def set_parameters(self, params):
        """
        Sets trainable model parameters from dict.

        Only implemented for trainable parameters.
        """
        raise NotImplementedError

    @property
    @abstractmethod
    def state_dim(self):
        """
        Returns the size of the model state
        """
        raise NotImplementedError


    @property
    def is_linear(self):
        """
        Returns true for linear models
        """
        return not self.to_linear.__func__ is Model.to_linear

    @property
    def is_diff(self):
        """
        Returns true for differentiable models.
        """
        return not self.pred_diff.__func__ is Model.pred_diff
Source code for autompc.sysid.model

AutoMPC

Navigation

Related Topics