PythonLinearNonlinearControl/PythonLinearNonlinearControl/envs/cost.py

from logging import getLogger

import numpy as np

logger = getLogger(__name__)


def calc_cost(pred_xs, input_sample, g_xs,
              state_cost_fn, input_cost_fn, terminal_state_cost_fn):
    """ calculate the cost

    Args:
        pred_xs (numpy.ndarray): predicted state trajectory,
            shape(pop_size, pred_len+1, state_size)
        input_sample (numpy.ndarray): inputs samples trajectory,
            shape(pop_size, pred_len+1, input_size)
        g_xs (numpy.ndarray): goal state trajectory,
            shape(pop_size, pred_len+1, state_size)
        state_cost_fn (function): state cost fucntion
        input_cost_fn (function): input cost fucntion
        terminal_state_cost_fn (function): terminal state cost fucntion
    Returns:
        cost (numpy.ndarray): cost of the input sample, shape(pop_size, )
    """
    # state cost
    state_cost = 0.
    if state_cost_fn is not None:
        state_pred_par_cost = state_cost_fn(
            pred_xs[:, 1:-1, :], g_xs[:, 1:-1, :])
        state_cost = np.sum(np.sum(state_pred_par_cost, axis=-1), axis=-1)

    # terminal cost
    terminal_state_cost = 0.
    if terminal_state_cost_fn is not None:
        terminal_state_par_cost = terminal_state_cost_fn(pred_xs[:, -1, :],
                                                         g_xs[:, -1, :])
        terminal_state_cost = np.sum(terminal_state_par_cost, axis=-1)

    # act cost
    act_cost = 0.
    if input_cost_fn is not None:
        act_pred_par_cost = input_cost_fn(input_sample)
        act_cost = np.sum(np.sum(act_pred_par_cost, axis=-1), axis=-1)

    return state_cost + terminal_state_cost + act_cost