Zhang, Yuan; Hoffman, Jasper; Boedecker, Joschka
UDUC: An Uncertainty-driven Approach for Learning-based Robust Control Working paper
title = {UDUC: An Uncertainty-driven Approach for Learning-based Robust Control},
author = {Yuan Zhang and Jasper Hoffman and Joschka Boedecker},
url = {arXiv preprint arXiv:2405.02598},
year = {2024},
date = {2024-05-09},
urldate = {2024-05-09},
keywords = {},
pubstate = {published},
tppubtype = {workingpaper}
Wang, Jianhong; Li, Yang; Zhang, Yuan; Pan, Wei; Kaski, Samuel
Open Ad Hoc Teamwork with Cooperative Game Theory Conference
Forty-first International Conference on Machine Learning, 2024.
title = {Open Ad Hoc Teamwork with Cooperative Game Theory},
author = {Jianhong Wang and Yang Li and Yuan Zhang and Wei Pan and Samuel Kaski},
url = {},
year = {2024},
date = {2024-05-09},
booktitle = {Forty-first International Conference on Machine Learning},
keywords = {},
pubstate = {published},
tppubtype = {conference}
Zhang, Yuan; Deekshith, Umashankar; Wang, Jianhong; Boedecker, Joschka
LCPPO: An Efficient Multi-agent Reinforcement Learning Algorithm on Complex Railway Network Conference
34th International Conference on Automated Planning and Scheduling, 2024.
title = {LCPPO: An Efficient Multi-agent Reinforcement Learning Algorithm on Complex Railway Network},
author = {Yuan Zhang and Umashankar Deekshith and Jianhong Wang and Joschka Boedecker},
url = {},
year = {2024},
date = {2024-05-09},
booktitle = {34th International Conference on Automated Planning and Scheduling},
keywords = {},
pubstate = {published},
tppubtype = {conference}
Shengchao, Yan; Zhang, Yuan; Zhang, Bohe; Boedecker, Joschka; Burgard, Wolfram
Learning Continuous Control with Geometric Regularity from Robot Intrinsic Symmetry Conference
2024 IEEE International Conference on Robotics and Automation ICRA, 2024.
title = {Learning Continuous Control with Geometric Regularity from Robot Intrinsic Symmetry},
author = {Yan Shengchao and Yuan Zhang and Bohe Zhang and Joschka Boedecker and Wolfram Burgard},
url = {},
year = {2024},
date = {2024-05-09},
booktitle = {2024 IEEE International Conference on Robotics and Automation ICRA},
keywords = {},
pubstate = {published},
tppubtype = {conference}
Zhang, Shuhao; Swevers, Jan
Time-optimal Point-to-point Motion Planning: A Two-stage Approach Proceedings Article Forthcoming
In: Forthcoming, (Accepted to the 2024 IFAC Conference on Nonlinear Model Predictive Control (NMPC)).
title = {Time-optimal Point-to-point Motion Planning: A Two-stage Approach},
author = {Shuhao Zhang and Jan Swevers},
url = {},
year = {2024},
date = {2024-04-16},
abstract = {This paper proposes a two-stage approach to formulate the time-optimal point-to-point motion planning problem, involving a first stage with a fixed time grid and a second stage with a variable time grid. The proposed approach brings benefits through its straightforward optimal control problem formulation with a fixed and low number of control steps for manageable computational complexity and the avoidance of interpolation errors associated with time scaling, especially when aiming to reach a distant goal. Additionally, an asynchronous nonlinear model predictive control (NMPC) update scheme is integrated with this two-stage approach to address delayed and fluctuating computation times, facilitating online replanning. The effectiveness of the proposed two-stage approach and NMPC implementation is demonstrated through numerical examples centered on autonomous navigation with collision avoidance.},
note = {Accepted to the 2024 IFAC Conference on Nonlinear Model Predictive Control (NMPC)},
keywords = {},
pubstate = {forthcoming},
tppubtype = {inproceedings}
Løwenstein, Kristoffer Fink; Bernardini, Daniele; Bemporad, Alberto; Fagiano, Lorenzo
Physics-Informed Online Learning by Moving Horizon Estimation: Learning Recurrent Neural Networks in Gray-box Models Proceedings Article
In: 8th IFAC Conference on Nonlinear Model Predictive Control NMPC 2024, pp. 78-85, IFAC-PapersOnLine, 2024, ISSN: 2405-8963.
title = {Physics-Informed Online Learning by Moving Horizon Estimation: Learning Recurrent Neural Networks in Gray-box Models},
author = {Kristoffer Fink Løwenstein and Daniele Bernardini and Alberto Bemporad and Lorenzo Fagiano },
url = {},
doi = {10.1016/j.ifacol.2024.09.013},
issn = {2405-8963},
year = {2024},
date = {2024-04-02},
urldate = {2024-04-02},
booktitle = {8th IFAC Conference on Nonlinear Model Predictive Control NMPC 2024},
volume = {58},
number = {18},
pages = {78-85},
publisher = {IFAC-PapersOnLine},
abstract = {In Model Predictive Control (MPC) closed-loop performance heavily depends on the quality of the underlying prediction model, where such a model must be accurate and yet simple. A key feature in modern MPC applications is the potential for online model adaptation to cope with time-varying changes, part-to-part variations, and complex features of the system dynamics not caught by models derived from first principles. In this paper, we propose to use a physics-informed, or gray-box, model that extends the physics-based model with a data-driven component, namely a Recurrent Neural Network (RNN). Relying on physics-informed models allows for a rather limited size of the RNN, thereby enhancing online applicability compared to pure black-box models. This work presents a method based on Moving Horizon Estimation (MHE) for simultaneous state estimation and learning of the RNN sub-model, a potentially challenging issue due to limited information available in noisy input-output data and lack of knowledge of the internal state of the RNN. We provide a case study on a quadruple tank benchmark showing how the method can cope with part-to-part variations.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
Meza, Gonzalo; Løwenstein, Kristoffer Fink; Fagiano, Lorenzo
Obstacle avoidance for a robotic manipulator with linear-quadratic Model Predictive Control Proceedings Article
In: 2024 IEEE 20th International Conference on Automation Science and Engineering (CASE 2024), pp. 3365-3370, 2024.
title = {Obstacle avoidance for a robotic manipulator with linear-quadratic Model Predictive Control},
author = {Gonzalo Meza and Kristoffer Fink Løwenstein and Lorenzo Fagiano },
doi = {10.1109/CASE59546.2024.10711546},
year = {2024},
date = {2024-04-02},
urldate = {2024-04-02},
booktitle = {2024 IEEE 20th International Conference on Automation Science and Engineering (CASE 2024)},
pages = {3365-3370},
abstract = {The problem of moving a six-degrees-of-freedom manipulator in an environment with unknown obstacles is considered. The manipulator is assumed to be equipped with an exteroceptive sensor that provides a partial sampling of the surroundings. A hierarchical control layout is proposed: in the outer layer, a path planner generates an obstacle free trajectory based on the available local information; in the inner layer, a Model-Predictive Controller formulated in the joint space tracks the trajectory while reactively avoiding unseen obstacles at a higher rate. By constructing a polytopic under-approximation of the free environment end employing a suitable estimate of the Jacobian matrix of the manipulator, the predictive controller features a convex quadratic cost and linear constraints, thus requiring the solution of a quadratic program at each time step. The proposed method is evaluated on the kinematic model of a MyCobot280 robotic arm, showing the potential for real-time feasibility.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
Messerer, Florian; Baumgärtner, Katrin; Lucia, Sergio; Diehl, Moritz
Fourth-order suboptimality of nominal model predictive control in the presence of uncertainty Journal Article
In: IEEE Control Systems Letters, vol. 8, pp. 508-513, 2024.
title = {Fourth-order suboptimality of nominal model predictive control in the presence of uncertainty},
author = {Florian Messerer and Katrin Baumgärtner and Sergio Lucia and Moritz Diehl},
doi = {10.1109/LCSYS.2024.3396611},
year = {2024},
date = {2024-03-08},
urldate = {2024-03-08},
journal = {IEEE Control Systems Letters},
volume = {8},
pages = {508-513},
abstract = {We investigate the suboptimality resulting from the application of nominal model predictive control (MPC) to a nonlinear discrete time stochastic system. The suboptimality is defined with respect to the corresponding stochastic optimal control problem (OCP) that minimizes the expected cost of the closed loop system. In this context, nominal MPC corresponds to a form of certainty-equivalent control (CEC). We prove that, in a smooth and unconstrained setting, the suboptimality growth is of fourth order with respect to the level of uncertainty, a parameter which we can think of as a standard deviation. This implies that the suboptimality does not grow very quickly as the level of uncertainty is increased, providing further insight into the practical success of nominal MPC. Similarly, the difference between the optimal and suboptimal control inputs is of second order. We illustrate the result on a simple numerical example, which we also use to show how the proven relationship may cease to hold in the presence of state constraints.},
keywords = {},
pubstate = {published},
tppubtype = {article}
Xie, Jing; Bonassi, Fabio; Scattolini, Riccardo
Internal Model Control design for systems learned by Control Affine Neural Nonlinear Autoregressive Exogenous Models Working paper Forthcoming
Forthcoming, (Accepted by IEEE Transactions on Automation Science and Engineering).
title = {Internal Model Control design for systems learned by Control Affine Neural Nonlinear Autoregressive Exogenous Models},
author = {Jing Xie and Fabio Bonassi and Riccardo Scattolini},
url = {},
year = {2024},
date = {2024-02-13},
urldate = {2024-02-13},
abstract = {This paper explores the use of Control Affine Neural Nonlinear AutoRegressive eXogenous (CA-NNARX) models for nonlinear system identification and model-based control design. The idea behind this architecture is to match the known control-affine structure of the system to achieve improved performance. Coherently with recent literature of neural networks for data-driven control, we first analyze the stability properties of CA-NNARX models, devising sufficient conditions for their incremental Input-to-State Stability (incremental ISS) that can be enforced at the model training stage. The model's stability property is then leveraged to design a stable Internal Model Control (IMC) architecture. The proposed control scheme is tested on a simulated Quadruple Tank benchmark system to address the output reference tracking problem. The results achieved show that (i) the modeling accuracy of CA-NNARX is superior to the one of a standard NNARX model for given weight size and training epochs, and (ii) the proposed IMC law provides performance comparable to the ones of a standard Model Predictive Controller (MPC) at a significantly lower computational burden.},
note = {Accepted by IEEE Transactions on Automation Science and Engineering},
keywords = {},
pubstate = {forthcoming},
tppubtype = {workingpaper}
Cecchin, Leonardo; Trachte, Adrian; Fagiano, Lorenzo; Diehl, Moritz
Real-time prediction of human-generated reference signals: a case study in advanced digging control Working paper
2024, (Submitted to the 2024 European Control Conference (ECC)).
title = {Real-time prediction of human-generated reference signals: a case study in advanced digging control},
author = {Leonardo Cecchin and Adrian Trachte and Lorenzo Fagiano and Moritz Diehl},
year = {2024},
date = {2024-02-12},
urldate = {2024-02-12},
abstract = {Techniques like Model Predictive Control (MPC) and two-degrees-of-freedom structures (feedforward plus feedback) can improve the control performance by exploiting a prediction of the reference trajectory, which is assumed to be available. This assumption holds true when pre-defined reference trajectories are known a-priori, e.g. constant or piecewise linear, but fails in applications where a human operator chooses the reference at runtime. To cope with this problem, we study different approaches to use the collected data of human-generated reference signals to learn a predictive model of the operator commands. The considered methods are function approximation techniques based on Kriging, Set-Membership, and LSTM Neural Networks.
We summarize the principles and the implementation of each method, and compare their performance using an experimental data-set of operations from a real-world excavator, where four operator-defined reference signals are predicted.},
note = {Submitted to the 2024 European Control Conference (ECC)},
keywords = {},
pubstate = {published},
tppubtype = {workingpaper}
We summarize the principles and the implementation of each method, and compare their performance using an experimental data-set of operations from a real-world excavator, where four operator-defined reference signals are predicted.
Cecchin, Leonardo; Ohtsuka, Toshiyuki; Trachte, Adrian; Diehl, Moritz
Model Predictive Controller for Hydraulic Cylinders with Independent Metering Control Valves Working paper
2024, (Submitted to the 2024 IFAC Conference on Nonlinear Model Predictive Control (NMPC)).
title = {Model Predictive Controller for Hydraulic Cylinders with Independent Metering Control Valves},
author = {Leonardo Cecchin and Toshiyuki Ohtsuka and Adrian Trachte and Moritz Diehl},
year = {2024},
date = {2024-02-12},
urldate = {2024-02-12},
abstract = {Hydraulic cylinders are pivotal components in various industrial, construction, and off-highway applications, where efficient actuation is crucial for reducing energy consumption, minimizing heat generation, and extending components' lifespan. The integration of Independent Metering Control, a valve topology allowing five valves to independently control the flow, represents a significant advancement in enhancing hydraulic systems' performance. However, the lack of a reliable and flexible control solution remains a challenge. In this paper, we present the implementation of nonlinear Model Predictive Control, using a favorable model formulation and a state-of-the-art solver. We show how it can deliver close-to-optimal performance with real-time capabilities, addressing the current gap in achieving efficient control for hydraulic cylinders with Independent Metering Control.},
note = {Submitted to the 2024 IFAC Conference on Nonlinear Model Predictive Control (NMPC)},
keywords = {},
pubstate = {published},
tppubtype = {workingpaper}
Zhang, Shuhao; Bos, Mathis; Vandewal, Bastiaan; Decré, Wilm; Gillis, Joris; Swevers, Jan
Robustified Time-optimal Collision-free Motion Planning for Autonomous Mobile Robots under Disturbance Conditions Working paper Forthcoming
Forthcoming, (Accepted to be presented at the 2024 IEEE International Conference on Robotics and Automation (ICRA)).
title = {Robustified Time-optimal Collision-free Motion Planning for Autonomous Mobile Robots under Disturbance Conditions},
author = {Shuhao Zhang and Mathis Bos and Bastiaan Vandewal and Wilm Decré and Joris Gillis and Jan Swevers},
url = {,contains,LIRIAS4141698&offset=0},
year = {2024},
date = {2024-02-07},
urldate = {2024-02-07},
abstract = {This paper presents a robustified time-optimal motion planning approach for navigating an Autonomous Mobile Robot (AMR) from an initial state to a terminal state without colliding with obstacles and while affected by disturbances modeled as random process and measurement noise. The approach iteratively solves the robustified problem by incorporating updated state-dependent safety margins for collision avoidance, the evolution of which is derived separately from the robustified problem. Additionally, a strategy for selecting an alternative terminal state to reach is introduced, which comes into play when the desired terminal state becomes infeasible considering the uncertainties. Both of these contributions are integrated into a robustified motion planning and control pipeline, the efficacy of which is validated through simulation experiments.},
note = {Accepted to be presented at the 2024 IEEE International Conference on Robotics and Automation (ICRA)},
keywords = {},
pubstate = {forthcoming},
tppubtype = {workingpaper}
Zhang, Shuhao; Swevers, Jan
Two-stage Time-optimal Motion Planning Presentation
07.02.2024, (Abstract at the 2024 Benelux Meeting ).
title = {Two-stage Time-optimal Motion Planning},
author = {Shuhao Zhang and Jan Swevers},
year = {2024},
date = {2024-02-07},
urldate = {2024-02-07},
note = {Abstract at the 2024 Benelux Meeting },
keywords = {},
pubstate = {published},
tppubtype = {presentation}
Simpson, Léo; Ghezzi, Andrea; Asprion, Jonas; Diehl, Moritz
An Efficient Method for the Joint Estimation of System Parameters and Noise Covariances for Linear Time-Variant Systems Proceedings Article
In: 2023 Conference of Decision and Control (CDC) , pp. 4524-4529, 2024, ISSN: 2576-2370.
title = {An Efficient Method for the Joint Estimation of System Parameters and Noise Covariances for Linear Time-Variant Systems },
author = {Léo Simpson and Andrea Ghezzi and Jonas Asprion and Moritz Diehl},
url = {},
doi = {10.1109/CDC49753.2023.10383686},
issn = {2576-2370},
year = {2024},
date = {2024-01-19},
urldate = {2023-03-20},
booktitle = {2023 Conference of Decision and Control (CDC) },
pages = {4524-4529},
abstract = {We present an optimization-based method for the joint estimation of system parameters and noise covariances of linear time-variant systems. Given measured data, this method maximizes the likelihood of the parameters. We solve the optimization problem of interest via a novel structure-exploiting solver. We present the advantages of the proposed approach over commonly used methods in the framework of Moving Horizon Estimation. Finally, we show the performance of the method through numerical simulations on a realistic example of a thermal system. In this example, the method can successfully estimate the model parameters in a short computational time.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
Roy, Wim Van; Nurkanovic, Armin; Abbasi-Esfeden, Ramin; Frey, Jonathan; Pozharskiy, Anton; Swevers, Jan; Diehl, Moritz
Continuous Optimization for Control of Finite-State Machines with Cascaded Hysteresis Via Time-Freezing Proceedings Article
In: 2023 62nd IEEE Conference on Decision and Control (CDC), pp. 6261-6266, IEEE, Singapore, Singapore, 2024, ISBN: 979-8-3503-0124-3.
title = {Continuous Optimization for Control of Finite-State Machines with Cascaded Hysteresis Via Time-Freezing},
author = {Wim Van Roy and Armin Nurkanovic and Ramin Abbasi-Esfeden and Jonathan Frey and Anton Pozharskiy and Jan Swevers and Moritz Diehl},
doi = {10.1109/CDC49753.2023.10384083},
isbn = {979-8-3503-0124-3},
year = {2024},
date = {2024-01-19},
urldate = {2023-12-01},
booktitle = {2023 62nd IEEE Conference on Decision and Control (CDC)},
pages = {6261-6266},
publisher = {IEEE},
address = {Singapore, Singapore},
abstract = {Control problems with Finite-State Machines (FSM) are often solved using integer variables, leading to a mixed-integer optimal control problem (MIOCP). This paper proposes an alternative method to describe a subclass of FSMs using complementarity constraints and time-freezing. The FSM from this subclass is built up by a sequence of states where a transition between the states is triggered by a single switching function. This can be looked at as a cascade of hysteresis loops where a memory effect is used to maintain the active state of the state machine. Based on the reformulation for hybrid systems with a hysteresis loop [13], a method is developed to reformulate this subclass in a similar fashion. The approach transforms the original problem into a Piecewise Smooth System (PSS), which can be discretized using the recently developed Finite Elements with Switch Detection [15], allowing for high-accuracy solutions. The reformulation is compared to a mixed-integer formulation from the literature on a time-optimal control problem. This work is a first step towards the general reformulation of FSMs into nonsmooth systems without integer states.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
Bonassi, Fabio; Bella, Alessio La; Farina, Marcello; Scattolini, Riccardo
Nonlinear MPC design for incrementally ISS systems with application to GRU networks Journal Article
In: Automatica, vol. 159, iss. 11381, pp. 111381, 2024.
title = {Nonlinear MPC design for incrementally ISS systems with application to GRU networks},
author = {Fabio Bonassi and Alessio La Bella and Marcello Farina and Riccardo Scattolini},
doi = {},
year = {2024},
date = {2024-01-03},
urldate = {2024-01-03},
journal = {Automatica},
volume = {159},
issue = {11381},
pages = {111381},
keywords = {},
pubstate = {published},
tppubtype = {article}
Bourkhissi, Lahcen El; Necoara, Ion
Complexity of linearized quadratic penalty for optimization with nonlinear equality constraints Working paper
2023, (Under review).
title = {Complexity of linearized quadratic penalty for optimization with nonlinear equality constraints},
author = {Lahcen El Bourkhissi and Ion Necoara},
doi = {},
year = {2023},
date = {2023-12-31},
abstract = {In this paper we consider a nonconvex optimization problem with nonlinear equality constraints. We assume that both, the objective function and the functional constraints, are locally smooth. For solving this problem, we propose a linearized quadratic penalty method, i.e., we linearize the objective function and the functional constraints in the penalty formulation at the current iterate and add a quadratic regularization, thus yielding a subproblem that is easy to solve, and whose solution is the next iterate. Under a dynamic regularization parameter choice, we derive convergence guarantees for the iterates of our method to an ϵ first-order optimal solution in O(1/ϵ3) outer iterations. Finally, we show that when the problem data satisfy Kurdyka-Lojasiewicz property, e.g., are semialgebraic, the whole sequence generated by our algorithm converges and we derive convergence rates. We validate the theory and the performance of the proposed algorithm by numerically comparing it with the existing methods from the literature.},
note = {Under review},
keywords = {},
pubstate = {published},
tppubtype = {workingpaper}
Bourkhissi, Lahcen El; Necoara, Ion; Patrinos, Panagiotis
Linearized ADMM for Nonsmooth Nonconvex Optimization with Nonlinear Equality Constraints Proceedings Article
In: 2023 62nd IEEE Conference on Decision and Control (CDC), pp. 7312-7317, IEEE, Singapore, Singapore, 2023, ISSN: 2576-2370.
title = {Linearized ADMM for Nonsmooth Nonconvex Optimization with Nonlinear Equality Constraints},
author = {Lahcen El Bourkhissi and Ion Necoara and Panagiotis Patrinos},
doi = {10.1109/CDC49753.2023.10384166},
issn = {2576-2370},
year = {2023},
date = {2023-12-13},
urldate = {2023-12-13},
booktitle = {2023 62nd IEEE Conference on Decision and Control (CDC)},
pages = {7312-7317},
publisher = {IEEE},
address = {Singapore, Singapore},
abstract = {This paper proposes a new approach for solving a structured nonsmooth nonconvex optimization problem with nonlinear equality constraints, where both the objective function and constraints are 2-blocks separable. Our method is based on a 2-block linearized ADMM, where we linearize the smooth part of the cost function and the nonlinear term of the functional constraints in the augmented Lagrangian at each outer iteration. This results in simple subproblems, whose solutions are used to update the iterates of the 2 blocks variables. We prove global convergence for the sequence generated by our method to a stationary point of the original problem. To demonstrate its effectiveness, we apply our proposed algorithm as a solver for the nonlinear model predictive control problem of an inverted pendulum on a cart.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
Voogd, Kevin; Allamaa, Jean Pierre; Alonso-Mora, Javier; Son, Tong Duy
Reinforcement Learning from Simulation to Real World Autonomous Driving using Digital Twin Proceedings Article
In: 22nd IFAC World Congress 2023, pp. 1510-1515, Elsevier Ltd, Yokohama, Japan, 2023, ISSN: 2405-8963.
title = {Reinforcement Learning from Simulation to Real World Autonomous Driving using Digital Twin},
author = {Kevin Voogd and Jean Pierre Allamaa and Javier Alonso-Mora and Tong Duy Son},
url = {},
doi = {},
issn = {2405-8963},
year = {2023},
date = {2023-11-30},
urldate = {2023-11-30},
booktitle = {22nd IFAC World Congress 2023},
journal = {IFAC-PapersOnLine},
volume = {56},
number = {2},
pages = {1510-1515},
publisher = {Elsevier Ltd},
address = {Yokohama, Japan},
abstract = {Reinforcement learning (RL) is a promising solution for autonomous vehicles to deal with complex and uncertain traffic environments. The RL training process is however expensive, unsafe, and time-consuming. Algorithms are often developed first in simulation and then transferred to the real-world, leading to a common sim2real challenge where performance decreases when the domain changes. In this paper, we propose a transfer learning process to minimize the gap by exploiting digital twin technology, relying on a systematic and simultaneous combination of virtual and real world data coming from vehicle dynamics and traffic scenarios. The model and testing environment is evolved from model, hardware to vehicle in the loop and proving ground testing stages, similar to standard development cycle in the automotive industry. In particular, we also integrate other transfer learning techniques such as domain randomization and adaptation in each stage. The simulation and real data are gradually incorporated to accelerate and make the transfer learning process more robust. The proposed RL methodology is applied to develop a path-following steering controller for an autonomous electric vehicle. After learning and deploying the real-time RL control policy on the vehicle, we obtained satisfactory and safe control performance already from the first deployment, demonstrating the advantages of the proposed digital twin based learning process.
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
Acerbo, Flavia Sofia; Swevers, Jan; Tuytelaars, Tinne; Son, Tong Duy
Evaluation of MPC-based Imitation Learning for Human-like Autonomous Driving Proceedings Article
In: 22nd IFAC World Congress, pp. 4871-4876, Elsevier Ltd, Yokohama, Japan, 2023, ISSN: 2405-8963.
title = {Evaluation of MPC-based Imitation Learning for Human-like Autonomous Driving},
author = {Flavia Sofia Acerbo and Jan Swevers and Tinne Tuytelaars and Tong Duy Son},
url = {},
doi = {},
issn = {2405-8963},
year = {2023},
date = {2023-11-30},
urldate = {2023-11-30},
booktitle = {22nd IFAC World Congress},
journal = { IFAC-PapersOnLine},
volume = {56},
number = {2},
pages = {4871-4876},
publisher = {Elsevier Ltd},
address = {Yokohama, Japan},
abstract = {This work evaluates and analyzes the combination of imitation learning (IL) and differentiable model predictive control (MPC) for the application of human-like autonomous driving. We combine MPC with a hierarchical learning-based policy, and measure its performance in open-loop and closed-loop with metrics related to safety, comfort and similarity to human driving characteristics. We also demonstrate the value of augmenting open-loop behavioral cloning with closed-loop training for a more robust learning, approximating the policy gradient through time with the state space model used by the MPC. We perform experimental evaluations on a lane keeping control system, learned from demonstrations collected on a fixed-base driving simulator, and show that our imitative policies approach the human driving style preferences.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}