Publications
Simpson, Léo; Nurkanovic, Armin; Diehl, Moritz
Direct Collocation for Numerical Optimal Control of Second-Order ODE Inproceedings Forthcoming
In: 2023 European Conference of Control (ECC), Forthcoming.
@inproceedings{Simpson2023DCSODE,
title = {Direct Collocation for Numerical Optimal Control of Second-Order ODE},
author = {Léo Simpson and Armin Nurkanovic and Moritz Diehl},
url = {https://arxiv.org/abs/2211.12308},
year = {2023},
date = {2023-04-25},
urldate = {2023-04-25},
booktitle = {2023 European Conference of Control (ECC)},
abstract = {Mechanical systems are usually modeled by second-order Ordinary Differential Equations (ODE) which take the form q¨=f(t,q,q˙). While simulation methods tailored to these equations have been studied, using them in direct optimal control methods is rare. Indeed, the standard approach is to perform a state augmentation, adding the velocities to the state. The main drawback of this approach is that the number of decision variables is doubled, which could harm the performance of the resulting optimization problem. In this paper, we present an approach tailored to second-order ODE. We compare it with the standard one, both on theoretical aspects and in a numerical example. Notably, we show that the tailored formulation is likely to improve the performance of a direct collocation method, for solving optimal control problems with second-order ODE of the more restrictive form q¨=f(t,q).},
keywords = {},
pubstate = {forthcoming},
tppubtype = {inproceedings}
}
Roy, Wim Van; Abbasi-Esfeden, Ramin; Swevers, Jan
Online Unit Commitment Problem Solving using Extended Dynamic Programming Presentation
22.03.2023.
@misc{vanRoy2023EDP,
title = {Online Unit Commitment Problem Solving using Extended Dynamic Programming},
author = {Wim Van Roy and Ramin Abbasi-Esfeden and Jan Swevers},
year = {2023},
date = {2023-03-22},
urldate = {2023-03-22},
keywords = {},
pubstate = {published},
tppubtype = {presentation}
}
Simpson, Léo; Ghezzi, Andrea; Asprion, Jonas; Diehl, Moritz
An Efficient Method for the Joint Estimation of System Parameters and Noise Covariances for Linear Time-Variant Systems Inproceedings Forthcoming
In: 2023 Conference of Decision and Control (CDC) , Forthcoming.
@inproceedings{Simpson2023EMJE,
title = {An Efficient Method for the Joint Estimation of System Parameters and Noise Covariances for Linear Time-Variant Systems },
author = {Léo Simpson and Andrea Ghezzi and Jonas Asprion and Moritz Diehl},
url = {https://arxiv.org/abs/2211.12302},
year = {2023},
date = {2023-03-20},
booktitle = {2023 Conference of Decision and Control (CDC) },
abstract = {We present an optimization-based method for the joint estimation of system parameters and noise covariances of linear time-variant systems. Given measured data, this method maximizes the likelihood of the parameters. We solve the optimization problem of interest via a novel structure-exploiting solver. We present the advantages of the proposed approach over commonly used methods in the framework of Moving Horizon Estimation. Finally, we show the performance of the method through numerical simulations on a realistic example of a thermal system. In this example, the method can successfully estimate the model parameters in a short computational time.},
keywords = {},
pubstate = {forthcoming},
tppubtype = {inproceedings}
}
Roy, Wim Van; Abbasi-Esfeden, Ramin; Swevers, Jan
A Dynamic Programming-based Heuristic Approach for Unit Commitment Problems Inproceedings Forthcoming
In: 2023 European Control Conference (ECC), Forthcoming.
@inproceedings{vanRoy2023ADP,
title = {A Dynamic Programming-based Heuristic Approach for Unit Commitment Problems},
author = {Wim Van Roy and Ramin Abbasi-Esfeden and Jan Swevers},
year = {2023},
date = {2023-03-10},
urldate = {2023-03-10},
booktitle = {2023 European Control Conference (ECC)},
abstract = {Unit Commitment (UC) problems are an essential set of problems in the power industry with applications in energy grid or heating systems management and control. The engineering goal is to balance the demand with the production of a network of production units, called generators, by providing a schedule and operating points for each generator cost-effectively while considering constraints. The constraints are caused by the dynamics of the system, the limits on the reserves, and possible robustness requirements. Due to the appearance of the on/off states from the generators, the resulting problems are NP-hard to solve. Thus, existing techniques to achieve a cost-efficient solution are computationally expensive. This paper proposes a dynamic programming-based heuristic to solve a UC problem. The heuristic focuses on finding a feasible and cost-effective solution within a limited calculation time for systems with a limited number of generators where a long time horizon is important. This method is compared to a Mixed Integer Linear Program (MILP) implementation for a micro-grid where it achieves a computation time that is an order of magnitude smaller than MILP programs for problems with a limited number of generators but a long time horizon.},
keywords = {},
pubstate = {forthcoming},
tppubtype = {inproceedings}
}
Abbasi-Esfeden, Ramin; Roy, Wim Van; Swevers, Jan
Iterative Switching Time Optimization for Mixed-integer Optimal Control Problems Inproceedings Forthcoming
In: 2023 European Control Conference (ECC), Forthcoming.
@inproceedings{AbbasiEsfeden2023STO,
title = {Iterative Switching Time Optimization for Mixed-integer Optimal Control Problems},
author = {Ramin Abbasi-Esfeden and Wim Van Roy and Jan Swevers},
year = {2023},
date = {2023-03-10},
urldate = {2023-03-10},
booktitle = {2023 European Control Conference (ECC)},
abstract = {This paper proposes an iterative method to solve Mixed-Integer Optimal Control Problems arising from systems with switched dynamics. The so-called relaxed problem plays a central role within this context. Through a numerical example, it is shown why relying on the relaxed problem can lead the solution astray. As an alternative, an iterative Switching Time Optimization method is proposed. The method consists of two components that iteratively interact: a Switching Time Optimization (STO) problem and a sequence optimization. Each component is explained in detail, and the numerical example is resolved, the results of which shows the efficiency of the proposed algorithm. Finally, the advantages and disadvantages of the method are discussed and future lines of research are sketched.},
keywords = {},
pubstate = {forthcoming},
tppubtype = {inproceedings}
}
Messerer, Florian; Baumgärtner, Katrin; Diehl, Moritz
A Dual-Control Effect Preserving Formulation for Nonlinear Output-Feedback Stochastic Model Predictive Control With Constraints Journal Article
In: IEEE Control Systems Letters, vol. 7, no. 1171--1176, 2023.
@article{Messerer2023,
title = {A Dual-Control Effect Preserving Formulation for Nonlinear Output-Feedback Stochastic Model Predictive Control With Constraints},
author = {Florian Messerer and Katrin Baumgärtner and Moritz Diehl},
url = {https://ieeexplore.ieee.org/document/9993720},
doi = {10.1109/LCSYS.2022.3230552},
year = {2023},
date = {2023-01-01},
urldate = {2023-01-01},
journal = {IEEE Control Systems Letters},
volume = {7},
number = {1171--1176},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Reiter, Rudolf; Messerer, Florian; Schratter, Markus; Watzenig, Daniel; Diehl, Moritz
An Inverse Optimal Control Approach for Trajectory Prediction of Autonomous Race Cars Inproceedings
In: 2022 European Control Conference (ECC), pp. 146–153, IEEE, London, United Kingdom, 2022, ISBN: 978-3-907144-07-7.
@inproceedings{reiter_inverse_2022,
title = {An Inverse Optimal Control Approach for Trajectory Prediction of Autonomous Race Cars},
author = {Rudolf Reiter and Florian Messerer and Markus Schratter and Daniel Watzenig and Moritz Diehl},
url = {https://ieeexplore.ieee.org/document/9838100/},
doi = {10.23919/ECC55457.2022.9838100},
isbn = {978-3-907144-07-7},
year = {2022},
date = {2022-07-01},
urldate = {2022-09-09},
booktitle = {2022 European Control Conference (ECC)},
pages = {146--153},
publisher = {IEEE},
address = {London, United Kingdom},
abstract = {This paper proposes an optimization-based approach to predict trajectories of autonomous race cars. We assume that the observed trajectory is the result of an optimization problem that trades off path progress against acceleration and jerk smoothness, and which is restricted by constraints. The algorithm predicts a trajectory by solving a parameterized nonlinear program (NLP) which contains path progress and smoothness in cost terms. By observing the actual motion of a vehicle, the parameters of prediction are updated by means of solving an inverse optimal control problem that contains the parameters of the predicting NLP as optimization variables. The algorithm therefore learns to predict the observed vehicle trajectory in a least-squares relation to measurement data and to the presumed structure of the predicting NLP. This work contributes with an algorithm that allows for accurate and interpretable predictions with sparse data. The algorithm is implemented on embedded hardware in an autonomous real-world race car that is competing in the challenge Roborace and analyzed with respect to recorded data.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Allamaa, Jean Pierre; Listov, Petr; Auweraer, Herman Van; Jones, Colin; Son, Tong Duy
Real-time Nonlinear MPC Strategy with Full Vehicle Validation for Autonomous Driving Inproceedings
In: 2022 American Control Conference (ACC), pp. 1982-1987, IEEE, Atlanta, GA, USA, 2022, ISBN: 978-1-6654-5196-3.
@inproceedings{Allamaa2022RTNMPCStrategy,
title = {Real-time Nonlinear MPC Strategy with Full Vehicle Validation for Autonomous Driving},
author = {Jean Pierre Allamaa and Petr Listov and Herman Van Auweraer and Colin Jones and Tong Duy Son},
url = {https://ieeexplore.ieee.org/document/9867514},
doi = {10.23919/ACC53348.2022.9867514},
isbn = {978-1-6654-5196-3},
year = {2022},
date = {2022-06-09},
booktitle = {2022 American Control Conference (ACC)},
pages = {1982-1987},
publisher = {IEEE},
address = {Atlanta, GA, USA},
abstract = {In this paper, we present the development and deployment of an embedded optimal control strategy for autonomous driving applications on a Ford Focus road vehicle. Non-linear model predictive control (NMPC) is designed and deployed on a system with hard real-time constraints. We show the properties of sequential quadratic programming (SQP) optimization solvers that are suitable for driving tasks. Importantly, the designed algorithms are validated based on a standard automotive XiL development cycle: model-in-the-loop (MiL) with high fidelity vehicle dynamics, hardware-in-the-loop (HiL) with vehicle actuation and embedded platform, and full vehicle-hardware-in-the-loop (VeHiL). The autonomous driving environment contains both virtual simulation and physical proving ground tracks. NMPC algorithms and optimal control problem formulation are fine-tuned using a deployable C code via code generation compatible with the target embedded toolchains. Finally, the developed systems are applied to autonomous collision avoidance, trajectory tracking, and lane change at high speed on city/highway and low speed at a parking environment.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Ghezzi, Andrea; Messerer, Florian; Balocco, Jacopo; Manzoni, Vincenzo; Diehl, Moritz
Implicit and Explicit Dual Model Predictive Control with an Application to Steel Recycling Inproceedings Forthcoming
In: Forthcoming.
@inproceedings{ghezzi2022implicit,
title = {Implicit and Explicit Dual Model Predictive Control with an Application to Steel Recycling},
author = {Andrea Ghezzi and Florian Messerer and Jacopo Balocco and Vincenzo Manzoni and Moritz Diehl},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
journal = {arXiv preprint arXiv:2204.02282},
keywords = {},
pubstate = {forthcoming},
tppubtype = {inproceedings}
}
Bonassi, Fabio; Farina, Marcello; Xie, Jing; Scattolini, Riccardo
An Offset-Free Nonlinear MPC scheme for systems learned by Neural NARX models Working paper
2022, (Under review).
@workingpaper{bonassi2022offset,
title = {An Offset-Free Nonlinear MPC scheme for systems learned by Neural NARX models},
author = {Fabio Bonassi and Marcello Farina and Jing Xie and Riccardo Scattolini},
url = {https://arxiv.org/abs/2203.16290},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
journal = {arXiv preprint arXiv:2203.16290},
abstract = {This paper deals with the design of nonlinear MPC controllers that provide offset-free setpoint tracking for models described by Neural Nonlinear AutoRegressive eXogenous (NNARX) networks. The NNARX model is identified from input-output data collected from the plant, and can be given a state-space representation with known measurable states made by past input and output variables, so that a state observer is not required. In the training phase, the Incremental Input-to-State Stability (deltaISS) property can be forced when consistent with the behavior of the plant. The deltaISS property is then leveraged to augment the model with an explicit integral action on the output tracking error, which allows to achieve offset-free tracking capabilities to the designed control scheme. The proposed control architecture is numerically tested on a water heating system and the achieved results are compared to those scored by another popular offset-free MPC method, showing that the proposed scheme attains remarkable performances even in presence of disturbances acting on the plant.},
note = {Under review},
keywords = {},
pubstate = {published},
tppubtype = {workingpaper}
}
Bonassi, Fabio; Farina, Marcello; Xie, Jing; Scattolini, Riccardo
On Recurrent Neural Networks for learning-based control: recent results and ideas for future developments Journal Article
In: Journal of Process Control, vol. 114, pp. 92-104, 2022, ISSN: 0959-1524.
@article{bonassi2022survey,
title = {On Recurrent Neural Networks for learning-based control: recent results and ideas for future developments},
author = {Fabio Bonassi and Marcello Farina and Jing Xie and Riccardo Scattolini},
url = {https://arxiv.org/abs/2111.13557},
doi = {10.1016/j.jprocont.2022.04.011},
issn = {0959-1524},
year = {2022},
date = {2022-01-01},
journal = {Journal of Process Control},
volume = {114},
pages = {92-104},
abstract = {This paper aims to discuss and analyze the potentialities of Recurrent Neural Networks (RNN) in control design applications. The main families of RNN are considered, namely Neural Nonlinear AutoRegressive eXogenous, Echo State Networks, Long Short Term Memory, and Gated Recurrent Units. The goal is twofold. Firstly, to survey recent results concerning the training of RNN that enjoy Input-to-State Stability (ISS) and Incremental Input-to-State Stability (𝛿ISS) guarantees. Secondly, to discuss the issues that still hinder the widespread use of RNN for control, namely their robustness, verifiability, and interpretability. The former properties are related to the so-called generalization capabilities of the networks, i.e. their consistency with the underlying real plants, even in presence of unseen or perturbed input trajectories. The latter is instead related to the possibility of providing a clear formal connection between the RNN model and the plant. In this context, we illustrate how ISS and 𝛿ISS represent a significant step towards the robustness and verifiability of the RNN models, while the requirement of interpretability paves the way to the use of physics-based networks. The design of model predictive controllers with RNN as plant’s model is also briefly discussed. Lastly, some of the main topics of the paper are illustrated on a simulated chemical system.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Bonassi, Fabio; Scattolini, Riccardo
Recurrent neural network-based Internal Model Control of unknown nonlinear stable systems Journal Article
In: European Journal of Control, pp. 100632, 2022, ISSN: 0947-3580.
@article{bonassi2022imc,
title = {Recurrent neural network-based Internal Model Control of unknown nonlinear stable systems},
author = {Fabio Bonassi and Riccardo Scattolini},
doi = {10.1016/j.ejcon.2022.100632},
issn = {0947-3580},
year = {2022},
date = {2022-01-01},
journal = {European Journal of Control},
pages = {100632},
abstract = {Owing to their superior modeling capabilities, gated Recurrent Neural Networks (RNNs), such as Gated Recurrent Units (GRUs) and Long Short-Term Memory networks (LSTMs), have become popular tools for learning dynamical systems. This paper aims to discuss how these networks can be adopted for the synthesis of Internal Model Control (IMC) architectures. To this end, a first gated RNN is used to learn a model of the unknown input-output stable plant. Then, another gated RNN approximating the model inverse is trained. The proposed scheme is able to cope with the saturation of the control variables, and it can be deployed on low-power embedded controllers since it does not require any online computation. The approach is then tested on the Quadruple Tank benchmark system, resulting in satisfactory closed-loop performances.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Acerbo, Flavia Sofia; Swevers, Jan; Tuytelaars, Tinne; Son, Tong Duy
MPC-based Imitation Learning for Safe and Human-like Autonomous Driving Working paper
2022.
@workingpaper{acerbo2022mpc,
title = {MPC-based Imitation Learning for Safe and Human-like Autonomous Driving},
author = {Flavia Sofia Acerbo and Jan Swevers and Tinne Tuytelaars and Tong Duy Son},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
journal = {arXiv preprint arXiv:2206.12348},
keywords = {},
pubstate = {published},
tppubtype = {workingpaper}
}
Zhang, Yuan; Wang, Jianhong; Boedecker, Joschka
Robust Reinforcement Learning in Continuous Control Tasks with Uncertainty Set Regularization Working paper
2022.
@workingpaper{zhang2022robust,
title = {Robust Reinforcement Learning in Continuous Control Tasks with Uncertainty Set Regularization},
author = {Yuan Zhang and Jianhong Wang and Joschka Boedecker},
url = {https://arxiv.org/abs/2207.02016},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
journal = {arXiv preprint arXiv:2207.02016},
keywords = {},
pubstate = {published},
tppubtype = {workingpaper}
}
Xie, Jing; Bonassi, Fabio; Farina, Marcello; Scattolini, Riccardo
Robust offset-free nonlinear model predictive control for systems learned by neural nonlinear autoregressive exogenous models Working paper
2022.
@workingpaper{https://doi.org/10.48550/arxiv.2210.06801,
title = {Robust offset-free nonlinear model predictive control for systems learned by neural nonlinear autoregressive exogenous models},
author = {Jing Xie and Fabio Bonassi and Marcello Farina and Riccardo Scattolini},
url = {https://arxiv.org/abs/2210.06801},
doi = {10.48550/ARXIV.2210.06801},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
publisher = {arXiv},
keywords = {},
pubstate = {published},
tppubtype = {workingpaper}
}
Saccani, Danilo; Cecchin, Leonardo; Fagiano, Lorenzo
Multitrajectory Model Predictive Control for Safe UAV Navigation in an Unknown Environment Journal Article
In: IEEE Transactions on Control Systems Technology, pp. 1-16, 2022.
@article{9938397,
title = {Multitrajectory Model Predictive Control for Safe UAV Navigation in an Unknown Environment},
author = {Danilo Saccani and Leonardo Cecchin and Lorenzo Fagiano},
doi = {10.1109/TCST.2022.3216989},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
journal = {IEEE Transactions on Control Systems Technology},
pages = {1-16},
abstract = {The problem of navigating an unmanned aerial vehicle (UAV) in an unknown environment is addressed with a novel model predictive control (MPC) formulation, named multitrajectory MPC (mt-MPC). The objective is to safely drive the vehicle to the desired target location by relying only on the partial description of the surroundings provided by an exteroceptive sensor. This information results in time-varying constraints during the navigation among obstacles. The proposed mt-MPC generates a sequence of position set points that are fed to control loops at lower hierarchical levels. To do so, the mt-MPC predicts two different state trajectories, a safe one and an exploiting one, in the same finite horizon optimal control problem (FHOCP). This formulation, particularly suitable for problems with uncertain time-varying constraints, allows one to partially decouple constraint satisfaction (safety) from cost function minimization (exploitation). Uncertainty due to modeling errors and sensors noise is taken into account as well, in a set membership (SM) framework. Theoretical guarantees of persistent obstacle avoidance are derived under suitable assumptions, and the approach is demonstrated experimentally out-of-the-laboratory on a prototype built with off-the-shelf components.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Allamaa, Jean Pierre; Patrinos, Panagiotis; Auweraer, Herman Van; Son, Tong Duy
Safety Envelope for Orthogonal Collocation Methods in Embedded Optimal Control Inproceedings Forthcoming
In: 2023 European Control Conference (ECC), Forthcoming.
@inproceedings{Allamaa2022SafetyEF,
title = {Safety Envelope for Orthogonal Collocation Methods in Embedded Optimal Control},
author = {Jean Pierre Allamaa and Panagiotis Patrinos and Herman Van Auweraer and Tong Duy Son},
url = {https://arxiv.org/abs/2211.14853},
doi = {10.48550/ARXIV.2211.14853},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
booktitle = {2023 European Control Conference (ECC)},
abstract = {Orthogonal collocation methods are direct simultaneous approaches for solving optimal control problems (OCP). A high solution accuracy is achieved with few optimization variables, making it more favorable for embedded and real-time NMPC applications. However, collocation approaches lack a guarantee about the safety of the resulting continuous trajectory as inequality constraints are only set on a finite number of collocation points. In this paper we propose a method to efficiently create a convex safety envelope containing the full trajectory such that the solution fully satisfies the OCP constraints. We make use of the Bernstein approximations of a polynomial's extrema and span the solution over an orthogonal basis using the Legendre polynomials. The tightness of the safety envelope estimation, high spectral accuracy of the method in solving the underlying differential equations, fast rate of convergence and little conservatism are properties of the presented approach making it a suitable method for safe real-time NMPC deployment. We show that our method has comparable computational performance to the pseudospectral approaches and can approximate the original OCP more accurately and up to 9 times more quickly than standard multiple-shooting methods in autonomous driving applications, without adding complexity to the formulation.},
keywords = {},
pubstate = {forthcoming},
tppubtype = {inproceedings}
}
Allamaa, Jean Pierre; Patrinos, Panagiotis; Auweraer, Herman Van; Son, Tong Duy
Sim2real for Autonomous Vehicle Control using Executable Digital Twin Journal Article
In: IFAC-PapersOnLine, vol. 55, no. 24, pp. 385-391, 2022, ISSN: 2405-8963, (10th IFAC Symposium on Advances in Automotive Control AAC 2022).
@article{ALLAMAA2022385,
title = {Sim2real for Autonomous Vehicle Control using Executable Digital Twin},
author = {Jean Pierre Allamaa and Panagiotis Patrinos and Herman Van Auweraer and Tong Duy Son},
url = {https://www.sciencedirect.com/science/article/pii/S2405896322023461},
doi = {https://doi.org/10.1016/j.ifacol.2022.10.314},
issn = {2405-8963},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
journal = {IFAC-PapersOnLine},
volume = {55},
number = {24},
pages = {385-391},
abstract = {In this work, we propose a sim2real method to transfer and adapt a nonlinear model predictive controller (NMPC) from simulation to the real target system based on executable digital twin (xDT). The xDT model is a high fidelity vehicle dynamics simulator, executable online in the control parameter randomization and learning process. The parameters are adapted to gradually improve control performance and deal with changing real-world environment. In particular, the performance metric is not required to be differentiable nor analytical with respect to the control parameters and system dynamics are not necessary linearized. Eventually, the proposed sim2real framework leverages altogether online high fidelity simulator, data-driven estimations, and simulation based optimization to transfer and adapt efficiently a controller developed in simulation environment to the real platform. Our experiment demonstrates that a high control performance is achieved without tedious time and labor consuming tuning.},
note = {10th IFAC Symposium on Advances in Automotive Control AAC 2022},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Voogd, Kevin; Allamaa, Jean Pierre; Alonso-Mora, Javier; Son, Tong Duy
Reinforcement Learning from Simulation to Real World Autonomous Driving using Digital Twin Working paper
2022, (Under review).
@workingpaper{Voogd2022ReinforcementLF,
title = {Reinforcement Learning from Simulation to Real World Autonomous Driving using Digital Twin},
author = {Kevin Voogd and Jean Pierre Allamaa and Javier Alonso-Mora and Tong Duy Son},
url = {https://arxiv.org/abs/2211.14874},
doi = {10.48550/ARXIV.2211.14874},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
publisher = {arXiv},
abstract = {Reinforcement learning (RL) is a promising solution for autonomous vehicles to deal with complex and uncertain traffic environments. The RL training process is however expensive, unsafe, and time consuming. Algorithms are often developed first in simulation and then transferred to the real world, leading to a common sim2real challenge that performance decreases when the domain changes. In this paper, we propose a transfer learning process to minimize the gap by exploiting digital twin technology, relying on a systematic and simultaneous combination of virtual and real world data coming from vehicle dynamics and traffic scenarios. The model and testing environment are evolved from model, hardware to vehicle in the loop and proving ground testing stages, similar to standard development cycle in automotive industry. In particular, we also integrate other transfer learning techniques such as domain randomization and adaptation in each stage. The simulation and real data are gradually incorporated to accelerate and make the transfer learning process more robust. The proposed RL methodology is applied to develop a path following steering controller for an autonomous electric vehicle. After learning and deploying the real-time RL control policy on the vehicle, we obtained satisfactory and safe control performance already from the first deployment, demonstrating the advantages of the proposed digital twin based learning process.},
note = {Under review},
keywords = {},
pubstate = {published},
tppubtype = {workingpaper}
}
Wang, Renzi; Schuurmans, Mathijs; Patrinos, Panagiotis
Interaction-aware Model Predictive Control for Autonomous Driving Inproceedings Forthcoming
In: 2023 European Control Conference (ECC), Forthcoming.
@inproceedings{Wang2022,
title = {Interaction-aware Model Predictive Control for Autonomous Driving},
author = {Renzi Wang and Mathijs Schuurmans and Panagiotis Patrinos},
url = {https://arxiv.org/abs/2211.17053},
doi = {10.48550/ARXIV.2211.17053},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
booktitle = {2023 European Control Conference (ECC)},
keywords = {},
pubstate = {forthcoming},
tppubtype = {inproceedings}
}