@conference{Data_Augmentation_caepia_2024, author = "Marta Vega-Bayo and Antonio Manuel G{\'o}mez-Orellana and V{\'i}ctor Manuel Vargas and David Guijo-Rubio and Laura Cornejo-Bueno and Jorge P{\'e}rez-Aracil and Sancho Salcedo-Sanz", abstract = "Predicting extreme winds (i.e. winds speed equal to or greater than 25 m/s), is essential to predict wind power and accomplish safe and efficient management of wind farms. Although feasible, predicting extreme wind with supervised classifiers and deep learning models is particularly difficult because of the low frequency of these events, which leads to highly unbalanced training datasets. To tackle this challenge, in this paper different traditional data augmentation techniques, such as random oversampling, SMOTE, time series data warping and multidimensional data warping, are used to generate synthetic samples of extreme wind and its predictors, such as previous samples of wind speed and meteorological variables of the surroundings. Results show that using data augmentation techniques with the right oversampling ratio leads to improvement in extreme wind prediction with most machine learning and deep learning models tested. In this paper, advanced data augmentation techniques, such as Variational Autoencoders (VAE), are also applied and evaluated when inputs are time series.", booktitle = "Bioinspired Systems for Translational Applications: From Robotics to Social Engineering", doi = "https://link.springer.com/chapter/10.1007/978-3-031-61137-7_28", issn = "1611-3349", keywords = "Extreme wind speed classification, data augmentation, machine learning, deep learning", month = "Mayo", organization = "IWINAC", pages = "303–313", title = "{D}ata {A}ugmentation {T}echniques for {E}xtreme {W}ind {P}rediction {I}mprovement", url = "doi.org/10.1007/978-3-031-61137-7_28", volume = "14675", year = "2024", }