Publications
2024 |
D. Gutiérrez-Avilés and J. F. Torres and F. Martínez-Álvarez and J. Cugliari An evolutionary triclustering approach to discover electricity consumption patterns in France (Conference) SAC 39th Annual ACM Symposium on Applied Computing, 2024. (Abstract | BibTeX | Tags: clustering, energy, time series) @conference{GUTIERREZ24_SAC, title = {An evolutionary triclustering approach to discover electricity consumption patterns in France}, author = {D. Gutiérrez-Avilés and J. F. Torres and F. Martínez-Álvarez and J. Cugliari}, year = {2024}, date = {2024-02-04}, booktitle = {SAC 39th Annual ACM Symposium on Applied Computing}, pages = {386-394}, abstract = {Electricity consumption patterns are critical in shaping energy policies and optimizing resource allocation. In pursuing a more sustainable and efficient energy future, uncovering hidden consumption patterns is paramount. This paper introduces an innovative approach, leveraging evolutionary triclustering techniques, to unveil previously undisclosed electricity consumption patterns in France. By harnessing the power of triclustering algorithms, this research provides a comprehensive analysis of electricity usage across various dimensions, shedding light on intricate relationships among variables. Using this novel method, the study reveals concealed patterns and offers insights that can inform decision-makers and stakeholders in the energy sector. The findings contribute to a better understanding of electricity consumption dynamics, aiding in developing more targeted and effective energy management strategies. This research represents a significant step forward in the quest for sustainable energy solutions and underscores the potential of evolutionary triclustering as a valuable tool in uncovering complex consumption patterns.}, keywords = {clustering, energy, time series}, pubstate = {published}, tppubtype = {conference} } Electricity consumption patterns are critical in shaping energy policies and optimizing resource allocation. In pursuing a more sustainable and efficient energy future, uncovering hidden consumption patterns is paramount. This paper introduces an innovative approach, leveraging evolutionary triclustering techniques, to unveil previously undisclosed electricity consumption patterns in France. By harnessing the power of triclustering algorithms, this research provides a comprehensive analysis of electricity usage across various dimensions, shedding light on intricate relationships among variables. Using this novel method, the study reveals concealed patterns and offers insights that can inform decision-makers and stakeholders in the energy sector. The findings contribute to a better understanding of electricity consumption dynamics, aiding in developing more targeted and effective energy management strategies. This research represents a significant step forward in the quest for sustainable energy solutions and underscores the potential of evolutionary triclustering as a valuable tool in uncovering complex consumption patterns. |
R. Pérez-Chacón and G. Asencio-Cortés and A. Troncoso and F. Martínez-Álvarez Pattern sequence-based algorithm for multivariate big data time series forecasting: Application to electricity consumption (Journal Article) Future Generation Computer Systems, 154 , pp. 397-412, 2024. (Abstract | Links | BibTeX | Tags: big data, energy, forecasting, time series) @article{PEREZ24, title = {Pattern sequence-based algorithm for multivariate big data time series forecasting: Application to electricity consumption}, author = {R. Pérez-Chacón and G. Asencio-Cortés and A. Troncoso and F. Martínez-Álvarez}, url = {https://www.sciencedirect.com/science/article/pii/S0167739X23004752}, doi = {https://doi.org/10.1016/j.future.2023.12.021}, year = {2024}, date = {2024-01-29}, journal = {Future Generation Computer Systems}, volume = {154}, pages = {397-412}, abstract = {Several interrelated variables typically characterize real-world processes, and a time series cannot be predicted without considering the influence that other time series might have on the target time series. This work proposes a novel algorithm to forecast multivariate big data time series. This new general-purpose approach consists first of a previous pattern recognition performed jointly using all time series that form the multivariate time series and then predicts the target time series by searching for similarities between pattern sequences. The proposed algorithm is designed to tackle multivariate time series forecasting problems within the context of big data. In particular, the algorithm has been developed with a distributed nature to enhance its efficiency in analyzing and processing large volumes of data. Moreover, the algorithm is straightforward to use, with only two parameters needing adjustment. Another advantage of the MV-bigPSF algorithm is its ability to perform multi-step forecasting, which is particularly useful in many practical applications. To evaluate the algorithm’s performance, real-world data from Uruguay’s power consumption has been utilized. Specifically, MV-bigPSF has been compared with both univariate and multivariate methods. Regarding the univariate ones, MV-bigPSF improved 12.8% in MAPE compared to the second-best method. Regarding the multivariate comparison, MV-bigPSF improved 44.8% in MAPE with respect to the second most accurate method. Regarding efficiency, the execution time of MV-bigPSF was 1.83 times faster than the second-fastest multivariate method, both in a single-core environment. Therefore, the proposed algorithm can be a valuable tool for practitioners and researchers working in multivariate time series forecasting, particularly in big data applications.}, keywords = {big data, energy, forecasting, time series}, pubstate = {published}, tppubtype = {article} } Several interrelated variables typically characterize real-world processes, and a time series cannot be predicted without considering the influence that other time series might have on the target time series. This work proposes a novel algorithm to forecast multivariate big data time series. This new general-purpose approach consists first of a previous pattern recognition performed jointly using all time series that form the multivariate time series and then predicts the target time series by searching for similarities between pattern sequences. The proposed algorithm is designed to tackle multivariate time series forecasting problems within the context of big data. In particular, the algorithm has been developed with a distributed nature to enhance its efficiency in analyzing and processing large volumes of data. Moreover, the algorithm is straightforward to use, with only two parameters needing adjustment. Another advantage of the MV-bigPSF algorithm is its ability to perform multi-step forecasting, which is particularly useful in many practical applications. To evaluate the algorithm’s performance, real-world data from Uruguay’s power consumption has been utilized. Specifically, MV-bigPSF has been compared with both univariate and multivariate methods. Regarding the univariate ones, MV-bigPSF improved 12.8% in MAPE compared to the second-best method. Regarding the multivariate comparison, MV-bigPSF improved 44.8% in MAPE with respect to the second most accurate method. Regarding efficiency, the execution time of MV-bigPSF was 1.83 times faster than the second-fastest multivariate method, both in a single-core environment. Therefore, the proposed algorithm can be a valuable tool for practitioners and researchers working in multivariate time series forecasting, particularly in big data applications. |
C. G. García-Soto and J. F. Torres and M. A. Zamora-Izquierdo and J. Palma and A. Troncoso Water consumption time series forecasting in urban centers using deep neural networks (Journal Article) Applied Water Science, 14 , pp. 1-14, 2024. (Abstract | Links | BibTeX | Tags: deep learning, forecasting, time series) @article{GARCIA-SOTO24, title = {Water consumption time series forecasting in urban centers using deep neural networks}, author = {C. G. García-Soto and J. F. Torres and M. A. Zamora-Izquierdo and J. Palma and A. Troncoso}, url = {https://link.springer.com/article/10.1007/s13201-023-02072-4}, doi = {https://doi.org/10.1007/s13201-023-02072-4}, year = {2024}, date = {2024-01-12}, journal = {Applied Water Science}, volume = {14}, pages = {1-14}, abstract = {The time series analysis and prediction techniques are highly valued in many application felds, such as economy, medicine and biology, environmental sciences or meteorology, among others. In the last years, there is a growing interest in the sustainable and optimal management of a resource as scarce as essential: the water. Forecasting techniques for water management can be used for diferent time horizons from the planning of constructions that can respond to long-term needs, to the detection of anomalies in the operation of facilities or the optimization of the operation in the short and medium term. In this paper, a deep neural network is specifcally designed to predict water consumption in the short-term. Results are reported using the time series of water consumption for a year and a half measured with 10-min frequency in the city of Murcia, the seventh largest city in Spain by number of inhabitants. The results are compared with K Nearest Neighbors, Random Forest, Extreme Gradient Boosting, Seasonal Autoregressive Integrated Moving Average and two persistence models as naive methods, showing the proposed deep learning model the most accurate results.}, keywords = {deep learning, forecasting, time series}, pubstate = {published}, tppubtype = {article} } The time series analysis and prediction techniques are highly valued in many application felds, such as economy, medicine and biology, environmental sciences or meteorology, among others. In the last years, there is a growing interest in the sustainable and optimal management of a resource as scarce as essential: the water. Forecasting techniques for water management can be used for diferent time horizons from the planning of constructions that can respond to long-term needs, to the detection of anomalies in the operation of facilities or the optimization of the operation in the short and medium term. In this paper, a deep neural network is specifcally designed to predict water consumption in the short-term. Results are reported using the time series of water consumption for a year and a half measured with 10-min frequency in the city of Murcia, the seventh largest city in Spain by number of inhabitants. The results are compared with K Nearest Neighbors, Random Forest, Extreme Gradient Boosting, Seasonal Autoregressive Integrated Moving Average and two persistence models as naive methods, showing the proposed deep learning model the most accurate results. |
F. Martínez-Álvarez and R. Scitovski and C. Rubio-Escudero and A. Morales-Esteban Emerging trends in big data analytics and natural disasters (Editorial) (Journal Article) Computers and Geosciences, 182 , pp. 105465, 2024. (Links | BibTeX | Tags: big data, natural disasters, time series) @article{MARTINEZ24, title = {Emerging trends in big data analytics and natural disasters (Editorial)}, author = {F. Martínez-Álvarez and R. Scitovski and C. Rubio-Escudero and A. Morales-Esteban}, url = {https://www.sciencedirect.com/science/article/pii/S0098300423001693}, doi = {https://doi.org/10.1016/j.cageo.2023.105465}, year = {2024}, date = {2024-01-01}, journal = {Computers and Geosciences}, volume = {182}, pages = {105465}, keywords = {big data, natural disasters, time series}, pubstate = {published}, tppubtype = {article} } |
2023 |
D. Hadjout and A. Sebaa and J. F. Torres and F. Mártinez-Álvarez Electricity consumption forecasting with outliers handling based on clustering and deep learning with application to the Algerian market (Journal Article) Expert Systems with Applications, 227 , pp. 120123, 2023. (Abstract | Links | BibTeX | Tags: clustering, deep learning, energy, time series) @article{HADJOUT23, title = {Electricity consumption forecasting with outliers handling based on clustering and deep learning with application to the Algerian market}, author = {D. Hadjout and A. Sebaa and J. F. Torres and F. Mártinez-Álvarez}, url = {https://www.sciencedirect.com/science/article/abs/pii/S0957417423006255}, doi = {https://doi.org/10.1016/j.eswa.2023.120123}, year = {2023}, date = {2023-10-01}, journal = {Expert Systems with Applications}, volume = {227}, pages = {120123}, abstract = {The reduction of electricity loss and the effective management of electricity demand are vital operations for production and distribution electricity enterprises. To achieve these goals, accurate forecasts of aggregate and individual electricity consumers are necessary. A novel multistep forecasting method is developed to forecast medium-term electricity consumption of the Algerian economic sector. The proposed method goes through the following three steps: cleaning steps, clustering steps and forecasting step of each cluster. The aim of the first step is to detect and then replace outliers. To complete the first phase, Robust Exponential and Holt-Winters Smoothing algorithms are adapted. Then, to carry out accurate forecasting at a lowest level, K-Shape and K-Means clustering methods are utilized to extract similarities and identify customer consumption patterns as a second step. The third step entails developing a deep learning model based on Gated Recurrent Units to forecast the electricity consumption in each cluster. To validate the proposed method, we compared our results to the most known methods in literature like Autoregressive Integrated Moving Average, Seasonal Grey Model, LSTM networks, Temporal Convolutional Networks and two ensemble models. The results of several experiments conducted with 2000 electricity consumers during 14 years from an Algeria province (Bejaia) demonstrate that the proposed method provides remarkable prediction performances. Thus, prediction performances of the K-Shape-based clustering method reach much higher prediction accuracy. According to the MAPE metric, the results of the best predictions are equal to 2.04%. It is also notable that 87% of the clients have a considerably low prediction error.}, keywords = {clustering, deep learning, energy, time series}, pubstate = {published}, tppubtype = {article} } The reduction of electricity loss and the effective management of electricity demand are vital operations for production and distribution electricity enterprises. To achieve these goals, accurate forecasts of aggregate and individual electricity consumers are necessary. A novel multistep forecasting method is developed to forecast medium-term electricity consumption of the Algerian economic sector. The proposed method goes through the following three steps: cleaning steps, clustering steps and forecasting step of each cluster. The aim of the first step is to detect and then replace outliers. To complete the first phase, Robust Exponential and Holt-Winters Smoothing algorithms are adapted. Then, to carry out accurate forecasting at a lowest level, K-Shape and K-Means clustering methods are utilized to extract similarities and identify customer consumption patterns as a second step. The third step entails developing a deep learning model based on Gated Recurrent Units to forecast the electricity consumption in each cluster. To validate the proposed method, we compared our results to the most known methods in literature like Autoregressive Integrated Moving Average, Seasonal Grey Model, LSTM networks, Temporal Convolutional Networks and two ensemble models. The results of several experiments conducted with 2000 electricity consumers during 14 years from an Algeria province (Bejaia) demonstrate that the proposed method provides remarkable prediction performances. Thus, prediction performances of the K-Shape-based clustering method reach much higher prediction accuracy. According to the MAPE metric, the results of the best predictions are equal to 2.04%. It is also notable that 87% of the clients have a considerably low prediction error. |
J. F. Torres and S. Valencia and F. Martínez-Álvarez and N. Hoyos Predicting Wildfires in the Caribbean Using Multi-source Satellite Data and Deep Learning (Conference) IWANN 17th International Work-Conference on Artificial Neural Networks, 14135 , Lecture Notes in Computer Science 2023. (Links | BibTeX | Tags: deep learning, natural disasters, time series) @conference{TORRES23_IWANN, title = {Predicting Wildfires in the Caribbean Using Multi-source Satellite Data and Deep Learning}, author = {J. F. Torres and S. Valencia and F. Martínez-Álvarez and N. Hoyos}, url = {https://link.springer.com/chapter/10.1007/978-3-031-43078-7_1}, doi = {https://doi.org/10.1007/978-3-031-43078-7_1}, year = {2023}, date = {2023-09-30}, booktitle = {IWANN 17th International Work-Conference on Artificial Neural Networks}, volume = {14135}, pages = {3-14}, series = {Lecture Notes in Computer Science}, keywords = {deep learning, natural disasters, time series}, pubstate = {published}, tppubtype = {conference} } |
A. R. Troncoso-García and M. Martínez-Ballesteros and F. Martínez-Álvarez and A. Troncoso Deep Learning-Based Approach for Sleep Apnea Detection Using Physiological Signals (Conference) IWANN 17th International Work-Conference on Artificial Neural Networks, 14134 , Lecture Notes in Computer Science 2023. (Links | BibTeX | Tags: deep learning, forecasting, time series) @conference{TRONCOSO-GARCIA23_IWANN, title = {Deep Learning-Based Approach for Sleep Apnea Detection Using Physiological Signals}, author = {A. R. Troncoso-García and M. Martínez-Ballesteros and F. Martínez-Álvarez and A. Troncoso}, url = {https://link.springer.com/chapter/10.1007/978-3-030-20521-8_22}, doi = {https://doi.org/10.1007/978-3-030-20521-8_22}, year = {2023}, date = {2023-09-30}, booktitle = {IWANN 17th International Work-Conference on Artificial Neural Networks}, volume = {14134}, pages = {626–637}, series = {Lecture Notes in Computer Science}, keywords = {deep learning, forecasting, time series}, pubstate = {published}, tppubtype = {conference} } |
M. J. Jiménez-Navarro and M. Martínez-Ballesteros and F. Martínez-Álvarez and G. Asencio-Cortés Embedded Temporal Feature Selection for Time Series Forecasting Using Deep Learning (Conference) IWANN 17th International Work-Conference on Artificial Neural Networks, 14135 , Lecture Notes in Computer Science 2023. (Links | BibTeX | Tags: deep learning, feature selection, time series) @conference{JIMENEZ-NAVARRO23_IWANN, title = {Embedded Temporal Feature Selection for Time Series Forecasting Using Deep Learning}, author = {M. J. Jiménez-Navarro and M. Martínez-Ballesteros and F. Martínez-Álvarez and G. Asencio-Cortés}, url = {https://link.springer.com/chapter/10.1007/978-3-031-43078-7_2}, doi = {https://doi.org/10.1007/978-3-031-43078-7_2}, year = {2023}, date = {2023-09-30}, booktitle = {IWANN 17th International Work-Conference on Artificial Neural Networks}, volume = {14135}, pages = {15-26}, series = {Lecture Notes in Computer Science}, keywords = {deep learning, feature selection, time series}, pubstate = {published}, tppubtype = {conference} } |
A. Vellinger and J. F. Torres and F. Divina and W. Vanhoof Neuroevolutionary Transfer Learning for Time Series Forecasting (Conference) SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications, 749 , Lecture Notes in Networks and Systems 2023. (Links | BibTeX | Tags: deep learning, forecasting, time series, transfer learning) @conference{VELLINGER23, title = {Neuroevolutionary Transfer Learning for Time Series Forecasting}, author = {A. Vellinger and J. F. Torres and F. Divina and W. Vanhoof}, doi = {https://doi.org/10.1007/978-3-031-42529-5_21}, year = {2023}, date = {2023-08-31}, booktitle = {SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications}, volume = {749}, pages = {219-228}, series = {Lecture Notes in Networks and Systems}, keywords = {deep learning, forecasting, time series, transfer learning}, pubstate = {published}, tppubtype = {conference} } |
M. J. Jiménez-Navarro and M. Martínez-Ballesteros and F. Martínez-Álvarez and G. Asencio-Cortés A New Deep Learning Architecture with Inductive Bias Balance for Oil Temperature Forecasting (Journal Article) Journal of Big Data, 10 , pp. 80, 2023. (Abstract | Links | BibTeX | Tags: deep learning, time series) @article{JIMENEZ-NAVARRO23c, title = {A New Deep Learning Architecture with Inductive Bias Balance for Oil Temperature Forecasting}, author = {M. J. Jiménez-Navarro and M. Martínez-Ballesteros and F. Martínez-Álvarez and G. Asencio-Cortés}, url = {https://journalofbigdata.springeropen.com/articles/10.1186/s40537-023-00745-0}, doi = {https://doi.org/10.1186/s40537-023-00745-0}, year = {2023}, date = {2023-05-28}, journal = {Journal of Big Data}, volume = {10}, pages = {80}, abstract = {Ensuring the optimal performance of power transformers is a laborious task in which the insulation system plays a vital role in decreasing their deterioration. The insulation system uses insulating oil to control temperature, as high temperatures can reduce the lifetime of the transformers and lead to expensive maintenance. Deep learning architectures have been demonstrated remarkable results in various fields. However, this improvement often comes at the cost of increased computing resources, which, in turn, increases the carbon footprint and hinders the optimization of architectures. In this study, we introduce a novel deep learning architecture that achieves a comparable efficacy to the best existing architectures in transformer oil temperature forecasting while improving efficiency. Effective forecasting can help prevent high temperatures and monitor the future condition of power transformers, thereby reducing unnecessary waste. To balance the inductive bias in our architecture, we propose the Smooth Residual Block, which divides the original problem into multiple subproblems to obtain different representations of the time series, collaboratively achieving the final forecasting. We applied our architecture to the Electricity Transformer datasets, which obtain transformer insulating oil temperature measures from two transformers in China. The results showed a 13% improvement in MSE and a 57% improvement in performance compared to the best current architectures, to the best of our knowledge. Moreover, we analyzed the architecture behavior to gain an intuitive understanding of the achieved solution.}, keywords = {deep learning, time series}, pubstate = {published}, tppubtype = {article} } Ensuring the optimal performance of power transformers is a laborious task in which the insulation system plays a vital role in decreasing their deterioration. The insulation system uses insulating oil to control temperature, as high temperatures can reduce the lifetime of the transformers and lead to expensive maintenance. Deep learning architectures have been demonstrated remarkable results in various fields. However, this improvement often comes at the cost of increased computing resources, which, in turn, increases the carbon footprint and hinders the optimization of architectures. In this study, we introduce a novel deep learning architecture that achieves a comparable efficacy to the best existing architectures in transformer oil temperature forecasting while improving efficiency. Effective forecasting can help prevent high temperatures and monitor the future condition of power transformers, thereby reducing unnecessary waste. To balance the inductive bias in our architecture, we propose the Smooth Residual Block, which divides the original problem into multiple subproblems to obtain different representations of the time series, collaboratively achieving the final forecasting. We applied our architecture to the Electricity Transformer datasets, which obtain transformer insulating oil temperature measures from two transformers in China. The results showed a 13% improvement in MSE and a 57% improvement in performance compared to the best current architectures, to the best of our knowledge. Moreover, we analyzed the architecture behavior to gain an intuitive understanding of the achieved solution. |
M. J. Jiménez-Navarro and M. Martínez-Ballesteros and F. Martínez-Álvarez and G. Asencio-Cortés PHILNet: A Novel Efficient Approach for Time Series Forecasting using Deep Learning (Journal Article) Information Sciences, 632 , pp. 815-832, 2023. (Abstract | Links | BibTeX | Tags: deep learning, time series) @article{JIMENEZ-NAVARRO23b, title = {PHILNet: A Novel Efficient Approach for Time Series Forecasting using Deep Learning}, author = {M. J. Jiménez-Navarro and M. Martínez-Ballesteros and F. Martínez-Álvarez and G. Asencio-Cortés}, url = {https://doi.org/10.1016/j.ins.2023.03.021}, doi = {https://www.sciencedirect.com/science/article/pii/S0020025523003183?via%3Dihub}, year = {2023}, date = {2023-03-03}, journal = {Information Sciences}, volume = {632}, pages = {815-832}, abstract = {Time series is one of the most common data types in the industry nowadays. Forecasting the future of a time series behavior can be useful in planning ahead, saving time, resources, and helping avoid undesired scenarios. To make the forecasting, historical data is utilized due to the causal nature of the time series. Several deep learning algorithms have been presented in this area, where the input is processed through a series of non-linear functions to produce the output. We present a novel strategy to improve the performance of deep learning models in time series forecasting in terms of efficiency while reaching similar effectiveness. This approach separates the model into levels, starting with the easiest and continuing to the most difficult. The simpler levels deal with smoothed versions of the input, whereas the most sophisticated level deals with the raw data. This strategy seeks to mimic the human learning process, in which basic tasks are completed initially, followed by more precise and sophisticated ones. Our method achieved promising results, obtaining a 35% improvement in mean squared error and a 2.6 time decrease in training time compared with the best models found in a variety of time series.}, keywords = {deep learning, time series}, pubstate = {published}, tppubtype = {article} } Time series is one of the most common data types in the industry nowadays. Forecasting the future of a time series behavior can be useful in planning ahead, saving time, resources, and helping avoid undesired scenarios. To make the forecasting, historical data is utilized due to the causal nature of the time series. Several deep learning algorithms have been presented in this area, where the input is processed through a series of non-linear functions to produce the output. We present a novel strategy to improve the performance of deep learning models in time series forecasting in terms of efficiency while reaching similar effectiveness. This approach separates the model into levels, starting with the easiest and continuing to the most difficult. The simpler levels deal with smoothed versions of the input, whereas the most sophisticated level deals with the raw data. This strategy seeks to mimic the human learning process, in which basic tasks are completed initially, followed by more precise and sophisticated ones. Our method achieved promising results, obtaining a 35% improvement in mean squared error and a 2.6 time decrease in training time compared with the best models found in a variety of time series. |
D. Azzouguer and A. Sebaa and D. Hadjout and F. Martínez-Álvarez Fraud Detection of Electricity Consumption using Robust Exponential and Holt-Winters Smoothing method (Conference) IEEE International Conference on Advanced Systems and Emergent Technologies, 2023. (Abstract | Links | BibTeX | Tags: energy, time series) @conference{AZZOUGUER23, title = {Fraud Detection of Electricity Consumption using Robust Exponential and Holt-Winters Smoothing method}, author = {D. Azzouguer and A. Sebaa and D. Hadjout and F. Martínez-Álvarez}, url = {https://ieeexplore.ieee.org/document/10150645}, doi = {10.1109/IC_ASET58101.2023.10150645}, year = {2023}, date = {2023-02-20}, booktitle = {IEEE International Conference on Advanced Systems and Emergent Technologies}, abstract = {Non-technical losses (NTL), especially fraud detection is very important for electricity distribution enterprises. Fraud detection allows for maximizing the effective economic return for such enterprises. This paper provides an electricity fraud detection approach based on robust exponential and Holt-Winters Smoothing methods. The proposed approach is a procedure that aims to discover the fraudulent behavior of electricity consumers and goes through three crucial steps: (1) the prediction of monthly consumption, (2) the detection of abnormal consumption of electrical meters, and (3) the detection of fraud cases of economic customers. The proposed model was trained and evaluated. Its experimental validation is achieved by using a large dataset of real users from the Algerian economic sector with almost 2000 clients and 14 years of monthly electricity consumption. The proposed solution revealed good performance compared to the literature and the comparison with the models implemented in this article: SARIMA for prediction and two sigma for anomaly detection. The results show highly efficient and realistic countermeasures to fraud detection, which leads us to say that this method is robust and can enhance company profit.}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {conference} } Non-technical losses (NTL), especially fraud detection is very important for electricity distribution enterprises. Fraud detection allows for maximizing the effective economic return for such enterprises. This paper provides an electricity fraud detection approach based on robust exponential and Holt-Winters Smoothing methods. The proposed approach is a procedure that aims to discover the fraudulent behavior of electricity consumers and goes through three crucial steps: (1) the prediction of monthly consumption, (2) the detection of abnormal consumption of electrical meters, and (3) the detection of fraud cases of economic customers. The proposed model was trained and evaluated. Its experimental validation is achieved by using a large dataset of real users from the Algerian economic sector with almost 2000 clients and 14 years of monthly electricity consumption. The proposed solution revealed good performance compared to the literature and the comparison with the models implemented in this article: SARIMA for prediction and two sigma for anomaly detection. The results show highly efficient and realistic countermeasures to fraud detection, which leads us to say that this method is robust and can enhance company profit. |
E. T. Habtemariam and K. Kekeba and M. Martínez-Ballesteros and F. Mártinez-Álvarez A Bayesian Optimization-Based LSTM Model for Wind Power Forecasting in the Adama District, Ethiopia (Journal Article) Energies, 16 , pp. 2317, 2023. (Abstract | Links | BibTeX | Tags: deep learning, time series) @article{EJIGU23, title = {A Bayesian Optimization-Based LSTM Model for Wind Power Forecasting in the Adama District, Ethiopia}, author = {E. T. Habtemariam and K. Kekeba and M. Martínez-Ballesteros and F. Mártinez-Álvarez}, url = {https://www.mdpi.com/1996-1073/16/5/2317}, doi = {https://doi.org/10.3390/en16052317}, year = {2023}, date = {2023-02-19}, journal = {Energies}, volume = {16}, pages = {2317}, abstract = {Renewable energies such as solar and wind power have become promising sources of energy to address the increase in greenhouse gases caused by the use of fossil fuels and to resolve current energy crises. Integrating wind energy into a large-scale electric grid presents a significant challenge due to the high intermittency and nonlinear behavior of wind power. Accurate wind power forecasting is essential for safe and efficient integration into the grid system. Many prediction models have been developed to predict the uncertain and nonlinear time series of wind power, but most neglect the use of Bayesian optimization to optimize the hyperparameters while training deep learning algorithms. The efficiency of grid search strategies decreases as the number of hyperparameters increases, and computation time complexity becomes an issue. This paper presents a robust and optimized Long-Short Term Memory network for forecasting wind power generation in the day ahead in the context of Ethiopia's renewable energy sector. The proposal uses Bayesian optimization to find the best hyperparameter combination in a reasonable computation time. The results indicate that tuning hyperparameters using this metaheuristic prior to building deep learning models significantly improves the predictive performance of the models. The proposed models were evaluated using MAE, RMSE, and MAPE metrics and outperformed both the baseline models and the optimized Gated Recurrent Unit architecture.}, keywords = {deep learning, time series}, pubstate = {published}, tppubtype = {article} } Renewable energies such as solar and wind power have become promising sources of energy to address the increase in greenhouse gases caused by the use of fossil fuels and to resolve current energy crises. Integrating wind energy into a large-scale electric grid presents a significant challenge due to the high intermittency and nonlinear behavior of wind power. Accurate wind power forecasting is essential for safe and efficient integration into the grid system. Many prediction models have been developed to predict the uncertain and nonlinear time series of wind power, but most neglect the use of Bayesian optimization to optimize the hyperparameters while training deep learning algorithms. The efficiency of grid search strategies decreases as the number of hyperparameters increases, and computation time complexity becomes an issue. This paper presents a robust and optimized Long-Short Term Memory network for forecasting wind power generation in the day ahead in the context of Ethiopia's renewable energy sector. The proposal uses Bayesian optimization to find the best hyperparameter combination in a reasonable computation time. The results indicate that tuning hyperparameters using this metaheuristic prior to building deep learning models significantly improves the predictive performance of the models. The proposed models were evaluated using MAE, RMSE, and MAPE metrics and outperformed both the baseline models and the optimized Gated Recurrent Unit architecture. |
A. R. Troncoso-García and M. Martínez-Ballesteros and F. Mártinez-Álvarez and A. Troncoso A new approach based on association rules to add explainability to time series forecasting models (Journal Article) Information Fusion, 94 , pp. 169-180, 2023. (Abstract | Links | BibTeX | Tags: association rules, time series, XAI) @article{TRONCOSO-GARCIA23, title = {A new approach based on association rules to add explainability to time series forecasting models}, author = {A. R. Troncoso-García and M. Martínez-Ballesteros and F. Mártinez-Álvarez and A. Troncoso}, url = {https://www.sciencedirect.com/science/article/pii/S1566253523000295}, doi = {10.1016/j.inffus.2023.01.021}, year = {2023}, date = {2023-01-22}, journal = {Information Fusion}, volume = {94}, pages = {169-180}, abstract = {Machine learning and deep learning have become the most useful and powerful tools in the last years to mine information from large datasets. Despite the successful application to many research fields, it is widely known that some of these solutions based on artificial intelligence are considered black-box models, meaning that most experts find difficult to explain and interpret the models and why they generate such outputs. In this context, explainable artificial intelligence is emerging with the aim of providing black-box models with sufficient interpretability. Thus, models could be easily understood and further applied. This work proposes a novel method to explain black-box models, by using numeric association rules to explain and interpret multi-step time series forecasting models. Thus, a multi-objective algorithm is used to discover quantitative association rules from the target model. Then, visual explanation techniques are applied to make the rules more interpretable. Data from Spanish electricity energy consumption has been used to assess the suitability of the proposal.}, keywords = {association rules, time series, XAI}, pubstate = {published}, tppubtype = {article} } Machine learning and deep learning have become the most useful and powerful tools in the last years to mine information from large datasets. Despite the successful application to many research fields, it is widely known that some of these solutions based on artificial intelligence are considered black-box models, meaning that most experts find difficult to explain and interpret the models and why they generate such outputs. In this context, explainable artificial intelligence is emerging with the aim of providing black-box models with sufficient interpretability. Thus, models could be easily understood and further applied. This work proposes a novel method to explain black-box models, by using numeric association rules to explain and interpret multi-step time series forecasting models. Thus, a multi-objective algorithm is used to discover quantitative association rules from the target model. Then, visual explanation techniques are applied to make the rules more interpretable. Data from Spanish electricity energy consumption has been used to assess the suitability of the proposal. |
M. J. Jiménez-Navarro and M. Martínez-Ballesteros and F. Mártinez-Álvarez and A. Troncoso and G. Asencio-Cortés From Simple to Complex: A Sequential Method for Enhancing Time Series Forecasting with Deep Learning (Journal Article) Logic Journal of the IGPL, in press , 2023. (Abstract | BibTeX | Tags: deep learning, time series) @article{JIMENEZ-NAVARRO23a, title = {From Simple to Complex: A Sequential Method for Enhancing Time Series Forecasting with Deep Learning}, author = {M. J. Jiménez-Navarro and M. Martínez-Ballesteros and F. Mártinez-Álvarez and A. Troncoso and G. Asencio-Cortés}, year = {2023}, date = {2023-01-20}, journal = {Logic Journal of the IGPL}, volume = {in press}, abstract = {Time series forecasting is a well-known deep learning application field in which previous data are used to predict the future behavior of the series. Recently, several deep learning approaches have been proposed in which several nonlinear functions are applied to the input to obtain the output. In this paper, we introduce a novel method to improve the performance of deep learning models in time series forecasting. This method divides the model into hierarchies or levels from simpler to more complex ones. Simpler levels handle smoothed versions of the input, whereas the most complex level processes the original time series. This method follows the human learning process where general/simpler tasks are performed first, and afterward, more precise/harder ones are accomplished.Our proposed methodology has been applied to the LSTM architecture, showing remarkable performance in various time series. In addition, a comparison is reported including a standard LSTM and novel methods such as DeepAR, Temporal Fusion Transformer (TFT), NBEATS and Echo State Network (ESN).}, keywords = {deep learning, time series}, pubstate = {published}, tppubtype = {article} } Time series forecasting is a well-known deep learning application field in which previous data are used to predict the future behavior of the series. Recently, several deep learning approaches have been proposed in which several nonlinear functions are applied to the input to obtain the output. In this paper, we introduce a novel method to improve the performance of deep learning models in time series forecasting. This method divides the model into hierarchies or levels from simpler to more complex ones. Simpler levels handle smoothed versions of the input, whereas the most complex level processes the original time series. This method follows the human learning process where general/simpler tasks are performed first, and afterward, more precise/harder ones are accomplished.Our proposed methodology has been applied to the LSTM architecture, showing remarkable performance in various time series. In addition, a comparison is reported including a standard LSTM and novel methods such as DeepAR, Temporal Fusion Transformer (TFT), NBEATS and Echo State Network (ESN). |
P. Jiménez-Herrera and L. Melgar-García and G. Asencio-Cortés and A. Troncoso Streaming big time series forecasting based on nearest similar patterns with application to energy consumption (Journal Article) Logic Journal of the IGPL, 31 (2), pp. 255-270, 2023. (Abstract | Links | BibTeX | Tags: energy, IoT, time series) @article{jimenez2023, title = {Streaming big time series forecasting based on nearest similar patterns with application to energy consumption}, author = {P. Jiménez-Herrera and L. Melgar-García and G. Asencio-Cortés and A. Troncoso}, url = {https://academic.oup.com/jigpal/advance-article-abstract/doi/10.1093/jigpal/jzac017/6534493?redirectedFrom=fulltext}, doi = {https://doi.org/10.1093/jigpal/jzac017}, year = {2023}, date = {2023-01-01}, journal = {Logic Journal of the IGPL}, volume = {31}, number = {2}, pages = {255-270}, abstract = {This work presents a novel approach to forecast streaming big time series based on nearest similar patterns. This approach combines a clustering algorithm with a classifier and the nearest neighbors algorithm. It presents two separate stages: offline and online. The offline phase is for training and finding the best models for clustering, classification and the nearest neighbors algorithm. The online phase is to predict big time series in real time. In the offline phase, data are divided into clusters and a forecasting model based on the nearest neighbors is trained for each cluster. In addition, a classifier is trained using the cluster assignments previously generated by the clustering algorithm. In the online phase, the classifier predicts the cluster label of an instance, and the proper nearest neighbors model according to the predicted cluster label is applied to obtain the final prediction using the similar patterns. The algorithm is able to be updated incrementally for online learning from data streams. Results are reported using electricity consumption with a granularity of 10 minutes for 4-hour-ahead forecasting and compared with well-known online benchmark learners, showing a remarkable improvement in prediction accuracy.}, keywords = {energy, IoT, time series}, pubstate = {published}, tppubtype = {article} } This work presents a novel approach to forecast streaming big time series based on nearest similar patterns. This approach combines a clustering algorithm with a classifier and the nearest neighbors algorithm. It presents two separate stages: offline and online. The offline phase is for training and finding the best models for clustering, classification and the nearest neighbors algorithm. The online phase is to predict big time series in real time. In the offline phase, data are divided into clusters and a forecasting model based on the nearest neighbors is trained for each cluster. In addition, a classifier is trained using the cluster assignments previously generated by the clustering algorithm. In the online phase, the classifier predicts the cluster label of an instance, and the proper nearest neighbors model according to the predicted cluster label is applied to obtain the final prediction using the similar patterns. The algorithm is able to be updated incrementally for online learning from data streams. Results are reported using electricity consumption with a granularity of 10 minutes for 4-hour-ahead forecasting and compared with well-known online benchmark learners, showing a remarkable improvement in prediction accuracy. |
L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A.Troncoso Identifying novelties and anomalies for incremental learning in streaming time series forecasting (Journal Article) Engineering Applications of Artificial Intelligence, 123 , pp. 106326, 2023. (Links | BibTeX | Tags: energy, IoT, time series) @article{Melgar2023b, title = {Identifying novelties and anomalies for incremental learning in streaming time series forecasting}, author = {L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A.Troncoso}, url = {https://www.sciencedirect.com/science/article/pii/S0952197623005109}, doi = {https://doi.org/10.1016/j.engappai.2023.106326}, year = {2023}, date = {2023-01-01}, journal = {Engineering Applications of Artificial Intelligence}, volume = {123}, pages = {106326}, keywords = {energy, IoT, time series}, pubstate = {published}, tppubtype = {article} } |
L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A. Troncoso A novel distributed forecasting method based on information fusion and incremental learning for streaming time series (Journal Article) Information Fusion, 95 , pp. 163-173, 2023. (Links | BibTeX | Tags: energy, IoT, time series) @article{Melgar2023a, title = {A novel distributed forecasting method based on information fusion and incremental learning for streaming time series}, author = {L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A. Troncoso}, url = {https://www.sciencedirect.com/science/article/pii/S1566253523000635}, doi = {https://doi.org/10.1016/j.inffus.2023.02.023}, year = {2023}, date = {2023-01-01}, journal = {Information Fusion}, volume = {95}, pages = {163-173}, keywords = {energy, IoT, time series}, pubstate = {published}, tppubtype = {article} } |
A. R. Troncoso-García and m. Martínez-Ballesteros and F. Martínez-Álvarez and A. Troncoso Evolutionary computation to explain deep learning models for time series forecasting (Conference) SAC 38th Annual ACM Symposium on Applied Computing, 2023. (Links | BibTeX | Tags: deep learning, time series, XAI) @conference{SAC2023, title = {Evolutionary computation to explain deep learning models for time series forecasting}, author = {A. R. Troncoso-García and m. Martínez-Ballesteros and F. Martínez-Álvarez and A. Troncoso}, url = {https://dl.acm.org/doi/abs/10.1145/3555776.3578994}, year = {2023}, date = {2023-01-01}, booktitle = {SAC 38th Annual ACM Symposium on Applied Computing}, keywords = {deep learning, time series, XAI}, pubstate = {published}, tppubtype = {conference} } |
A. R. Troncoso-García and M. Martínez-Ballesteros and F. Martínez-Álvarez and A. Troncoso Deep Learning-Based Approach for Sleep Apnea Detection Using Physiological Signals (Conference) IWANN International Work-conference on Artificial Intelligence, Lecture Notes in Computer Science 2023. (BibTeX | Tags: deep learning, feature selection, time series) @conference{IWANN2023, title = {Deep Learning-Based Approach for Sleep Apnea Detection Using Physiological Signals}, author = {A. R. Troncoso-García and M. Martínez-Ballesteros and F. Martínez-Álvarez and A. Troncoso}, year = {2023}, date = {2023-01-01}, booktitle = {IWANN International Work-conference on Artificial Intelligence}, series = {Lecture Notes in Computer Science}, keywords = {deep learning, feature selection, time series}, pubstate = {published}, tppubtype = {conference} } |
M. J. Jiménez-Navarro and M. Martínez-Ballesteros and I. S. Brito and F. Martínez-Álvarez and G. Asencio-Cortés A bioinspired ensemble approach for multi-horizon reference evapotranspiration forecasting in Portugal (Conference) SAC 38th Annual ACM Symposium on Applied Computing, 2023. (Abstract | Links | BibTeX | Tags: deep learning, precision agriculture, time series) @conference{EVAPOCVOA23, title = {A bioinspired ensemble approach for multi-horizon reference evapotranspiration forecasting in Portugal}, author = {M. J. Jiménez-Navarro and M. Martínez-Ballesteros and I. S. Brito and F. Martínez-Álvarez and G. Asencio-Cortés}, url = {https://dl.acm.org/doi/abs/10.1145/3555776.3578634}, doi = {https://doi.org/10.1145/3555776.3578634}, year = {2023}, date = {2023-01-01}, booktitle = {SAC 38th Annual ACM Symposium on Applied Computing}, pages = {441-448}, abstract = {The year 2022 was the driest year in Portugal since 1931 with 97% of territory in severe drought. Water is especially important for the agricultural sector in Portugal, as it represents 78% total consumption according to the Water Footprint report published in 2010. Reference evapotranspiration is essential due to its importance in optimal irrigation planning that reduces water consumption. This study analyzes and proposes a framework to forecast daily reference evapotranspiration at eight stations in Portugal from 2012 to 2022 without relying on public meteorological forecasts. The data include meteorological data obtained from sensors included in the stations. The goal is to perform a multi-horizon forecasting of reference evapotranspiration using the multiple related covariates. The framework combines the data processing and the analysis of several state-of-the-art forecasting methods including classical, linear, tree-based, artificial neural network and ensembles. Then, an ensemble of all trained models is proposed using a recent bioinspired metaheuristic named Coronavirus Optimization Algorithm to weight the predictions. The results in terms of MAE and MSE are reported, indicating that our approach achieved a MAE of 0.658.}, keywords = {deep learning, precision agriculture, time series}, pubstate = {published}, tppubtype = {conference} } The year 2022 was the driest year in Portugal since 1931 with 97% of territory in severe drought. Water is especially important for the agricultural sector in Portugal, as it represents 78% total consumption according to the Water Footprint report published in 2010. Reference evapotranspiration is essential due to its importance in optimal irrigation planning that reduces water consumption. This study analyzes and proposes a framework to forecast daily reference evapotranspiration at eight stations in Portugal from 2012 to 2022 without relying on public meteorological forecasts. The data include meteorological data obtained from sensors included in the stations. The goal is to perform a multi-horizon forecasting of reference evapotranspiration using the multiple related covariates. The framework combines the data processing and the analysis of several state-of-the-art forecasting methods including classical, linear, tree-based, artificial neural network and ensembles. Then, an ensemble of all trained models is proposed using a recent bioinspired metaheuristic named Coronavirus Optimization Algorithm to weight the predictions. The results in terms of MAE and MSE are reported, indicating that our approach achieved a MAE of 0.658. |
L. Melgar-García, M. Hosseini and A. Troncoso Identification of anomalies in urban sound data with Autoencoders (Conference) HAIS 18th International Conference on Hybrid Artificial Intelligence Systems, Lecture Notes in Computer Science 2023. (BibTeX | Tags: deep learning, IoT, time series) @conference{HAIS23_Laura, title = {Identification of anomalies in urban sound data with Autoencoders}, author = {L. Melgar-García, M. Hosseini and A. Troncoso}, year = {2023}, date = {2023-01-01}, booktitle = {HAIS 18th International Conference on Hybrid Artificial Intelligence Systems}, series = {Lecture Notes in Computer Science}, keywords = {deep learning, IoT, time series}, pubstate = {published}, tppubtype = {conference} } |
E. Tefera and A. Troncoso and M. Martínez Ballesteros and F. Martínez-Álvarez A New Hybrid CNN-LSTM for Wind Power Forecasting in Ethiopia (Conference) HAIS 18th International Conference on Hybrid Artificial Intelligence Systems, Lecture Notes in Computer Science 2023. (BibTeX | Tags: deep learning, energy, time series) @conference{HAIS23_Ejigu, title = {A New Hybrid CNN-LSTM for Wind Power Forecasting in Ethiopia}, author = {E. Tefera and A. Troncoso and M. Martínez Ballesteros and F. Martínez-Álvarez}, year = {2023}, date = {2023-01-01}, booktitle = {HAIS 18th International Conference on Hybrid Artificial Intelligence Systems}, series = {Lecture Notes in Computer Science}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
P. Casas-Gómez and F. Martínez-Álvarez and A. Troncoso and J. C. Linares-Calderón Machine Learning Approaches for Predicting Tree Growth Trends based on Basal Area Increment (Conference) SOCO 18th International Conference on Soft Computing Models in Industrial and Environmental Applications, Lecture Notes in Networks and Systems 2023. (BibTeX | Tags: time series) @conference{SOCO22_Pablo, title = {Machine Learning Approaches for Predicting Tree Growth Trends based on Basal Area Increment}, author = {P. Casas-Gómez and F. Martínez-Álvarez and A. Troncoso and J. C. Linares-Calderón}, year = {2023}, date = {2023-01-01}, booktitle = {SOCO 18th International Conference on Soft Computing Models in Industrial and Environmental Applications}, series = {Lecture Notes in Networks and Systems}, keywords = {time series}, pubstate = {published}, tppubtype = {conference} } |
2022 |
M. Á. Molina and M. J. Jiménez-Navarro and R. Arjona and F. Mártinez-Álvarez and G. Asencio-Cortés DIAFAN-TL: An instance weighting-based transfer learning algorithm with application to phenology forecasting (Journal Article) Knowledge-Based Systems, 254 , pp. 109644, 2022. (Abstract | Links | BibTeX | Tags: time series, transfer learning) @article{MOLINA22, title = {DIAFAN-TL: An instance weighting-based transfer learning algorithm with application to phenology forecasting}, author = {M. Á. Molina and M. J. Jiménez-Navarro and R. Arjona and F. Mártinez-Álvarez and G. Asencio-Cortés}, url = {https://www.sciencedirect.com/science/article/pii/S0950705122008322}, doi = {https://doi.org/10.1016/j.knosys.2022.109644}, year = {2022}, date = {2022-10-22}, journal = {Knowledge-Based Systems}, volume = {254}, pages = {109644}, abstract = {The agricultural sector has been, and still is, the most important economic sector in many countries. Due to advances in technology, the amount and variety of available data have been increasing over the years. However, compared to other economic sectors, there is not always enough quality data for one particular domain (crops, plantations, plots) to obtain acceptable forecasting results with machine learning algorithms. In this context, transfer learning can help extract knowledge from different but related domains with enough data to transfer it to a target domain with scarce data. This process can overcome forecasting accuracy compared to training models uniquely with data from the target domain. In this work, a novel instance weighting-based transfer learning algorithm is proposed and applied to the phenology forecasting problem. A new metric named DIAFAN is proposed to weight samples from different source domains according to their relationship with the target domain, promoting the diversity of the information and avoiding inconsistent samples. Additionally, a set of validation schemes is specifically designed to ensure fair comparisons in terms of data volume with other benchmark transfer learning algorithms. The proposed algorithm, DIAFAN-TL, is tested with a proposed dataset of 16 plots of olive groves from different places, including information fusion from satellite images, meteorological stations and human field sampling of crop phenology. DIAFAN-TL achieves a remarkable improvement with respect to 15 other well-known transfer learning algorithms and three nontransfer learning scenarios. Finally, several performance analyses according to the different phenological states, prediction horizons and source domains are also performed.}, keywords = {time series, transfer learning}, pubstate = {published}, tppubtype = {article} } The agricultural sector has been, and still is, the most important economic sector in many countries. Due to advances in technology, the amount and variety of available data have been increasing over the years. However, compared to other economic sectors, there is not always enough quality data for one particular domain (crops, plantations, plots) to obtain acceptable forecasting results with machine learning algorithms. In this context, transfer learning can help extract knowledge from different but related domains with enough data to transfer it to a target domain with scarce data. This process can overcome forecasting accuracy compared to training models uniquely with data from the target domain. In this work, a novel instance weighting-based transfer learning algorithm is proposed and applied to the phenology forecasting problem. A new metric named DIAFAN is proposed to weight samples from different source domains according to their relationship with the target domain, promoting the diversity of the information and avoiding inconsistent samples. Additionally, a set of validation schemes is specifically designed to ensure fair comparisons in terms of data volume with other benchmark transfer learning algorithms. The proposed algorithm, DIAFAN-TL, is tested with a proposed dataset of 16 plots of olive groves from different places, including information fusion from satellite images, meteorological stations and human field sampling of crop phenology. DIAFAN-TL achieves a remarkable improvement with respect to 15 other well-known transfer learning algorithms and three nontransfer learning scenarios. Finally, several performance analyses according to the different phenological states, prediction horizons and source domains are also performed. |
A. M. Chacón-Maldonado and M. A. Molina and A. Troncoso and F. Martínez-Álvarez and G. Asencio-Cortés Olive Phenology Forecasting Using Information Fusion-Based Imbalanced Preprocessing and Automated Deep Learning (Conference) HAIS 17th International Conference on Hybrid Artificial Intelligence Systems, Lecture Notes in Computer Science 2022. (Links | BibTeX | Tags: deep learning, pattern recognition, time series) @conference{HAIS22_Andres, title = {Olive Phenology Forecasting Using Information Fusion-Based Imbalanced Preprocessing and Automated Deep Learning}, author = {A. M. Chacón-Maldonado and M. A. Molina and A. Troncoso and F. Martínez-Álvarez and G. Asencio-Cortés}, url = {https://link.springer.com/chapter/10.1007/978-3-031-15471-3_24}, year = {2022}, date = {2022-09-12}, booktitle = {HAIS 17th International Conference on Hybrid Artificial Intelligence Systems}, journal = {HAIS 17th International Conference on Hybrid Artificial Intelligence Systems, Lecture Notes in Computer Science 2022}, pages = {274-285}, series = {Lecture Notes in Computer Science}, keywords = {deep learning, pattern recognition, time series}, pubstate = {published}, tppubtype = {conference} } |
A. R. Troncoso-García and M. Martínez-Ballesteros and F. Martínez-Álvarez and A. Troncoso Explainable machine learning for sleep apnea prediction (Conference) KES International Conference on Knowledge Based and Intelligent information and Engineering Systems, 2022. (Abstract | Links | BibTeX | Tags: association rules, deep learning, time series, XAI) @conference{TRONCOSO-GARCIA22, title = {Explainable machine learning for sleep apnea prediction}, author = {A. R. Troncoso-García and M. Martínez-Ballesteros and F. Martínez-Álvarez and A. Troncoso}, url = {https://www.sciencedirect.com/science/article/pii/S1877050922012406}, doi = {https://doi.org/10.1016/j.procs.2022.09.351}, year = {2022}, date = {2022-09-10}, booktitle = {KES International Conference on Knowledge Based and Intelligent information and Engineering Systems}, pages = {2930-2939}, abstract = {Machine and deep learning has become one of the most useful tools in the last years as a diagnosis-decision-support tool in the health area. However, it is widely known that artificial intelligence models are considered a black box and most experts experience difficulties explaining and interpreting the models and their results. In this context, explainable artificial intelligence is emerging with the aim of providing black-box models with sufficient interpretability so that models can be easily understood and further applied. Obstructive sleep apnea is a common chronic respiratory disease related to sleep. Its diagnosis nowadays is done by processing different data signals, such as electrocardiogram or respiratory rate. The waveform of the respiratory signal is of importance too. Machine learning models could be applied to the signal's analysis. Data from a polysomnography study for automatic sleep apnea detection have been used to evaluate the use of the Local Interpretable Model-Agnostic (LIME) library for explaining the health data models. Results obtained help to understand how several features have been used in the model and their influence in the quality of sleep.}, keywords = {association rules, deep learning, time series, XAI}, pubstate = {published}, tppubtype = {conference} } Machine and deep learning has become one of the most useful tools in the last years as a diagnosis-decision-support tool in the health area. However, it is widely known that artificial intelligence models are considered a black box and most experts experience difficulties explaining and interpreting the models and their results. In this context, explainable artificial intelligence is emerging with the aim of providing black-box models with sufficient interpretability so that models can be easily understood and further applied. Obstructive sleep apnea is a common chronic respiratory disease related to sleep. Its diagnosis nowadays is done by processing different data signals, such as electrocardiogram or respiratory rate. The waveform of the respiratory signal is of importance too. Machine learning models could be applied to the signal's analysis. Data from a polysomnography study for automatic sleep apnea detection have been used to evaluate the use of the Local Interpretable Model-Agnostic (LIME) library for explaining the health data models. Results obtained help to understand how several features have been used in the model and their influence in the quality of sleep. |
D. Hadjout and J. F. Torres and A. Troncoso and A. Sebaa and F. Martínez-Álvarez Electricity consumption forecasting based on ensemble deep learning with application to the Algerian market (Journal Article) Energy, 243 , pp. 123060, 2022. (Abstract | Links | BibTeX | Tags: deep learning, energy, time series) @article{HADJOUT22, title = {Electricity consumption forecasting based on ensemble deep learning with application to the Algerian market}, author = {D. Hadjout and J. F. Torres and A. Troncoso and A. Sebaa and F. Martínez-Álvarez}, url = {https://www.sciencedirect.com/science/article/pii/S0360544221033090}, doi = {https://doi.org/10.1016/j.energy.2021.123060}, year = {2022}, date = {2022-03-15}, journal = {Energy}, volume = {243}, pages = {123060}, abstract = {The economic sector is one of the most important pillars of countries. Economic activities of industry are intimately linked with the ability to meet their needs for electricity. Therefore, electricity forecasting is a very important task. It allows for better planning and management of energy resources. Several methods have been proposed to forecast energy consumption. In this work, to predict monthly electricity consumption for the economic sector, we develop a novel approach based on ensemble learning. Our approach combines three models that proved successful in the field, namely: Long Short Term Memory and Gated Recurrent Unit neural networks, and Temporal Convolutional Networks. The experiments have been conducted with almost 2000 clients and 14 years of monthly electricity consumption from Bejaia, Algeria. The results show that the proposed ensemble models achieve better performance than both the company's requirements and the prediction of the traditional individual models. Finally, statistical tests have been carried out to prove that significance of the ensemble models developed.}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {article} } The economic sector is one of the most important pillars of countries. Economic activities of industry are intimately linked with the ability to meet their needs for electricity. Therefore, electricity forecasting is a very important task. It allows for better planning and management of energy resources. Several methods have been proposed to forecast energy consumption. In this work, to predict monthly electricity consumption for the economic sector, we develop a novel approach based on ensemble learning. Our approach combines three models that proved successful in the field, namely: Long Short Term Memory and Gated Recurrent Unit neural networks, and Temporal Convolutional Networks. The experiments have been conducted with almost 2000 clients and 14 years of monthly electricity consumption from Bejaia, Algeria. The results show that the proposed ensemble models achieve better performance than both the company's requirements and the prediction of the traditional individual models. Finally, statistical tests have been carried out to prove that significance of the ensemble models developed. |
A. Gómez-Losada and G. Asencio-Cortés and N. Duch-Brown Automatic Eligibility of Sellers in an Online Marketplace: A Case Study of Amazon Algorithm (Journal Article) Information, 13 (44), pp. 1–16, 2022. (Abstract | Links | BibTeX | Tags: feature selection, time series) @article{losada2022, title = {Automatic Eligibility of Sellers in an Online Marketplace: A Case Study of Amazon Algorithm}, author = {A. Gómez-Losada and G. Asencio-Cortés and N. Duch-Brown}, url = {https://www.mdpi.com/2078-2489/13/2/44}, doi = {10.3390/info13020044}, year = {2022}, date = {2022-01-01}, journal = {Information}, volume = {13}, number = {44}, pages = {1--16}, abstract = {Purchase processes on Amazon Marketplace begin at the Buy Box, which represents the buy click process through which numerous sellers compete. This study aimed to estimate empirically the relevant seller characteristics that Amazon could consider featuring in the Buy Box. To that end, 22 product categories from Italy’s Amazon web page were studied over a ten-month period, and the sellers were analyzed through their products featured in the Buy Box. Two different experiments were proposed and the results were analyzed using four classification algorithms (a neural network, random forest, support vector machine, and C5.0 decision trees) and a rule-based classification. The first experiment aimed to characterize sellers unspecifically by predicting their change at the Buy Box. The second one aimed to predict which seller would be featured in it. Both experiments revealed that the customer experience and the dynamics of the sellers’ prices were important features of the Buy Box. Additionally, we proposed a set of default features that Amazon could consider when no information about sellers was available. We also proposed the possible existence of a relationship or composition among important features that could be used for sellers to be featured in the Buy Box.}, keywords = {feature selection, time series}, pubstate = {published}, tppubtype = {article} } Purchase processes on Amazon Marketplace begin at the Buy Box, which represents the buy click process through which numerous sellers compete. This study aimed to estimate empirically the relevant seller characteristics that Amazon could consider featuring in the Buy Box. To that end, 22 product categories from Italy’s Amazon web page were studied over a ten-month period, and the sellers were analyzed through their products featured in the Buy Box. Two different experiments were proposed and the results were analyzed using four classification algorithms (a neural network, random forest, support vector machine, and C5.0 decision trees) and a rule-based classification. The first experiment aimed to characterize sellers unspecifically by predicting their change at the Buy Box. The second one aimed to predict which seller would be featured in it. Both experiments revealed that the customer experience and the dynamics of the sellers’ prices were important features of the Buy Box. Additionally, we proposed a set of default features that Amazon could consider when no information about sellers was available. We also proposed the possible existence of a relationship or composition among important features that could be used for sellers to be featured in the Buy Box. |
M.A. Castán-Lascorz and P. Jiménez-Herrera and A. Troncoso and G. Asencio-Cortés A new hybrid method for predicting univariate and multivariate time series based on pattern forecasting (Journal Article) Information Sciences, 586 , pp. 611–627, 2022. (Abstract | Links | BibTeX | Tags: energy, pattern recognition, time series) @article{castan2022, title = {A new hybrid method for predicting univariate and multivariate time series based on pattern forecasting}, author = {M.A. Castán-Lascorz and P. Jiménez-Herrera and A. Troncoso and G. Asencio-Cortés}, url = {https://www.sciencedirect.com/science/article/pii/S0020025521012226?via%3Dihub}, doi = {10.1016/j.ins.2021.12.001}, year = {2022}, date = {2022-01-01}, journal = {Information Sciences}, volume = {586}, pages = {611--627}, abstract = {Time series forecasting has become indispensable for multiple applications and industrial processes. Currently, a large number of algorithms have been developed to forecast time series, all of which are suitable depending on the characteristics and patterns to be inferred in each case. In this work, a new algorithm is proposed to predict both univariate and multivariate time series based on a combination of clustering, classification and forecasting techniques. The main goal of the proposed algorithm is first to group windows of time series values with similar patterns by applying a clustering process. Then, a specific forecasting model for each pattern is built and training is only conducted with the time windows corresponding to that pattern. The new algorithm has been designed using a flexible framework that allows the model to be generated using any combination of approaches within multiple machine learning techniques. To evaluate the model, several experiments are carried out using different configurations of the clustering, classification and forecasting methods that the model consists of. The results are analyzed and compared to classical prediction models, such as autoregressive, integrated, moving average and Holt-Winters models, to very recent forecasting methods, including deep, long short-term memory neural networks, and to well-known methods in the literature, such as k nearest neighbors, classification and regression trees, as well as random forest.}, keywords = {energy, pattern recognition, time series}, pubstate = {published}, tppubtype = {article} } Time series forecasting has become indispensable for multiple applications and industrial processes. Currently, a large number of algorithms have been developed to forecast time series, all of which are suitable depending on the characteristics and patterns to be inferred in each case. In this work, a new algorithm is proposed to predict both univariate and multivariate time series based on a combination of clustering, classification and forecasting techniques. The main goal of the proposed algorithm is first to group windows of time series values with similar patterns by applying a clustering process. Then, a specific forecasting model for each pattern is built and training is only conducted with the time windows corresponding to that pattern. The new algorithm has been designed using a flexible framework that allows the model to be generated using any combination of approaches within multiple machine learning techniques. To evaluate the model, several experiments are carried out using different configurations of the clustering, classification and forecasting methods that the model consists of. The results are analyzed and compared to classical prediction models, such as autoregressive, integrated, moving average and Holt-Winters models, to very recent forecasting methods, including deep, long short-term memory neural networks, and to well-known methods in the literature, such as k nearest neighbors, classification and regression trees, as well as random forest. |
G. Velázquez and F. Morales and M. García-Torres and F. Gómez-Vela and F. Divina and J.L. Vázquez Noguera and F. Daumas-Ladouce and C. Ayala and D. Pinto-Roaand P. Gardel-Sotomayor Distribution level Electric current consumption and meteorological data set of the East region of Paraguay (Journal Article) Data in Brief, 40 , pp. 107699, 2022. (Abstract | Links | BibTeX | Tags: energy, time series) @article{velazquez2022distribution, title = {Distribution level Electric current consumption and meteorological data set of the East region of Paraguay}, author = {G. Velázquez and F. Morales and M. García-Torres and F. Gómez-Vela and F. Divina and J.L. Vázquez Noguera and F. Daumas-Ladouce and C. Ayala and D. Pinto-Roaand P. Gardel-Sotomayor}, url = {https://www.sciencedirect.com/science/article/pii/S2352340921009744}, doi = {10.1016/j.dib.2021.107699}, year = {2022}, date = {2022-01-01}, journal = {Data in Brief}, volume = {40}, pages = {107699}, publisher = {Elsevier pubstate = published}, abstract = {This paper presents a data set with information on meteorological data and electricity consumption in the department of Alto Paraná, Paraguay. The meteorological data were registered every three hours at the Aeropuerto Guarani, Department of Alto Paraná, which belongs to the Dirección Nacional de Aeronáutica Civil of Paraguay. The final data consists of a total of 22.445 records of temperature, relative humidity, wind speed and atmospheric pressure. On the other hand, the electrical energy consumption data set contains a total of 1.848.947 records, all of them coming from the one hundred and fifteen feeders located throughout the Alto Paraná region of Paraguay. Electrical energy consumption data was provided by Administración Nacional de Electricidad (ANDE). The analysis of this data can yield insights regarding the energy consumption in the area.}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {article} } This paper presents a data set with information on meteorological data and electricity consumption in the department of Alto Paraná, Paraguay. The meteorological data were registered every three hours at the Aeropuerto Guarani, Department of Alto Paraná, which belongs to the Dirección Nacional de Aeronáutica Civil of Paraguay. The final data consists of a total of 22.445 records of temperature, relative humidity, wind speed and atmospheric pressure. On the other hand, the electrical energy consumption data set contains a total of 1.848.947 records, all of them coming from the one hundred and fifteen feeders located throughout the Alto Paraná region of Paraguay. Electrical energy consumption data was provided by Administración Nacional de Electricidad (ANDE). The analysis of this data can yield insights regarding the energy consumption in the area. |
J. A. Gallardo-Gómez and F. Divina and A. Troncoso and F. Martínez-Álvarez Explainable Artificial Intelligence for the Electric Vehicle Load Demand Forecasting Problem (Conference) SOCO 17th International Conference on Soft Computing Models in Industrial and Environmental Applications, Advances in Intelligent Systems and Computing 2022. (Links | BibTeX | Tags: big data, energy, time series) @conference{gallardo2022explainable, title = {Explainable Artificial Intelligence for the Electric Vehicle Load Demand Forecasting Problem}, author = {J. A. Gallardo-Gómez and F. Divina and A. Troncoso and F. Martínez-Álvarez }, url = {https://link.springer.com/chapter/10.1007/978-3-030-87869-6_65}, year = {2022}, date = {2022-01-01}, booktitle = {SOCO 17th International Conference on Soft Computing Models in Industrial and Environmental Applications}, pages = {413-422}, series = { Advances in Intelligent Systems and Computing}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
F. Morales and M. García-Torres and G. Velázquez and F. Daumas-Ladouce and P. Gardel-Sotomayor and F. Gómez-Vela and F. Divina and J. L. Vázquez Noguera and C. Sauer Ayala and D. Pinto-Roa Analysis of Electric Energy Consumption Profiles Using a Machine Learning Approach: A Paraguayan Case Study (Journal Article) Electronics, 11 (2), pp. 267, 2022. (Abstract | Links | BibTeX | Tags: big data, energy, time series) @article{morales2022analysisb, title = {Analysis of Electric Energy Consumption Profiles Using a Machine Learning Approach: A Paraguayan Case Study}, author = {F. Morales and M. García-Torres and G. Velázquez and F. Daumas-Ladouce and P. Gardel-Sotomayor and F. Gómez-Vela and F. Divina and J. L. Vázquez Noguera and C. Sauer Ayala and D. Pinto-Roa}, url = {https://www.mdpi.com/2079-9292/11/2/267}, doi = {10.3390/electronics11020267}, year = {2022}, date = {2022-01-01}, journal = {Electronics}, volume = {11}, number = {2}, pages = {267}, abstract = {Correctly defining and grouping electrical feeders is of great importance for electrical system operators. In this paper, we compare two different clustering techniques, K-means and hierarchical agglomerative clustering, applied to real data from the east region of Paraguay. The raw data were pre-processed, resulting in four data sets, namely, (i) a weekly feeder demand, (ii) a monthly feeder demand, (iii) a statistical feature set extracted from the original data and (iv) a seasonal and daily consumption feature set obtained considering the characteristics of the Paraguayan load curve. Considering the four data sets, two clustering algorithms, two distance metrics and five linkage criteria a total of 36 models with the Silhouette, Davies–Bouldin and Calinski–Harabasz index scores was assessed. The K-means algorithms with the seasonal feature data sets showed the best performance considering the Silhouette, Calinski–Harabasz and Davies–Bouldin validation index scores with a configuration of six clusters.}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {article} } Correctly defining and grouping electrical feeders is of great importance for electrical system operators. In this paper, we compare two different clustering techniques, K-means and hierarchical agglomerative clustering, applied to real data from the east region of Paraguay. The raw data were pre-processed, resulting in four data sets, namely, (i) a weekly feeder demand, (ii) a monthly feeder demand, (iii) a statistical feature set extracted from the original data and (iv) a seasonal and daily consumption feature set obtained considering the characteristics of the Paraguayan load curve. Considering the four data sets, two clustering algorithms, two distance metrics and five linkage criteria a total of 36 models with the Silhouette, Davies–Bouldin and Calinski–Harabasz index scores was assessed. The K-means algorithms with the seasonal feature data sets showed the best performance considering the Silhouette, Calinski–Harabasz and Davies–Bouldin validation index scores with a configuration of six clusters. |
E. T. Habtermariam and K. Kekeba and A. Troncoso and F. Martínez-Álvarez A Cluster-Based Deep Learning Model for Energy Consumption Forecasting in Ethiopia (Conference) SOCO 17th International Conference on Soft Computing Models in Industrial and Environmental Applications , 531 , Lecture Notes in Networks and Systems 2022. (Links | BibTeX | Tags: deep learning, energy, pattern recognition, time series) @conference{SOCO22_Ejigu, title = {A Cluster-Based Deep Learning Model for Energy Consumption Forecasting in Ethiopia}, author = {E. T. Habtermariam and K. Kekeba and A. Troncoso and F. Martínez-Álvarez}, url = {https://link.springer.com/chapter/10.1007/978-3-031-18050-7_41}, year = {2022}, date = {2022-01-01}, booktitle = {SOCO 17th International Conference on Soft Computing Models in Industrial and Environmental Applications }, journal = {SOCO 17th International Conference on Soft Computing Models in Industrial and Environmental Applications, Lecture Notes in Networks Systems, Vol. 531.}, volume = {531}, pages = {423-432}, series = {Lecture Notes in Networks and Systems}, keywords = {deep learning, energy, pattern recognition, time series}, pubstate = {published}, tppubtype = {conference} } |
L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A. Troncoso Nearest neighbors with incremental learning for real-time forecasting of electricity demand (Conference) IEEE International Conference on Data Mining Workshops, 2022. (Links | BibTeX | Tags: energy, IoT, time series) @conference{MelgarICDM2022, title = {Nearest neighbors with incremental learning for real-time forecasting of electricity demand}, author = {L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A. Troncoso}, url = {https://ieeexplore.ieee.org/document/10031211}, year = {2022}, date = {2022-01-01}, booktitle = {IEEE International Conference on Data Mining Workshops}, keywords = {energy, IoT, time series}, pubstate = {published}, tppubtype = {conference} } |
2021 |
K.-T. T. Bui and J. F. Torres and D. Gutiérrez-Avilés and V. H. Nhu and F. Martínez-Álvarez and D. T. Bui Deformation forecasting of a hydropower dam by hybridizing a Long Short-Term Memory deep learning network with the Coronavirus Optimization Algorithm (Journal Article) Computer-Aided Civil and Infrastructure Engineering, 37 , pp. 1368-1386, 2021. (Abstract | Links | BibTeX | Tags: deep learning, time series) @article{BUI22b, title = {Deformation forecasting of a hydropower dam by hybridizing a Long Short-Term Memory deep learning network with the Coronavirus Optimization Algorithm}, author = {K.-T. T. Bui and J. F. Torres and D. Gutiérrez-Avilés and V. H. Nhu and F. Martínez-Álvarez and D. T. Bui}, url = {https://onlinelibrary.wiley.com/doi/abs/10.1111/mice.12810}, doi = {https://doi.org/10.1111/mice.12810}, year = {2021}, date = {2021-11-24}, journal = {Computer-Aided Civil and Infrastructure Engineering}, volume = {37}, pages = {1368-1386}, abstract = {The safety operation and management of hydropower dam play a critical role in social-economic development and ensure people's safety in many countries; therefore, modeling and forecasting the hydropower dam's deformations with high accuracy is crucial. This research aims to propose and validate a new model based on deep learning long short-term memory (LSTM) and the coronavirus optimization algorithm (CVOA), named CVOA-LSTM, for forecasting the deformations of the hydropower dam. The second-largest hydropower dam of Vietnam, located in the Hoa Binh province, is focused. Herein, we used the LSTM to establish the deformation model, whereas the CVOA was utilized to optimize the three parameters of the LSTM, the number of hidden layers, the learning rate, and the dropout. The efficacy of the proposed CVOA-LSTM model is assessed by comparing its forecasting performance with state-of-the-art benchmarks, sequential minimal optimization for support vector regression, Gaussian process, M5' model tree, multilayer perceptron neural network, reduced error pruning tree, random tree, random forest, and radial basis function neural network. The result shows that the proposed CVOA-LSTM model has high forecasting capability (R2 = 0.874, root mean square error = 0.34, mean absolute error = 0.23) and outperforms the benchmarks. We conclude that CVOA-LSTM is a new tool that can be considered to forecast the hydropower dam's deformations.}, keywords = {deep learning, time series}, pubstate = {published}, tppubtype = {article} } The safety operation and management of hydropower dam play a critical role in social-economic development and ensure people's safety in many countries; therefore, modeling and forecasting the hydropower dam's deformations with high accuracy is crucial. This research aims to propose and validate a new model based on deep learning long short-term memory (LSTM) and the coronavirus optimization algorithm (CVOA), named CVOA-LSTM, for forecasting the deformations of the hydropower dam. The second-largest hydropower dam of Vietnam, located in the Hoa Binh province, is focused. Herein, we used the LSTM to establish the deformation model, whereas the CVOA was utilized to optimize the three parameters of the LSTM, the number of hidden layers, the learning rate, and the dropout. The efficacy of the proposed CVOA-LSTM model is assessed by comparing its forecasting performance with state-of-the-art benchmarks, sequential minimal optimization for support vector regression, Gaussian process, M5' model tree, multilayer perceptron neural network, reduced error pruning tree, random tree, random forest, and radial basis function neural network. The result shows that the proposed CVOA-LSTM model has high forecasting capability (R2 = 0.874, root mean square error = 0.34, mean absolute error = 0.23) and outperforms the benchmarks. We conclude that CVOA-LSTM is a new tool that can be considered to forecast the hydropower dam's deformations. |
J. F. Torres and M. J. Jiménez-Navarro and F. Martínez-Álvarez and A. Troncoso Electricity consumption time series forecasting using Temporal Convolutional Networks (Conference) CAEPIA Conference of the Spanish Association for Artificial Intelligence , Lecture Notes in Artificial Intelligence 2021. (BibTeX | Tags: deep learning, time series) @conference{TORRES21b, title = {Electricity consumption time series forecasting using Temporal Convolutional Networks}, author = {J. F. Torres and M. J. Jiménez-Navarro and F. Martínez-Álvarez and A. Troncoso}, year = {2021}, date = {2021-09-01}, booktitle = {CAEPIA Conference of the Spanish Association for Artificial Intelligence }, series = {Lecture Notes in Artificial Intelligence}, keywords = {deep learning, time series}, pubstate = {published}, tppubtype = {conference} } |
A. Melara and J. F. Torres and A. Troncoso and F. Martínez-Álvarez Electricity Generation Forecasting in Concentrating Solar-Thermal Power Plants with Ensemble Learning (Conference) SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications, 1401 , Advances in Intelligent Systems and Computing 2021. (Links | BibTeX | Tags: deep learning, energy, time series) @conference{MELARA21, title = {Electricity Generation Forecasting in Concentrating Solar-Thermal Power Plants with Ensemble Learning}, author = {A. Melara and J. F. Torres and A. Troncoso and F. Martínez-Álvarez}, doi = {https://doi.org/10.1007/978-3-030-87869-6_63}, year = {2021}, date = {2021-09-01}, booktitle = {SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications}, volume = {1401}, pages = {665-674}, series = {Advances in Intelligent Systems and Computing}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
D. Hadjout and J. F. Torres and A. Sebaa and F. Martínez-Álvarez SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications, 1401 , Advances in Intelligent Systems and Computing 2021. (Links | BibTeX | Tags: deep learning, energy, time series) @conference{HADJOUT21, title = {Medium-Term Electricity Consumption Forecasting in Algeria Based on Clustering, Deep Learning and Bayesian Optimization Methods}, author = {D. Hadjout and J. F. Torres and A. Sebaa and F. Martínez-Álvarez}, doi = {https://doi.org/10.1007/978-3-030-87869-6_70}, year = {2021}, date = {2021-09-01}, booktitle = {SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications}, volume = {1401}, pages = {739-748}, series = {Advances in Intelligent Systems and Computing}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
M. J. Jiménez-Navarro and F. Martínez-Álvarez and A. Troncoso and G. Asencio-Cortés HLNet: A Novel Hierarchical Deep Neural Network for Time Series Forecasting (Conference) SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications, 1401 , Advances in Intelligent Systems and Computing 2021. (Links | BibTeX | Tags: deep learning, time series) @conference{JIMENEZ-NAVARRO21, title = {HLNet: A Novel Hierarchical Deep Neural Network for Time Series Forecasting}, author = {M. J. Jiménez-Navarro and F. Martínez-Álvarez and A. Troncoso and G. Asencio-Cortés}, doi = {https://doi.org/10.1007/978-3-030-87869-6_68}, year = {2021}, date = {2021-09-01}, booktitle = {SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications}, volume = {1401}, pages = {717-727}, series = {Advances in Intelligent Systems and Computing}, keywords = {deep learning, time series}, pubstate = {published}, tppubtype = {conference} } |
M. A. Molina and M. J. Jiménez-Navarro and F. Martínez-Álvarez and G. Asencio-Cortés A Model-Based Deep Transfer Learning Algorithm for Phenology Forecasting Using Satellite Imagery (Conference) HAIS 16th International Conference on Hybrid Artificial Intelligence Systems, 12886 , Lecture Notes in Computer Science 2021. (Links | BibTeX | Tags: deep learning, time series) @conference{MOLINA21, title = {A Model-Based Deep Transfer Learning Algorithm for Phenology Forecasting Using Satellite Imagery}, author = {M. A. Molina and M. J. Jiménez-Navarro and F. Martínez-Álvarez and G. Asencio-Cortés}, url = {https://link.springer.com/chapter/10.1007/978-3-030-86271-8_43}, doi = {https://doi.org/10.1007/978-3-030-86271-8_43}, year = {2021}, date = {2021-09-01}, booktitle = {HAIS 16th International Conference on Hybrid Artificial Intelligence Systems}, volume = {12886}, pages = {511-523}, series = {Lecture Notes in Computer Science}, keywords = {deep learning, time series}, pubstate = {published}, tppubtype = {conference} } |
J. F. Torres and D. Hadjout and A. Sebaa and F. Martínez-Álvarez and A. Troncoso Deep Learning for Time Series Forecasting: A Survey (Journal Article) Big Data, 9 (1), pp. 3-21, 2021. (Abstract | Links | BibTeX | Tags: big data, deep learning, time series) @article{TORRES21, title = {Deep Learning for Time Series Forecasting: A Survey}, author = {J. F. Torres and D. Hadjout and A. Sebaa and F. Martínez-Álvarez and A. Troncoso}, url = {https://www.liebertpub.com/doi/10.1089/big.2020.0159}, doi = {10.1089/big.2020.0159}, year = {2021}, date = {2021-02-05}, journal = {Big Data}, volume = {9}, number = {1}, pages = {3-21}, abstract = {Deep learning, one of the most remarkable techniques of machine learning, has been a major success in many fields, including image processing, speech recognition, and text understanding. It is powerful engines capable of learning arbitrary mapping functions, not require a scaled or stationary time series as input, support multivariate inputs, and support multi-step outputs. All of these features together make deep learning useful tools when dealing with more complex time series prediction problems involving large amounts of data, and multiple variables with complex relationships. This paper provides an overview of the most common Deep Learning types for time series forecasting, Explain the relationships between deep learning models and classical approaches to time series forecasting. A brief background of the particular challenges presents in time-series data and the most common deep learning techniques that are often used for time series forecasting is provided. Previous studies that applied deep learning to time series are reviewed.}, keywords = {big data, deep learning, time series}, pubstate = {published}, tppubtype = {article} } Deep learning, one of the most remarkable techniques of machine learning, has been a major success in many fields, including image processing, speech recognition, and text understanding. It is powerful engines capable of learning arbitrary mapping functions, not require a scaled or stationary time series as input, support multivariate inputs, and support multi-step outputs. All of these features together make deep learning useful tools when dealing with more complex time series prediction problems involving large amounts of data, and multiple variables with complex relationships. This paper provides an overview of the most common Deep Learning types for time series forecasting, Explain the relationships between deep learning models and classical approaches to time series forecasting. A brief background of the particular challenges presents in time-series data and the most common deep learning techniques that are often used for time series forecasting is provided. Previous studies that applied deep learning to time series are reviewed. |
J. Roiz-Pagador and A. M. Chacon-Maldonado and R. Ruiz and G. Asencio-Cortes Earthquake Prediction in California using Feature Selection techniques (Conference) SOCO 16th International Conference on Soft Computing Models in Industrial and Environmental Applications, Advances in Intelligent Systems and Computing 2021. (Links | BibTeX | Tags: feature selection, natural disasters, time series) @conference{roiz2022, title = {Earthquake Prediction in California using Feature Selection techniques}, author = {J. Roiz-Pagador and A. M. Chacon-Maldonado and R. Ruiz and G. Asencio-Cortes}, url = {https://link.springer.com/chapter/10.1007/978-3-030-87869-6_69}, year = {2021}, date = {2021-01-01}, booktitle = {SOCO 16th International Conference on Soft Computing Models in Industrial and Environmental Applications}, series = {Advances in Intelligent Systems and Computing}, keywords = {feature selection, natural disasters, time series}, pubstate = {published}, tppubtype = {conference} } |
L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A. Troncoso Nearest neighbours-based forecasting for electricity demand time series in streaming (Conference) CAEPIA Conference of the Spanish Association for Artificial Intelligence , Lecture Notes in Artificial Intelligence 2021. (Abstract | BibTeX | Tags: IoT, time series) @conference{CAEPIA21_Laura, title = {Nearest neighbours-based forecasting for electricity demand time series in streaming}, author = {L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A. Troncoso }, year = {2021}, date = {2021-01-01}, booktitle = {CAEPIA Conference of the Spanish Association for Artificial Intelligence }, series = {Lecture Notes in Artificial Intelligence}, abstract = {This paper presents a forecasting algorithm for time series in streaming. The methodology has two well-differentiated stages: the algorithm searches for the nearest neighbors to generate an initial prediction model in the batch phase. Then, an online phase is carried out when the time series arrives in streaming. In particular, the nearest neighbor of the streaming data from the training set is computed and the nearest neighbors, previously computed in the batch phase, of this nearest neighbor are used to obtain the predictions. Results using the electricity consumption time series are reported, showing a remarkable performance of the proposed algorithm in terms of forecasting errors when compared to a nearest neighbors-based benchmark algorithm. The running times for the predictions are also remarkable.}, keywords = {IoT, time series}, pubstate = {published}, tppubtype = {conference} } This paper presents a forecasting algorithm for time series in streaming. The methodology has two well-differentiated stages: the algorithm searches for the nearest neighbors to generate an initial prediction model in the batch phase. Then, an online phase is carried out when the time series arrives in streaming. In particular, the nearest neighbor of the streaming data from the training set is computed and the nearest neighbors, previously computed in the batch phase, of this nearest neighbor are used to obtain the predictions. Results using the electricity consumption time series are reported, showing a remarkable performance of the proposed algorithm in terms of forecasting errors when compared to a nearest neighbors-based benchmark algorithm. The running times for the predictions are also remarkable. |
J. A. Gallardo and M. García-Torres and F. Gómez-Vela and F. Morales and F. Divina and D. Becerra-Alonso and G. Velázquez and F. Daumas-Ladouce and J. L. Vázquez Noguera and C. Ayala Sauer Forecasting Electricity Consumption Data from Paraguay Using a Machine Learning Approach (Conference) SOCO 16th International Conference on Soft Computing Models in Industrial and Environmental Applications, 1401 , Advances in Intelligent Systems and Computing 2021. (Links | BibTeX | Tags: big data, energy, time series) @conference{gallardo2022forecasting, title = {Forecasting Electricity Consumption Data from Paraguay Using a Machine Learning Approach}, author = {J. A. Gallardo and M. García-Torres and F. Gómez-Vela and F. Morales and F. Divina and D. Becerra-Alonso and G. Velázquez and F. Daumas-Ladouce and J. L. Vázquez Noguera and C. Ayala Sauer}, url = {https://link.springer.com/chapter/10.1007/978-3-030-87869-6_65}, year = {2021}, date = {2021-01-01}, booktitle = {SOCO 16th International Conference on Soft Computing Models in Industrial and Environmental Applications}, volume = {1401}, pages = {685-694}, series = {Advances in Intelligent Systems and Computing}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
2020 |
P. Jiménez-Herrera and L. Melgar-García and G. Asencio-Cortés and A. Troncoso A New Forecasting Algorithm Based on Neighbors for Streaming Electricity Time Series (Conference) HAIS 15th International Conference on Hybrid Artificial Intelligence Systems, Lecture Notes in Computer Science 2020. (Links | BibTeX | Tags: big data, energy, IoT, time series) @conference{HAIS2020, title = {A New Forecasting Algorithm Based on Neighbors for Streaming Electricity Time Series}, author = {P. Jiménez-Herrera and L. Melgar-García and G. Asencio-Cortés and A. Troncoso}, url = {https://link.springer.com/chapter/10.1007/978-3-030-61705-9_43}, year = {2020}, date = {2020-11-04}, booktitle = {HAIS 15th International Conference on Hybrid Artificial Intelligence Systems}, pages = {522-533}, series = {Lecture Notes in Computer Science}, keywords = {big data, energy, IoT, time series}, pubstate = {published}, tppubtype = {conference} } |
Y. Lin and I. Koprinska and M. Rana and A. Troncoso Solar Power Forecasting Based on Pattern Sequence Similarity and Meta-learning (Conference) ICANN 29th International Conference on Artificial Neural Networks, Lecture Notes in Computer Science 2020. (Links | BibTeX | Tags: energy, time series) @conference{ICANN20, title = {Solar Power Forecasting Based on Pattern Sequence Similarity and Meta-learning}, author = {Y. Lin and I. Koprinska and M. Rana and A. Troncoso}, url = {https://link.springer.com/chapter/10.1007/978-3-030-61609-0_22}, year = {2020}, date = {2020-10-14}, booktitle = {ICANN 29th International Conference on Artificial Neural Networks}, pages = {271-283}, series = {Lecture Notes in Computer Science }, keywords = {energy, time series}, pubstate = {published}, tppubtype = {conference} } |
F. Divina and J. F. Torres and M. García-Torres and F. Martínez-Álvarez and A. Troncoso Hybridizing deep learning and neuroevolution: Application to the Spanish short-term electric energy consumption forecasting (Journal Article) Applied Sciences, 10 (16), pp. 5487, 2020. (Abstract | Links | BibTeX | Tags: big data, deep learning, energy, time series) @article{DIVINA2020, title = {Hybridizing deep learning and neuroevolution: Application to the Spanish short-term electric energy consumption forecasting}, author = {F. Divina and J. F. Torres and M. García-Torres and F. Martínez-Álvarez and A. Troncoso}, url = {https://www.mdpi.com/2076-3417/10/16/5487}, doi = {https://doi.org/10.3390/app10165487}, year = {2020}, date = {2020-07-30}, journal = {Applied Sciences}, volume = {10}, number = {16}, pages = {5487}, abstract = {The electric energy production would be much more efficient if accurate estimations of the future demand were available, since these would allow allocating only the resources needed for the production of the right amount of energy required. With this motivation in mind, we propose a strategy, based on neuroevolution, that can be used to this aim. Our proposal uses a genetic algorithm in order to find a sub-optimal set of hyper-parameters for configuring a deep neural network, which can then be used for obtaining the forecasting. Such a strategy is justified by the observation that the performances achieved by deep neural networks are strongly dependent on the right setting of the hyper-parameters, and genetic algorithms have shown excellent search capabilities in huge search spaces. Moreover, we base our proposal on a distributed computing platform, which allows its use on a large time-series. In order to assess the performances of our approach, we have applied it to a large dataset, related to the electric energy consumption registered in Spain over almost 10 years. Experimental results confirm the validity of our proposal since it outperforms all other forecasting techniques to which it has been compared.}, keywords = {big data, deep learning, energy, time series}, pubstate = {published}, tppubtype = {article} } The electric energy production would be much more efficient if accurate estimations of the future demand were available, since these would allow allocating only the resources needed for the production of the right amount of energy required. With this motivation in mind, we propose a strategy, based on neuroevolution, that can be used to this aim. Our proposal uses a genetic algorithm in order to find a sub-optimal set of hyper-parameters for configuring a deep neural network, which can then be used for obtaining the forecasting. Such a strategy is justified by the observation that the performances achieved by deep neural networks are strongly dependent on the right setting of the hyper-parameters, and genetic algorithms have shown excellent search capabilities in huge search spaces. Moreover, we base our proposal on a distributed computing platform, which allows its use on a large time-series. In order to assess the performances of our approach, we have applied it to a large dataset, related to the electric energy consumption registered in Spain over almost 10 years. Experimental results confirm the validity of our proposal since it outperforms all other forecasting techniques to which it has been compared. |
F. Martínez-Álvarez and G. Asencio-Cortés and J. F. Torres and D. Gutiérrez-Avilés and L. Melgar-García and R. Pérez-Chacón and C. Rubio-Escudero and A. Troncoso and J. C. Riquelme Coronavirus Optimization Algorithm: A bioinspired metaheuristic based on the COVID-19 propagation model (Journal Article) Big Data, 8 (4), pp. 308-322, 2020. (Abstract | Links | BibTeX | Tags: big data, deep learning, energy, time series) @article{MARTINEZ-ALVAREZ20, title = {Coronavirus Optimization Algorithm: A bioinspired metaheuristic based on the COVID-19 propagation model}, author = {F. Martínez-Álvarez and G. Asencio-Cortés and J. F. Torres and D. Gutiérrez-Avilés and L. Melgar-García and R. Pérez-Chacón and C. Rubio-Escudero and A. Troncoso and J. C. Riquelme}, url = {https://www.liebertpub.com/doi/full/10.1089/big.2020.0051}, doi = {10.1089/big.2020.0051}, year = {2020}, date = {2020-07-22}, journal = {Big Data}, volume = {8}, number = {4}, pages = {308-322}, abstract = {This work proposes a novel bioinspired metaheuristic, simulating how the coronavirus spreads and infects healthy people. From a primary infected individual (patient zero), the coronavirus rapidly infects new victims, creating large populations of infected people who will either die or spread infection. Relevant terms such as reinfection probability, super-spreading rate, social distancing measures or traveling rate are introduced into the model in order to simulate the coronavirus activity as accurately as possible. The infected population initially grows exponentially over time, but taking into consideration social isolation measures, the mortality rate and number of recoveries, the infected population gradually decreases. The Coronavirus Optimization Algorithm has two major advantages when compared to other similar strategies. Firstly, the input parameters are already set according to the disease statistics, preventing researchers from initializing them with arbitrary values. Secondly, the approach has the ability to end after several iterations, without setting this value either. Furthermore, a parallel multi-virus version is proposed, where several coronavirus strains evolve over time and explore wider search space areas in less iterations. Finally, the metaheuristic has been combined with deep learning models, in order to find optimal hyperparameters during the training phase. As application case, the problem of electricity load time series forecasting has been addressed, showing quite remarkable performance.}, keywords = {big data, deep learning, energy, time series}, pubstate = {published}, tppubtype = {article} } This work proposes a novel bioinspired metaheuristic, simulating how the coronavirus spreads and infects healthy people. From a primary infected individual (patient zero), the coronavirus rapidly infects new victims, creating large populations of infected people who will either die or spread infection. Relevant terms such as reinfection probability, super-spreading rate, social distancing measures or traveling rate are introduced into the model in order to simulate the coronavirus activity as accurately as possible. The infected population initially grows exponentially over time, but taking into consideration social isolation measures, the mortality rate and number of recoveries, the infected population gradually decreases. The Coronavirus Optimization Algorithm has two major advantages when compared to other similar strategies. Firstly, the input parameters are already set according to the disease statistics, preventing researchers from initializing them with arbitrary values. Secondly, the approach has the ability to end after several iterations, without setting this value either. Furthermore, a parallel multi-virus version is proposed, where several coronavirus strains evolve over time and explore wider search space areas in less iterations. Finally, the metaheuristic has been combined with deep learning models, in order to find optimal hyperparameters during the training phase. As application case, the problem of electricity load time series forecasting has been addressed, showing quite remarkable performance. |
R. Pérez-Chacón and G. Asencio-Cortés and F. Martínez-Álvarez and A. Troncoso Big data time series forecasting based on pattern sequence similarity and its application to the electricity demand (Journal Article) Information Sciences, 540 , pp. 160-174, 2020. (Abstract | Links | BibTeX | Tags: big data, energy, time series) @article{PEREZ20, title = {Big data time series forecasting based on pattern sequence similarity and its application to the electricity demand}, author = {R. Pérez-Chacón and G. Asencio-Cortés and F. Martínez-Álvarez and A. Troncoso}, url = {https://www.sciencedirect.com/science/article/pii/S0020025520306010}, doi = {10.1016/j.ins.2020.06.014}, year = {2020}, date = {2020-06-06}, journal = {Information Sciences}, volume = {540}, pages = {160-174}, abstract = {This work proposes a novel algorithm to forecast big data time series. Based on the well-established Pattern Sequence Forecasting algorithm, this new approach has two major contributions to the literature. First, the improvement of the aforementioned algorithm with respect to the accuracy of predictions, and second, its transformation into the big data context, having reached meaningful results in terms of scalability. The algorithm uses the Apache Spark distributed computation framework and it is a ready-to-use application with few parameters to adjust. Physical and cloud clusters have been used to carry out the experimentation, which consisted in applying the algorithm to real-world data from Uruguay electricity demand.}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {article} } This work proposes a novel algorithm to forecast big data time series. Based on the well-established Pattern Sequence Forecasting algorithm, this new approach has two major contributions to the literature. First, the improvement of the aforementioned algorithm with respect to the accuracy of predictions, and second, its transformation into the big data context, having reached meaningful results in terms of scalability. The algorithm uses the Apache Spark distributed computation framework and it is a ready-to-use application with few parameters to adjust. Physical and cloud clusters have been used to carry out the experimentation, which consisted in applying the algorithm to real-world data from Uruguay electricity demand. |