Publications
2024 |
D. Gutiérrez-Avilés and J. F. Torres and F. Martínez-Álvarez and J. Cugliari An evolutionary triclustering approach to discover electricity consumption patterns in France (Conference) SAC 39th Annual ACM Symposium on Applied Computing, 2024. (Abstract | BibTeX | Tags: clustering, energy, time series) @conference{GUTIERREZ24_SAC, title = {An evolutionary triclustering approach to discover electricity consumption patterns in France}, author = {D. Gutiérrez-Avilés and J. F. Torres and F. Martínez-Álvarez and J. Cugliari}, year = {2024}, date = {2024-02-04}, booktitle = {SAC 39th Annual ACM Symposium on Applied Computing}, pages = {386-394}, abstract = {Electricity consumption patterns are critical in shaping energy policies and optimizing resource allocation. In pursuing a more sustainable and efficient energy future, uncovering hidden consumption patterns is paramount. This paper introduces an innovative approach, leveraging evolutionary triclustering techniques, to unveil previously undisclosed electricity consumption patterns in France. By harnessing the power of triclustering algorithms, this research provides a comprehensive analysis of electricity usage across various dimensions, shedding light on intricate relationships among variables. Using this novel method, the study reveals concealed patterns and offers insights that can inform decision-makers and stakeholders in the energy sector. The findings contribute to a better understanding of electricity consumption dynamics, aiding in developing more targeted and effective energy management strategies. This research represents a significant step forward in the quest for sustainable energy solutions and underscores the potential of evolutionary triclustering as a valuable tool in uncovering complex consumption patterns.}, keywords = {clustering, energy, time series}, pubstate = {published}, tppubtype = {conference} } Electricity consumption patterns are critical in shaping energy policies and optimizing resource allocation. In pursuing a more sustainable and efficient energy future, uncovering hidden consumption patterns is paramount. This paper introduces an innovative approach, leveraging evolutionary triclustering techniques, to unveil previously undisclosed electricity consumption patterns in France. By harnessing the power of triclustering algorithms, this research provides a comprehensive analysis of electricity usage across various dimensions, shedding light on intricate relationships among variables. Using this novel method, the study reveals concealed patterns and offers insights that can inform decision-makers and stakeholders in the energy sector. The findings contribute to a better understanding of electricity consumption dynamics, aiding in developing more targeted and effective energy management strategies. This research represents a significant step forward in the quest for sustainable energy solutions and underscores the potential of evolutionary triclustering as a valuable tool in uncovering complex consumption patterns. |
R. Pérez-Chacón and G. Asencio-Cortés and A. Troncoso and F. Martínez-Álvarez Pattern sequence-based algorithm for multivariate big data time series forecasting: Application to electricity consumption (Journal Article) Future Generation Computer Systems, 154 , pp. 397-412, 2024. (Abstract | Links | BibTeX | Tags: big data, energy, forecasting, time series) @article{PEREZ24, title = {Pattern sequence-based algorithm for multivariate big data time series forecasting: Application to electricity consumption}, author = {R. Pérez-Chacón and G. Asencio-Cortés and A. Troncoso and F. Martínez-Álvarez}, url = {https://www.sciencedirect.com/science/article/pii/S0167739X23004752}, doi = {https://doi.org/10.1016/j.future.2023.12.021}, year = {2024}, date = {2024-01-29}, journal = {Future Generation Computer Systems}, volume = {154}, pages = {397-412}, abstract = {Several interrelated variables typically characterize real-world processes, and a time series cannot be predicted without considering the influence that other time series might have on the target time series. This work proposes a novel algorithm to forecast multivariate big data time series. This new general-purpose approach consists first of a previous pattern recognition performed jointly using all time series that form the multivariate time series and then predicts the target time series by searching for similarities between pattern sequences. The proposed algorithm is designed to tackle multivariate time series forecasting problems within the context of big data. In particular, the algorithm has been developed with a distributed nature to enhance its efficiency in analyzing and processing large volumes of data. Moreover, the algorithm is straightforward to use, with only two parameters needing adjustment. Another advantage of the MV-bigPSF algorithm is its ability to perform multi-step forecasting, which is particularly useful in many practical applications. To evaluate the algorithm’s performance, real-world data from Uruguay’s power consumption has been utilized. Specifically, MV-bigPSF has been compared with both univariate and multivariate methods. Regarding the univariate ones, MV-bigPSF improved 12.8% in MAPE compared to the second-best method. Regarding the multivariate comparison, MV-bigPSF improved 44.8% in MAPE with respect to the second most accurate method. Regarding efficiency, the execution time of MV-bigPSF was 1.83 times faster than the second-fastest multivariate method, both in a single-core environment. Therefore, the proposed algorithm can be a valuable tool for practitioners and researchers working in multivariate time series forecasting, particularly in big data applications.}, keywords = {big data, energy, forecasting, time series}, pubstate = {published}, tppubtype = {article} } Several interrelated variables typically characterize real-world processes, and a time series cannot be predicted without considering the influence that other time series might have on the target time series. This work proposes a novel algorithm to forecast multivariate big data time series. This new general-purpose approach consists first of a previous pattern recognition performed jointly using all time series that form the multivariate time series and then predicts the target time series by searching for similarities between pattern sequences. The proposed algorithm is designed to tackle multivariate time series forecasting problems within the context of big data. In particular, the algorithm has been developed with a distributed nature to enhance its efficiency in analyzing and processing large volumes of data. Moreover, the algorithm is straightforward to use, with only two parameters needing adjustment. Another advantage of the MV-bigPSF algorithm is its ability to perform multi-step forecasting, which is particularly useful in many practical applications. To evaluate the algorithm’s performance, real-world data from Uruguay’s power consumption has been utilized. Specifically, MV-bigPSF has been compared with both univariate and multivariate methods. Regarding the univariate ones, MV-bigPSF improved 12.8% in MAPE compared to the second-best method. Regarding the multivariate comparison, MV-bigPSF improved 44.8% in MAPE with respect to the second most accurate method. Regarding efficiency, the execution time of MV-bigPSF was 1.83 times faster than the second-fastest multivariate method, both in a single-core environment. Therefore, the proposed algorithm can be a valuable tool for practitioners and researchers working in multivariate time series forecasting, particularly in big data applications. |
2023 |
D. Hadjout and A. Sebaa and J. F. Torres and F. Mártinez-Álvarez Electricity consumption forecasting with outliers handling based on clustering and deep learning with application to the Algerian market (Journal Article) Expert Systems with Applications, 227 , pp. 120123, 2023. (Abstract | Links | BibTeX | Tags: clustering, deep learning, energy, time series) @article{HADJOUT23, title = {Electricity consumption forecasting with outliers handling based on clustering and deep learning with application to the Algerian market}, author = {D. Hadjout and A. Sebaa and J. F. Torres and F. Mártinez-Álvarez}, url = {https://www.sciencedirect.com/science/article/abs/pii/S0957417423006255}, doi = {https://doi.org/10.1016/j.eswa.2023.120123}, year = {2023}, date = {2023-10-01}, journal = {Expert Systems with Applications}, volume = {227}, pages = {120123}, abstract = {The reduction of electricity loss and the effective management of electricity demand are vital operations for production and distribution electricity enterprises. To achieve these goals, accurate forecasts of aggregate and individual electricity consumers are necessary. A novel multistep forecasting method is developed to forecast medium-term electricity consumption of the Algerian economic sector. The proposed method goes through the following three steps: cleaning steps, clustering steps and forecasting step of each cluster. The aim of the first step is to detect and then replace outliers. To complete the first phase, Robust Exponential and Holt-Winters Smoothing algorithms are adapted. Then, to carry out accurate forecasting at a lowest level, K-Shape and K-Means clustering methods are utilized to extract similarities and identify customer consumption patterns as a second step. The third step entails developing a deep learning model based on Gated Recurrent Units to forecast the electricity consumption in each cluster. To validate the proposed method, we compared our results to the most known methods in literature like Autoregressive Integrated Moving Average, Seasonal Grey Model, LSTM networks, Temporal Convolutional Networks and two ensemble models. The results of several experiments conducted with 2000 electricity consumers during 14 years from an Algeria province (Bejaia) demonstrate that the proposed method provides remarkable prediction performances. Thus, prediction performances of the K-Shape-based clustering method reach much higher prediction accuracy. According to the MAPE metric, the results of the best predictions are equal to 2.04%. It is also notable that 87% of the clients have a considerably low prediction error.}, keywords = {clustering, deep learning, energy, time series}, pubstate = {published}, tppubtype = {article} } The reduction of electricity loss and the effective management of electricity demand are vital operations for production and distribution electricity enterprises. To achieve these goals, accurate forecasts of aggregate and individual electricity consumers are necessary. A novel multistep forecasting method is developed to forecast medium-term electricity consumption of the Algerian economic sector. The proposed method goes through the following three steps: cleaning steps, clustering steps and forecasting step of each cluster. The aim of the first step is to detect and then replace outliers. To complete the first phase, Robust Exponential and Holt-Winters Smoothing algorithms are adapted. Then, to carry out accurate forecasting at a lowest level, K-Shape and K-Means clustering methods are utilized to extract similarities and identify customer consumption patterns as a second step. The third step entails developing a deep learning model based on Gated Recurrent Units to forecast the electricity consumption in each cluster. To validate the proposed method, we compared our results to the most known methods in literature like Autoregressive Integrated Moving Average, Seasonal Grey Model, LSTM networks, Temporal Convolutional Networks and two ensemble models. The results of several experiments conducted with 2000 electricity consumers during 14 years from an Algeria province (Bejaia) demonstrate that the proposed method provides remarkable prediction performances. Thus, prediction performances of the K-Shape-based clustering method reach much higher prediction accuracy. According to the MAPE metric, the results of the best predictions are equal to 2.04%. It is also notable that 87% of the clients have a considerably low prediction error. |
D. Azzouguer and A. Sebaa and D. Hadjout and F. Martínez-Álvarez Fraud Detection of Electricity Consumption using Robust Exponential and Holt-Winters Smoothing method (Conference) IEEE International Conference on Advanced Systems and Emergent Technologies, 2023. (Abstract | Links | BibTeX | Tags: energy, time series) @conference{AZZOUGUER23, title = {Fraud Detection of Electricity Consumption using Robust Exponential and Holt-Winters Smoothing method}, author = {D. Azzouguer and A. Sebaa and D. Hadjout and F. Martínez-Álvarez}, url = {https://ieeexplore.ieee.org/document/10150645}, doi = {10.1109/IC_ASET58101.2023.10150645}, year = {2023}, date = {2023-02-20}, booktitle = {IEEE International Conference on Advanced Systems and Emergent Technologies}, abstract = {Non-technical losses (NTL), especially fraud detection is very important for electricity distribution enterprises. Fraud detection allows for maximizing the effective economic return for such enterprises. This paper provides an electricity fraud detection approach based on robust exponential and Holt-Winters Smoothing methods. The proposed approach is a procedure that aims to discover the fraudulent behavior of electricity consumers and goes through three crucial steps: (1) the prediction of monthly consumption, (2) the detection of abnormal consumption of electrical meters, and (3) the detection of fraud cases of economic customers. The proposed model was trained and evaluated. Its experimental validation is achieved by using a large dataset of real users from the Algerian economic sector with almost 2000 clients and 14 years of monthly electricity consumption. The proposed solution revealed good performance compared to the literature and the comparison with the models implemented in this article: SARIMA for prediction and two sigma for anomaly detection. The results show highly efficient and realistic countermeasures to fraud detection, which leads us to say that this method is robust and can enhance company profit.}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {conference} } Non-technical losses (NTL), especially fraud detection is very important for electricity distribution enterprises. Fraud detection allows for maximizing the effective economic return for such enterprises. This paper provides an electricity fraud detection approach based on robust exponential and Holt-Winters Smoothing methods. The proposed approach is a procedure that aims to discover the fraudulent behavior of electricity consumers and goes through three crucial steps: (1) the prediction of monthly consumption, (2) the detection of abnormal consumption of electrical meters, and (3) the detection of fraud cases of economic customers. The proposed model was trained and evaluated. Its experimental validation is achieved by using a large dataset of real users from the Algerian economic sector with almost 2000 clients and 14 years of monthly electricity consumption. The proposed solution revealed good performance compared to the literature and the comparison with the models implemented in this article: SARIMA for prediction and two sigma for anomaly detection. The results show highly efficient and realistic countermeasures to fraud detection, which leads us to say that this method is robust and can enhance company profit. |
P. Jiménez-Herrera and L. Melgar-García and G. Asencio-Cortés and A. Troncoso Streaming big time series forecasting based on nearest similar patterns with application to energy consumption (Journal Article) Logic Journal of the IGPL, 31 (2), pp. 255-270, 2023. (Abstract | Links | BibTeX | Tags: energy, IoT, time series) @article{jimenez2023, title = {Streaming big time series forecasting based on nearest similar patterns with application to energy consumption}, author = {P. Jiménez-Herrera and L. Melgar-García and G. Asencio-Cortés and A. Troncoso}, url = {https://academic.oup.com/jigpal/advance-article-abstract/doi/10.1093/jigpal/jzac017/6534493?redirectedFrom=fulltext}, doi = {https://doi.org/10.1093/jigpal/jzac017}, year = {2023}, date = {2023-01-01}, journal = {Logic Journal of the IGPL}, volume = {31}, number = {2}, pages = {255-270}, abstract = {This work presents a novel approach to forecast streaming big time series based on nearest similar patterns. This approach combines a clustering algorithm with a classifier and the nearest neighbors algorithm. It presents two separate stages: offline and online. The offline phase is for training and finding the best models for clustering, classification and the nearest neighbors algorithm. The online phase is to predict big time series in real time. In the offline phase, data are divided into clusters and a forecasting model based on the nearest neighbors is trained for each cluster. In addition, a classifier is trained using the cluster assignments previously generated by the clustering algorithm. In the online phase, the classifier predicts the cluster label of an instance, and the proper nearest neighbors model according to the predicted cluster label is applied to obtain the final prediction using the similar patterns. The algorithm is able to be updated incrementally for online learning from data streams. Results are reported using electricity consumption with a granularity of 10 minutes for 4-hour-ahead forecasting and compared with well-known online benchmark learners, showing a remarkable improvement in prediction accuracy.}, keywords = {energy, IoT, time series}, pubstate = {published}, tppubtype = {article} } This work presents a novel approach to forecast streaming big time series based on nearest similar patterns. This approach combines a clustering algorithm with a classifier and the nearest neighbors algorithm. It presents two separate stages: offline and online. The offline phase is for training and finding the best models for clustering, classification and the nearest neighbors algorithm. The online phase is to predict big time series in real time. In the offline phase, data are divided into clusters and a forecasting model based on the nearest neighbors is trained for each cluster. In addition, a classifier is trained using the cluster assignments previously generated by the clustering algorithm. In the online phase, the classifier predicts the cluster label of an instance, and the proper nearest neighbors model according to the predicted cluster label is applied to obtain the final prediction using the similar patterns. The algorithm is able to be updated incrementally for online learning from data streams. Results are reported using electricity consumption with a granularity of 10 minutes for 4-hour-ahead forecasting and compared with well-known online benchmark learners, showing a remarkable improvement in prediction accuracy. |
L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A.Troncoso Identifying novelties and anomalies for incremental learning in streaming time series forecasting (Journal Article) Engineering Applications of Artificial Intelligence, 123 , pp. 106326, 2023. (Links | BibTeX | Tags: energy, IoT, time series) @article{Melgar2023b, title = {Identifying novelties and anomalies for incremental learning in streaming time series forecasting}, author = {L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A.Troncoso}, url = {https://www.sciencedirect.com/science/article/pii/S0952197623005109}, doi = {https://doi.org/10.1016/j.engappai.2023.106326}, year = {2023}, date = {2023-01-01}, journal = {Engineering Applications of Artificial Intelligence}, volume = {123}, pages = {106326}, keywords = {energy, IoT, time series}, pubstate = {published}, tppubtype = {article} } |
L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A. Troncoso A novel distributed forecasting method based on information fusion and incremental learning for streaming time series (Journal Article) Information Fusion, 95 , pp. 163-173, 2023. (Links | BibTeX | Tags: energy, IoT, time series) @article{Melgar2023a, title = {A novel distributed forecasting method based on information fusion and incremental learning for streaming time series}, author = {L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A. Troncoso}, url = {https://www.sciencedirect.com/science/article/pii/S1566253523000635}, doi = {https://doi.org/10.1016/j.inffus.2023.02.023}, year = {2023}, date = {2023-01-01}, journal = {Information Fusion}, volume = {95}, pages = {163-173}, keywords = {energy, IoT, time series}, pubstate = {published}, tppubtype = {article} } |
E. Tefera and A. Troncoso and M. Martínez Ballesteros and F. Martínez-Álvarez A New Hybrid CNN-LSTM for Wind Power Forecasting in Ethiopia (Conference) HAIS 18th International Conference on Hybrid Artificial Intelligence Systems, Lecture Notes in Computer Science 2023. (BibTeX | Tags: deep learning, energy, time series) @conference{HAIS23_Ejigu, title = {A New Hybrid CNN-LSTM for Wind Power Forecasting in Ethiopia}, author = {E. Tefera and A. Troncoso and M. Martínez Ballesteros and F. Martínez-Álvarez}, year = {2023}, date = {2023-01-01}, booktitle = {HAIS 18th International Conference on Hybrid Artificial Intelligence Systems}, series = {Lecture Notes in Computer Science}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
2022 |
D. Hadjout and J. F. Torres and A. Troncoso and A. Sebaa and F. Martínez-Álvarez Electricity consumption forecasting based on ensemble deep learning with application to the Algerian market (Journal Article) Energy, 243 , pp. 123060, 2022. (Abstract | Links | BibTeX | Tags: deep learning, energy, time series) @article{HADJOUT22, title = {Electricity consumption forecasting based on ensemble deep learning with application to the Algerian market}, author = {D. Hadjout and J. F. Torres and A. Troncoso and A. Sebaa and F. Martínez-Álvarez}, url = {https://www.sciencedirect.com/science/article/pii/S0360544221033090}, doi = {https://doi.org/10.1016/j.energy.2021.123060}, year = {2022}, date = {2022-03-15}, journal = {Energy}, volume = {243}, pages = {123060}, abstract = {The economic sector is one of the most important pillars of countries. Economic activities of industry are intimately linked with the ability to meet their needs for electricity. Therefore, electricity forecasting is a very important task. It allows for better planning and management of energy resources. Several methods have been proposed to forecast energy consumption. In this work, to predict monthly electricity consumption for the economic sector, we develop a novel approach based on ensemble learning. Our approach combines three models that proved successful in the field, namely: Long Short Term Memory and Gated Recurrent Unit neural networks, and Temporal Convolutional Networks. The experiments have been conducted with almost 2000 clients and 14 years of monthly electricity consumption from Bejaia, Algeria. The results show that the proposed ensemble models achieve better performance than both the company's requirements and the prediction of the traditional individual models. Finally, statistical tests have been carried out to prove that significance of the ensemble models developed.}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {article} } The economic sector is one of the most important pillars of countries. Economic activities of industry are intimately linked with the ability to meet their needs for electricity. Therefore, electricity forecasting is a very important task. It allows for better planning and management of energy resources. Several methods have been proposed to forecast energy consumption. In this work, to predict monthly electricity consumption for the economic sector, we develop a novel approach based on ensemble learning. Our approach combines three models that proved successful in the field, namely: Long Short Term Memory and Gated Recurrent Unit neural networks, and Temporal Convolutional Networks. The experiments have been conducted with almost 2000 clients and 14 years of monthly electricity consumption from Bejaia, Algeria. The results show that the proposed ensemble models achieve better performance than both the company's requirements and the prediction of the traditional individual models. Finally, statistical tests have been carried out to prove that significance of the ensemble models developed. |
J. F. Torres and F. Martínez-Álvarez and A. Troncoso A deep LSTM network for the Spanish electricity consumption forecasting (Journal Article) Neural Computing and Applications, 34 , pp. 10533-10545, 2022. (Abstract | Links | BibTeX | Tags: deep learning, energy) @article{TORRES22b, title = {A deep LSTM network for the Spanish electricity consumption forecasting}, author = {J. F. Torres and F. Martínez-Álvarez and A. Troncoso}, url = {https://link.springer.com/article/10.1007/s00521-021-06773-2}, doi = {https://doi.org/10.1007/s00521-021-06773-2}, year = {2022}, date = {2022-02-05}, journal = {Neural Computing and Applications}, volume = {34}, pages = {10533-10545}, abstract = {Nowadays, electricity is a basic commodity necessary for the well-being of any modern society. Due to the growth in electricity consumption in recent years, mainly in large cities, electricity forecasting is key to the management of an efficient, sustainable and safe smart grid for the consumer. In this work, a deep neural network is proposed to address the electricity consumption forecasting in the short-term, namely, a long short-term memory (LSTM) network due to its ability to deal with sequential data such as time-series data. First, the optimal values for certain hyper-parameters have been obtained by a random search and a metaheuristic, called coronavirus optimization algorithm (CVOA), based on the propagation of the SARS-Cov-2 virus. Then, the optimal LSTM has been applied to predict the electricity demand with 4-h forecast horizon. Results using Spanish electricity data during nine years and half measured with 10-min frequency are presented and discussed. Finally, the performance of the proposed LSTM using random search and the LSTM using CVOA is compared, on the one hand, with that of recently published deep neural networks (such as a deep feed-forward neural network optimized with a grid search) and temporal fusion transformers optimized with a sampling algorithm, and, on the other hand, with traditional machine learning techniques, such as a linear regression, decision trees and tree-based ensemble techniques (gradient-boosted trees and random forest), achieving the smallest prediction error below 1.5%.}, keywords = {deep learning, energy}, pubstate = {published}, tppubtype = {article} } Nowadays, electricity is a basic commodity necessary for the well-being of any modern society. Due to the growth in electricity consumption in recent years, mainly in large cities, electricity forecasting is key to the management of an efficient, sustainable and safe smart grid for the consumer. In this work, a deep neural network is proposed to address the electricity consumption forecasting in the short-term, namely, a long short-term memory (LSTM) network due to its ability to deal with sequential data such as time-series data. First, the optimal values for certain hyper-parameters have been obtained by a random search and a metaheuristic, called coronavirus optimization algorithm (CVOA), based on the propagation of the SARS-Cov-2 virus. Then, the optimal LSTM has been applied to predict the electricity demand with 4-h forecast horizon. Results using Spanish electricity data during nine years and half measured with 10-min frequency are presented and discussed. Finally, the performance of the proposed LSTM using random search and the LSTM using CVOA is compared, on the one hand, with that of recently published deep neural networks (such as a deep feed-forward neural network optimized with a grid search) and temporal fusion transformers optimized with a sampling algorithm, and, on the other hand, with traditional machine learning techniques, such as a linear regression, decision trees and tree-based ensemble techniques (gradient-boosted trees and random forest), achieving the smallest prediction error below 1.5%. |
M.A. Castán-Lascorz and P. Jiménez-Herrera and A. Troncoso and G. Asencio-Cortés A new hybrid method for predicting univariate and multivariate time series based on pattern forecasting (Journal Article) Information Sciences, 586 , pp. 611–627, 2022. (Abstract | Links | BibTeX | Tags: energy, pattern recognition, time series) @article{castan2022, title = {A new hybrid method for predicting univariate and multivariate time series based on pattern forecasting}, author = {M.A. Castán-Lascorz and P. Jiménez-Herrera and A. Troncoso and G. Asencio-Cortés}, url = {https://www.sciencedirect.com/science/article/pii/S0020025521012226?via%3Dihub}, doi = {10.1016/j.ins.2021.12.001}, year = {2022}, date = {2022-01-01}, journal = {Information Sciences}, volume = {586}, pages = {611--627}, abstract = {Time series forecasting has become indispensable for multiple applications and industrial processes. Currently, a large number of algorithms have been developed to forecast time series, all of which are suitable depending on the characteristics and patterns to be inferred in each case. In this work, a new algorithm is proposed to predict both univariate and multivariate time series based on a combination of clustering, classification and forecasting techniques. The main goal of the proposed algorithm is first to group windows of time series values with similar patterns by applying a clustering process. Then, a specific forecasting model for each pattern is built and training is only conducted with the time windows corresponding to that pattern. The new algorithm has been designed using a flexible framework that allows the model to be generated using any combination of approaches within multiple machine learning techniques. To evaluate the model, several experiments are carried out using different configurations of the clustering, classification and forecasting methods that the model consists of. The results are analyzed and compared to classical prediction models, such as autoregressive, integrated, moving average and Holt-Winters models, to very recent forecasting methods, including deep, long short-term memory neural networks, and to well-known methods in the literature, such as k nearest neighbors, classification and regression trees, as well as random forest.}, keywords = {energy, pattern recognition, time series}, pubstate = {published}, tppubtype = {article} } Time series forecasting has become indispensable for multiple applications and industrial processes. Currently, a large number of algorithms have been developed to forecast time series, all of which are suitable depending on the characteristics and patterns to be inferred in each case. In this work, a new algorithm is proposed to predict both univariate and multivariate time series based on a combination of clustering, classification and forecasting techniques. The main goal of the proposed algorithm is first to group windows of time series values with similar patterns by applying a clustering process. Then, a specific forecasting model for each pattern is built and training is only conducted with the time windows corresponding to that pattern. The new algorithm has been designed using a flexible framework that allows the model to be generated using any combination of approaches within multiple machine learning techniques. To evaluate the model, several experiments are carried out using different configurations of the clustering, classification and forecasting methods that the model consists of. The results are analyzed and compared to classical prediction models, such as autoregressive, integrated, moving average and Holt-Winters models, to very recent forecasting methods, including deep, long short-term memory neural networks, and to well-known methods in the literature, such as k nearest neighbors, classification and regression trees, as well as random forest. |
G. Velázquez and F. Morales and M. García-Torres and F. Gómez-Vela and F. Divina and J.L. Vázquez Noguera and F. Daumas-Ladouce and C. Ayala and D. Pinto-Roaand P. Gardel-Sotomayor Distribution level Electric current consumption and meteorological data set of the East region of Paraguay (Journal Article) Data in Brief, 40 , pp. 107699, 2022. (Abstract | Links | BibTeX | Tags: energy, time series) @article{velazquez2022distribution, title = {Distribution level Electric current consumption and meteorological data set of the East region of Paraguay}, author = {G. Velázquez and F. Morales and M. García-Torres and F. Gómez-Vela and F. Divina and J.L. Vázquez Noguera and F. Daumas-Ladouce and C. Ayala and D. Pinto-Roaand P. Gardel-Sotomayor}, url = {https://www.sciencedirect.com/science/article/pii/S2352340921009744}, doi = {10.1016/j.dib.2021.107699}, year = {2022}, date = {2022-01-01}, journal = {Data in Brief}, volume = {40}, pages = {107699}, publisher = {Elsevier pubstate = published}, abstract = {This paper presents a data set with information on meteorological data and electricity consumption in the department of Alto Paraná, Paraguay. The meteorological data were registered every three hours at the Aeropuerto Guarani, Department of Alto Paraná, which belongs to the Dirección Nacional de Aeronáutica Civil of Paraguay. The final data consists of a total of 22.445 records of temperature, relative humidity, wind speed and atmospheric pressure. On the other hand, the electrical energy consumption data set contains a total of 1.848.947 records, all of them coming from the one hundred and fifteen feeders located throughout the Alto Paraná region of Paraguay. Electrical energy consumption data was provided by Administración Nacional de Electricidad (ANDE). The analysis of this data can yield insights regarding the energy consumption in the area.}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {article} } This paper presents a data set with information on meteorological data and electricity consumption in the department of Alto Paraná, Paraguay. The meteorological data were registered every three hours at the Aeropuerto Guarani, Department of Alto Paraná, which belongs to the Dirección Nacional de Aeronáutica Civil of Paraguay. The final data consists of a total of 22.445 records of temperature, relative humidity, wind speed and atmospheric pressure. On the other hand, the electrical energy consumption data set contains a total of 1.848.947 records, all of them coming from the one hundred and fifteen feeders located throughout the Alto Paraná region of Paraguay. Electrical energy consumption data was provided by Administración Nacional de Electricidad (ANDE). The analysis of this data can yield insights regarding the energy consumption in the area. |
J. A. Gallardo-Gómez and F. Divina and A. Troncoso and F. Martínez-Álvarez Explainable Artificial Intelligence for the Electric Vehicle Load Demand Forecasting Problem (Conference) SOCO 17th International Conference on Soft Computing Models in Industrial and Environmental Applications, Advances in Intelligent Systems and Computing 2022. (Links | BibTeX | Tags: big data, energy, time series) @conference{gallardo2022explainable, title = {Explainable Artificial Intelligence for the Electric Vehicle Load Demand Forecasting Problem}, author = {J. A. Gallardo-Gómez and F. Divina and A. Troncoso and F. Martínez-Álvarez }, url = {https://link.springer.com/chapter/10.1007/978-3-030-87869-6_65}, year = {2022}, date = {2022-01-01}, booktitle = {SOCO 17th International Conference on Soft Computing Models in Industrial and Environmental Applications}, pages = {413-422}, series = { Advances in Intelligent Systems and Computing}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
F. Morales and M. García-Torres and G. Velázquez and F. Daumas-Ladouce and P. Gardel-Sotomayor and F. Gómez-Vela and F. Divina and J. L. Vázquez Noguera and C. Sauer Ayala and D. Pinto-Roa Analysis of Electric Energy Consumption Profiles Using a Machine Learning Approach: A Paraguayan Case Study (Journal Article) Electronics, 11 (2), pp. 267, 2022. (Abstract | Links | BibTeX | Tags: big data, energy, time series) @article{morales2022analysisb, title = {Analysis of Electric Energy Consumption Profiles Using a Machine Learning Approach: A Paraguayan Case Study}, author = {F. Morales and M. García-Torres and G. Velázquez and F. Daumas-Ladouce and P. Gardel-Sotomayor and F. Gómez-Vela and F. Divina and J. L. Vázquez Noguera and C. Sauer Ayala and D. Pinto-Roa}, url = {https://www.mdpi.com/2079-9292/11/2/267}, doi = {10.3390/electronics11020267}, year = {2022}, date = {2022-01-01}, journal = {Electronics}, volume = {11}, number = {2}, pages = {267}, abstract = {Correctly defining and grouping electrical feeders is of great importance for electrical system operators. In this paper, we compare two different clustering techniques, K-means and hierarchical agglomerative clustering, applied to real data from the east region of Paraguay. The raw data were pre-processed, resulting in four data sets, namely, (i) a weekly feeder demand, (ii) a monthly feeder demand, (iii) a statistical feature set extracted from the original data and (iv) a seasonal and daily consumption feature set obtained considering the characteristics of the Paraguayan load curve. Considering the four data sets, two clustering algorithms, two distance metrics and five linkage criteria a total of 36 models with the Silhouette, Davies–Bouldin and Calinski–Harabasz index scores was assessed. The K-means algorithms with the seasonal feature data sets showed the best performance considering the Silhouette, Calinski–Harabasz and Davies–Bouldin validation index scores with a configuration of six clusters.}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {article} } Correctly defining and grouping electrical feeders is of great importance for electrical system operators. In this paper, we compare two different clustering techniques, K-means and hierarchical agglomerative clustering, applied to real data from the east region of Paraguay. The raw data were pre-processed, resulting in four data sets, namely, (i) a weekly feeder demand, (ii) a monthly feeder demand, (iii) a statistical feature set extracted from the original data and (iv) a seasonal and daily consumption feature set obtained considering the characteristics of the Paraguayan load curve. Considering the four data sets, two clustering algorithms, two distance metrics and five linkage criteria a total of 36 models with the Silhouette, Davies–Bouldin and Calinski–Harabasz index scores was assessed. The K-means algorithms with the seasonal feature data sets showed the best performance considering the Silhouette, Calinski–Harabasz and Davies–Bouldin validation index scores with a configuration of six clusters. |
E. T. Habtermariam and K. Kekeba and A. Troncoso and F. Martínez-Álvarez A Cluster-Based Deep Learning Model for Energy Consumption Forecasting in Ethiopia (Conference) SOCO 17th International Conference on Soft Computing Models in Industrial and Environmental Applications , 531 , Lecture Notes in Networks and Systems 2022. (Links | BibTeX | Tags: deep learning, energy, pattern recognition, time series) @conference{SOCO22_Ejigu, title = {A Cluster-Based Deep Learning Model for Energy Consumption Forecasting in Ethiopia}, author = {E. T. Habtermariam and K. Kekeba and A. Troncoso and F. Martínez-Álvarez}, url = {https://link.springer.com/chapter/10.1007/978-3-031-18050-7_41}, year = {2022}, date = {2022-01-01}, booktitle = {SOCO 17th International Conference on Soft Computing Models in Industrial and Environmental Applications }, journal = {SOCO 17th International Conference on Soft Computing Models in Industrial and Environmental Applications, Lecture Notes in Networks Systems, Vol. 531.}, volume = {531}, pages = {423-432}, series = {Lecture Notes in Networks and Systems}, keywords = {deep learning, energy, pattern recognition, time series}, pubstate = {published}, tppubtype = {conference} } |
L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A. Troncoso Nearest neighbors with incremental learning for real-time forecasting of electricity demand (Conference) IEEE International Conference on Data Mining Workshops, 2022. (Links | BibTeX | Tags: energy, IoT, time series) @conference{MelgarICDM2022, title = {Nearest neighbors with incremental learning for real-time forecasting of electricity demand}, author = {L. Melgar-García and D. Gutiérrez-Avilés and C. Rubio-Escudero and A. Troncoso}, url = {https://ieeexplore.ieee.org/document/10031211}, year = {2022}, date = {2022-01-01}, booktitle = {IEEE International Conference on Data Mining Workshops}, keywords = {energy, IoT, time series}, pubstate = {published}, tppubtype = {conference} } |
2021 |
A. Melara and J. F. Torres and A. Troncoso and F. Martínez-Álvarez Electricity Generation Forecasting in Concentrating Solar-Thermal Power Plants with Ensemble Learning (Conference) SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications, 1401 , Advances in Intelligent Systems and Computing 2021. (Links | BibTeX | Tags: deep learning, energy, time series) @conference{MELARA21, title = {Electricity Generation Forecasting in Concentrating Solar-Thermal Power Plants with Ensemble Learning}, author = {A. Melara and J. F. Torres and A. Troncoso and F. Martínez-Álvarez}, doi = {https://doi.org/10.1007/978-3-030-87869-6_63}, year = {2021}, date = {2021-09-01}, booktitle = {SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications}, volume = {1401}, pages = {665-674}, series = {Advances in Intelligent Systems and Computing}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
D. Hadjout and J. F. Torres and A. Sebaa and F. Martínez-Álvarez SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications, 1401 , Advances in Intelligent Systems and Computing 2021. (Links | BibTeX | Tags: deep learning, energy, time series) @conference{HADJOUT21, title = {Medium-Term Electricity Consumption Forecasting in Algeria Based on Clustering, Deep Learning and Bayesian Optimization Methods}, author = {D. Hadjout and J. F. Torres and A. Sebaa and F. Martínez-Álvarez}, doi = {https://doi.org/10.1007/978-3-030-87869-6_70}, year = {2021}, date = {2021-09-01}, booktitle = {SOCO International Conference on Soft Computing Models in Industrial and Environmental Applications}, volume = {1401}, pages = {739-748}, series = {Advances in Intelligent Systems and Computing}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
F. Divina and F. Gómez-Vela and M. García-Torres Advanced Optimization Methods and Big Data Applications in Energy Demand Forecast (Journal Article) Applied Sciences, 11 (3), pp. 1261, 2021. (Links | BibTeX | Tags: energy) @article{divina2021advanced, title = {Advanced Optimization Methods and Big Data Applications in Energy Demand Forecast}, author = {F. Divina and F. Gómez-Vela and M. García-Torres}, url = {https://www.mdpi.com/2076-3417/11/3/1261/htm}, doi = {10.3390/app11031261}, year = {2021}, date = {2021-01-01}, journal = {Applied Sciences}, volume = {11}, number = {3}, pages = {1261}, publisher = {Multidisciplinary Digital Publishing Institute}, keywords = {energy}, pubstate = {published}, tppubtype = {article} } |
J. A. Gallardo and M. García-Torres and F. Gómez-Vela and F. Morales and F. Divina and D. Becerra-Alonso and G. Velázquez and F. Daumas-Ladouce and J. L. Vázquez Noguera and C. Ayala Sauer Forecasting Electricity Consumption Data from Paraguay Using a Machine Learning Approach (Conference) SOCO 16th International Conference on Soft Computing Models in Industrial and Environmental Applications, 1401 , Advances in Intelligent Systems and Computing 2021. (Links | BibTeX | Tags: big data, energy, time series) @conference{gallardo2022forecasting, title = {Forecasting Electricity Consumption Data from Paraguay Using a Machine Learning Approach}, author = {J. A. Gallardo and M. García-Torres and F. Gómez-Vela and F. Morales and F. Divina and D. Becerra-Alonso and G. Velázquez and F. Daumas-Ladouce and J. L. Vázquez Noguera and C. Ayala Sauer}, url = {https://link.springer.com/chapter/10.1007/978-3-030-87869-6_65}, year = {2021}, date = {2021-01-01}, booktitle = {SOCO 16th International Conference on Soft Computing Models in Industrial and Environmental Applications}, volume = {1401}, pages = {685-694}, series = {Advances in Intelligent Systems and Computing}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
2020 |
P. Jiménez-Herrera and L. Melgar-García and G. Asencio-Cortés and A. Troncoso A New Forecasting Algorithm Based on Neighbors for Streaming Electricity Time Series (Conference) HAIS 15th International Conference on Hybrid Artificial Intelligence Systems, Lecture Notes in Computer Science 2020. (Links | BibTeX | Tags: big data, energy, IoT, time series) @conference{HAIS2020, title = {A New Forecasting Algorithm Based on Neighbors for Streaming Electricity Time Series}, author = {P. Jiménez-Herrera and L. Melgar-García and G. Asencio-Cortés and A. Troncoso}, url = {https://link.springer.com/chapter/10.1007/978-3-030-61705-9_43}, year = {2020}, date = {2020-11-04}, booktitle = {HAIS 15th International Conference on Hybrid Artificial Intelligence Systems}, pages = {522-533}, series = {Lecture Notes in Computer Science}, keywords = {big data, energy, IoT, time series}, pubstate = {published}, tppubtype = {conference} } |
Y. Lin and I. Koprinska and M. Rana and A. Troncoso Solar Power Forecasting Based on Pattern Sequence Similarity and Meta-learning (Conference) ICANN 29th International Conference on Artificial Neural Networks, Lecture Notes in Computer Science 2020. (Links | BibTeX | Tags: energy, time series) @conference{ICANN20, title = {Solar Power Forecasting Based on Pattern Sequence Similarity and Meta-learning}, author = {Y. Lin and I. Koprinska and M. Rana and A. Troncoso}, url = {https://link.springer.com/chapter/10.1007/978-3-030-61609-0_22}, year = {2020}, date = {2020-10-14}, booktitle = {ICANN 29th International Conference on Artificial Neural Networks}, pages = {271-283}, series = {Lecture Notes in Computer Science }, keywords = {energy, time series}, pubstate = {published}, tppubtype = {conference} } |
F. Divina and J. F. Torres and M. García-Torres and F. Martínez-Álvarez and A. Troncoso Hybridizing deep learning and neuroevolution: Application to the Spanish short-term electric energy consumption forecasting (Journal Article) Applied Sciences, 10 (16), pp. 5487, 2020. (Abstract | Links | BibTeX | Tags: big data, deep learning, energy, time series) @article{DIVINA2020, title = {Hybridizing deep learning and neuroevolution: Application to the Spanish short-term electric energy consumption forecasting}, author = {F. Divina and J. F. Torres and M. García-Torres and F. Martínez-Álvarez and A. Troncoso}, url = {https://www.mdpi.com/2076-3417/10/16/5487}, doi = {https://doi.org/10.3390/app10165487}, year = {2020}, date = {2020-07-30}, journal = {Applied Sciences}, volume = {10}, number = {16}, pages = {5487}, abstract = {The electric energy production would be much more efficient if accurate estimations of the future demand were available, since these would allow allocating only the resources needed for the production of the right amount of energy required. With this motivation in mind, we propose a strategy, based on neuroevolution, that can be used to this aim. Our proposal uses a genetic algorithm in order to find a sub-optimal set of hyper-parameters for configuring a deep neural network, which can then be used for obtaining the forecasting. Such a strategy is justified by the observation that the performances achieved by deep neural networks are strongly dependent on the right setting of the hyper-parameters, and genetic algorithms have shown excellent search capabilities in huge search spaces. Moreover, we base our proposal on a distributed computing platform, which allows its use on a large time-series. In order to assess the performances of our approach, we have applied it to a large dataset, related to the electric energy consumption registered in Spain over almost 10 years. Experimental results confirm the validity of our proposal since it outperforms all other forecasting techniques to which it has been compared.}, keywords = {big data, deep learning, energy, time series}, pubstate = {published}, tppubtype = {article} } The electric energy production would be much more efficient if accurate estimations of the future demand were available, since these would allow allocating only the resources needed for the production of the right amount of energy required. With this motivation in mind, we propose a strategy, based on neuroevolution, that can be used to this aim. Our proposal uses a genetic algorithm in order to find a sub-optimal set of hyper-parameters for configuring a deep neural network, which can then be used for obtaining the forecasting. Such a strategy is justified by the observation that the performances achieved by deep neural networks are strongly dependent on the right setting of the hyper-parameters, and genetic algorithms have shown excellent search capabilities in huge search spaces. Moreover, we base our proposal on a distributed computing platform, which allows its use on a large time-series. In order to assess the performances of our approach, we have applied it to a large dataset, related to the electric energy consumption registered in Spain over almost 10 years. Experimental results confirm the validity of our proposal since it outperforms all other forecasting techniques to which it has been compared. |
F. Martínez-Álvarez and G. Asencio-Cortés and J. F. Torres and D. Gutiérrez-Avilés and L. Melgar-García and R. Pérez-Chacón and C. Rubio-Escudero and A. Troncoso and J. C. Riquelme Coronavirus Optimization Algorithm: A bioinspired metaheuristic based on the COVID-19 propagation model (Journal Article) Big Data, 8 (4), pp. 308-322, 2020. (Abstract | Links | BibTeX | Tags: big data, deep learning, energy, time series) @article{MARTINEZ-ALVAREZ20, title = {Coronavirus Optimization Algorithm: A bioinspired metaheuristic based on the COVID-19 propagation model}, author = {F. Martínez-Álvarez and G. Asencio-Cortés and J. F. Torres and D. Gutiérrez-Avilés and L. Melgar-García and R. Pérez-Chacón and C. Rubio-Escudero and A. Troncoso and J. C. Riquelme}, url = {https://www.liebertpub.com/doi/full/10.1089/big.2020.0051}, doi = {10.1089/big.2020.0051}, year = {2020}, date = {2020-07-22}, journal = {Big Data}, volume = {8}, number = {4}, pages = {308-322}, abstract = {This work proposes a novel bioinspired metaheuristic, simulating how the coronavirus spreads and infects healthy people. From a primary infected individual (patient zero), the coronavirus rapidly infects new victims, creating large populations of infected people who will either die or spread infection. Relevant terms such as reinfection probability, super-spreading rate, social distancing measures or traveling rate are introduced into the model in order to simulate the coronavirus activity as accurately as possible. The infected population initially grows exponentially over time, but taking into consideration social isolation measures, the mortality rate and number of recoveries, the infected population gradually decreases. The Coronavirus Optimization Algorithm has two major advantages when compared to other similar strategies. Firstly, the input parameters are already set according to the disease statistics, preventing researchers from initializing them with arbitrary values. Secondly, the approach has the ability to end after several iterations, without setting this value either. Furthermore, a parallel multi-virus version is proposed, where several coronavirus strains evolve over time and explore wider search space areas in less iterations. Finally, the metaheuristic has been combined with deep learning models, in order to find optimal hyperparameters during the training phase. As application case, the problem of electricity load time series forecasting has been addressed, showing quite remarkable performance.}, keywords = {big data, deep learning, energy, time series}, pubstate = {published}, tppubtype = {article} } This work proposes a novel bioinspired metaheuristic, simulating how the coronavirus spreads and infects healthy people. From a primary infected individual (patient zero), the coronavirus rapidly infects new victims, creating large populations of infected people who will either die or spread infection. Relevant terms such as reinfection probability, super-spreading rate, social distancing measures or traveling rate are introduced into the model in order to simulate the coronavirus activity as accurately as possible. The infected population initially grows exponentially over time, but taking into consideration social isolation measures, the mortality rate and number of recoveries, the infected population gradually decreases. The Coronavirus Optimization Algorithm has two major advantages when compared to other similar strategies. Firstly, the input parameters are already set according to the disease statistics, preventing researchers from initializing them with arbitrary values. Secondly, the approach has the ability to end after several iterations, without setting this value either. Furthermore, a parallel multi-virus version is proposed, where several coronavirus strains evolve over time and explore wider search space areas in less iterations. Finally, the metaheuristic has been combined with deep learning models, in order to find optimal hyperparameters during the training phase. As application case, the problem of electricity load time series forecasting has been addressed, showing quite remarkable performance. |
R. Pérez-Chacón and G. Asencio-Cortés and F. Martínez-Álvarez and A. Troncoso Big data time series forecasting based on pattern sequence similarity and its application to the electricity demand (Journal Article) Information Sciences, 540 , pp. 160-174, 2020. (Abstract | Links | BibTeX | Tags: big data, energy, time series) @article{PEREZ20, title = {Big data time series forecasting based on pattern sequence similarity and its application to the electricity demand}, author = {R. Pérez-Chacón and G. Asencio-Cortés and F. Martínez-Álvarez and A. Troncoso}, url = {https://www.sciencedirect.com/science/article/pii/S0020025520306010}, doi = {10.1016/j.ins.2020.06.014}, year = {2020}, date = {2020-06-06}, journal = {Information Sciences}, volume = {540}, pages = {160-174}, abstract = {This work proposes a novel algorithm to forecast big data time series. Based on the well-established Pattern Sequence Forecasting algorithm, this new approach has two major contributions to the literature. First, the improvement of the aforementioned algorithm with respect to the accuracy of predictions, and second, its transformation into the big data context, having reached meaningful results in terms of scalability. The algorithm uses the Apache Spark distributed computation framework and it is a ready-to-use application with few parameters to adjust. Physical and cloud clusters have been used to carry out the experimentation, which consisted in applying the algorithm to real-world data from Uruguay electricity demand.}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {article} } This work proposes a novel algorithm to forecast big data time series. Based on the well-established Pattern Sequence Forecasting algorithm, this new approach has two major contributions to the literature. First, the improvement of the aforementioned algorithm with respect to the accuracy of predictions, and second, its transformation into the big data context, having reached meaningful results in terms of scalability. The algorithm uses the Apache Spark distributed computation framework and it is a ready-to-use application with few parameters to adjust. Physical and cloud clusters have been used to carry out the experimentation, which consisted in applying the algorithm to real-world data from Uruguay electricity demand. |
M. Nazeriye and A. Haeri and F. Martínez-Álvarez Analysis of the Impact of Residential Property and Equipment on Building Energy Efficiency and Consumption - A Data Mining Approach (Journal Article) Applied Sciences, 10 (10), pp. 3589, 2020. (Abstract | Links | BibTeX | Tags: energy, time series) @article{NAZERIYE20, title = {Analysis of the Impact of Residential Property and Equipment on Building Energy Efficiency and Consumption - A Data Mining Approach}, author = {M. Nazeriye and A. Haeri and F. Martínez-Álvarez}, url = {https://www.mdpi.com/2076-3417/10/10/3589/}, doi = {https://doi.org/10.3390/app10103589}, year = {2020}, date = {2020-05-22}, journal = {Applied Sciences}, volume = {10}, number = {10}, pages = {3589}, abstract = {Human living could become very difficult due to a lack of energy. The household sector plays a significant role in energy consumption. Trying to optimize and achieve efficient energy consumption can lead to large-scale energy savings. The aim of this paper is to identify the equipment and property affecting energy efficiency and consumption in residential homes. For this purpose, a hybrid data-mining approach based on K-means algorithms and decision trees is presented. To analyze the approach, data is modeled once using the approach and then without it. A data set of residential homes of England and Wales is arranged in low, medium and high consumption clusters. The C5.0 algorithm is run on each cluster to extract factors affecting energy efficiency. The comparison of the modeling results, and also their accuracy, prove that the approach employed has the ability to extract the findings with greater accuracy and detail than in other cases. The installation of boilers, using cavity walls, and installing insulation could improve energy efficiency. Old homes and the usage of economy 7 electricity have an unfavorable effect on energy efficiency, but the approach shows that each cluster behaved differently in these factors related to energy efficiency and has unique results}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {article} } Human living could become very difficult due to a lack of energy. The household sector plays a significant role in energy consumption. Trying to optimize and achieve efficient energy consumption can lead to large-scale energy savings. The aim of this paper is to identify the equipment and property affecting energy efficiency and consumption in residential homes. For this purpose, a hybrid data-mining approach based on K-means algorithms and decision trees is presented. To analyze the approach, data is modeled once using the approach and then without it. A data set of residential homes of England and Wales is arranged in low, medium and high consumption clusters. The C5.0 algorithm is run on each cluster to extract factors affecting energy efficiency. The comparison of the modeling results, and also their accuracy, prove that the approach employed has the ability to extract the findings with greater accuracy and detail than in other cases. The installation of boilers, using cavity walls, and installing insulation could improve energy efficiency. Old homes and the usage of economy 7 electricity have an unfavorable effect on energy efficiency, but the approach shows that each cluster behaved differently in these factors related to energy efficiency and has unique results |
Ó. Trull and J.C. García-Díaz and A. Troncoso Initialization methods for multiple seasonal Holt–Winters forecasting models (Journal Article) Mathematics, 8 (2), pp. 268, 2020. (Links | BibTeX | Tags: energy, time series) @article{TRULL20a, title = {Initialization methods for multiple seasonal Holt–Winters forecasting models}, author = {Ó. Trull and J.C. García-Díaz and A. Troncoso}, doi = {10.3390/math8020268 }, year = {2020}, date = {2020-01-01}, journal = {Mathematics}, volume = {8}, number = {2}, pages = {268}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {article} } |
Óscar Trull and J. Carlos García-Díaz and A. Troncoso Stability of Multiple Seasonal Holt-Winters Models Applied to Hourly Electricity Demand in Spain (Journal Article) Applied Sciences, 10 (7), pp. 2630, 2020. (Links | BibTeX | Tags: energy, time series) @article{Trull20b, title = {Stability of Multiple Seasonal Holt-Winters Models Applied to Hourly Electricity Demand in Spain}, author = {Óscar Trull and J. Carlos García-Díaz and A. Troncoso}, doi = {10.3390/app10072630}, year = {2020}, date = {2020-01-01}, journal = {Applied Sciences}, volume = {10}, number = {7}, pages = {2630}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {article} } |
2019 |
C. Gómez-Quiles and G. Asencio-Cortés and A. Gastalver-Rubio and F. Martínez-Álvarez and A. Troncoso and J. Manresa and J. C. Riquelme and J. M. Riquelme A novel ensemble method for electric vehicle power consumption forecasting: application to the Spanish system (Journal Article) IEEE Access, 7 , pp. 120840-120856, 2019. (Links | BibTeX | Tags: energy, time series) @article{GOMEZ19, title = {A novel ensemble method for electric vehicle power consumption forecasting: application to the Spanish system}, author = {C. Gómez-Quiles and G. Asencio-Cortés and A. Gastalver-Rubio and F. Martínez-Álvarez and A. Troncoso and J. Manresa and J. C. Riquelme and J. M. Riquelme}, url = {https://ieeexplore.ieee.org/document/8807120}, doi = {https://doi.org/10.1109/ACCESS.2019.2936478}, year = {2019}, date = {2019-08-01}, journal = {IEEE Access}, volume = {7}, pages = {120840-120856}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {article} } |
J. F. Torres and D. Gutiérrez-Avilés and A. Troncoso and F. Martínez-Álvarez Random Hyper-Parameter Search-Based Deep Neural Network for Power Consumption Forecasting (Conference) IWANN 15th International Work-Conference on Artificial Neural Networks, 11506 , Lecture Notes in Computer Science 2019. (Links | BibTeX | Tags: deep learning, energy, time series) @conference{TORRES19-2, title = {Random Hyper-Parameter Search-Based Deep Neural Network for Power Consumption Forecasting}, author = {J. F. Torres and D. Gutiérrez-Avilés and A. Troncoso and F. Martínez-Álvarez}, url = {https://link.springer.com/chapter/10.1007/978-3-030-20521-8_22}, doi = {https://doi.org/10.1007/978-3-030-20521-8_22}, year = {2019}, date = {2019-05-16}, booktitle = {IWANN 15th International Work-Conference on Artificial Neural Networks}, volume = {11506}, pages = {259-269}, series = {Lecture Notes in Computer Science}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
J. F. Torres and A. Troncoso and I. Koprinska and Z. Wang and F. Martínez-Álvarez Big data solar power forecasting based on deep learning and multiple data sources (Journal Article) Expert Systems, 36 , pp. id12394, 2019. (Links | BibTeX | Tags: deep learning, energy, time series) @article{TORRES19-1, title = {Big data solar power forecasting based on deep learning and multiple data sources}, author = {J. F. Torres and A. Troncoso and I. Koprinska and Z. Wang and F. Martínez-Álvarez}, url = {https://onlinelibrary.wiley.com/doi/abs/10.1111/exsy.12394}, doi = {https://doi.org/10.1111/exsy.12394}, year = {2019}, date = {2019-03-01}, journal = {Expert Systems}, volume = {36}, pages = {id12394}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {article} } |
R. Talavera-Llames and R. Pérez-Chacón and A. Troncoso and F. Martínez-Álvarez MV-kWNN: A novel multivariate and multi-output weighted nearest neighbors algorithm for big data time series forecasting (Journal Article) Neurocomputing, 353 , pp. 56-73, 2019. (Abstract | Links | BibTeX | Tags: big data, energy, time series) @article{NEUCOM2019, title = {MV-kWNN: A novel multivariate and multi-output weighted nearest neighbors algorithm for big data time series forecasting}, author = {R. Talavera-Llames and R. Pérez-Chacón and A. Troncoso and F. Martínez-Álvarez}, url = {https://www.sciencedirect.com/science/article/pii/S0925231219303236?via%3Dihub}, doi = {10.1016/j.neucom.2018.07.092}, year = {2019}, date = {2019-01-01}, journal = {Neurocomputing}, volume = {353}, pages = {56-73}, abstract = {This paper introduces a novel algorithm for big data time series forecasting. Its main novelty lies in its ability to deal with multivariate data, i.e. to consider multiple time series simultaneously, in order to make multi-output predictions. Real-world processes are typically characterised by several interrelated variables, and the future occurrence of certain time series cannot be explained without understanding the influence that other time series might have on the target time series. One key issue in the context of the multivariate analysis is to determine a priori whether exogenous variables must be included in the model or not. To deal with this, a correlation analysis is used to find a minimum correlation threshold that an exogenous time series must exhibit, in order to be beneficial. Furthermore, the proposed approach has been specifically designed to be used in the context of big data, thus making it possible to efficiently process very large time series. To evaluate the performance of the proposed approach we use data from Spanish electricity prices. Results have been compared to other multivariate approaches showing remarkable improvements both in terms of accuracy and execution time.}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {article} } This paper introduces a novel algorithm for big data time series forecasting. Its main novelty lies in its ability to deal with multivariate data, i.e. to consider multiple time series simultaneously, in order to make multi-output predictions. Real-world processes are typically characterised by several interrelated variables, and the future occurrence of certain time series cannot be explained without understanding the influence that other time series might have on the target time series. One key issue in the context of the multivariate analysis is to determine a priori whether exogenous variables must be included in the model or not. To deal with this, a correlation analysis is used to find a minimum correlation threshold that an exogenous time series must exhibit, in order to be beneficial. Furthermore, the proposed approach has been specifically designed to be used in the context of big data, thus making it possible to efficiently process very large time series. To evaluate the performance of the proposed approach we use data from Spanish electricity prices. Results have been compared to other multivariate approaches showing remarkable improvements both in terms of accuracy and execution time. |
F. Martinez-Alvarez and A. Schmutz and G. Asencio-Cortes and J. Jacques A Novel Hybrid Algorithm to Forecast Functional Time Series Based on Pattern Sequence Similarity with Application to Electricity Demand (Journal Article) Energies, 12 (94), pp. 1-18, 2019, ISSN: 1996-1073. (Abstract | Links | BibTeX | Tags: energy, time series) @article{en12010094b, title = {A Novel Hybrid Algorithm to Forecast Functional Time Series Based on Pattern Sequence Similarity with Application to Electricity Demand}, author = {F. Martinez-Alvarez and A. Schmutz and G. Asencio-Cortes and J. Jacques}, url = {http://www.mdpi.com/1996-1073/12/1/94}, doi = {10.3390/en12010094}, issn = {1996-1073}, year = {2019}, date = {2019-01-01}, journal = {Energies}, volume = {12}, number = {94}, pages = {1-18}, abstract = {The forecasting of future values is a very challenging task. In almost all scientific disciplines, the analysis of time series provides useful information and even economic benefits. In this context, this paper proposes a novel hybrid algorithm to forecast functional time series with arbitrary prediction horizons. It integrates a well-known clustering functional data algorithm into a forecasting strategy based on pattern sequence similarity, which was originally developed for discrete time series. The new approach assumes that some patterns are repeated over time, and it attempts to discover them and evaluate their immediate future. Hence, the algorithm first applies a clustering functional time series algorithm, i.e., it assigns labels to every data unit (it may represent either one hour, or one day, or any arbitrary length). As a result, the time series is transformed into a sequence of labels. Later, it retrieves the sequence of labels occurring just after the sample that we want to be forecasted. This sequence is searched for within the historical data, and every time it is found, the sample immediately after is stored. Once the searching process is terminated, the output is generated by weighting all stored data. The performance of the approach has been tested on real-world datasets related to electricity demand and compared to other existing methods, reporting very promising results. Finally, a statistical significance test has been carried out to confirm the suitability of the election of the compared methods. In conclusion, a novel algorithm to forecast functional time series is proposed with very satisfactory results when assessed in the context of electricity demand.}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {article} } The forecasting of future values is a very challenging task. In almost all scientific disciplines, the analysis of time series provides useful information and even economic benefits. In this context, this paper proposes a novel hybrid algorithm to forecast functional time series with arbitrary prediction horizons. It integrates a well-known clustering functional data algorithm into a forecasting strategy based on pattern sequence similarity, which was originally developed for discrete time series. The new approach assumes that some patterns are repeated over time, and it attempts to discover them and evaluate their immediate future. Hence, the algorithm first applies a clustering functional time series algorithm, i.e., it assigns labels to every data unit (it may represent either one hour, or one day, or any arbitrary length). As a result, the time series is transformed into a sequence of labels. Later, it retrieves the sequence of labels occurring just after the sample that we want to be forecasted. This sequence is searched for within the historical data, and every time it is found, the sample immediately after is stored. Once the searching process is terminated, the output is generated by weighting all stored data. The performance of the approach has been tested on real-world datasets related to electricity demand and compared to other existing methods, reporting very promising results. Finally, a statistical significance test has been carried out to confirm the suitability of the election of the compared methods. In conclusion, a novel algorithm to forecast functional time series is proposed with very satisfactory results when assessed in the context of electricity demand. |
Y. Lin and I. Koprinska and M. Rana and A. Troncoso Pattern Sequence Neural Network for Solar Power Forecasting (Conference) ICONIP 26th International Conference on Neural Information Processing, 2019. (BibTeX | Tags: energy, time series) @conference{ICONIP19, title = {Pattern Sequence Neural Network for Solar Power Forecasting}, author = {Y. Lin and I. Koprinska and M. Rana and A. Troncoso}, year = {2019}, date = {2019-01-01}, booktitle = {ICONIP 26th International Conference on Neural Information Processing}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {conference} } |
Ó. Trull and J. C. García-Díaz and A. Troncoso Application of Discrete-Interval Moving Seasonalities to Spanish Electricity Demand Forecasting during Easter (Journal Article) Energies, 12 (6), pp. 1083, 2019. (Abstract | Links | BibTeX | Tags: energy, time series) @article{Energies2019, title = {Application of Discrete-Interval Moving Seasonalities to Spanish Electricity Demand Forecasting during Easter}, author = {Ó. Trull and J. C. García-Díaz and A. Troncoso }, url = {https://www.mdpi.com/1996-1073/12/6/1083}, doi = {10.3390/en12061083}, year = {2019}, date = {2019-01-01}, journal = {Energies}, volume = {12}, number = {6}, pages = {1083}, abstract = {Forecasting electricity demand through time series is a tool used by transmission system operators to establish future operating conditions. The accuracy of these forecasts is essential for the precise development of activity. However, the accuracy of the forecasts is enormously subject to the calendar effect. The multiple seasonal Holt–Winters models are widely used due to the great precision and simplicity that they offer. Usually, these models relate this calendar effect to external variables that contribute to modification of their forecasts a posteriori. In this work, a new point of view is presented, where the calendar effect constitutes a built-in part of the Holt–Winters model. In particular, the proposed model incorporates discrete-interval moving seasonalities. Moreover, a clear example of the application of this methodology to situations that are difficult to treat, such as the days of Easter, is presented. The results show that the proposed model performs well, outperforming the regular Holt–Winters model and other methods such as artificial neural networks and Exponential Smoothing State Space Model with Box-Cox Transformation, ARMA Errors, Trend and Seasonal Components (TBATS) methods.}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {article} } Forecasting electricity demand through time series is a tool used by transmission system operators to establish future operating conditions. The accuracy of these forecasts is essential for the precise development of activity. However, the accuracy of the forecasts is enormously subject to the calendar effect. The multiple seasonal Holt–Winters models are widely used due to the great precision and simplicity that they offer. Usually, these models relate this calendar effect to external variables that contribute to modification of their forecasts a posteriori. In this work, a new point of view is presented, where the calendar effect constitutes a built-in part of the Holt–Winters model. In particular, the proposed model incorporates discrete-interval moving seasonalities. Moreover, a clear example of the application of this methodology to situations that are difficult to treat, such as the days of Easter, is presented. The results show that the proposed model performs well, outperforming the regular Holt–Winters model and other methods such as artificial neural networks and Exponential Smoothing State Space Model with Box-Cox Transformation, ARMA Errors, Trend and Seasonal Components (TBATS) methods. |
F. Divina and M. García-Torres and F. Goméz-Vela and J.L. Vázquez Noguera A Comparative Study of Time Series Forecasting Methods for Short Term Electric Energy Consumption Prediction in Smart Buildings (Journal Article) Applied Sciences, 12 (10), pp. 1934, 2019. (Abstract | Links | BibTeX | Tags: energy, time series) @article{Energies2019b, title = {A Comparative Study of Time Series Forecasting Methods for Short Term Electric Energy Consumption Prediction in Smart Buildings}, author = {F. Divina and M. García-Torres and F. Goméz-Vela and J.L. Vázquez Noguera}, url = {https://www.mdpi.com/1996-1073/12/10/1934}, doi = {https://doi.org/10.3390/en12101934}, year = {2019}, date = {2019-01-01}, journal = {Applied Sciences}, volume = {12}, number = {10}, pages = {1934}, abstract = {Smart buildings are equipped with sensors that allow monitoring a range of building systems including heating and air conditioning, lighting and the general electric energy consumption. Thees data can then be stored and analyzed. The ability to use historical data regarding electric energy consumption could allow improving the energy efficiency of such buildings, as well as help to spot problems related to wasting of energy. This problem is even more important when considering that buildings are some of the largest consumers of energy. In this paper, we are interested in forecasting the energy consumption of smart buildings, and, to this aim, we propose a comparative study of different forecasting strategies that can be used to this aim. To do this, we used the data regarding the electric consumption registered by thirteen buildings located in a university campus in the south of Spain. The empirical comparison of the selected methods on the different data showed that some methods are more suitable than others for this kind of problem. In particular, we show that strategies based on Machine Learning approaches seem to be more suitable for this task.}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {article} } Smart buildings are equipped with sensors that allow monitoring a range of building systems including heating and air conditioning, lighting and the general electric energy consumption. Thees data can then be stored and analyzed. The ability to use historical data regarding electric energy consumption could allow improving the energy efficiency of such buildings, as well as help to spot problems related to wasting of energy. This problem is even more important when considering that buildings are some of the largest consumers of energy. In this paper, we are interested in forecasting the energy consumption of smart buildings, and, to this aim, we propose a comparative study of different forecasting strategies that can be used to this aim. To do this, we used the data regarding the electric consumption registered by thirteen buildings located in a university campus in the south of Spain. The empirical comparison of the selected methods on the different data showed that some methods are more suitable than others for this kind of problem. In particular, we show that strategies based on Machine Learning approaches seem to be more suitable for this task. |
2018 |
R. Pérez-Chacón and J. M. Luna and A. Troncoso and F. Martínez-Álvarez and J. C. Riquelme Big data analytics for discovering electricity consumption patterns in smart cities (Journal Article) Energies, 11 (3), pp. 683, 2018. (Abstract | Links | BibTeX | Tags: big data, energy, time series) @article{Energies2018, title = {Big data analytics for discovering electricity consumption patterns in smart cities}, author = {R. Pérez-Chacón and J. M. Luna and A. Troncoso and F. Martínez-Álvarez and J. C. Riquelme}, url = {http://www.mdpi.com/1996-1073/11/3/683 }, doi = {10.3390/en11030683 }, year = {2018}, date = {2018-01-01}, journal = {Energies}, volume = {11}, number = {3}, pages = {683}, abstract = {New technologies such as sensor networks have been incorporated into the management of buildings for organizations and cities. Sensor networks have led to an exponential increase in the volume of data available in recent years, which can be used to extract consumption patterns for the purposes of energy and monetary savings. For this reason, new approaches and strategies are needed to analyze information in big data environments. This paper proposes a methodology to extract electric energy consumption patterns in big data time series, so that very valuable conclusions can be made for managers and governments. The methodology is based on the study of four clustering validity indices in their parallelized versions along with the application of a clustering technique. In particular, this work uses a voting system to choose an optimal number of clusters from the results of the indices, as well as the application of the distributed version of the k-means algorithm included in Apache Spark’s Machine Learning Library. The results, using electricity consumption for the years 2011–2017 for eight buildings of a public university, are presented and discussed. In addition, the performance of the proposed methodology is evaluated using synthetic big data, which cab represent thousands of buildings in a smart city. Finally, policies derived from the patterns discovered are proposed to optimize energy usage across the university campus.}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {article} } New technologies such as sensor networks have been incorporated into the management of buildings for organizations and cities. Sensor networks have led to an exponential increase in the volume of data available in recent years, which can be used to extract consumption patterns for the purposes of energy and monetary savings. For this reason, new approaches and strategies are needed to analyze information in big data environments. This paper proposes a methodology to extract electric energy consumption patterns in big data time series, so that very valuable conclusions can be made for managers and governments. The methodology is based on the study of four clustering validity indices in their parallelized versions along with the application of a clustering technique. In particular, this work uses a voting system to choose an optimal number of clusters from the results of the indices, as well as the application of the distributed version of the k-means algorithm included in Apache Spark’s Machine Learning Library. The results, using electricity consumption for the years 2011–2017 for eight buildings of a public university, are presented and discussed. In addition, the performance of the proposed methodology is evaluated using synthetic big data, which cab represent thousands of buildings in a smart city. Finally, policies derived from the patterns discovered are proposed to optimize energy usage across the university campus. |
A. Galicia and J. F. Torres and F. Martínez-Álvarez and A. Troncoso A novel Spark-based multi-step forecasting algorithm for big data time series (Journal Article) Information Sciences, 467 , pp. 800-818, 2018. (Abstract | Links | BibTeX | Tags: big data, energy, time series) @article{INFSCI2018, title = {A novel Spark-based multi-step forecasting algorithm for big data time series}, author = {A. Galicia and J. F. Torres and F. Martínez-Álvarez and A. Troncoso}, url = {https://www.sciencedirect.com/science/article/pii/S0020025518304493}, doi = {10.1016/j.ins.2018.06.010}, year = {2018}, date = {2018-01-01}, journal = {Information Sciences}, volume = {467}, pages = {800-818}, abstract = {This paper presents different scalable methods for predicting big time series, namely time series with a high frequency measurement. Methods are also developed to deal with arbitrary prediction horizons. The Apache Spark framework is proposed for distributed computing in order to achieve the scalability of the methods. Prediction methods have been developed using Spark’s MLlib library for machine learning. Since the library does not support multivariate regression, the prediction problem is formulated as h prediction sub-problems, where h is the number of future values to predict, that is, the prediction horizon. Furthermore, different kinds of representative methods have been chosen, such as decision trees, two tree-based ensemble techniques (Gradient-Boosted and Random Forest) and a linear regression method as a reference method for comparisons. Finally, the methodology has been tested in a real time series of electrical demand in Spain, with a time interval of ten minutes between measurements.}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {article} } This paper presents different scalable methods for predicting big time series, namely time series with a high frequency measurement. Methods are also developed to deal with arbitrary prediction horizons. The Apache Spark framework is proposed for distributed computing in order to achieve the scalability of the methods. Prediction methods have been developed using Spark’s MLlib library for machine learning. Since the library does not support multivariate regression, the prediction problem is formulated as h prediction sub-problems, where h is the number of future values to predict, that is, the prediction horizon. Furthermore, different kinds of representative methods have been chosen, such as decision trees, two tree-based ensemble techniques (Gradient-Boosted and Random Forest) and a linear regression method as a reference method for comparisons. Finally, the methodology has been tested in a real time series of electrical demand in Spain, with a time interval of ten minutes between measurements. |
R. Talavera-Llames and R. Pérez-Chacón and A. Troncoso and F. Martínez-Álvarez Big data time series forecasting based on nearest neighbors distributed computing with Spark (Journal Article) Knowledge-Based Systems, 161 (1), pp. 12-25, 2018. (Abstract | Links | BibTeX | Tags: big data, energy, time series) @article{KNOSYS2018b, title = {Big data time series forecasting based on nearest neighbors distributed computing with Spark}, author = {R. Talavera-Llames and R. Pérez-Chacón and A. Troncoso and F. Martínez-Álvarez}, url = {https://www.sciencedirect.com/science/article/pii/S0950705118303770}, doi = {10.1016/j.knosys.2018.07.026}, year = {2018}, date = {2018-01-01}, journal = {Knowledge-Based Systems}, volume = {161}, number = {1}, pages = {12-25}, abstract = {A new approach for big data forecasting based on the k-weighted nearest neighbours algorithm is introduced in this work. Such an algorithm has been developed for distributed computing under the Apache Spark framework. Every phase of the algorithm is explained in this work, along with how the optimal values of the input parameters required for the algorithm are obtained. In order to test the developed algorithm, a Spanish energy consumption big data time series has been used. The accuracy of the prediction has been assessed showing remarkable results. Additionally, the optimal configuration of a Spark cluster has been discussed. Finally, a scalability analysis of the algorithm has been conducted leading to the conclusion that the proposed algorithm is highly suitable for big data environments.}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {article} } A new approach for big data forecasting based on the k-weighted nearest neighbours algorithm is introduced in this work. Such an algorithm has been developed for distributed computing under the Apache Spark framework. Every phase of the algorithm is explained in this work, along with how the optimal values of the input parameters required for the algorithm are obtained. In order to test the developed algorithm, a Spanish energy consumption big data time series has been used. The accuracy of the prediction has been assessed showing remarkable results. Additionally, the optimal configuration of a Spark cluster has been discussed. Finally, a scalability analysis of the algorithm has been conducted leading to the conclusion that the proposed algorithm is highly suitable for big data environments. |
J. F. Torres and A. Galicia and A. Troncoso and F. Martínez-Álvarez A scalable approach based on deep learning for big data time series forecasting (Journal Article) Integrated Computer-Aided Engineering, 25 (4), pp. 335-348, 2018. (Abstract | Links | BibTeX | Tags: deep learning, energy, time series) @article{ICAE2018, title = {A scalable approach based on deep learning for big data time series forecasting}, author = {J. F. Torres and A. Galicia and A. Troncoso and F. Martínez-Álvarez}, url = {https://content.iospress.com/articles/integrated-computer-aided-engineering/ica580}, doi = {10.3233/ICA-180580}, year = {2018}, date = {2018-01-01}, journal = {Integrated Computer-Aided Engineering}, volume = {25}, number = {4}, pages = {335-348}, abstract = {This paper presents a method based on deep learning to deal with big data times series forecasting. The deep feed forward neural network provided by the H2O big data analysis framework has been used along with the Apache Spark platform for distributed computing. Since H2O does not allow the conduction of multi-step regression, a general-purpose methodology that can be used for prediction horizons with arbitrary length is proposed here, being the prediction horizon, h, the number of future values to be predicted. The solution consists in splitting the problem into h forecasting subproblems, being h the number of samples to be simultaneously predicted. Thus, the best prediction model for each subproblem can be obtained, making easier its parallelization and adaptation to the big data context. Moreover, a grid search is carried out to obtain the optimal hyperparameters of the deep learning-based approach. Results from a real-world dataset composed of electricity consumption in Spain, with a ten-minute frequency sampling rate, from 2007 to 2016 are reported. In particular, the accuracy and runtimes versus computing resources and size of the dataset are analyzed. Finally, the performance and the scalability of the proposed method is compared to other recently published techniques, showing to be a suitable method to process big data time series.}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {article} } This paper presents a method based on deep learning to deal with big data times series forecasting. The deep feed forward neural network provided by the H2O big data analysis framework has been used along with the Apache Spark platform for distributed computing. Since H2O does not allow the conduction of multi-step regression, a general-purpose methodology that can be used for prediction horizons with arbitrary length is proposed here, being the prediction horizon, h, the number of future values to be predicted. The solution consists in splitting the problem into h forecasting subproblems, being h the number of samples to be simultaneously predicted. Thus, the best prediction model for each subproblem can be obtained, making easier its parallelization and adaptation to the big data context. Moreover, a grid search is carried out to obtain the optimal hyperparameters of the deep learning-based approach. Results from a real-world dataset composed of electricity consumption in Spain, with a ten-minute frequency sampling rate, from 2007 to 2016 are reported. In particular, the accuracy and runtimes versus computing resources and size of the dataset are analyzed. Finally, the performance and the scalability of the proposed method is compared to other recently published techniques, showing to be a suitable method to process big data time series. |
D. Gutiérrez-Avilés and J. A. Fábregas and J. Tejedor and F. Martínez-Álvarez and A. Troncoso and J. C. Riquelme SmartFD: A real big data application for electrical fraud detection (Conference) HAIS 13th International Conference on Hybrid Artificial Intelligence Systems, Lecture Notes in Computer Science 2018. (Links | BibTeX | Tags: big data, energy) @conference{HAIS2018, title = {SmartFD: A real big data application for electrical fraud detection}, author = {D. Gutiérrez-Avilés and J. A. Fábregas and J. Tejedor and F. Martínez-Álvarez and A. Troncoso and J. C. Riquelme}, url = {https://link.springer.com/chapter/10.1007/978-3-319-92639-1_11}, year = {2018}, date = {2018-01-01}, booktitle = {HAIS 13th International Conference on Hybrid Artificial Intelligence Systems}, series = {Lecture Notes in Computer Science}, keywords = {big data, energy}, pubstate = {published}, tppubtype = {conference} } |
J. F. Torres and A. Troncoso and I. Koprinska and Z. Wang and F. Martínez-Álvarez Deep learning for big data time series forecasting applied to solar power (Conference) SOCO 13th International Conference on Soft Computing Models in Industrial and Environmental Applications, Advances in Intelligent Systems and Computing 2018. (Links | BibTeX | Tags: deep learning, energy, time series) @conference{SOCO2018, title = {Deep learning for big data time series forecasting applied to solar power}, author = {J. F. Torres and A. Troncoso and I. Koprinska and Z. Wang and F. Martínez-Álvarez}, url = {https://link.springer.com/chapter/10.1007/978-3-319-94120-2_12}, year = {2018}, date = {2018-01-01}, booktitle = {SOCO 13th International Conference on Soft Computing Models in Industrial and Environmental Applications}, series = {Advances in Intelligent Systems and Computing}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
Z. Wang and I. Koprinska and A. Troncoso and F. Martínez-Álvarez Static and dinamic ensembles of neural networks for power solar forecasting (Conference) IJCNN International Joint Conference on Neural Networks, 2018. (BibTeX | Tags: energy, time series) @conference{IJCNN2018, title = {Static and dinamic ensembles of neural networks for power solar forecasting}, author = {Z. Wang and I. Koprinska and A. Troncoso and F. Martínez-Álvarez}, year = {2018}, date = {2018-01-01}, booktitle = {IJCNN International Joint Conference on Neural Networks}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {conference} } |
F. Martínez-Álvarez and A. Troncoso and J. C. Riquelme Data Science and Big Data in Energy Forecasting (Journal Article) Energies, 11 (11), pp. 3224, 2018. (Links | BibTeX | Tags: big data, energy) @article{Martinez18, title = {Data Science and Big Data in Energy Forecasting}, author = {F. Martínez-Álvarez and A. Troncoso and J. C. Riquelme}, doi = {10.3390/en11113224}, year = {2018}, date = {2018-01-01}, journal = {Energies}, volume = {11}, number = {11}, pages = {3224}, keywords = {big data, energy}, pubstate = {published}, tppubtype = {article} } |
F. Divina and A. Gilson and F. Goméz-Vela and M. García-Torres and J. F. Torres Stacking ensemble learning for short-term electricity consumption forecasting (Journal Article) Energies, 11 (4), pp. 949, 2018. (Abstract | Links | BibTeX | Tags: energy, time series) @article{Energy2018, title = {Stacking ensemble learning for short-term electricity consumption forecasting}, author = {F. Divina and A. Gilson and F. Goméz-Vela and M. García-Torres and J. F. Torres}, url = {https://www.mdpi.com/1996-1073/11/4/949}, doi = {https://doi.org/10.3390/en11040949}, year = {2018}, date = {2018-01-01}, journal = {Energies}, volume = {11}, number = {4}, pages = {949}, abstract = {The ability to predict short-term electric energy demand would provide several benefits, both at the economic and environmental level. For example, it would allow for an efficient use of resources in order to face the actual demand, reducing the costs associated to the production as well as the emission of CO 2 . To this aim, in this paper we propose a strategy based on ensemble learning in order to tackle the short-term load forecasting problem. In particular, our approach is based on a stacking ensemble learning scheme, where the predictions produced by three base learning methods are used by a top level method in order to produce final predictions. We tested the proposed scheme on a dataset reporting the energy consumption in Spain over more than nine years. The obtained experimental results show that an approach for short-term electricity consumption forecasting based on ensemble learning can help in combining predictions produced by weaker learning methods in order to obtain superior results. In particular, the system produces a lower error with respect to the existing state-of-the art techniques used on the same dataset. More importantly, this case study has shown that using an ensemble scheme can achieve very accurate predictions, and thus that it is a suitable approach for addressing the short-term load forecasting problem.}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {article} } The ability to predict short-term electric energy demand would provide several benefits, both at the economic and environmental level. For example, it would allow for an efficient use of resources in order to face the actual demand, reducing the costs associated to the production as well as the emission of CO 2 . To this aim, in this paper we propose a strategy based on ensemble learning in order to tackle the short-term load forecasting problem. In particular, our approach is based on a stacking ensemble learning scheme, where the predictions produced by three base learning methods are used by a top level method in order to produce final predictions. We tested the proposed scheme on a dataset reporting the energy consumption in Spain over more than nine years. The obtained experimental results show that an approach for short-term electricity consumption forecasting based on ensemble learning can help in combining predictions produced by weaker learning methods in order to obtain superior results. In particular, the system produces a lower error with respect to the existing state-of-the art techniques used on the same dataset. More importantly, this case study has shown that using an ensemble scheme can achieve very accurate predictions, and thus that it is a suitable approach for addressing the short-term load forecasting problem. |
2017 |
J. F. Torres and A. M. Fernández and A. Troncoso and F. Martínez-Álvarez Deep Learning - Based Approach for Time Series Forecasting with Application to Electricity Load (Conference) IWINAC International Work-Conference on the Interplay Between Natural and Artificial Computation, Lecture Notes in computer Science 2017. (Abstract | Links | BibTeX | Tags: deep learning, energy, time series) @conference{IWINAC2017, title = {Deep Learning - Based Approach for Time Series Forecasting with Application to Electricity Load}, author = {J. F. Torres and A. M. Fernández and A. Troncoso and F. Martínez-Álvarez}, url = {https://link.springer.com/chapter/10.1007/978-3-319-59773-7_21}, year = {2017}, date = {2017-01-01}, booktitle = {IWINAC International Work-Conference on the Interplay Between Natural and Artificial Computation}, series = {Lecture Notes in computer Science}, abstract = {This paper presents a novel method to predict times series using deep learning. In particular, the method can be used for arbitrary time horizons, dividing each predicted sample into a single problem. This fact allows easy parallelization and adaptation to the big data context. Deep learning implementation in H2O library is used for each subproblem. However, H2O does not permit multi-step regression, therefore the solution proposed consists in splitting into h forecasting subproblems, being h the number of samples to be predicted, and, each of one has been separately studied, getting the best prediction model for each subproblem. Additionally, Apache Spark is used to load in memory large datasets and speed up the execution time. This methodology has been tested on a real-world dataset composed of electricity consumption in Spain, with a ten minute frequency sampling rate, from 2007 to 2016. Reported results exhibit errors less than 2%.}, keywords = {deep learning, energy, time series}, pubstate = {published}, tppubtype = {conference} } This paper presents a novel method to predict times series using deep learning. In particular, the method can be used for arbitrary time horizons, dividing each predicted sample into a single problem. This fact allows easy parallelization and adaptation to the big data context. Deep learning implementation in H2O library is used for each subproblem. However, H2O does not permit multi-step regression, therefore the solution proposed consists in splitting into h forecasting subproblems, being h the number of samples to be predicted, and, each of one has been separately studied, getting the best prediction model for each subproblem. Additionally, Apache Spark is used to load in memory large datasets and speed up the execution time. This methodology has been tested on a real-world dataset composed of electricity consumption in Spain, with a ten minute frequency sampling rate, from 2007 to 2016. Reported results exhibit errors less than 2%. |
A. Galicia and J. F. Torres and F. Martínez-Álvarez and A. Troncoso Scalable Forecasting Techniques Applied to Big Electricity Time Series (Conference) IWANN International Work-Conference on Artificial Neural Networks, Lecture Notes in Computer Science 2017. (Links | BibTeX | Tags: big data, energy, time series) @conference{IWANN2017, title = {Scalable Forecasting Techniques Applied to Big Electricity Time Series}, author = {A. Galicia and J. F. Torres and F. Martínez-Álvarez and A. Troncoso}, url = {https://link.springer.com/chapter/10.1007/978-3-319-59147-6_15}, year = {2017}, date = {2017-01-01}, booktitle = {IWANN International Work-Conference on Artificial Neural Networks}, series = {Lecture Notes in Computer Science}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
F. Martínez-Álvarez and A. Troncoso and J. C. Riquelme Recent Advances in energy Time Series Forecasting (Journal Article) Energies, 10 (6), pp. 809, 2017. (Abstract | Links | BibTeX | Tags: energy, time series) @article{Energies2017, title = {Recent Advances in energy Time Series Forecasting}, author = {F. Martínez-Álvarez and A. Troncoso and J. C. Riquelme}, url = {http://www.mdpi.com/1996-1073/10/6/809}, doi = {10.3390/en10060809}, year = {2017}, date = {2017-01-01}, journal = {Energies}, volume = {10}, number = {6}, pages = {809}, abstract = {This editorial summarizes the performance of the special issue entitled Energy Time Series Forecasting, which was published in MDPI’s Energies journal. The special issue took place in 2016 and accepted a total of 21 papers from twelve different countries. Electrical, solar, or wind energy forecasting were the most analyzed topics, introducing brand new methods with very sound results.}, keywords = {energy, time series}, pubstate = {published}, tppubtype = {article} } This editorial summarizes the performance of the special issue entitled Energy Time Series Forecasting, which was published in MDPI’s Energies journal. The special issue took place in 2016 and accepted a total of 21 papers from twelve different countries. Electrical, solar, or wind energy forecasting were the most analyzed topics, introducing brand new methods with very sound results. |
2016 |
R. Talavera-Llames and R. Pérez-Chacón and M. Martínez-Ballesteros and A. Troncoso and F. Martínez-Álvarez A Nearest Neighbours - Based Algorithm for Big Time Series Data Forecasting (Conference) HAIS 11th International Conference on Hybrid Artificial Intelligence Systems, Lecture Note in Computer Science 2016. (Links | BibTeX | Tags: big data, energy, time series) @conference{HAIS2016b, title = {A Nearest Neighbours - Based Algorithm for Big Time Series Data Forecasting}, author = {R. Talavera-Llames and R. Pérez-Chacón and M. Martínez-Ballesteros and A. Troncoso and F. Martínez-Álvarez}, url = {https://link.springer.com/chapter/10.1007/978-3-319-32034-2_15}, year = {2016}, date = {2016-01-01}, booktitle = {HAIS 11th International Conference on Hybrid Artificial Intelligence Systems}, series = {Lecture Note in Computer Science}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {conference} } |
R. Pérez-Chacón and R. Talavera-Llames and F. Martínez-Álvarez and A. Troncoso Finding Electric Energy Consumption Patterns in Big Time Series Data (Conference) DCAI 13th International Conference on Distributed Computing and Artificial Intelligence, Advances in Intelligent Systems and Computing 2016. (Links | BibTeX | Tags: big data, energy, time series) @conference{DCAI2016, title = {Finding Electric Energy Consumption Patterns in Big Time Series Data}, author = {R. Pérez-Chacón and R. Talavera-Llames and F. Martínez-Álvarez and A. Troncoso}, url = {https://link.springer.com/chapter/10.1007%2F978-3-319-40162-1_25}, year = {2016}, date = {2016-01-01}, booktitle = {DCAI 13th International Conference on Distributed Computing and Artificial Intelligence}, series = {Advances in Intelligent Systems and Computing}, keywords = {big data, energy, time series}, pubstate = {published}, tppubtype = {conference} } |