@article{ZhelayskayaVasileShpritsetal.2019, author = {Zhelayskaya, Irina S. and Vasile, Ruggero and Shprits, Yuri Y. and Stolle, Claudia and Matzka, J{\"u}rgen}, title = {Systematic Analysis of Machine Learning and Feature Selection Techniques for Prediction of the Kp Index}, series = {Space Weather: The International Journal of Research and Applications}, volume = {17}, journal = {Space Weather: The International Journal of Research and Applications}, number = {10}, publisher = {American Geophysical Union}, address = {Washington}, issn = {1542-7390}, doi = {10.1029/2019SW002271}, pages = {1461 -- 1486}, year = {2019}, abstract = {The Kp index is a measure of the midlatitude global geomagnetic activity and represents short-term magnetic variations driven by solar wind plasma and interplanetary magnetic field. The Kp index is one of the most widely used indicators for space weather alerts and serves as input to various models, such as for the thermosphere and the radiation belts. It is therefore crucial to predict the Kp index accurately. Previous work in this area has mostly employed artificial neural networks to nowcast Kp, based their inferences on the recent history of Kp and on solar wind measurements at L1. In this study, we systematically test how different machine learning techniques perform on the task of nowcasting and forecasting Kp for prediction horizons of up to 12 hr. Additionally, we investigate different methods of machine learning and information theory for selecting the optimal inputs to a predictive model. We illustrate how these methods can be applied to select the most important inputs to a predictive model of Kp and to significantly reduce input dimensionality. We compare our best performing models based on a reduced set of optimal inputs with the existing models of Kp, using different test intervals, and show how this selection can affect model performance.}, language = {en} }