@techreport{b5a4fb30d7a54a2ea952ae65888e317f,
title = "Forecasting Bilateral Refugee Flows with High-dimensional Data and Machine Learning Techniques",
abstract = "We develop monthly refugee flow forecasting models for 150 origin countries to the EU27, using machine learning and high-dimensional data, including digital trace data from Google Trends. Comparing different models and forecasting horizons and validating them out-of-sample, we find that an ensemble forecast combining Random Forest and Extreme Gradient Boosting algorithms consistently outperforms for forecast horizons between 3 to 12 months. For large refugee flow corridors, this holds in a parsimonious model exclusively based on Google Trends variables, which has the advantage of close-to-real-time availability. We provide practical recommendations about how our approach can enable ahead-of-period refugee forecasting applications.",
author = "A. Groeger and Conghan Zheng and {Boss .}, Konstantin and Tobias Heidland and Finja Krueger",
year = "2023",
month = mar,
language = "English",
series = "BSE Working Paper",
publisher = "BSE Working Papers",
number = "1387",
address = "Spain",
type = "WorkingPaper",
institution = "BSE Working Papers",
}