@inproceedings{d31569e3558243b6a024b3273ba9ce7b,
title = "Ensemble Learning on Large Scale Financial Imbalanced Data",
abstract = "This study focused on evaluating the performance of ensemble learning on handling imbalanced data. Imbalanced data is a special problem in classification task where the class distribution is not uniformed. Resampling (SMOTE and ENN) is employed to improve the classifier performance. Four metrics is applied for performance evaluation i.e., precision, recall, specificity, and F-1 score. Based on the experiments, Bagging has a superior performance compared to baseline classifiers (Na{\"i}ve Bayes and Log Regression) and other ensemble learnings (Boosting and Random Forest). In addition, the combination of SMOTE and ENN successfully increase the classification performance and avoiding biased to the majority class.",
keywords = "Big data, Ensemble learning, Imbalanced data, Spark (key words)",
author = "Sanabila, {H. R.} and Wisnu Jatmiko",
note = "Publisher Copyright: {\textcopyright} 2018 IEEE.; 2018 International Workshop on Big Data and Information Security, IWBIS 2018 ; Conference date: 12-05-2018 Through 13-05-2018",
year = "2018",
month = sep,
day = "24",
doi = "10.1109/IWBIS.2018.8471702",
language = "English",
series = "2018 International Workshop on Big Data and Information Security, IWBIS 2018",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "93--98",
booktitle = "2018 International Workshop on Big Data and Information Security, IWBIS 2018",
address = "United States",
}