@inproceedings{541464a935104feea80fcedaef6bb56d,
title = "Roulette sampling for cost-sensitive learning",
abstract = "In this paper, we propose a new and general preprocessor algorithm, called CSRoulette, which converts any cost-insensitive classification algorithms into cost-sensitive ones. CSRoulette is based on cost proportional roulette sampling technique (called CPRS in short). CSRoulette is closely related to Costing, another cost-sensitive meta-learning algorithm, which is based on rejection sampling. Unlike rejection sampling which produces smaller samples, CPRS can generate different size samples. To further improve its performance, we apply ensemble (bagging) on CPRS; the resulting algorithm is called CSRoulette. Our experiments show that CSRoulette outperforms Costing and other meta-learning methods in most datasets tested. In addition, we investigate the effect of various sample sizes and conclude that reduced sample sizes (as in rejection sampling) cannot be compensated by increasing the number of bagging iterations.",
keywords = "Classification, Cost-sensitive learning, Data mining, Decision trees, Machine learning, Meta-learning",
author = "Sheng, {Victor S.} and Ling, {Charles X.}",
year = "2007",
doi = "10.1007/978-3-540-74958-5_73",
language = "English",
isbn = "9783540749578",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer-Verlag",
pages = "724--731",
booktitle = "Machine Learning",
note = "18th European Conference on Machine Learning, ECML 2007 ; Conference date: 17-09-2007 Through 21-09-2007",
}