@inproceedings{70fca85d9a5e4bb8842662c71b94343a,
title = "Phishing URL Detection Using URL Ranking",
abstract = "The openness of the Web exposes opportunities for criminals to upload malicious content. In fact, despite extensive research, email based spam filtering techniques are unable to protect other web services. Therefore, a counter measure must be taken that generalizes across web services to protect the user from phishing host URLs. This paper describes an approach that classifies URLs automatically based on their lexical and host-based features. Clustering is performed on the entire dataset and a cluster ID (or label) is derived for each URL, which in turn is used as a predictive feature by the classification system. Online URL reputation services are used in order to categorize URLs and the categories returned are used as a supplemental source of information that would enable the system to rank URLs. The classifier achieves 93-98% accuracy by detecting a large number of phishing hosts, while maintaining a modest false positive rate. URL clustering, URL classification, and URL categorization mechanisms work in conjunction to give URLs a rank.",
keywords = "Classification, Clustering, Feature Vector, URL Ranking, Web Categorization",
author = "Feroz, {Mohammed Nazim} and Susan Mengel",
note = "Publisher Copyright: {\textcopyright} 2015 IEEE.; 4th IEEE International Congress on Big Data, BigData Congress 2015 ; Conference date: 27-06-2015 Through 02-07-2015",
year = "2015",
month = aug,
day = "17",
doi = "10.1109/BigDataCongress.2015.97",
language = "English",
series = "Proceedings - 2015 IEEE International Congress on Big Data, BigData Congress 2015",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "635--638",
editor = "Latifur Khan and Carminati Barbara",
booktitle = "Proceedings - 2015 IEEE International Congress on Big Data, BigData Congress 2015",
}