@inproceedings{b126861e09e6473d8f98a5f17cb76af5,
title = "A multi-layer Na{\"i}ve Bayes model for approximate identity matching",
abstract = "Identity management is critical to various governmental practices ranging from providing citizens services to enforcing homeland security. The task of searching for a specific identity is difficult because multiple identity representations may exist due to issues related to unintentional errors and intentional deception. We propose a Na{\"i}ve Bayes identity matching model that improves existing techniques in terms of effectiveness. Experiments show that our proposed model performs significantly better than the exact-match based technique and achieves higher precision than the record comparison technique, In addition, our model greatly reduces the efforts of manually labeling training instances by employing a semi-supervised learning approach. This training method outperforms both fully supervised and unsupervised learning. With a training dataset that only contains 30% labeled instances, our model achieves a performance comparable to that of a fully supervised learning.",
author = "Wang, {G. Alan} and Hsinchun Chen and Homa Atabakhsh",
year = "2006",
doi = "10.1007/11760146_44",
language = "English (US)",
isbn = "3540344780",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer-Verlag",
pages = "479--484",
booktitle = "Intelligence and Security Informatics - IEEE International Conference on Intelligence and Security Informatics, ISI 2006, Proceedings",
note = "IEEE International Conference on Intelligence and Security Informatics, ISI 2006 ; Conference date: 23-05-2006 Through 24-05-2006",
}