@inproceedings{71865ad34a944e89a3ddf6a0bc159c0f,
title = "Detecting Complex Sensitive Information via Phrase Structure in Recursive Neural Networks",
abstract = "State-of-the-art sensitive information detection in unstructured data relies on the frequency of co-occurrence of keywords with sensitive seed words. In practice, however, this may fail to detect more complex patterns of sensitive information. In this work, we propose learning phrase structures that separate sensitive from non-sensitive documents in recursive neural networks. Our evaluation on real data with human labeled sensitive content shows that our new approach outperforms existing keyword based strategies.",
author = "Jan Neerbek and Ira Assent and Peter Dolog",
year = "2018",
doi = "10.1007/978-3-319-93040-4_30",
language = "English",
isbn = "978-3-319-93039-8",
volume = "10939",
series = "Lecture Notes in Computer Science",
publisher = "Springer",
pages = "373--385",
booktitle = "PAKDD 2018",
address = "Germany",
note = "null ; Conference date: 03-06-2018 Through 06-06-2018",
}