DOI Publisher Details Copy BibTeX Download .bib
{"key"=>"Campanile2022377", "type"=>"Conference paper", "bibtex"=>"@article{Campanile2022377,\n author = {Campanile, Lelio and de Biase, Maria Stella and Marrone, Stefano and Marulli, Fiammetta and Raimondo, Mariapia and Verde, Laura},\n title = {Sensitive Information Detection Adopting Named Entity Recognition: A Proposed Methodology},\n year = {2022},\n journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},\n volume = {13380 LNCS},\n pages = {377 – 388},\n doi = {10.1007/978-3-031-10542-5_26}\n}\n", "author"=>"Campanile, Lelio and de Biase, Maria Stella and Marrone, Stefano and Marulli, Fiammetta and Raimondo, Mariapia and Verde, Laura", "author_array"=>[{"first"=>"Lelio", "last"=>"Campanile", "prefix"=>"", "suffix"=>""}, {"first"=>"Maria Stella", "last"=>"Biase", "prefix"=>"de", "suffix"=>""}, {"first"=>"Stefano", "last"=>"Marrone", "prefix"=>"", "suffix"=>""}, {"first"=>"Fiammetta", "last"=>"Marulli", "prefix"=>"", "suffix"=>""}, {"first"=>"Mariapia", "last"=>"Raimondo", "prefix"=>"", "suffix"=>""}, {"first"=>"Laura", "last"=>"Verde", "prefix"=>"", "suffix"=>""}], "author_0_first"=>"Lelio", "author_0_last"=>"Campanile", "author_0_prefix"=>"", "author_0_suffix"=>"", "author_1_first"=>"Maria Stella", "author_1_last"=>"Biase", "author_1_prefix"=>"de", "author_1_suffix"=>"", "author_2_first"=>"Stefano", "author_2_last"=>"Marrone", "author_2_prefix"=>"", "author_2_suffix"=>"", "author_3_first"=>"Fiammetta", "author_3_last"=>"Marulli", "author_3_prefix"=>"", "author_3_suffix"=>"", "author_4_first"=>"Mariapia", "author_4_last"=>"Raimondo", "author_4_prefix"=>"", "author_4_suffix"=>"", "author_5_first"=>"Laura", "author_5_last"=>"Verde", "author_5_prefix"=>"", "author_5_suffix"=>"", "title"=>"Sensitive Information Detection Adopting Named Entity Recognition: A Proposed Methodology", "year"=>"2022", "journal"=>"Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)", "volume"=>"13380 LNCS", "pages"=>"377 – 388", "doi"=>"10.1007/978-3-031-10542-5_26", "url"=>"https://www.scopus.com/inward/record.uri?eid=2-s2.0-85135889610&doi=10.1007%2f978-3-031-10542-5_26&partnerID=40&md5=3f22e351a3b3a961fed6a8cbe9a61cba", "abstract"=>"Protecting and safeguarding privacy has become increasingly important, especially in recent years. The increasing possibilities of acquiring and sharing personal information and data through digital devices and platforms, such as apps or social networks, have increased the risks of privacy breaches. In order to effectively respect and guarantee the privacy and protection of sensitive information, it is necessary to develop mechanisms capable of providing such guarantees automatically and reliably. In this paper we propose a methodology able to automatically recognize sensitive data. A Named Entity Recognition was used to identify appropriate entities. An improvement in the recognition of these entities is achieved by evaluating the words contained in an appropriate context window by assessing their similarity to words in a domain taxonomy. This, in fact, makes it possible to refine the labels of the recognized categories using a generic Named Entity Recognition. A preliminary evaluation of the reliability of the proposed approach was performed. In detail, texts of juridical documents written in Italian were analyzed. © 2022, The Author(s), under exclusive license to Springer Nature Switzerland AG.", "author_keywords"=>"Anonymization; Data privacy; Information extraction; Named entity recognition; Sensitive information", "keywords"=>"Natural language processing systems; Sensitive data; Anonymization; Context window; Domain taxonomy; Information detection; Information extraction; Named entity recognition; Personal information; Privacy breaches; Sensitive datas; Sensitive informations; Digital devices", "publication_stage"=>"Final", "source"=>"Scopus", "note"=>"Cited by: 4"}