Dataset composed of 30 privacy policies of online platforms, annotated to assess the level of comprehensiveness of information. This work focuses on the processed categories of data, classifying each clause either as fully informative or as insufficiently informative.
If you use this repository, dataset, or code, please cite our work as:
@inproceedings{DBLP:conf/jurix/GrundlerVaguePrivacyPolicies,
author = {Giulia Grundler and
Rūta Liepiņa and
Mariaceleste Musicco and
Francesca Lagioia and
Andrea Galassi and
Giovanni Sartor and
Paolo Torroni},
editor = {Jaromir Savelka and
Jakub Harasta and
Tereza Novotna and
Jakub Misek},
title = {Detecting Vague Clauses in Privacy Policies: the Analysis of Data Categories using BERT Models and LLMs},
booktitle = {Legal Knowledge and Information Systems - {JURIX} 2024: The Thirty-seventh Annual Conference, Brno, Czech Republic, 11-13 December 2024},
series = {Frontiers in Artificial Intelligence and Applications},
volume = {395},
pages = {72--83},
publisher = {{IOS} Press},
year = {2024},
url = {https://doi.org/10.3233/FAIA241235},
doi = {10.3233/FAIA220465}
}