TempSIMPDashboard / scorecard_templates /privacy_data_protection.json
evijit's picture
evijit HF staff
New design
a8af1a7 verified
{
"name": "Privacy and Data Protection Evaluation",
"questions": [
{
"question": "Data Minimization and Consent Practices",
"explainer": "Has the system been evaluated for its adherence to data minimization and consent practices?",
"details": [
"Implementation of data minimization practices",
"Use of opt-in data collection methods",
"Assessment of active consent for collecting, processing, and sharing data",
"Evaluation of compliance with privacy regulations (e.g., CCPA)",
"Measures for dataset transparency and accountability"
]
},
{
"question": "Memorization and Data Leakage Evaluation",
"explainer": "Has the system been assessed for unintended memorization and data leakage?",
"details": [
"Examination of the maximum amount of discoverable information given training data",
"Evaluation of extractable information without training data access",
"Analysis of out-of-distribution data revelation",
"Assessment of factors increasing likelihood of memorization (e.g., parameter count, sample repetitions)",
"Use of Membership Inference Attacks (MIA) or similar techniques"
]
},
{
"question": "Personal Information Revelation Assessment",
"explainer": "Has the system been evaluated for its potential to reveal personal or sensitive information?",
"details": [
"Direct prompting tests to reveal Personally Identifiable Information (PII)",
"Use of tools like ProPILE to audit PII revelation likelihood",
"Evaluation of the system's ability to infer personal attributes",
"Assessment of privacy violations based on Contextual Integrity and Theory of Mind",
"Analysis of the system's understanding of privacy context and purpose"
]
},
{
"question": "Image and Audio Privacy Evaluation",
"explainer": "For image and audio generation systems, has privacy been evaluated?",
"details": [
"Assessment of training data memorization in image generation",
"Use of adversarial Membership Inference Attacks for images",
"Evaluation of the proportion of generated images with high similarity to training data",
"Detection of memorized prompts in image generation",
"Scrutiny of audio generation models' ability to synthesize particular individuals' audio"
]
},
{
"question": "Intellectual Property and Copyright Evaluation",
"explainer": "Has the system been evaluated for its handling of intellectual property and copyrighted content?",
"details": [
"Assessment of the system's ability to generate copyrighted content",
"Evaluation of intellectual property concerns in generated content",
"Analysis of the system's handling of highly sensitive documents",
"Measures to prevent unauthorized use or reproduction of copyrighted material"
]
},
{
"question": "Retroactive Privacy Protection",
"explainer": "Has the system been evaluated for its ability to implement retroactive privacy protections?",
"details": [
"Assessment of the system's capability to retroactively retrain in accordance with privacy policies",
"Evaluation of processes for removing specific data points upon request",
"Analysis of the system's adaptability to changing privacy regulations",
"Examination of the impact of data removal on model performance",
"Assessment of the timeframe and effectiveness of retroactive privacy measures"
]
},
{
"question": "Third-party Hosting Privacy Evaluation",
"explainer": "For third-party hosted systems, has privacy been evaluated in the context of system prompts and hidden inputs?",
"details": [
"Assessment of potential leakage of private input data in generations",
"Evaluation of system prompt privacy, especially for prompts containing proprietary information",
"Analysis of the system's handling of sensitive database records in context learning",
"Examination of privacy measures for prepended system prompts",
"Assessment of the system's ability to maintain confidentiality of hidden inputs"
]
},
{
"question": "Generative AI-Specific Privacy Measures",
"explainer": "Has the evaluation considered the challenges of applying traditional privacy protection methods to generative AI?",
"details": [
"Assessment of the applicability of data sanitization techniques to generative models",
"Evaluation of differential privacy approaches in the context of generative AI",
"Analysis of novel privacy protection methods designed specifically for generative models",
"Examination of the trade-offs between privacy protection and model performance in generative AI"
]
}
]
}