PII Masking
Overview
Installation
pip install gllm-privacy-binary poetry add gllm-privacy-binaryuv add gllm-privacy-binaryRunning Your First Anonymization
1
import asyncio
from gllm_privacy.pii_detector import TextAnalyzer, TextAnonymizer
from gllm_privacy.pii_detector.constants import Entities
from gllm_privacy.pii_detector.anonymizer import Operation
async def main():
# 1. Initialize the Analyzer & Anonymizer
text_analyzer = TextAnalyzer()
text_anonymizer = TextAnonymizer(text_analyzer)
# 2. Define input text containing mixed PII
text = "Halo, nama saya Budi. Nomor KTP saya 3525011212941001. Hubungi budi@example.com atau +628123456789"
# 3. Define target entities
entities = [Entities.KTP, Entities.EMAIL_ADDRESS, Entities.PHONE_NUMBER]
# 4. Run Anonymization
print("--- Anonymizing ---")
anonymized_text = await text_anonymizer.run(
text=text,
entities=entities,
operation=Operation.ANONYMIZE
)
print(anonymized_text)
# 5. Run Deanonymization (Restore original values)
print("\n--- Deanonymizing ---")
deanonymized_text = await text_anonymizer.run(
text=anonymized_text,
operation=Operation.DEANONYMIZE
)
print(deanonymized_text)
if __name__ == "__main__":
asyncio.run(main())2
python privacy_quickstart.py3
--- Anonymizing ---
Halo, nama saya Budi. Nomor KTP saya <ID_KTP_1>. Hubungi <EMAIL_ADDRESS_1> atau <PHONE_NUMBER_1>.
--- Deanonymizing ---
Halo, nama saya Budi. Nomor KTP saya 3525011212941001. Hubungi budi@example.com atau +628123456789.Enhanced Anonymization with NER
1
2
3
4
Last updated
Was this helpful?