modifiers.pii_modifier#

Module Contents#

Classes#

Data#

API#

modifiers.pii_modifier.DEFAULT_BATCH_SIZE#

2000

class modifiers.pii_modifier.PiiModifier(
language: str = DEFAULT_LANGUAGE,
supported_entities: list[str] | None = None,
anonymize_action: str = 'redact',
batch_size: int = DEFAULT_BATCH_SIZE,
device: str = 'gpu',
**kwargs,
)#

Bases: nemo_curator.modifiers.DocumentModifier

Initialization

load_deidentifier() nemo_curator.pii.algorithm.PiiDeidentifier#
modify_document(
text: pandas.Series,
partition_info: dict | None = None,
) pandas.Series#