filters.bitext_filter#

Module Contents#

Classes#

API#

class filters.bitext_filter.BitextFilter(
src_field: str = 'src',
tgt_field: str = 'tgt',
metadata_fields: list[str] | str | None = None,
metadata_field_name_mapping: dict[str, str] | None = None,
score_field: str | None = None,
score_type: type | str | None = None,
invert: bool = False,
)#

Bases: abc.ABC

Initialization

abstractmethod keep_bitext(**kwargs) bool#
abstractmethod score_bitext(
src: pandas.Series,
tgt: pandas.Series,
**kwargs,
) pandas.Series#