Skip to content

sex_gender

sex_gender

Classes:

Name Description
Gender

Match Gender

Sex

Determine Male or Female

Gender()

Bases: RegexPredictor

Match Gender

Source code in src/nemo_safe_synthesizer/pii_replacer/ner/regexes/sex_gender.py
def __init__(self):
    entity = Entity.GENDER

    non_binary = Pattern(
        pattern=re.compile(r"^non[-_ ]?binary$", flags=re.IGNORECASE),
        ignore_raw_score=True,
        context_score=Score.MAX,
        header_contexts=GENDER_HEADERS,
    )
    trans_gender = Pattern(
        pattern=re.compile(r"^trans[-_ ]?(gender)?$", flags=re.IGNORECASE),
        ignore_raw_score=True,
        context_score=Score.MAX,
        header_contexts=GENDER_HEADERS,
    )
    inter_sex = Pattern(
        pattern=re.compile(r"^inter[-_ ]?sex$", flags=re.IGNORECASE),
        ignore_raw_score=True,
        context_score=Score.MAX,
        header_contexts=GENDER_HEADERS,
    )
    m = Pattern(
        pattern=re.compile(r"^m$", flags=re.IGNORECASE),
        ignore_raw_score=True,
        context_score=Score.HIGH,
        header_contexts=GENDER_HEADERS,
    )
    f = Pattern(
        pattern=re.compile(r"^f$", flags=re.IGNORECASE),
        ignore_raw_score=True,
        context_score=Score.HIGH,
        header_contexts=GENDER_HEADERS,
    )
    male = Pattern(
        pattern=re.compile(r"^male$", flags=re.IGNORECASE),
        ignore_raw_score=True,
        context_score=Score.MAX,
        header_contexts=GENDER_HEADERS,
    )
    female = Pattern(
        pattern=re.compile(r"^female$", flags=re.IGNORECASE),
        ignore_raw_score=True,
        context_score=Score.MAX,
        header_contexts=GENDER_HEADERS,
    )

    all_patterns = [non_binary, trans_gender, inter_sex, male, female, m, f]
    super().__init__(name="gender", entity=entity, patterns=all_patterns)

Sex()

Bases: RegexPredictor

Determine Male or Female

Source code in src/nemo_safe_synthesizer/pii_replacer/ner/regexes/sex_gender.py
def __init__(self):
    entity = Entity.SEX

    m = Pattern(
        pattern=re.compile(r"^m$", flags=re.IGNORECASE),
        ignore_raw_score=True,
        header_contexts=SEX_HEADERS,
    )
    f = Pattern(
        pattern=re.compile(r"^f$", flags=re.IGNORECASE),
        ignore_raw_score=True,
        header_contexts=SEX_HEADERS,
    )
    male = Pattern(
        pattern=re.compile(r"^male$", flags=re.IGNORECASE),
        raw_score=Score.HIGH,
    )
    female = Pattern(
        pattern=re.compile(r"^female$", flags=re.IGNORECASE),
        raw_score=Score.HIGH,
    )

    all_patterns = [male, female, m, f]
    super().__init__(name="sex", entity=entity, patterns=all_patterns)