From 427f44c3d22604dd8224c1705d3cecde7ef410e6 Mon Sep 17 00:00:00 2001 From: loubnabnl Date: Tue, 28 Mar 2023 10:46:47 +0000 Subject: [PATCH] updates --- pii/ner/pii_redaction/run_pii_slurm.py | 5 ++--- pii/ner/pii_redaction/utils.py | 1 + 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/pii/ner/pii_redaction/run_pii_slurm.py b/pii/ner/pii_redaction/run_pii_slurm.py index 0427152..5aee4ab 100644 --- a/pii/ner/pii_redaction/run_pii_slurm.py +++ b/pii/ner/pii_redaction/run_pii_slurm.py @@ -193,14 +193,13 @@ def makejob(JOB_NAME="pii-redaction", LANG=None, TEXT_COLUMN="content"): "cmake", ] for i in range(args.start, args.end + 1): - #language = languages[i] - language="github-issues-filtered-structured" + language = languages[i] print(f"Submitting jobs for experiment on language {language}") job_name = f"{language}-pii-redaction-idx_{i}" job = makejob( JOB_NAME=job_name, LANG=language, - TEXT_COL=args.text_column, + TEXT_COLUMN=args.text_column, ) # submit the job print(f"Job for lang {language} ready and saved at jobs/{job_name}.sbatch") diff --git a/pii/ner/pii_redaction/utils.py b/pii/ner/pii_redaction/utils.py index 6ecdd27..bd4ed42 100644 --- a/pii/ner/pii_redaction/utils.py +++ b/pii/ner/pii_redaction/utils.py @@ -120,6 +120,7 @@ def redact_pii_text(text, secrets, replacements, add_references=False): step = 0 last_text = text for secret in secrets: + # some post-processing if secret["tag"] in IGNORE or not is_secret(secret["value"]): continue if secret["tag"] == "IP_ADDRESS":