diff --git a/tests/data/expected/dedupe-by-url.json.gz b/tests/data/expected/dedupe-by-url.json.gz index 50903087..295755dd 100644 Binary files a/tests/data/expected/dedupe-by-url.json.gz and b/tests/data/expected/dedupe-by-url.json.gz differ diff --git a/tests/data/expected/dedupe-paragraph-ngrams.json.gz b/tests/data/expected/dedupe-paragraph-ngrams.json.gz index beca9513..c22ba24c 100644 Binary files a/tests/data/expected/dedupe-paragraph-ngrams.json.gz and b/tests/data/expected/dedupe-paragraph-ngrams.json.gz differ diff --git a/tests/data/expected/dedupe-paragraphs.json.gz b/tests/data/expected/dedupe-paragraphs.json.gz index 182c84b4..ea7b6817 100644 Binary files a/tests/data/expected/dedupe-paragraphs.json.gz and b/tests/data/expected/dedupe-paragraphs.json.gz differ diff --git a/tests/data/expected/email-spans-jq.json.gz b/tests/data/expected/email-spans-jq.json.gz index 773e520d..cce52158 100644 Binary files a/tests/data/expected/email-spans-jq.json.gz and b/tests/data/expected/email-spans-jq.json.gz differ diff --git a/tests/data/expected/email-spans.json.gz b/tests/data/expected/email-spans.json.gz index 34a486cd..746bcb6d 100644 Binary files a/tests/data/expected/email-spans.json.gz and b/tests/data/expected/email-spans.json.gz differ diff --git a/tests/data/expected/mixer.json.gz b/tests/data/expected/mixer.json.gz index 3b1e643a..6996b9ac 100644 Binary files a/tests/data/expected/mixer.json.gz and b/tests/data/expected/mixer.json.gz differ diff --git a/tests/data/expected/remove-paragraphs.json.gz b/tests/data/expected/remove-paragraphs.json.gz index 617266d3..43c607d7 100644 Binary files a/tests/data/expected/remove-paragraphs.json.gz and b/tests/data/expected/remove-paragraphs.json.gz differ