From 5184c96f06f9f97d6af9b3d994e9b227cbb8b76c Mon Sep 17 00:00:00 2001 From: Neil Smith Date: Fri, 21 Oct 2016 13:33:30 +0100 Subject: [PATCH] Added more special characters for unaccent --- language_models.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/language_models.py b/language_models.py index 5a35b38..8824bca 100644 --- a/language_models.py +++ b/language_models.py @@ -7,7 +7,7 @@ import itertools from math import log10 import os -unaccent_specials = ''.maketrans({"’": "'"}) +unaccent_specials = ''.maketrans({"’": "'", '“': '"', '”': '"'}) def letters(text): """Remove all non-alphabetic characters from a text -- 2.34.1