Trim whitespaces in string normalization
This commit is contained in:
parent
88087c8628
commit
bb78725a05
@ -114,6 +114,15 @@ class TestTexts(unittest.TestCase):
|
||||
tools.normalize_string("avec ascenseur")
|
||||
)
|
||||
|
||||
def test_whitespace_trim(self):
|
||||
"""
|
||||
Checks that trailing and beginning whitespaces are trimmed.
|
||||
"""
|
||||
self.assertEqual(
|
||||
"rennes 35000",
|
||||
tools.normalize_string(" Rennes 35000 ")
|
||||
)
|
||||
|
||||
def test_accents(self):
|
||||
"""
|
||||
Checks accents are replaced.
|
||||
|
@ -225,6 +225,9 @@ def normalize_string(string, lowercase=True, convert_arabic_numerals=True):
|
||||
# Collapse multiple spaces, replace tabulations and newlines by space
|
||||
string = re.sub(r"\s+", " ", string)
|
||||
|
||||
# Trim whitespaces
|
||||
string = string.strip()
|
||||
|
||||
return string
|
||||
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user