Mercurial > p > roundup > code

--- a/roundup/backends/indexer_dbm.py	Tue Oct 29 22:13:49 2019 -0400
+++ b/roundup/backends/indexer_dbm.py	Wed Oct 30 17:48:48 2019 -0400
@@ -132,11 +132,11 @@
         """Split text/plain string into a list of words
         """
         # case insensitive
-        text = str(text).upper()
+        text = text.upper()

         # Split the raw text
         return re.findall(r'\b\w{%d,%d}\b' % (self.minlength, self.maxlength),
-                          text)
+                          text, re.UNICODE)

     # we override this to ignore too short and too long words
     # and also to fix a bug - the (fail) case.
author	John Rouillard <rouilj@ieee.org>
date	Wed, 30 Oct 2019 17:48:48 -0400
parents	e2baa4e6ed6d
children	8e4c5db44fde