diff roundup/backends/indexer_rdbms.py @ 4091:09e79cbeb827

force sqlite3 in py2.6+ to treat our stored text as UTF-8
author Richard Jones <richard@users.sourceforge.net>
date Thu, 12 Mar 2009 04:29:16 +0000
parents eddb82d0964c
children 2ff6f39aa391
line wrap: on
line diff
--- a/roundup/backends/indexer_rdbms.py	Thu Mar 12 03:04:10 2009 +0000
+++ b/roundup/backends/indexer_rdbms.py	Thu Mar 12 04:29:16 2009 +0000
@@ -65,8 +65,8 @@
 
         # ok, find all the unique words in the text
         text = unicode(text, "utf-8", "replace").upper()
-        wordlist = [w.encode("utf-8", "replace")
-                for w in re.findall(r'(?u)\b\w{2,25}\b', text)]
+        wordlist = [w.encode("utf-8")
+            for w in re.findall(r'(?u)\b\w{2,25}\b', text)]
         words = set()
         for word in wordlist:
             if self.is_stopword(word): continue

Roundup Issue Tracker: http://roundup-tracker.org/