Skip to content

Commit 7116c87

Browse files
committed
handle words starting with unicode characters
1 parent 0fb5e98 commit 7116c87

File tree

1 file changed

+7
-1
lines changed

1 file changed

+7
-1
lines changed

roundup/backends/indexer_dbm.py

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -189,7 +189,10 @@ def load_index(self, reload=0, wordlist=None):
189189
else:
190190
segments = ['-','#']
191191
for word in wordlist:
192-
segments.append(word[0].upper())
192+
initchar = word[0].upper()
193+
if initchar not in self.segments:
194+
initchar = '_'
195+
segments.append(initchar)
193196

194197
# Load the segments
195198
for segment in segments:
@@ -242,6 +245,9 @@ def save_index(self):
242245
segdicts[segment] = {}
243246
for word, entry in self.words.items(): # Split into segment dicts
244247
initchar = word[0].upper()
248+
if initchar not in letters:
249+
# if it's a unicode character, add it to the '_' segment
250+
initchar = '_'
245251
segdicts[initchar][word] = entry
246252

247253
# save

0 commit comments

Comments
 (0)