X-Git-Url: https://git.korewanetadesu.com/?p=python-collate.git;a=blobdiff_plain;f=collate%2Fstrings.py;fp=collate%2Fstrings.py;h=60685c57a3415e763a63d05545340429113ec222;hp=8d6af993cd72d5f0fcb4fc04eb6e1953f72904c9;hb=ee7317abef6e6c235c6344f3f173af134e52cf8c;hpb=e8b221311bf60883d3f14083bab63fd947d34509 diff --git a/collate/strings.py b/collate/strings.py index 8d6af99..60685c5 100644 --- a/collate/strings.py +++ b/collate/strings.py @@ -14,7 +14,8 @@ CONTINUE_ON = frozenset([ UNKNOWN, LETTER, NUMBER = range(3) -BREAKER = u"\u2029" # Paragraph break character +BREAKER = u"\u2028" # Line break character +HBREAKER = u"\u2029" # Paragraph break character INFINITY = float('inf') KEEP_IN_NUMBERS = u"'.," @@ -81,6 +82,8 @@ def sortemes(string, key=lambda s: s): elif category[0] == "N": digits.append(uchar) if letters: + if unicodedata.category(letters[-1])[0] == "L": + letters.append(HBREAKER) aletters(u"".join(letters)) letters = [] previous = LETTER