Collator.lstripwords: Strip words off the start and append to the end.

[python-collate.git] / collate / icu / __init__.py
diff --git a/collate/icu/__init__.py b/collate/icu/__init__.py

index 00a1538..6d27a6f 100644 (file)
--- a/collate/icu/__init__.py
+++ b/collate/icu/__init__.py
@@ -11,6 +11,8 @@ Avoid this backend if...
  
  """
  
+__all__ = ["Collator"]
+
  import collate._abcollator
  import collate._locale
  import collate.errors
@@ -21,6 +23,7 @@ class Collator(collate._abcollator.Collator):
      """ICU-based collation."""
  
      def __init__(self, locale, encoding=None):
+        super(Collator, self).__init__(locale, encoding)
          locale, encoding = collate._locale.getpair(locale, encoding)
          icu_locale = "root" if locale == "C" else locale
          self._collator = _icu.Collator(icu_locale)
@@ -37,9 +40,9 @@ class Collator(collate._abcollator.Collator):
              self._breaker = _icu.WordBreaker("root")
  
      def words(self, string):
-        if isinstance(string, str):
-            string = string.decode(self.encoding, 'replace')
-        return filter(lambda u: not u.isspace(), self._breaker.words(string))
+        """Split the string along word boundries."""
+        string = self.unicode(string)
+        return self._breaker.words(string)
  
      def key(self, string):
          """Sort key for a string.
@@ -48,18 +51,6 @@ class Collator(collate._abcollator.Collator):
          instance according to the 'encoding' attribute of the
          Collator.
          """
-        if isinstance(string, str):
-            string = string.decode(self.encoding, 'replace')
+        string = self.unicode(string)
          return self._collator.key(string)
  
-    def cmp(self, a, b):
-        """Return negative if a < b, zero if a == b, positive if a > b.
-
-        If strs rather than unicodes are passed in, they are first
-        decoded according to the 'encoding' attribute of the Collator.
-        """
-        if isinstance(a, str):
-            a = a.decode(self.encoding, 'replace')
-        if isinstance(b, str):
-            b = a.decode(self.encoding, 'replace')
-        return self._collator.cmp(a, b)