add unit_len()

2013-03-25 16:35:28 -07:00 · 2013-03-25 16:35:28 -07:00 · d4e3837c64
parent 656d3cb501
commit d4e3837c64
1 changed files with 57 additions and 39 deletions
--- a/boltons/strutils.py
+++ b/boltons/strutils.py
@ -9,7 +9,8 @@ from compat import unicode, bytes
 __all__ = ['camel2under', 'under2camel', 'StringBuffer',
-           'slugify', 'split_punct_ws', 'asciify']
+           'slugify', 'split_punct_ws', 'asciify', 'pluralize',
           'singularize', 'cardinalize']
 _punct_ws_str = string.punctuation + string.whitespace
@ -39,37 +40,6 @@ def under2camel(under_string):
    return ''.join(w.capitalize() or '_' for w in under_string.split('_'))
 class StringBuffer(object):
    """
    This is meant to be a better file-like string buffer.
    Faster than StringIO, better encoding handling than cStringIO.
    This one is for unicode text strings. Look for ByteBuffer if you
    want to handle byte strings.
    """
    def __init__(self, default_encoding=None, errors='strict'):
        self.data = collections.deque()
        self.default_encoding = default_encoding or 'utf-8'
        self.errors = errors
    def write(self, s):
        if not isinstance(s, unicode):
            enc = self.default_encoding
            errs = self.errors
            try:
                s = s.decode(enc, errs)
            except AttributeError:
                raise ValueError('write() expected a unicode or byte string')
        self.data.append(s)
    def truncate(self):
        self.data = collections.deque()
        self.write = self.data.append
    def getvalue(self):
        return unicode().join(self.data)
 def slugify(text, delim='_', lower=True, ascii=False):
    """
    A basic function that turns text full of scary characters
@ -105,16 +75,34 @@ def split_punct_ws(text):
    return [w for w in _punct_re.split(text) if w]
-def cardinalize(unit_noun, count):
+def unit_len(sized_iterable, unit_noun='item'):
-    """\
+    """
    Returns a plain-English description of an iterable's len(),
    conditionally pluralized with cardinalize() (below).
-    Conditionally pluralizes a singular word ``unit`` if ``count`` is
+    >>> print unit_len(range(10), 'number')
-    not one, preserving case when possible.
+    10 numbers
    >>> print unit_len('aeiou', 'vowel')
    5 vowels
    >>> print unit_len([], 'worry')
    No worries
    """
    count = len(sized_iterable)
    units = cardinalize(count, unit_noun)
    if count:
        return u'%s %s' % (count, units)
    return u'No %s' % (units,)
 def cardinalize(count, unit_noun):
    """\
    Conditionally pluralizes a singular word ``unit_noun`` if
    ``count`` is not one, preserving case when possible.
    >>> vowels = 'aeiou'
-    >>> print len(vowels), cardinalize('vowel', len(vowels))
+    >>> print len(vowels), cardinalize(len(vowels), 'vowel')
    5 vowels
-    >>> print 3, cardinalize('Wish', 3)
+    >>> print 3, cardinalize(3, 'Wish')
    3 Wishes
    """
    if count == 1:
@ -140,7 +128,6 @@ def singularize(word):
        singular = word[:-2]
    else:
        singular = word[:-1]
    # not singular enough?
    return _match_case(orig_word, singular)
@ -199,6 +186,37 @@ _IRR_S2P = {'alumnus': 'alumni', 'analysis': 'analyses', 'antenna': 'antennae',
 _IRR_P2S = dict([(v, k) for k, v in _IRR_S2P.items()])
 class StringBuffer(object):
    """
    This is meant to be a better file-like string buffer.
    Faster than StringIO, better encoding handling than cStringIO.
    This one is for unicode text strings. Look for ByteBuffer if you
    want to handle byte strings.
    """
    def __init__(self, default_encoding=None, errors='strict'):
        self.data = collections.deque()
        self.default_encoding = default_encoding or 'utf-8'
        self.errors = errors
    def write(self, s):
        if not isinstance(s, unicode):
            enc = self.default_encoding
            errs = self.errors
            try:
                s = s.decode(enc, errs)
            except AttributeError:
                raise ValueError('write() expected a unicode or byte string')
        self.data.append(s)
    def truncate(self):
        self.data = collections.deque()
        self.write = self.data.append
    def getvalue(self):
        return unicode().join(self.data)
 def asciify(text, ignore=False):
    """
    Converts a unicode or bytestring into a bytestring with