source: main/waeup.kofa/trunk/src/waeup/kofa/utils/helpers.py @ 8349

Last change on this file since 8349 was 8192, checked in by uli, 13 years ago

Let to_timezone ignore not-datetimes.

  • Property svn:keywords set to Id
File size: 18.1 KB
RevLine 
[7196]1## $Id: helpers.py 8192 2012-04-17 11:19:55Z uli $
2##
3## Copyright (C) 2011 Uli Fouquet & Henrik Bettermann
4## This program is free software; you can redistribute it and/or modify
5## it under the terms of the GNU General Public License as published by
6## the Free Software Foundation; either version 2 of the License, or
7## (at your option) any later version.
8##
9## This program is distributed in the hope that it will be useful,
10## but WITHOUT ANY WARRANTY; without even the implied warranty of
11## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12## GNU General Public License for more details.
13##
14## You should have received a copy of the GNU General Public License
15## along with this program; if not, write to the Free Software
16## Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17##
[7819]18"""General helper functions for Kofa.
[4188]19"""
[8185]20import datetime
[4188]21import os
[8185]22import pytz
[4375]23import re
[4188]24import shutil
[5731]25import grok
[5848]26from cStringIO import StringIO
27from docutils.core import publish_string
[7943]28from zope.component import getUtility
[5731]29from zope.component.interfaces import IFactory
[5734]30from zope.interface import implementedBy
[7941]31from zope.interface.interface import Method, Attribute
[6071]32from zope.schema import getFieldNames
33from zope.schema.fieldproperty import FieldProperty
[6372]34from zope.security.interfaces import NoInteraction
35from zope.security.management import getInteraction
[7175]36from zope.pluggableauth.interfaces import IAuthenticatorPlugin
[4188]37
[6503]38BUFSIZE = 8 * 1024
[6372]39
[7186]40def remove_file_or_directory(filepath):
[4188]41    """Remove a file or directory.
[5738]42
43    Different to :func:`shutil.rmtree` we also accept not existing
44    paths (returning silently) and if a dir turns out to be a regular
45    file, we remove that.
[4188]46    """
47    filepath = os.path.abspath(filepath)
48    if not os.path.exists(filepath):
49        return
50    if os.path.isdir(filepath):
51        shutil.rmtree(filepath)
52    else:
53        os.unlink(filepath)
54    return
55
[7186]56def copy_filesystem_tree(src, dst, overwrite=False, del_old=False):
[4188]57    """Copy contents of directory src to directory dst.
58
59    Both directories must exists.
60
61    If `overwrite` is true, any same named objects will be
62    overwritten. Otherwise these files will not be touched.
63
64    If `del_old` is true, copied files and directories will be removed
65    from the src directory.
66
67    This functions returns a list of non-copied files.
68
69    Unix hidden files and directories (starting with '.') are not
70    processed by this function.
71    """
72    if not os.path.exists(src):
73        raise ValueError('source path does not exist: %s' % src)
74    if not os.path.exists(dst):
75        raise ValueError('destination path does not exist: %s' % dst)
76    if not os.path.isdir(src):
77        raise ValueError('source path is not a directory: %s' % src)
78    if not os.path.isdir(dst):
79        raise ValueError('destination path is not a directory: %s' % dst)
80    not_copied = []
81    for item in os.listdir(src):
82        if item.startswith('.'):
83            continue # We do not copy hidden stuff...
84        itemsrc = os.path.join(src, item)
85        itemdst = os.path.join(dst, item)
86
87        if os.path.exists(itemdst):
88            if overwrite is True:
[7186]89                remove_file_or_directory(itemdst)
[4188]90            else:
91                not_copied.append(item)
92                continue
[6113]93
[4188]94        if os.path.isdir(itemsrc):
95            shutil.copytree(itemsrc, itemdst)
96        else:
97            shutil.copy2(itemsrc, itemdst)
98        if del_old:
[7186]99            remove_file_or_directory(itemsrc)
[4188]100    return not_copied
[4375]101
102
[7186]103def get_inner_HTML_part(html_code):
[4375]104    """Return the 'inner' part of a complete HTML snippet.
105
106    If there is a form part, get this.
107
108    If there is no form part, try to return the body part contents.
109
110    If there is no body, return as-is.
[5738]111
112    Let's see how that works. If we deliver some doc with form, we
113    will get that form only:
114
115       >>> doc = '<html><form>My Form</form>Outside the form</html>'
[7186]116       >>> get_inner_HTML_part(doc)
[5738]117       '<form>My Form</form>'
118
119    No form? Then seek for a body part and get the contents:
120
121       >>> doc = '<html><body>My Body</body>Trailing Trash</html>'
[7186]122       >>> get_inner_HTML_part(doc)
[5738]123       'My Body'
124
125    If none of these is included, return what we got:
126
127       >>> doc = '<html>without body nor form</html>'
[7186]128       >>> get_inner_HTML_part(doc)
[5738]129       '<html>without body nor form</html>'
130
[4375]131    """
132
133    try:
[5738]134        result = re.match('^.+(<form[^\>]*>.*</form>).+$', html_code,
[4375]135                          re.DOTALL).groups()[0]
136        return result
137    except AttributeError:
138        # No <form> part included
139        try:
140            result = re.match('^.+<body[^\>]*>(.*)</body>.*$', html_code,
141                              re.DOTALL).groups()[0]
142            return result
143        except AttributeError:
144            # No <form> and no <body> tag...
145            pass
146    return html_code
147
[5731]148class FactoryBase(grok.GlobalUtility):
149    """A factory for things.
150
151    This is a baseclass for easier creation of factories. Factories
152    are utilities that are registered under a certain name and return
153    instances of certain classes when called.
154
[7811]155    In :mod:`waeup.kofa` we use factories extensively for
[7933]156    batching. While processing a batch some processors looks up a
[5731]157    factory to create real-world instances that then get filled with
158    data from imported CSV files.
159
160    To get rid of reimplementing the same stuff over and over again,
161    most notably the methods defined here, we offer this base class
162    (which will *not* be registered as a factory itself).
163
164    Real factories can then be created like this:
165
166       >>> import grok
[7811]167       >>> from waeup.kofa.utils.helpers import FactoryBase
[5731]168       >>> class MyObject(object):
169       ...   # Some class we want to get instances of.
170       ...   pass
171       >>> class MyObjectFactory(FactoryBase):
172       ...   # This is the factory for MyObject instances
[7811]173       ...   grok.name(u'waeup.kofa.factory.MyObject')
[5731]174       ...   factory = MyObject
175
176    That's it. It is essential to set the ``factory`` attribute, which
177    will determine the class of which instances should be created when
178    called. The given name must even be unique amongst all utilities
179    registered during runtime. While you can pick any name you like
[7811]180    you might want to prepend ``waeup.kofa.factory.`` to the name
[5731]181    string to make sure it does not clash with names of other
182    utilities one day.
183
184    Before all this works we have to grok the baseclass once and our
185    freshly defined factory. This executes all the component
186    registration stuff we don't want to do ourselves. In daily use
[7811]187    this is done automatically on startup of a :mod:`waeup.kofa`
[5731]188    system.
[6113]189
[7811]190       >>> grok.testing.grok('waeup.kofa.utils.helpers')
[5731]191       >>> grok.testing.grok_component(
192       ...    'MyObjectFactory', MyObjectFactory
193       ...  )
194       True
195
[7933]196    After grokking we (and processors) can create objects without
[5731]197    knowing about the location of the real class definition, just by
198    the factory name:
199
200       >>> from zope.component import createObject
[7811]201       >>> obj = createObject('waeup.kofa.factory.MyObject')
[5731]202       >>> isinstance(obj, MyObject)
203       True
204
205    We can also use the regular utility lookups to find our new
206    factory:
207
208       >>> from zope.component import getUtility
209       >>> from zope.component.interfaces import IFactory
210       >>> factory = getUtility(
[7811]211       ...   IFactory, name='waeup.kofa.factory.MyObject'
[5731]212       ...   )
213       >>> isinstance(factory, MyObjectFactory)
214       True
215
216    And this factory generates `MyObject` instances:
217
218       >>> obj = factory()
219       >>> isinstance(obj, MyObject)
220       True
221
222    """
223    grok.baseclass() # Do not grok this class, do not register us.
224    grok.implements(IFactory)
225    # You can override any of the following attributes in derived
226    # classes. The `grok.name` setting *must* even be set to some
227    # unique value.
228    grok.name(u'waeup.Factory')
229    title = u"Create instances of ``factory``.",
230    description = u"This factory instantiates new applicant instances."
231    factory = None
232
233    def __call__(self, *args, **kw):
234        """The main factory function.
235
236        Returns an instance of the requested object.
237        """
238        return self.factory()
239
240    def getInterfaces(self):
241        # Required by IFactory
242        return implementedBy(self.factory)
[5848]243
244def ReST2HTML_w_warnings(source_string):
245    """Convert a reStructuredText string to HTML preserving warnings.
246
247    Returns a tuple ``(<HTML_CODE>, <WARNINGS>)``, both being
248    strings. Where ``<HTML_CODE>`` is the HTML code generated from the
[5876]249    source string (in unicode), ``<WARNINGS>`` is a string containing
250    any warning messages or ``None``.
[6113]251
[5848]252    Regular multi-line ReStructuredText strings will be returned as
253    HTML code:
254
[7811]255        >>> from waeup.kofa.utils.helpers import ReST2HTML
[5848]256        >>> source = '''
257        ... Headline
258        ... ========
259        ...
260        ... - A list item
261        ... - Another item
262        ...
263        ... Thanks for watching!
264        ... '''
265        >>> html, warnings = ReST2HTML_w_warnings(source)
266        >>> print html
267        <div class="document" id="headline">
268        <h1 class="title">Headline</h1>
269        <BLANKLINE>
270        <ul class="simple">
271        <li>A list item</li>
272        <li>Another item</li>
273        </ul>
274        <p>Thanks for watching!</p>
275        </div>
276
277    Here no warnings happened, so the `warnings` are ``None``:
278
279        >>> warnings is None
280        True
[6113]281
[5848]282    If warnings happen then they can be retrieved in the returned
283    ``warnings``. We try to render an erraneous document:
284
285        >>> source = '''
286        ... Headline
287        ... ======
288        ...
289        ... Thanks for watching!
290        ... '''
291        >>> html, warnings = ReST2HTML_w_warnings(source)
292        >>> print html
293        <div class="document" id="headline">
294        <h1 class="title">Headline</h1>
295        <BLANKLINE>
296        <p>Thanks for watching!</p>
297        </div>
298
299        >>> print warnings
300        <string>:3: (WARNING/2) Title underline too short.
301        <BLANKLINE>
302        Headline
303        ======
304        <BLANKLINE>
305
306    As you can see, the warnings are not displayed inline the document
307    but can be retrieved from the returned warnings, which is a string
308    or ``None``.
309    """
310    warnings = StringIO()
311    fulldoc = publish_string(
312        source_string, writer_name='html4css1',
313        settings_overrides={
314            'report_level': 0,
315            'warning_stream': warnings,
316            })
317    warnings.seek(0)
318    warning_msgs = warnings.read()
319    if warning_msgs:
320        # Render again, this time with no warnings inline...
321        fulldoc =  publish_string(
322        source_string, writer_name='html4css1',
323        settings_overrides={
324            'report_level': 10000,
325            'halt_level': 10000,
326            'warning_stream': warnings,
327            })
328    if warning_msgs == '':
329        warning_msgs = None
[7186]330    result = get_inner_HTML_part(fulldoc).strip()
[5876]331    if not isinstance(result, unicode):
332        result = result.decode('utf-8')
333    return result, warning_msgs
[5848]334
335def ReST2HTML(source_string):
336    """Render a string containing ReStructuredText to HTML.
337
338    Any warnings about too short headings, etc. are silently
339    discarded. Use :func:`ReST2HTML_w_warnings` if you want to get any
340    warnings.
341
[5876]342    The returned string will be unicode.
[6113]343
[5848]344    A regular document will be rendered like this:
345
346        >>> source = '''
347        ... Headline
348        ... ========
349        ...
350        ... Thanks for watching!
351        ... '''
352        >>> html = ReST2HTML(source)
353        >>> print html
354        <div class="document" id="headline">
355        <h1 class="title">Headline</h1>
356        <BLANKLINE>
357        <p>Thanks for watching!</p>
358        </div>
359
360    A document with markup problems (here: the underline is too short)
361    will look similar:
362
363        >>> source = '''
364        ... Headline
365        ... ======
366        ...
367        ... Thanks for watching!
368        ... '''
369        >>> html = ReST2HTML(source)
370        >>> print html
371        <div class="document" id="headline">
372        <h1 class="title">Headline</h1>
373        <BLANKLINE>
374        <p>Thanks for watching!</p>
375        </div>
[6113]376
[5848]377    """
378    html, warnings = ReST2HTML_w_warnings(source_string)
379    return html
[6071]380
381def attrs_to_fields(cls):
382    """Turn the attributes of a class into FieldProperty instances.
[6113]383
384    With Python >= 2.6 we can even use this function as a class decorator.
[6071]385    """
386    iface = list(implementedBy(cls))[0]
387    for field_name in getFieldNames(iface):
388        setattr(cls, field_name, FieldProperty(iface[field_name]))
389    return cls
[6372]390
391def get_current_principal():
392    """Get the 'current' principal.
393
394    This method works without a request. Examining a request is the
395    regular (and recommended) way to get a principal involved
396    'currently'.
397
398    Use this method only if you really have no access to the current
399    request.
400
401    Returns ``None`` when no principal is involved (for instance
402    during tests).
403    """
404    try:
405        principal = getInteraction().participations[0].principal
406    except NoInteraction:
407        return None
408    except IndexError: # No participations present
409        return None
410    return principal
[6503]411
412def cmp_files(file_descr1, file_descr2):
413    """Compare two files by their file descriptors.
414
415    Returns ``True`` if both are equal, ``False`` otherwise.
416    """
[6531]417    file_descr1.seek(0)
418    file_descr2.seek(0)
[6503]419    while True:
420        b1 = file_descr1.read(BUFSIZE)
421        b2 = file_descr2.read(BUFSIZE)
422        if b1 != b2:
423            return False
424        if not b1:
425            return True
[7078]426
427def string_from_bytes(number):
428    """Turn a number into some textual representation.
429
430      Examples:
431
432        >>> string_from_bytes(1)
433        u'1 byte(s)'
434
435        >>> string_from_bytes(1025)
436        u'1 KB'
437
438        >>> string_from_bytes(1.5 * 1024*1024)
439        u'1.50 MB'
440
441        >>> string_from_bytes(673.286 * 1024**3)
442        u'673.29 GB'
443
444    """
445    if number < 1024:
446        return u'%s byte(s)' % (str(number),)
447    elif number < 1024**2:
448        return u'%s KB' % (number / 1024,)
449    elif number < 1024**3:
450        return u'%.2f MB' % (number / 1024**2,)
451    return u'%.2f GB' % (number / 1024**3,)
[7079]452
453def file_size(file_like_obj):
454    """Determine file size in most effective manner.
455
456    Returns the number of bytes in a file. This function works for
457    both, real files as well as file-like objects like cStringIO based
458    'files'.
459
460    Example:
461
462      >>> from cStringIO import StringIO
463      >>> file_size(StringIO('my file content'))
464      15
465
466    Please note that this function expects the file-like object passed
467    in to be at first reading position (it does no seek(0)) and that
468    when finished the file pointer might be at end of file.
469    """
470    if hasattr(file_like_obj, 'fileno'):
471        return os.fstat(file_like_obj.fileno())[6]
472    file_like_obj.seek(0, 2) # seek to last position in file
473    return file_like_obj.tell()
[7175]474
475def get_user_account(request):
476    """Return local user account.
477    """
478    principal_id = request.principal.id
[7234]479    authenticator = getUtility(IAuthenticatorPlugin, name='users')
480    account = authenticator.getAccount(principal_id)
[7175]481    return account
[7941]482
483def iface_names(iface, omit=[], exclude_attribs=True, exclude_methods=True):
484    """Get all attribute names of an interface.
485
486    Searches also base interfaces.
487
488    Names of fields that are pure attributes
489    (i.e. zope.interface.Attribute) or methods are excluded by
490    default.
491
492    Names of typical fields derived from zope.schema are included.
493
494    The `omit` paramter can give a list of names to exclude.
495
496    Returns an unsorted list of strings.
497    """
498    ifaces = [iface] + list(iface.getBases())
499    names = []
500    for item in ifaces:
501        names += item.names()
502    names = [x for x in names if x not in omit]
503    result = []
504    for name in names:
505        cls = iface.get(name).__class__
506        if exclude_attribs and cls is Attribute:
507            continue
508        if exclude_methods and cls is Method:
509            continue
510        result.append(name)
511    return result
[7968]512
513def get_sorted_preferred(tuples_iterable, preferred_list):
514    """Get a list of tuples (<TITLE>,<TOKEN>) with values in
515    `preferred_list` put in front.
516
517    The rest of the tuples iterable is returned in orginal order. This
518    is useful for putting default entries on top of (already sorted)
519    lists of choice values, for instance when sorting countries and
520    their code.
521
522    Sample:
523
524    We have a list of tuples with uppercase 'titles' and lowercase
525    'tokens'. This list is already sorted but we want certain values
526    of this list to show up before other values. For instance we want
527    to see the 'C' entry to come first.
528
529      >>> get_sorted_preferred([('A','a'), ('B','b'), ('C','c')],
530      ...                       ['c'])
531      (('C', 'c'), ('A', 'a'), ('B', 'b'))
532
533    i.e. the entry with 'c' as second value moved to head of result.
534
535    We can also require multiple entries at head of list:
536
537      >>> get_sorted_preferred([('A','a'), ('B','b'), ('C','c')],
538      ...                       ['b', 'c'])
539      (('B', 'b'), ('C', 'c'), ('A', 'a'))
540
541    We required the 'b' entry to come before the 'c' entry and then
542    the rest of the input list. That's what we got.
543
544    The result is returned as a tuple of tuples to keep order of values.
545    """
546    result = [None for x in preferred_list]
547    for title, code in tuples_iterable:
548        if code in preferred_list:
549            index = preferred_list.index(code)
550            result[index] = (title, code)
551        else:
552            result.append((title, code))
553    return tuple(result)
[8185]554
555def now(tz=None):
556    """Get current datetime in timezone of `tz`.
557
558    If `tz`, a `tzinfo` instance, is None, UTC time is returned.
559
560    `tz` should be a timezone as defined in pytz.
561    """
562    return to_timezone(datetime.datetime.utcnow(), tz=tz)
563
564def to_timezone(dt, tz=None):
565    """Shift datetime into timezone `tz`.
566
567    If datetime `dt` contains no `tzinfo` (i.e. it is 'naive'), it is
568    assumed to be UTC.
569
570    If no `tz` is given, shift to UTC is performed.
[8192]571
572    If `dt` is not a datetime.datetime, the input value is returned
573    unchanged.
[8185]574    """
[8192]575    if not isinstance(dt, datetime.datetime):
576        return dt
[8185]577    if tz is None:
578        tz = pytz.utc
579    if dt.tzinfo is None:
580        dt = pytz.utc.localize(dt)
581    return tz.normalize(dt.tzinfo.normalize(dt).astimezone(tz))
Note: See TracBrowser for help on using the repository browser.