/usr/share/pyshared/mvpa2/base/dochelpers.py is in python-mvpa2 2.2.0-4ubuntu2.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 | # emacs: -*- mode: python; py-indent-offset: 4; indent-tabs-mode: nil -*-
# vi: set ft=python sts=4 ts=4 sw=4 et:
### ### ### ### ### ### ### ### ### ### ### ### ### ### ### ### ### ### ### ##
#
# See COPYING file distributed along with the PyMVPA package for the
# copyright and license terms.
#
### ### ### ### ### ### ### ### ### ### ### ### ### ### ### ### ### ### ### ##
"""Various helpers to improve docstrings and textual output"""
__docformat__ = 'restructuredtext'
import re, textwrap
# for table2string
import numpy as np
from math import ceil
from StringIO import StringIO
from mvpa2 import cfg
from mvpa2.base.externals import versions, exists
if __debug__:
from mvpa2.base import debug
__add_init2doc = False
__in_ipython = exists('running ipython env')
# if ran within IPython -- might need to add doc to init
if __in_ipython:
__rst_mode = False # either to do ReST links at all
if versions['ipython'] <= '0.8.1':
__add_init2doc = True
else:
__rst_mode = True
#
# Predefine some sugarings depending on syntax convention to be used
#
# XXX Might need to be removed or become proper cfg parameter
__rst_conventions = 'numpy'
if __rst_conventions == 'epydoc':
_rst_sep = "`"
_rst_indentstr = " "
def _rst_section(section_name):
"""Provide section heading"""
return ":%s:" % section_name
elif __rst_conventions == 'numpy':
_rst_sep = ""
_rst_indentstr = ""
def _rst_section(section_name):
"""Provide section heading"""
return "%s\n%s" % (section_name, '-'*len(section_name))
else:
raise ValueError, "Unknown convention %s for RST" % __rst_conventions
def _rst(s, snotrst=''):
"""Produce s only in __rst mode"""
if __rst_mode:
return s
else:
return snotrst
def _rst_underline(text, markup):
"""Add and underline RsT string matching the length of the given string.
"""
return text + '\n' + markup * len(text)
def single_or_plural(single, plural, n):
"""Little helper to spit out single or plural version of a word.
"""
ni = int(n)
if ni > 1 or ni == 0:
# 1 forest, 2 forests, 0 forests
return plural
else:
return single
def handle_docstring(text, polite=True):
"""Take care of empty and non existing doc strings."""
if text is None or not len(text):
if polite:
return '' #No documentation found. Sorry!'
else:
return ''
else:
# Problem is that first line might often have no offset, so might
# need to be ignored from dedent call
if not text.startswith(' '):
lines = text.split('\n')
text2 = '\n'.join(lines[1:])
return lines[0] + "\n" + textwrap.dedent(text2)
else:
return textwrap.dedent(text)
def _indent(text, istr=_rst_indentstr):
"""Simple indenter
"""
return '\n'.join(istr + s for s in text.split('\n'))
__parameters_str_re = re.compile("[\n^]\s*:?Parameters?:?\s*\n(:?\s*-+\s*\n)?")
"""regexp to match :Parameter: and :Parameters: stand alone in a line
or
Parameters
----------
in multiple lines"""
def _split_out_parameters(initdoc):
"""Split documentation into (header, parameters, suffix)
Parameters
----------
initdoc : string
The documentation string
"""
# TODO: bind it to the only word in the line
p_res = __parameters_str_re.search(initdoc)
if p_res is None:
return initdoc, "", ""
else:
# Could have been accomplished also via re.match
# where new line is after :Parameters:
# parameters header index
ph_i = p_res.start()
# parameters body index
pb_i = p_res.end()
# end of parameters
try:
pe_i = initdoc.index('\n\n', pb_i)
except ValueError:
pe_i = len(initdoc)
result = initdoc[:ph_i].rstrip('\n '), \
initdoc[pb_i:pe_i], initdoc[pe_i:]
# XXX a bit of duplication of effort since handle_docstring might
# do splitting internally
return handle_docstring(result[0], polite=False).strip('\n'), \
textwrap.dedent(result[1]).strip('\n'), \
textwrap.dedent(result[2]).strip('\n')
__re_params = re.compile('(?:\n\S.*?)+$')
__re_spliter1 = re.compile('(?:\n|\A)(?=\S)')
__re_spliter2 = re.compile('[\n:]')
def _parse_parameters(paramdoc):
"""Parse parameters and return list of (name, full_doc_string)
It is needed to remove multiple entries for the same parameter
like it could be with adding parameters from the parent class
It assumes that previously parameters were unwrapped, so their
documentation starts at the begining of the string, like what
should it be after _split_out_parameters
"""
entries = __re_spliter1.split(paramdoc)
result = [(__re_spliter2.split(e)[0].strip(), e)
for e in entries if e != '']
if __debug__:
debug('DOCH', 'parseParameters: Given "%s", we split into %s' %
(paramdoc, result))
return result
def get_docstring_split(f):
"""Given a function, break it up into portions
Parameters
----------
f : function
Returns
-------
(initial doc string, params (as list of tuples), suffix string)
"""
if not hasattr(f, '__doc__') or f.__doc__ in (None, ""):
return None, None, None
initdoc, params, suffix = _split_out_parameters(
f.__doc__)
params_list = _parse_parameters(params)
return initdoc, params_list, suffix
def enhanced_doc_string(item, *args, **kwargs):
"""Generate enhanced doc strings for various items.
Parameters
----------
item : str or class
What object requires enhancing of documentation
*args : list
Includes base classes to look for parameters, as well, first item
must be a dictionary of locals if item is given by a string
force_extend : bool
Either to force looking for the documentation in the parents.
By default force_extend = False, and lookup happens only if kwargs
is one of the arguments to the respective function (e.g. item.__init__)
skip_params : list of str
List of parameters (in addition to [kwargs]) which should not
be added to the documentation of the class.
It is to be used from a collector, ie whenever class is already created
"""
# Handling of arguments
if len(kwargs):
if set(kwargs.keys()).issubset(set(['force_extend'])):
raise ValueError, "Got unknown keyword arguments (smth among %s)" \
" in enhanced_doc_string." % kwargs
force_extend = kwargs.get('force_extend', False)
skip_params = kwargs.get('skip_params', [])
# XXX make it work also not only with classes but with methods as well
if isinstance(item, basestring):
if len(args)<1 or not isinstance(args[0], dict):
raise ValueError, \
"Please provide locals for enhanced_doc_string of %s" % item
name = item
lcl = args[0]
args = args[1:]
elif hasattr(item, "im_class"):
# bound method
raise NotImplementedError, \
"enhanced_doc_string is not yet implemented for methods"
elif hasattr(item, "__name__"):
name = item.__name__
lcl = item.__dict__
else:
raise ValueError, "Don't know how to extend docstring for %s" % item
# check whether docstring magic is requested or not
if not cfg.getboolean('doc', 'pimp docstrings', True):
return lcl['__doc__']
if __debug__:
debug('DOCH', 'Processing docstrings of %s' % name)
#return lcl['__doc__']
rst_lvlmarkup = ["=", "-", "_"]
# would then be called for any child... ok - ad hoc for SVM???
if hasattr(item, '_customize_doc') and name=='SVM':
item._customize_doc()
initdoc = ""
if lcl.has_key('__init__'):
func = lcl['__init__']
initdoc = func.__doc__
skip_params += lcl.get('__init__doc__exclude__', [])
# either to extend arguments
# do only if kwargs is one of the arguments
# in python 2.5 args are no longer in co_names but in varnames
extend_args = force_extend or \
'kwargs' in (func.func_code.co_names +
func.func_code.co_varnames)
if __debug__ and not extend_args:
debug('DOCH',
'Not extending parameters for __init__ of %s',
(name,))
if initdoc is None:
initdoc = "Initialize instance of %s" % name
initdoc, params, suffix = _split_out_parameters(initdoc)
params_list = _parse_parameters(params)
known_params = set([i[0] for i in params_list])
# If there are additional ones:
if lcl.has_key('_paramsdoc'):
params_list += [i for i in lcl['_paramsdoc']
if not (i[0] in known_params)]
known_params = set([i[0] for i in params_list])
# no need for placeholders
skip_params = set(skip_params + ['kwargs', '**kwargs'])
# XXX we do evil check here, refactor code to separate
# regressions out of the classifiers, and making
# retrainable flag not available for those classes which
# can't actually do retraining. Although it is not
# actually that obvious for Meta Classifiers
if hasattr(item, '__tags__'):
clf_internals = item.__tags__
skip_params.update([i for i in ('retrainable',)
if not (i in clf_internals)])
known_params.update(skip_params)
if extend_args:
# go through all the parents and obtain their init parameters
parent_params_list = []
for i in args:
if hasattr(i, '__init__'):
# XXX just assign within a class to don't redo without need
initdoc_ = i.__init__.__doc__
if initdoc_ is None:
continue
splits_ = _split_out_parameters(initdoc_)
params_ = splits_[1]
parent_params_list += _parse_parameters(params_.lstrip())
# extend with ones which are not known to current init
for i, v in parent_params_list:
if not (i in known_params):
params_list += [(i, v)]
known_params.update([i])
# if there are parameters -- populate the list
if len(params_list):
params_ = '\n'.join([i[1].rstrip() for i in params_list
if not i[0] in skip_params])
initdoc += "\n\n%s\n" \
% _rst_section('Parameters') + _indent(params_)
if suffix != "":
initdoc += "\n\n" + suffix
initdoc = handle_docstring(initdoc)
# Finally assign generated doc to the constructor
lcl['__init__'].__doc__ = initdoc
docs = [ handle_docstring(lcl['__doc__']) ]
# Optionally populate the class documentation with it
if __add_init2doc and initdoc != "":
docs += [ _rst_underline('Constructor information for `%s` class'
% name, rst_lvlmarkup[2]),
initdoc ]
# Add information about the ca if available
if lcl.has_key('_cadoc') and len(item._cadoc):
# to don't conflict with Notes section if such was already
# present
lcldoc = lcl['__doc__'] or ''
if not 'Notes' in lcldoc:
section_name = _rst_section('Notes')
else:
section_name = '\n' # just an additional newline
# no indent is necessary since ca list must be already indented
docs += ['%s\nAvailable conditional attributes:' % section_name,
handle_docstring(item._cadoc)]
# Deprecated -- but actually we might like to have it in ipython
# mode may be?
if False: #len(args):
bc_intro = _rst(' ') + 'Please refer to the documentation of the ' \
'base %s for more information:' \
% (single_or_plural('class', 'classes', len(args)))
docs += ['\n' + _rst_section('See Also'),
bc_intro,
' ' + ',\n '.join(['%s%s.%s%s%s' % (_rst(':class:`~'),
i.__module__,
i.__name__,
_rst('`'),
_rst_sep)
for i in args])
]
itemdoc = '\n\n'.join(docs)
# remove some bogus new lines -- never 3 empty lines in doc are useful
result = re.sub("\s*\n\s*\n\s*\n", "\n\n", itemdoc)
return result
def table2string(table, out=None):
"""Given list of lists figure out their common widths and print to out
Parameters
----------
table : list of lists of strings
What is aimed to be printed
out : None or stream
Where to print. If None -- will print and return string
Returns
-------
string if out was None
"""
print2string = out is None
if print2string:
out = StringIO()
# equalize number of elements in each row
Nelements_max = len(table) \
and max(len(x) for x in table)
for i, table_ in enumerate(table):
table[i] += [''] * (Nelements_max - len(table_))
# figure out lengths within each column
atable = np.asarray(table)
# eat whole entry while computing width for @w (for wide)
markup_strip = re.compile('^@([lrc]|w.*)')
col_width = [ max( [len(markup_strip.sub('', x))
for x in column] ) for column in atable.T ]
string = ""
for i, table_ in enumerate(table):
string_ = ""
for j, item in enumerate(table_):
item = str(item)
if item.startswith('@'):
align = item[1]
item = item[2:]
if not align in ['l', 'r', 'c', 'w']:
raise ValueError, 'Unknown alignment %s. Known are l,r,c' % align
else:
align = 'c'
NspacesL = max(ceil((col_width[j] - len(item))/2.0), 0)
NspacesR = max(col_width[j] - NspacesL - len(item), 0)
if align in ['w', 'c']:
pass
elif align == 'l':
NspacesL, NspacesR = 0, NspacesL + NspacesR
elif align == 'r':
NspacesL, NspacesR = NspacesL + NspacesR, 0
else:
raise RuntimeError, 'Should not get here with align=%s' % align
string_ += "%%%ds%%s%%%ds " \
% (NspacesL, NspacesR) % ('', item, '')
string += string_.rstrip() + '\n'
out.write(string)
if print2string:
value = out.getvalue()
out.close()
return value
def _repr_attrs(obj, attrs, default=None, error_value='ERROR'):
"""Helper to obtain a list of formatted attributes different from
the default
"""
out = []
for a in attrs:
v = getattr(obj, a, error_value)
if not (v is default or isinstance(v, basestring) and v == default):
out.append('%s=%r' % (a, v))
return out
def _repr(obj, *args, **kwargs):
"""Helper to get a structured __repr__ for all objects.
Parameters
----------
obj : object
This will typically be `self` of the to be documented object.
*args, **kwargs : str
An arbitrary number of additional items. All of them must be of type
`str`. All items will be appended comma separated to the class name.
Keyword arguments will be appended as `key`=`value.
Returns
-------
str
"""
cls_name = obj.__class__.__name__
truncate = cfg.get_as_dtype('verbose', 'truncate repr', int, default=200)
# -5 to take (...) into account
max_length = truncate - 5 - len(cls_name)
if max_length < 0:
max_length = 0
auto_repr = ', '.join(list(args)
+ ["%s=%s" % (k, v) for k, v in kwargs.iteritems()])
if not truncate is None and len(auto_repr) > max_length:
auto_repr = auto_repr[:max_length] + '...'
# finally wrap in <> and return
# + instead of '%s' for bits of speedup
return "%s(%s)" % (cls_name, auto_repr)
def _str(obj, *args, **kwargs):
"""Helper to get a structured __str__ for all objects.
If an object has a `descr` attribute, its content will be used instead of
an auto-generated description.
Optional additional information might be added under certain debugging
conditions (e.g. `id(obj)`).
Parameters
----------
obj : object
This will typically be `self` of the to be documented object.
*args, **kwargs : str
An arbitrary number of additional items. All of them must be of type
`str`. All items will be appended comma separated to the class name.
Keyword arguments will be appended as `key`=`value.
Returns
-------
str
"""
truncate = cfg.get_as_dtype('verbose', 'truncate str', int, default=200)
s = None
# don't do descriptions for dicts like our collections as they might contain
# an actual item 'descr'
if hasattr(obj, 'descr') and not isinstance(obj, dict):
s = obj.descr
if s is None:
s = obj.__class__.__name__
auto_descr = ', '.join(list(args)
+ ["%s=%s" % (k, v) for k, v in kwargs.iteritems()])
if len(auto_descr):
s = s + ': ' + auto_descr
if not truncate is None and len(s) > truncate - 5:
# -5 to take <...> into account
s = s[:truncate-5] + '...'
if __debug__ and 'DS_ID' in debug.active:
# in case there was nothing but the class name
if len(s):
if s[-1]:
s += ','
s += ' '
s += 'id=%i' % id(obj)
# finally wrap in <> and return
# + instead of '%s' for bits of speedup
return '<' + s + '>'
def borrowdoc(cls, methodname=None):
"""Return a decorator to borrow docstring from another `cls`.`methodname`
It should not be used for __init__ methods of classes derived from
ClassWithCollections since __doc__'s of those are handled by the
AttributeCollector anyways.
Common use is to borrow a docstring from the class's method for an
adapter function (e.g. sphere_searchlight borrows from Searchlight)
Examples
--------
To borrow `__repr__` docstring from parent class `Mapper`, do::
@borrowdoc(Mapper)
def __repr__(self):
...
Parameters
----------
cls
Usually a parent class
methodname : None or str
Name of the method from which to borrow. If None, would use
the same name as of the decorated method
"""
def _borrowdoc(method):
"""Decorator which assigns to the `method` docstring from another
"""
if methodname is None:
other_method = getattr(cls, method.__name__)
else:
other_method = getattr(cls, methodname)
if hasattr(other_method, '__doc__'):
method.__doc__ = other_method.__doc__
return method
return _borrowdoc
def borrowkwargs(cls, methodname=None, exclude=None):
"""Return a decorator which would borrow docstring for ``**kwargs``
Notes
-----
TODO: take care about ``*args`` in a clever way if those are also present
Examples
--------
In the simplest scenario -- just grab all arguments from parent class::
@borrowkwargs(A)
def met1(self, bu, **kwargs):
pass
Parameters
----------
methodname : None or str
Name of the method from which to borrow. If None, would use
the same name as of the decorated method
exclude : None or list of arguments to exclude
If function does not pass all ``**kwargs``, you would need to list
those here to be excluded from borrowed docstring
"""
def _borrowkwargs(method):
"""Decorator which borrows docstrings for ``**kwargs`` for the `method`
"""
if methodname is None:
other_method = getattr(cls, method.__name__)
else:
other_method = getattr(cls, methodname)
# TODO:
# method.__doc__ = enhanced_from(other_method.__doc__)
mdoc, odoc = method.__doc__, other_method.__doc__
if mdoc is None:
mdoc = ''
mpreamble, mparams, msuffix = _split_out_parameters(mdoc)
opreamble, oparams, osuffix = _split_out_parameters(odoc)
mplist = _parse_parameters(mparams)
oplist = _parse_parameters(oparams)
known_params = set([i[0] for i in mplist])
# !!! has to not rebind exclude variable
skip_params = exclude or [] # handle None
skip_params = set(['kwargs', '**kwargs'] + skip_params)
# combine two and filter out items to skip
aplist = [i for i in mplist if not i[0] in skip_params]
aplist += [i for i in oplist
if not i[0] in skip_params.union(known_params)]
docstring = mpreamble
if len(aplist):
params_ = '\n'.join([i[1].rstrip() for i in aplist])
docstring += "\n\n%s\n" \
% _rst_section('Parameters') + _indent(params_)
if msuffix != "":
docstring += "\n\n" + msuffix
docstring = handle_docstring(docstring)
# Finally assign generated doc to the method
method.__doc__ = docstring
return method
return _borrowkwargs
|