def tabulate()

in c3dm/tools/tabulate.py [0:0]
59 lines of code
24 McCabe index (conditional complexity)

def tabulate(tabular_data, headers=(), tablefmt="simple",
			 floatfmt=_DEFAULT_FLOATFMT, numalign="decimal", stralign="left",
			 missingval=_DEFAULT_MISSINGVAL, showindex="default", disable_numparse=False,
			 colalign=None):
	"""Format a fixed width table for pretty printing.

	>>> print(tabulate([[1, 2.34], [-56, "8.999"], ["2", "10001"]]))
	---  ---------
	  1      2.34
	-56      8.999
	  2  10001
	---  ---------

	The first required argument (`tabular_data`) can be a
	list-of-lists (or another iterable of iterables), a list of named
	tuples, a dictionary of iterables, an iterable of dictionaries,
	a two-dimensional NumPy array, NumPy record array, or a Pandas'
	dataframe.


	Table headers
	-------------

	To print nice column headers, supply the second argument (`headers`):

	  - `headers` can be an explicit list of column headers
	  - if `headers="firstrow"`, then the first row of data is used
	  - if `headers="keys"`, then dictionary keys or column indices are used

	Otherwise a headerless table is produced.

	If the number of headers is less than the number of columns, they
	are supposed to be names of the last columns. This is consistent
	with the plain-text format of R and Pandas' dataframes.

	>>> print(tabulate([["sex","age"],["Alice","F",24],["Bob","M",19]],
	...       headers="firstrow"))
		   sex      age
	-----  -----  -----
	Alice  F         24
	Bob    M         19

	By default, pandas.DataFrame data have an additional column called
	row index. To add a similar column to all other types of data,
	use `showindex="always"` or `showindex=True`. To suppress row indices
	for all types of data, pass `showindex="never" or `showindex=False`.
	To add a custom row index column, pass `showindex=some_iterable`.

	>>> print(tabulate([["F",24],["M",19]], showindex="always"))
	-  -  --
	0  F  24
	1  M  19
	-  -  --


	Column alignment
	----------------

	`tabulate` tries to detect column types automatically, and aligns
	the values properly. By default it aligns decimal points of the
	numbers (or flushes integer numbers to the right), and flushes
	everything else to the left. Possible column alignments
	(`numalign`, `stralign`) are: "right", "center", "left", "decimal"
	(only for `numalign`), and None (to disable alignment).


	Table formats
	-------------

	`floatfmt` is a format specification used for columns which
	contain numeric data with a decimal point. This can also be
	a list or tuple of format strings, one per column.

	`None` values are replaced with a `missingval` string (like
	`floatfmt`, this can also be a list of values for different
	columns):

	>>> print(tabulate([["spam", 1, None],
	...                 ["eggs", 42, 3.14],
	...                 ["other", None, 2.7]], missingval="?"))
	-----  --  ----
	spam    1  ?
	eggs   42  3.14
	other   ?  2.7
	-----  --  ----

	Various plain-text table formats (`tablefmt`) are supported:
	'plain', 'simple', 'grid', 'pipe', 'orgtbl', 'rst', 'mediawiki',
	'latex', 'latex_raw' and 'latex_booktabs'. Variable `tabulate_formats`
	contains the list of currently supported formats.

	"plain" format doesn't use any pseudographics to draw tables,
	it separates columns with a double space:

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]],
	...                 ["strings", "numbers"], "plain"))
	strings      numbers
	spam         41.9999
	eggs        451

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]], tablefmt="plain"))
	spam   41.9999
	eggs  451

	"simple" format is like Pandoc simple_tables:

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]],
	...                 ["strings", "numbers"], "simple"))
	strings      numbers
	---------  ---------
	spam         41.9999
	eggs        451

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]], tablefmt="simple"))
	----  --------
	spam   41.9999
	eggs  451
	----  --------

	"grid" is similar to tables produced by Emacs table.el package or
	Pandoc grid_tables:

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]],
	...                ["strings", "numbers"], "grid"))
	+-----------+-----------+
	| strings   |   numbers |
	+===========+===========+
	| spam      |   41.9999 |
	+-----------+-----------+
	| eggs      |  451      |
	+-----------+-----------+

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]], tablefmt="grid"))
	+------+----------+
	| spam |  41.9999 |
	+------+----------+
	| eggs | 451      |
	+------+----------+

	"fancy_grid" draws a grid using box-drawing characters:

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]],
	...                ["strings", "numbers"], "fancy_grid"))
	╒═══════════╤═══════════╕
	│ strings   │   numbers │
	╞═══════════╪═══════════╡
	│ spam      │   41.9999 │
	├───────────┼───────────┤
	│ eggs      │  451      │
	╘═══════════╧═══════════╛

	"pipe" is like tables in PHP Markdown Extra extension or Pandoc
	pipe_tables:

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]],
	...                ["strings", "numbers"], "pipe"))
	| strings   |   numbers |
	|:----------|----------:|
	| spam      |   41.9999 |
	| eggs      |  451      |

	"presto" is like tables produce by the Presto CLI:

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]],
	...                ["strings", "numbers"], "presto"))
	 strings   |   numbers
	-----------+-----------
	 spam      |   41.9999
	 eggs      |  451

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]], tablefmt="pipe"))
	|:-----|---------:|
	| spam |  41.9999 |
	| eggs | 451      |

	"orgtbl" is like tables in Emacs org-mode and orgtbl-mode. They
	are slightly different from "pipe" format by not using colons to
	define column alignment, and using a "+" sign to indicate line
	intersections:

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]],
	...                ["strings", "numbers"], "orgtbl"))
	| strings   |   numbers |
	|-----------+-----------|
	| spam      |   41.9999 |
	| eggs      |  451      |


	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]], tablefmt="orgtbl"))
	| spam |  41.9999 |
	| eggs | 451      |

	"rst" is like a simple table format from reStructuredText; please
	note that reStructuredText accepts also "grid" tables:

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]],
	...                ["strings", "numbers"], "rst"))
	=========  =========
	strings      numbers
	=========  =========
	spam         41.9999
	eggs        451
	=========  =========

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]], tablefmt="rst"))
	====  ========
	spam   41.9999
	eggs  451
	====  ========

	"mediawiki" produces a table markup used in Wikipedia and on other
	MediaWiki-based sites:

	>>> print(tabulate([["strings", "numbers"], ["spam", 41.9999], ["eggs", "451.0"]],
	...                headers="firstrow", tablefmt="mediawiki"))
	{| class="wikitable" style="text-align: left;"
	|+ <!-- caption -->
	|-
	! strings   !! align="right"|   numbers
	|-
	| spam      || align="right"|   41.9999
	|-
	| eggs      || align="right"|  451
	|}

	"html" produces HTML markup:

	>>> print(tabulate([["strings", "numbers"], ["spam", 41.9999], ["eggs", "451.0"]],
	...                headers="firstrow", tablefmt="html"))
	<table>
	<thead>
	<tr><th>strings  </th><th style="text-align: right;">  numbers</th></tr>
	</thead>
	<tbody>
	<tr><td>spam     </td><td style="text-align: right;">  41.9999</td></tr>
	<tr><td>eggs     </td><td style="text-align: right;"> 451     </td></tr>
	</tbody>
	</table>

	"latex" produces a tabular environment of LaTeX document markup:

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]], tablefmt="latex"))
	\\begin{tabular}{lr}
	\\hline
	 spam &  41.9999 \\\\
	 eggs & 451      \\\\
	\\hline
	\\end{tabular}

	"latex_raw" is similar to "latex", but doesn't escape special characters,
	such as backslash and underscore, so LaTeX commands may embedded into
	cells' values:

	>>> print(tabulate([["spam$_9$", 41.9999], ["\\\\emph{eggs}", "451.0"]], tablefmt="latex_raw"))
	\\begin{tabular}{lr}
	\\hline
	 spam$_9$    &  41.9999 \\\\
	 \\emph{eggs} & 451      \\\\
	\\hline
	\\end{tabular}

	"latex_booktabs" produces a tabular environment of LaTeX document markup
	using the booktabs.sty package:

	>>> print(tabulate([["spam", 41.9999], ["eggs", "451.0"]], tablefmt="latex_booktabs"))
	\\begin{tabular}{lr}
	\\toprule
	 spam &  41.9999 \\\\
	 eggs & 451      \\\\
	\\bottomrule
	\end{tabular}

	Number parsing
	--------------
	By default, anything which can be parsed as a number is a number.
	This ensures numbers represented as strings are aligned properly.
	This can lead to weird results for particular strings such as
	specific git SHAs e.g. "42992e1" will be parsed into the number
	429920 and aligned as such.

	To completely disable number parsing (and alignment), use
	`disable_numparse=True`. For more fine grained control, a list column
	indices is used to disable number parsing only on those columns
	e.g. `disable_numparse=[0, 2]` would disable number parsing only on the
	first and third columns.
	"""
	if tabular_data is None:
		tabular_data = []
	list_of_lists, headers = _normalize_tabular_data(
			tabular_data, headers, showindex=showindex)

	# empty values in the first column of RST tables should be escaped (issue #82)
	# "" should be escaped as "\\ " or ".."
	if tablefmt == 'rst':
		list_of_lists, headers = _rst_escape_first_column(list_of_lists, headers)

	# optimization: look for ANSI control codes once,
	# enable smart width functions only if a control code is found
	plain_text = '\t'.join(['\t'.join(map(_text_type, headers))] + \
							['\t'.join(map(_text_type, row)) for row in list_of_lists])

	has_invisible = re.search(_invisible_codes, plain_text)
	enable_widechars = wcwidth is not None and WIDE_CHARS_MODE
	if tablefmt in multiline_formats and _is_multiline(plain_text):
		tablefmt = multiline_formats.get(tablefmt, tablefmt)
		is_multiline = True
	else:
		is_multiline = False
	width_fn = _choose_width_fn(has_invisible, enable_widechars, is_multiline)

	# format rows and columns, convert numeric values to strings
	cols = list(izip_longest(*list_of_lists))
	numparses = _expand_numparse(disable_numparse, len(cols))
	coltypes = [_column_type(col, numparse=np) for col, np in
				zip(cols, numparses)]
	if isinstance(floatfmt, basestring): #old version
		float_formats = len(cols) * [floatfmt] # just duplicate the string to use in each column
	else: # if floatfmt is list, tuple etc we have one per column
		float_formats = list(floatfmt)
		if len(float_formats) < len(cols):
			float_formats.extend( (len(cols)-len(float_formats)) * [_DEFAULT_FLOATFMT] )
	if isinstance(missingval, basestring):
		missing_vals = len(cols) * [missingval]
	else:
		missing_vals = list(missingval)
		if len(missing_vals) < len(cols):
			missing_vals.extend( (len(cols)-len(missing_vals)) * [_DEFAULT_MISSINGVAL] )
	cols = [[_format(v, ct, fl_fmt, miss_v, has_invisible) for v in c]
			 for c, ct, fl_fmt, miss_v in zip(cols, coltypes, float_formats, missing_vals)]

	# align columns
	aligns = [numalign if ct in [int,float] else stralign for ct in coltypes]
	if colalign is not None:
		assert isinstance(colalign, Iterable)
		for idx, align in enumerate(colalign):
			aligns[idx] = align
	minwidths = [width_fn(h) + MIN_PADDING for h in headers] if headers else [0]*len(cols)
	cols = [_align_column(c, a, minw, has_invisible, enable_widechars, is_multiline)
			for c, a, minw in zip(cols, aligns, minwidths)]

	if headers:
		# align headers and add headers
		t_cols = cols or [['']] * len(headers)
		t_aligns = aligns or [stralign] * len(headers)
		minwidths = [max(minw, max(width_fn(cl) for cl in c)) for minw, c in zip(minwidths, t_cols)]
		headers = [_align_header(h, a, minw, width_fn(h), is_multiline, width_fn)
				   for h, a, minw in zip(headers, t_aligns, minwidths)]
		rows = list(zip(*cols))
	else:
		minwidths = [max(width_fn(cl) for cl in c) for c in cols]
		rows = list(zip(*cols))

	if not isinstance(tablefmt, TableFormat):
		tablefmt = _table_formats.get(tablefmt, _table_formats["simple"])

	return _format_table(tablefmt, headers, rows, minwidths, aligns, is_multiline)