Source code for soma.html

# -*- coding: utf-8 -*-

#  This software and supporting documentation are distributed by
#      Institut Federatif de Recherche 49
#      CEA/NeuroSpin, Batiment 145,
#      91191 Gif-sur-Yvette cedex
#      France
#
# This software is governed by the CeCILL-B license under
# French law and abiding by the rules of distribution of free software.
# You can  use, modify and/or redistribute the software under the
# terms of the CeCILL-B license as circulated by CEA, CNRS
# and INRIA at the following URL "http://www.cecill.info".
#
# As a counterpart to the access to the source code and  rights to copy,
# modify and redistribute granted by the license, users are provided only
# with a limited warranty  and the software's author,  the holder of the
# economic rights,  and the successive licensors  have only  limited
# liability.
#
# In this respect, the user's attention is drawn to the risks associated
# with loading,  using,  modifying and/or developing or reproducing the
# software by the user in light of its specific status of free software,
# that may mean  that it is complicated to manipulate,  and  that  also
# therefore means  that it is reserved for developers  and  experienced
# professionals having in-depth computer knowledge. Users are therefore
# encouraged to load and test the software's suitability as regards their
# requirements in conditions enabling the security of their systems and/or
# data to be ensured and,  more generally, to use and operate it in the
# same conditions as regards security.
#
# The fact that you are presently reading this means that you have had
# knowledge of the CeCILL-B license and that you accept its terms.

'''
Utility functions for HTML format.

* author: Yann Cointepas
* organization: NeuroSpin
* license: `CeCILL B <http://www.cecill.info/licences/Licence_CeCILL-B_V1-en.html>`_
'''
from __future__ import absolute_import
__docformat__ = "restructuredtext en"

import six
import sys

#------------------------------------------------------------------------------
#: mapping of charaters to be escaped for HTML
_htmlEscape = None
_lesserHtmlEscape = None


# ylep 2020-03-24: now that UTF-8 is everywhere, shouldn't we just replace
# HTML-unsafe characters (&<>"') and leave the rest untouched? (i.e. what the
# standard library function html.escape does in Python 3.2 and later).

[docs]def htmlEscape(msg): """Replace special characters by their correponding html entity. All characters that have a corresponding named HTML entity are replaced. - returns: *unicode* """ global _htmlEscape if _htmlEscape is None: _htmlEscape = { codepoint: u'&' + name + u';' for codepoint, name in six.iteritems(six.moves.html_entities.codepoint2name) } if not isinstance(msg, six.string_types): # htmlEscape is sometimes used on non-string types (as print) like # tuples or dicts msg = str(msg) msg = six.ensure_text(msg) return msg.translate(_htmlEscape)
[docs]def lesserHtmlEscape(msg): """Replace special characters by their correponding html entity. All characters that have a corresponding named HTML entity are replaced, except accented characters commonly used in French text (éàèâêôîûàö) and the double-quote character ("). - returns: *unicode* """ global _lesserHtmlEscape if _lesserHtmlEscape is None: _lesserHtmlEscape = { codepoint: u'&' + name + u';' for codepoint, name in six.iteritems(six.moves.html_entities.codepoint2name) if six.unichr(codepoint) not in (u'"', u'é', u'à', u'è', u'â', u'ê', u'ô', u'î', u'û', u'ù', u'ö', ) } msg = six.ensure_text(msg) return msg.translate(_lesserHtmlEscape)