Source code for annotations.TextNorm.language

# -*- coding: UTF-8 -*-
"""
:filename: sppas.src.annotations.TextNorm.language.py
:author:   Brigitte Bigi
:contact:  develop@sppas.org
:summary:  Language name definition.

.. _This file is part of SPPAS: http://www.sppas.org/
..
    -------------------------------------------------------------------------

     ___   __    __    __    ___
    /     |  \  |  \  |  \  /              the automatic
    \__   |__/  |__/  |___| \__             annotation and
       \  |     |     |   |    \             analysis
    ___/  |     |     |   | ___/              of speech

    Copyright (C) 2011-2021  Brigitte Bigi
    Laboratoire Parole et Langage, Aix-en-Provence, France

    Use of this software is governed by the GNU Public License, version 3.

    SPPAS is free software: you can redistribute it and/or modify
    it under the terms of the GNU General Public License as published by
    the Free Software Foundation, either version 3 of the License, or
    (at your option) any later version.

    SPPAS is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU General Public License for more details.

    You should have received a copy of the GNU General Public License
    along with SPPAS. If not, see <http://www.gnu.org/licenses/>.

    This banner notice must not be removed.

    -------------------------------------------------------------------------

"""


[docs]class sppasLangISO: """Language name definition. todo: parse a iso639-3 json file to load all language names. """ lang_list = ["cmn", "jpn", "yue", "zho", "cdo", "cjy", "cmo", "cpx", "czh", "czo", "czt", "gan", "hak", "hsn", "ltc", "lzh", "mnp", "och", "wuu", "ben"] # TODO: add languages # -----------------------------------------------------------------------
[docs] @staticmethod def without_whitespace(lang): """Return true if 'lang' is not using whitespace. Mandarin Chinese or Japanese languages return True, but English or French return False. :param lang: (str) iso639-3 language code or a string starting with such code, like "yue" or "yue-chars" for example. :returns: (bool) """ for l in sppasLangISO.lang_list: if l in lang: return True for l in sppasLangISO.lang_list: if lang.startswith(l): return True return False