Coverage for /usr/local/lib/python3.7/dist-packages/chardet/sbcsgroupprober.py: 58%

######################## BEGIN LICENSE BLOCK ########################

# The Original Code is Mozilla Universal charset detector code.

# The Initial Developer of the Original Code is

# Netscape Communications Corporation.

# Contributor(s):

# Mark Pilgrim - port to Python

# Shy Shalom - original C code

# This library is free software; you can redistribute it and/or

# modify it under the terms of the GNU Lesser General Public

# License as published by the Free Software Foundation; either

# version 2.1 of the License, or (at your option) any later version.

# This library is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU

# Lesser General Public License for more details.

# You should have received a copy of the GNU Lesser General Public

# License along with this library; if not, write to the Free Software

# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA

# 02110-1301 USA

######################### END LICENSE BLOCK #########################

from .charsetgroupprober import CharSetGroupProber

from .sbcharsetprober import SingleByteCharSetProber

from .langcyrillicmodel import (Win1251CyrillicModel, Koi8rModel,

Latin5CyrillicModel, MacCyrillicModel,

Ibm866Model, Ibm855Model)

from .langgreekmodel import Latin7GreekModel, Win1253GreekModel

from .langbulgarianmodel import Latin5BulgarianModel, Win1251BulgarianModel

# from .langhungarianmodel import Latin2HungarianModel, Win1250HungarianModel

from .langthaimodel import TIS620ThaiModel

from .langhebrewmodel import Win1255HebrewModel

from .hebrewprober import HebrewProber

from .langturkishmodel import Latin5TurkishModel

class SBCSGroupProber(CharSetGroupProber):

def __init__(self):

super(SBCSGroupProber, self).__init__()

self.probers = [

SingleByteCharSetProber(Win1251CyrillicModel),

SingleByteCharSetProber(Koi8rModel),

SingleByteCharSetProber(Latin5CyrillicModel),

SingleByteCharSetProber(MacCyrillicModel),

SingleByteCharSetProber(Ibm866Model),

SingleByteCharSetProber(Ibm855Model),

SingleByteCharSetProber(Latin7GreekModel),

SingleByteCharSetProber(Win1253GreekModel),

SingleByteCharSetProber(Latin5BulgarianModel),

SingleByteCharSetProber(Win1251BulgarianModel),

# TODO: Restore Hungarian encodings (iso-8859-2 and windows-1250)

# after we retrain model.

# SingleByteCharSetProber(Latin2HungarianModel),

# SingleByteCharSetProber(Win1250HungarianModel),

SingleByteCharSetProber(TIS620ThaiModel),

SingleByteCharSetProber(Latin5TurkishModel),

]

hebrew_prober = HebrewProber()

logical_hebrew_prober = SingleByteCharSetProber(Win1255HebrewModel,

False, hebrew_prober)

visual_hebrew_prober = SingleByteCharSetProber(Win1255HebrewModel, True,

hebrew_prober)

hebrew_prober.set_model_probers(logical_hebrew_prober, visual_hebrew_prober)

self.probers.extend([hebrew_prober, logical_hebrew_prober,

visual_hebrew_prober])

self.reset()

Coverage for /usr/local/lib/python3.7/dist-packages/chardet/sbcsgroupprober.py : 58%

19 statements 11 run 8 missing 0 excluded