Пример #1
0
 def __init__(self):
     CharSetProber.__init__(self)
     self._mCodingSM = [ \
         CodingStateMachine(HZSMModel),
         CodingStateMachine(ISO2022CNSMModel),
         CodingStateMachine(ISO2022JPSMModel),
         CodingStateMachine(ISO2022KRSMModel)
         ]
     self.reset()
Пример #2
0
 def __init__(self):
     CharSetProber.__init__(self)
     self._mCodingSM = [ \
         CodingStateMachine(HZSMModel),
         CodingStateMachine(ISO2022CNSMModel),
         CodingStateMachine(ISO2022JPSMModel),
         CodingStateMachine(ISO2022KRSMModel)
         ]
     self.reset()
 def __init__(self):
     CharSetProber.__init__(self)
     self._mActiveNum = 0
     self._mProbers = []
     self._mBestGuessProber = None
Пример #4
0
import constants, sys
from charsetprober import CharSetProber

SAMPLE_SIZE = 64
SB_ENOUGH_REL_THRESHOLD = 1024
POSITIVE_SHORTCUT_THRESHOLD = 0.95
NEGATIVE_SHORTCUT_THRESHOLD = 0.05
SYMBOL_CAT_ORDER = 250
NUMBER_OF_SEQ_CAT = 4
POSITIVE_CAT = NUMBER_OF_SEQ_CAT - 1
#NEGATIVE_CAT = 0
 
class SingleByteCharSetProber(CharSetProber):
    def __init__(self, model, reversed=constants.False, nameProber=None):
        CharSetProber.__init__(self)
        self._mModel = model
        self._mReversed = reversed # TRUE if we need to reverse every pair in the model lookup
        self._mNameProber = nameProber # Optional auxiliary prober for name decision
        self.reset()

    def reset(self):
        CharSetProber.reset(self)
        self._mLastOrder = 255 # char order of last character
        self._mSeqCounters = [0] * NUMBER_OF_SEQ_CAT
        self._mTotalSeqs = 0
        self._mTotalChar = 0
        self._mFreqChar = 0 # characters that fall in our sampling range

    def get_charset_name(self):
        if self._mNameProber:
Пример #5
0
 def __init__(self):
     CharSetProber.__init__(self)
     self.reset()
Пример #6
0
 def __init__(self):
     CharSetProber.__init__(self)
     self._mActiveNum = 0
     self._mProbers = []
     self._mBestGuessProber = None
Пример #7
0
 def __init__(self):
     CharSetProber.__init__(self)
     self._mDistributionAnalyzer = None
     self._mCodingSM = None
     self._mLastChar = [_bytechar(0), _bytechar(0)]
Пример #8
0
 def __init__(self, model, reversed=False, nameProber=None):
     CharSetProber.__init__(self)
     self._mModel = model
     self._mReversed = reversed  # TRUE if we need to reverse every pair in the model lookup
     self._mNameProber = nameProber  # Optional auxiliary prober for name decision
     self.reset()
Пример #9
0
 def __init__(self):
     CharSetProber.__init__(self)
     self._mCodingSM = CodingStateMachine(UTF8SMModel)
     self.reset()
Пример #10
0
 def __init__(self):
     CharSetProber.__init__(self)
     self._mLogicalProber = None
     self._mVisualProber = None
     self.reset()
Пример #11
0
 def __init__(self):
     CharSetProber.__init__(self)
     self._mCodingSM = CodingStateMachine(UTF8SMModel)
     self.reset()
Пример #12
0
 def __init__(self):
     CharSetProber.__init__(self)
     self._mDistributionAnalyzer = None
     self._mCodingSM = None
     self._mLastChar = ['\x00', '\x00']
Пример #13
0
 def __init__(self):
     CharSetProber.__init__(self)
     self._mDistributionAnalyzer = None
     self._mCodingSM = None
     self._mLastChar = [_bytechar(0), _bytechar(0)]
Пример #14
0
	def __init__(self):
		CharSetProber.__init__(self)
		self._mLogicalProber = None
		self._mVisualProber = None
		self.reset()
Пример #15
0
 def __init__(self):
     CharSetProber.__init__(self)
     self.reset()
Пример #16
0
	def __init__(self):
		CharSetProber.__init__(self)
		self._mDistributionAnalyzer = None
		self._mCodingSM = None
		self._mLastChar = ['\x00', '\x00']
Пример #17
0
from charsetprober import CharSetProber

SAMPLE_SIZE = 64
SB_ENOUGH_REL_THRESHOLD = 1024
POSITIVE_SHORTCUT_THRESHOLD = 0.95
NEGATIVE_SHORTCUT_THRESHOLD = 0.05
SYMBOL_CAT_ORDER = 250
NUMBER_OF_SEQ_CAT = 4
POSITIVE_CAT = NUMBER_OF_SEQ_CAT - 1

#NEGATIVE_CAT = 0


class SingleByteCharSetProber(CharSetProber):
    def __init__(self, model, reversed=constants. False, nameProber=None):
        CharSetProber.__init__(self)
        self._mModel = model
        self._mReversed = reversed  # TRUE if we need to reverse every pair in the model lookup
        self._mNameProber = nameProber  # Optional auxiliary prober for name decision
        self.reset()

    def reset(self):
        CharSetProber.reset(self)
        self._mLastOrder = 255  # char order of last character
        self._mSeqCounters = [0] * NUMBER_OF_SEQ_CAT
        self._mTotalSeqs = 0
        self._mTotalChar = 0
        self._mFreqChar = 0  # characters that fall in our sampling range

    def get_charset_name(self):
        if self._mNameProber:
Пример #18
0
 def __init__(self, model, reversed=False, nameProber=None):
     CharSetProber.__init__(self)
     self._mModel = model
     self._mReversed = reversed # TRUE if we need to reverse every pair in the model lookup
     self._mNameProber = nameProber # Optional auxiliary prober for name decision
     self.reset()