$67 GRAYBYTE WORDPRESS FILE MANAGER $71

SERVER : vnpttt-amd7f72-h1.vietnix.vn #1 SMP Fri May 24 12:42:50 UTC 2024
SERVER IP : 103.200.23.149 | ADMIN IP 216.73.216.22
OPTIONS : CRL = ON | WGT = ON | SDO = OFF | PKEX = OFF
DEACTIVATED : NONE

/usr/lib/python3.6/site-packages/chardet/

HOME
Current File : /usr/lib/python3.6/site-packages/chardet//codingstatemachine.py
######################## BEGIN LICENSE BLOCK ########################
# The Original Code is mozilla.org code.
#
# The Initial Developer of the Original Code is
# Netscape Communications Corporation.
# Portions created by the Initial Developer are Copyright (C) 1998
# the Initial Developer. All Rights Reserved.
#
# Contributor(s):
#   Mark Pilgrim - port to Python
#
# This library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.
#
# This library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public
# License along with this library; if not, write to the Free Software
# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
# 02110-1301  USA
######################### END LICENSE BLOCK #########################

import logging

from .enums import MachineState


class CodingStateMachine(object):
    """
    A state machine to verify a byte sequence for a particular encoding. For
    each byte the detector receives, it will feed that byte to every active
    state machine available, one byte at a time. The state machine changes its
    state based on its previous state and the byte it receives. There are 3
    states in a state machine that are of interest to an auto-detector:

    START state: This is the state to start with, or a legal byte sequence
                 (i.e. a valid code point) for character has been identified.

    ME state:  This indicates that the state machine identified a byte sequence
               that is specific to the charset it is designed for and that
               there is no other possible encoding which can contain this byte
               sequence. This will to lead to an immediate positive answer for
               the detector.

    ERROR state: This indicates the state machine identified an illegal byte
                 sequence for that encoding. This will lead to an immediate
                 negative answer for this encoding. Detector will exclude this
                 encoding from consideration from here on.
    """
    def __init__(self, sm):
        self._model = sm
        self._curr_byte_pos = 0
        self._curr_char_len = 0
        self._curr_state = None
        self.logger = logging.getLogger(__name__)
        self.reset()

    def reset(self):
        self._curr_state = MachineState.START

    def next_state(self, c):
        # for each byte we get its class
        # if it is first byte, we also get byte length
        byte_class = self._model['class_table'][c]
        if self._curr_state == MachineState.START:
            self._curr_byte_pos = 0
            self._curr_char_len = self._model['char_len_table'][byte_class]
        # from byte's class and state_table, we get its next state
        curr_state = (self._curr_state * self._model['class_factor']
                      + byte_class)
        self._curr_state = self._model['state_table'][curr_state]
        self._curr_byte_pos += 1
        return self._curr_state

    def get_current_charlen(self):
        return self._curr_char_len

    def get_coding_state_machine(self):
        return self._model['name']

    @property
    def language(self):
        return self._model['language']

Current_dir [ NOT WRITEABLE ] Document_root [ WRITEABLE ]


[ Back ]
NAME
SIZE
LAST TOUCH
USER
CAN-I?
FUNCTIONS
..
--
16 Dec 2025 9.25 PM
root / root
0755
__pycache__
--
31 Aug 2024 3.39 AM
root / root
0755
cli
--
31 Aug 2024 3.39 AM
root / root
0755
__init__.py
1.522 KB
13 Apr 2017 1.41 AM
root / root
0644
big5freq.py
30.521 KB
12 Apr 2017 12.51 AM
root / root
0644
big5prober.py
1.716 KB
12 Apr 2017 12.51 AM
root / root
0644
chardistribution.py
9.19 KB
12 Apr 2017 2.52 AM
root / root
0644
charsetgroupprober.py
3.698 KB
12 Apr 2017 12.51 AM
root / root
0644
charsetprober.py
4.99 KB
8 Jun 2017 9.21 PM
root / root
0644
codingstatemachine.py
3.506 KB
12 Apr 2017 12.51 AM
root / root
0644
compat.py
1.107 KB
8 Jun 2017 9.32 PM
root / root
0644
cp949prober.py
1.812 KB
12 Apr 2017 12.51 AM
root / root
0644
enums.py
1.622 KB
12 Apr 2017 12.51 AM
root / root
0644
escprober.py
3.857 KB
12 Apr 2017 12.51 AM
root / root
0644
escsm.py
10.264 KB
12 Apr 2017 12.51 AM
root / root
0644
eucjpprober.py
3.661 KB
12 Apr 2017 12.51 AM
root / root
0644
euckrfreq.py
13.229 KB
12 Apr 2017 12.51 AM
root / root
0644
euckrprober.py
1.707 KB
12 Apr 2017 12.51 AM
root / root
0644
euctwfreq.py
30.88 KB
12 Apr 2017 3.48 AM
root / root
0644
euctwprober.py
1.706 KB
12 Apr 2017 12.51 AM
root / root
0644
gb2312freq.py
20.229 KB
12 Apr 2017 12.51 AM
root / root
0644
gb2312prober.py
1.713 KB
12 Apr 2017 12.51 AM
root / root
0644
hebrewprober.py
13.514 KB
8 Jun 2017 9.21 PM
root / root
0644
jisfreq.py
25.173 KB
12 Apr 2017 12.51 AM
root / root
0644
jpcntx.py
19.183 KB
12 Apr 2017 12.51 AM
root / root
0644
langbulgarianmodel.py
12.538 KB
8 Jun 2017 9.32 PM
root / root
0644
langcyrillicmodel.py
17.527 KB
8 Jun 2017 9.32 PM
root / root
0644
langgreekmodel.py
12.391 KB
8 Jun 2017 9.32 PM
root / root
0644
langhebrewmodel.py
11.079 KB
8 Jun 2017 9.32 PM
root / root
0644
langhungarianmodel.py
12.297 KB
8 Jun 2017 9.32 PM
root / root
0644
langthaimodel.py
11.025 KB
8 Jun 2017 9.32 PM
root / root
0644
langturkishmodel.py
10.842 KB
8 Jun 2017 9.32 PM
root / root
0644
latin1prober.py
5.244 KB
8 Jun 2017 9.21 PM
root / root
0644
mbcharsetprober.py
3.333 KB
12 Apr 2017 12.51 AM
root / root
0644
mbcsgroupprober.py
1.965 KB
12 Apr 2017 12.51 AM
root / root
0644
mbcssm.py
24.884 KB
12 Apr 2017 12.51 AM
root / root
0644
sbcharsetprober.py
5.524 KB
8 Jun 2017 9.32 PM
root / root
0644
sbcsgroupprober.py
3.463 KB
8 Jun 2017 9.32 PM
root / root
0644
sjisprober.py
3.686 KB
12 Apr 2017 12.51 AM
root / root
0644
universaldetector.py
12.192 KB
8 Jun 2017 9.32 PM
root / root
0644
utf8prober.py
2.701 KB
12 Apr 2017 12.51 AM
root / root
0644
version.py
0.236 KB
8 Jun 2017 9.32 PM
root / root
0644

GRAYBYTE WORDPRESS FILE MANAGER @ 2026 CONTACT ME
Static GIF