PHP 8.3.31
Preview: __init__.py Size: 3.62 KB
/opt/alt/python38/lib/python3.8/site-packages/pip/_vendor/chardet/__init__.py

######################## BEGIN LICENSE BLOCK ########################
# This library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.
#
# This library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public
# License along with this library; if not, write to the Free Software
# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
# 02110-1301  USA
######################### END LICENSE BLOCK #########################

from .enums import InputState
from .universaldetector import UniversalDetector
from .version import VERSION, __version__

__all__ = ["UniversalDetector", "detect", "detect_all", "__version__", "VERSION"]


def detect(byte_str):
    """
    Detect the encoding of the given byte string.

    :param byte_str:     The byte sequence to examine.
    :type byte_str:      ``bytes`` or ``bytearray``
    """
    if not isinstance(byte_str, bytearray):
        if not isinstance(byte_str, bytes):
            raise TypeError(
                f"Expected object of type bytes or bytearray, got: {type(byte_str)}"
            )
        byte_str = bytearray(byte_str)
    detector = UniversalDetector()
    detector.feed(byte_str)
    return detector.close()


def detect_all(byte_str, ignore_threshold=False):
    """
    Detect all the possible encodings of the given byte string.

    :param byte_str:          The byte sequence to examine.
    :type byte_str:           ``bytes`` or ``bytearray``
    :param ignore_threshold:  Include encodings that are below
                              ``UniversalDetector.MINIMUM_THRESHOLD``
                              in results.
    :type ignore_threshold:   ``bool``
    """
    if not isinstance(byte_str, bytearray):
        if not isinstance(byte_str, bytes):
            raise TypeError(
                f"Expected object of type bytes or bytearray, got: {type(byte_str)}"
            )
        byte_str = bytearray(byte_str)

    detector = UniversalDetector()
    detector.feed(byte_str)
    detector.close()

    if detector.input_state == InputState.HIGH_BYTE:
        results = []
        probers = []
        for prober in detector.charset_probers:
            if hasattr(prober, "probers"):
                probers.extend(p for p in prober.probers)
            else:
                probers.append(prober)
        for prober in probers:
            if ignore_threshold or prober.get_confidence() > detector.MINIMUM_THRESHOLD:
                charset_name = prober.charset_name or ""
                lower_charset_name = charset_name.lower()
                # Use Windows encoding name instead of ISO-8859 if we saw any
                # extra Windows-specific bytes
                if lower_charset_name.startswith("iso-8859") and detector.has_win_bytes:
                    charset_name = detector.ISO_WIN_MAP.get(
                        lower_charset_name, charset_name
                    )
                results.append(
                    {
                        "encoding": charset_name,
                        "confidence": prober.get_confidence(),
                        "language": prober.language,
                    }
                )
        if len(results) > 0:
            return sorted(results, key=lambda result: -result["confidence"])

    return [detector.result]

Directory Contents

Dirs: 3 × Files: 41

Name Size Perms Modified Actions
cli DIR
- drwxr-xr-x 2025-05-01 13:10:18
Edit Download
metadata DIR
- drwxr-xr-x 2025-05-01 13:10:18
Edit Download
- drwxr-xr-x 2025-05-01 13:10:18
Edit Download
30.54 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
1.70 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
9.38 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
3.73 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
4.69 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
3.48 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
1.79 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
1.58 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
3.77 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
11.74 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
3.59 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
13.25 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
1.69 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
36.05 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
1.69 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
20.25 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
1.70 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
13.59 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
25.19 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
41.50 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
1.69 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
26.17 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
102.11 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
96.18 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
95.89 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
98.99 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
125.03 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
100.37 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
93.14 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
5.14 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
3.29 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
2.01 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
29.36 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
6.05 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
4.03 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
3.66 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
12.98 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
2.65 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
8.09 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download
242 B lrw-r--r-- 2023-11-13 21:40:26
Edit Download
3.62 KB lrw-r--r-- 2023-11-13 21:40:26
Edit Download

If ZipArchive is unavailable, a .tar will be created (no compression).