|
|
|
""" |
|
Charset-Normalizer |
|
~~~~~~~~~~~~~~ |
|
The Real First Universal Charset Detector. |
|
A library that helps you read text from an unknown charset encoding. |
|
Motivated by chardet, This package is trying to resolve the issue by taking a new approach. |
|
All IANA character set names for which the Python core library provides codecs are supported. |
|
|
|
Basic usage: |
|
>>> from charset_normalizer import from_bytes |
|
>>> results = from_bytes('Bсеки човек има право на образование. Oбразованието!'.encode('utf_8')) |
|
>>> best_guess = results.best() |
|
>>> str(best_guess) |
|
'Bсеки човек има право на образование. Oбразованието!' |
|
|
|
Others methods and usages are available - see the full documentation |
|
at <https://github.com/Ousret/charset_normalizer>. |
|
:copyright: (c) 2021 by Ahmed TAHRI |
|
:license: MIT, see LICENSE for more details. |
|
""" |
|
import logging |
|
|
|
from .api import from_bytes, from_fp, from_path, is_binary |
|
from .legacy import detect |
|
from .models import CharsetMatch, CharsetMatches |
|
from .utils import set_logging_handler |
|
from .version import VERSION, __version__ |
|
|
|
__all__ = ( |
|
"from_fp", |
|
"from_path", |
|
"from_bytes", |
|
"is_binary", |
|
"detect", |
|
"CharsetMatch", |
|
"CharsetMatches", |
|
"__version__", |
|
"VERSION", |
|
"set_logging_handler", |
|
) |
|
|
|
|
|
|
|
|
|
logging.getLogger("charset_normalizer").addHandler(logging.NullHandler()) |
|
|