first commit

2023-11-30 14:53:37 +01:00 · 2023-11-30 14:53:37 +01:00 · b3f136fc22
commit b3f136fc22
1535 changed files with 262586 additions and 0 deletions
--- a/check-gpt4.py
+++ b/check-gpt4.py
@ -0,0 +1,36 @@
 import requests
 from dns import resolver, rdatatype
 __API_KEY = 'YXJkQU1VVkRoSGZyV0FP'  # fill in your actual api key
 __API_URL = 'https://dns.it53.nl:8443/api/v1/servers/localhost/zones'
 __MASTER_DNS = 'ns1.it53.nl'  # fill in your actual master DNS
 headers = {
    'X-API-Key': __API_KEY,
 }
 response = requests.get(__API_URL, headers=headers)
 data = response.json()
 for zone in data:
    zone_name = zone['name'].rstrip('.')
    try:
        answers = resolver.resolve(zone_name, 'NS')
        ns_records = [rdata.to_text().rstrip('.') for rdata in answers]  # strip ending '.'
        if __MASTER_DNS not in ns_records:
            print(f'🚨 {zone_name} does not point to master DNS: {__MASTER_DNS}')
            continue
    except Exception as e:
        print(f'🚨 Error resolving NS for {zone_name}: {e}')
        continue
    try:
        soa_answer = resolver.resolve(zone_name, 'SOA')
        if __MASTER_DNS not in soa_answer.rrset.to_text():
            print(f'🚨 SOA record of {zone_name} is inconsistent with master DNS: {__MASTER_DNS}')
        else:
            print(f'✅ DNS consistency check passed for {zone_name}.')
    except Exception as e:
        print(f'🚨 Error resolving SOA for {zone_name}: {e}')
--- a/check.py
+++ b/check.py
@ -0,0 +1,89 @@
 import requests
 from dns import resolver, query, message, exception  
 import socket
 # Replace with your DNS master
 DNS_MASTER = "ns1.it53.nl"
 # Replace with your API key
 API_KEY = "YXJkQU1VVkRoSGZyV0FP"
 def get_zones(api_key):
    url = "https://dns.it53.nl:8443/api/v1/servers/localhost/zones"
    headers = {"x-api-key": api_key}
    response = requests.get(url, headers=headers)
    zones = response.json()
    return zones
 def get_ns_records(zone_name):
    try:
        ns_records = resolver.resolve(zone_name, 'NS')
        return [str(record) for record in ns_records]
    except resolver.NXDOMAIN:
        print(f"❌ Error: Zone '{zone_name}' does not exist.")
        return []
    except resolver.NoAnswer:
        print(f"❌ Error: No NS records found for zone '{zone_name}'.")
        return []
 def check_soa_consistency(zone_name, ns_records, master_ip):
    master_soa_query = message.make_query(zone_name, 'SOA')
    try:
        master_soa_response = query.tcp(master_soa_query, where=master_ip)
        print(f"Master SOA response for {zone_name}: {master_soa_response}")
    except exception.SyntaxError:
        print(f"❌ Malformed text input for master NS in zone '{zone_name}'.")
        return
    for ns_record in ns_records:
        try:
            ns_soa_query = message.make_query(zone_name, 'SOA')
            ns_soa_response = query.tcp(ns_soa_query, where=ns_record)
            print(f"NS '{ns_record}' SOA response for {zone_name}: {ns_soa_response}")
            # Extract serial from SOA records
            ns_serial = ns_soa_response.answer[0].serial
            master_serial = master_soa_response.answer[0].serial
            print(f"NS serial {ns_serial}")
            # Compare serial values
            if ns_serial != master_serial:
                print(f"❌ Inconsistency: Serial for NS '{ns_record}' in zone '{zone_name}'.")
            else:
                print(f"✅ Consistency: Serial for NS '{ns_record}' in zone '{zone_name}'.")
        except exception.SyntaxError:
            print(f"❌ Malformed text input for NS '{ns_record}' in zone '{zone_name}'.")
        except resolver.NoAnswer:
            print(f"❌ No SOA record found for NS '{ns_record}' in zone '{zone_name}'.")
        except resolver.NXDOMAIN:
            print(f"❌ Zone '{zone_name}' does not exist for NS '{ns_record}'.")
        except exception.Timeout:
            print(f"❌ Timeout while checking SOA for NS '{ns_record}' in zone '{zone_name}'.")
        except Exception as e:
            print(f"❌ Error checking SOA for NS '{ns_record}' in zone '{zone_name}': {str(e)}")
 def main():
    zones = get_zones(API_KEY)
    for zone in zones:
        zone_name = zone["name"]
        print(f"Checking zone: {zone_name}")
        ns_records = get_ns_records(zone_name)
        if ns_records:
            # Resolve IP address for DNS_MASTER
            try:
                master_ip = socket.gethostbyname(DNS_MASTER)
                check_soa_consistency(zone_name, ns_records, master_ip)
            except socket.error as e:
                print(f"❌ Error resolving IP address for '{DNS_MASTER}': {str(e)}")
        exit()
        print("\n" + "=" * 40 + "\n")
 if __name__ == "__main__":
    main()
--- a/check2.py
+++ b/check2.py
@ -0,0 +1,71 @@
 import dns.resolver
 import requests
 BASE_API_URL = "https://dns.it53.nl:8443"
 def fetch_zones(api_key):
    headers = {'X-API-Key': api_key}
    response = requests.get(f"{BASE_API_URL}/api/v1/servers/localhost/zones", headers=headers)
    if response.status_code != 200:
        print(f"Error fetching zones: {response.status_code}")
        return []
    try:
        return response.json()
    except ValueError:
        print("Error parsing JSON for zones")
        print(response.text)
        return []
 def fetch_ns_records(zone_name):
    try:
        result = dns.resolver.resolve(zone_name, 'NS')
        return [str(ns) for ns in result]
    except dns.resolver.NXDOMAIN:
        print(f"Error: Zone {zone_name} not found.")
        return []
    except dns.resolver.NoAnswer:
        print(f"Error: No NS records found for zone {zone_name}")
        return []
 def check_dns_consistency(master_dns, zones, api_key):
    for zone in zones:
        zone_name = zone['name']
        print(f"Checking DNS consistency for zone: {zone_name}")
        # Fetch NS records from the internet
        master_ns_records = fetch_ns_records(zone_name)
        if not master_ns_records:
            continue
        for ns_record in master_ns_records:
            # Check SOA record consistency for each NS
            if ns_record != master_dns:
                soa_record = fetch_ns_records(f"{zone_name}/SOA")  # Use fetch_ns_records instead
                master_soa_record = fetch_ns_records(f"{zone_name}/SOA")  # Use fetch_ns_records instead
                print(f"Debug: {zone_name} - NS: {ns_record}, Master SOA: {master_dns} - {master_soa_record}, Current SOA: {ns_record} - {soa_record}")
                if soa_record != master_soa_record:
                    print(f"❌ Inconsistency detected for NS {ns_record} in zone {zone_name}")
                    print(f"   Master SOA: {master_dns} - {master_soa_record}")
                    print(f"   Current SOA: {ns_record} - {soa_record}")
                else:
                    print(f"✅ Consistency verified for NS {ns_record} in zone {zone_name}")
        print()
 if __name__ == "__main__":
    # Configure the DNS master and API key
    CONFIG = {
        "master_dns": "ns1.it53.nl",
        "api_key": "YXJkQU1VVkRoSGZyV0FP"  # Replace with your actual API key
    }
    # Fetch zones
    zones = fetch_zones(CONFIG["api_key"])
    # Check DNS consistency
    check_dns_consistency(CONFIG["master_dns"], zones, CONFIG["api_key"])
--- a/generate-zone-list.py
+++ b/generate-zone-list.py
@ -0,0 +1,24 @@
 import requests
 import yaml
 __API_KEY = 'YXJkQU1VVkRoSGZyV0FP'  
 __API_URL = 'https://dns.it53.nl:8443/api/v1/servers/localhost/zones'
 __MASTER_DNS = 'ns1.it53.nl' 
 headers = {
    'X-API-Key': __API_KEY,
 }
 response = requests.get(__API_URL, headers=headers)
 data = response.json()
 # Format zones
 zones = [{'name': d['name'].rstrip('.'), 'type': d['kind'].lower()} for d in data]
 # Dump to YAML
 output = yaml.dump({'zones': zones})
 print(output)
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,2 @@
 dnspython
 requests
--- a/serial.py
+++ b/serial.py
@ -0,0 +1,27 @@
 import dns.query
 import dns.zone
 def get_dns_serial(zone_name, nameserver):
    try:
        # Query the nameserver for the zone
        response = dns.query.tcp(dns.message.make_query(zone_name, dns.rdatatype.SOA), nameserver)
        # Parse the response
        answer = dns.zone.from_text(response.answer[0].to_text(), zone_name)
        serial = answer.get_rdataset(zone_name, dns.rdatatype.SOA)[0].serial
        return serial
    except Exception as e:
        print(f"Error: {e}")
        return None
 # Example usage
 zone_name = "0x5e.eu"
 nameserver = "ns1.it53.nl"  # Use the desired nameserver's IP address
 serial = get_dns_serial(zone_name, nameserver)
 if serial:
    print(f"The DNS serial for {zone_name} is {serial}")
 else:
    print(f"Failed to fetch DNS serial for {zone_name}")
--- a/venv/bin/Activate.ps1
+++ b/venv/bin/Activate.ps1
@ -0,0 +1,247 @@
 <#
 .Synopsis
 Activate a Python virtual environment for the current PowerShell session.
 .Description
 Pushes the python executable for a virtual environment to the front of the
 $Env:PATH environment variable and sets the prompt to signify that you are
 in a Python virtual environment. Makes use of the command line switches as
 well as the `pyvenv.cfg` file values present in the virtual environment.
 .Parameter VenvDir
 Path to the directory that contains the virtual environment to activate. The
 default value for this is the parent of the directory that the Activate.ps1
 script is located within.
 .Parameter Prompt
 The prompt prefix to display when this virtual environment is activated. By
 default, this prompt is the name of the virtual environment folder (VenvDir)
 surrounded by parentheses and followed by a single space (ie. '(.venv) ').
 .Example
 Activate.ps1
 Activates the Python virtual environment that contains the Activate.ps1 script.
 .Example
 Activate.ps1 -Verbose
 Activates the Python virtual environment that contains the Activate.ps1 script,
 and shows extra information about the activation as it executes.
 .Example
 Activate.ps1 -VenvDir C:\Users\MyUser\Common\.venv
 Activates the Python virtual environment located in the specified location.
 .Example
 Activate.ps1 -Prompt "MyPython"
 Activates the Python virtual environment that contains the Activate.ps1 script,
 and prefixes the current prompt with the specified string (surrounded in
 parentheses) while the virtual environment is active.
 .Notes
 On Windows, it may be required to enable this Activate.ps1 script by setting the
 execution policy for the user. You can do this by issuing the following PowerShell
 command:
 PS C:\> Set-ExecutionPolicy -ExecutionPolicy RemoteSigned -Scope CurrentUser
 For more information on Execution Policies: 
 https://go.microsoft.com/fwlink/?LinkID=135170
 #>
 Param(
    [Parameter(Mandatory = $false)]
    [String]
    $VenvDir,
    [Parameter(Mandatory = $false)]
    [String]
    $Prompt
 )
 <# Function declarations --------------------------------------------------- #>
 <#
 .Synopsis
 Remove all shell session elements added by the Activate script, including the
 addition of the virtual environment's Python executable from the beginning of
 the PATH variable.
 .Parameter NonDestructive
 If present, do not remove this function from the global namespace for the
 session.
 #>
 function global:deactivate ([switch]$NonDestructive) {
    # Revert to original values
    # The prior prompt:
    if (Test-Path -Path Function:_OLD_VIRTUAL_PROMPT) {
        Copy-Item -Path Function:_OLD_VIRTUAL_PROMPT -Destination Function:prompt
        Remove-Item -Path Function:_OLD_VIRTUAL_PROMPT
    }
    # The prior PYTHONHOME:
    if (Test-Path -Path Env:_OLD_VIRTUAL_PYTHONHOME) {
        Copy-Item -Path Env:_OLD_VIRTUAL_PYTHONHOME -Destination Env:PYTHONHOME
        Remove-Item -Path Env:_OLD_VIRTUAL_PYTHONHOME
    }
    # The prior PATH:
    if (Test-Path -Path Env:_OLD_VIRTUAL_PATH) {
        Copy-Item -Path Env:_OLD_VIRTUAL_PATH -Destination Env:PATH
        Remove-Item -Path Env:_OLD_VIRTUAL_PATH
    }
    # Just remove the VIRTUAL_ENV altogether:
    if (Test-Path -Path Env:VIRTUAL_ENV) {
        Remove-Item -Path env:VIRTUAL_ENV
    }
    # Just remove VIRTUAL_ENV_PROMPT altogether.
    if (Test-Path -Path Env:VIRTUAL_ENV_PROMPT) {
        Remove-Item -Path env:VIRTUAL_ENV_PROMPT
    }
    # Just remove the _PYTHON_VENV_PROMPT_PREFIX altogether:
    if (Get-Variable -Name "_PYTHON_VENV_PROMPT_PREFIX" -ErrorAction SilentlyContinue) {
        Remove-Variable -Name _PYTHON_VENV_PROMPT_PREFIX -Scope Global -Force
    }
    # Leave deactivate function in the global namespace if requested:
    if (-not $NonDestructive) {
        Remove-Item -Path function:deactivate
    }
 }
 <#
 .Description
 Get-PyVenvConfig parses the values from the pyvenv.cfg file located in the
 given folder, and returns them in a map.
 For each line in the pyvenv.cfg file, if that line can be parsed into exactly
 two strings separated by `=` (with any amount of whitespace surrounding the =)
 then it is considered a `key = value` line. The left hand string is the key,
 the right hand is the value.
 If the value starts with a `'` or a `"` then the first and last character is
 stripped from the value before being captured.
 .Parameter ConfigDir
 Path to the directory that contains the `pyvenv.cfg` file.
 #>
 function Get-PyVenvConfig(
    [String]
    $ConfigDir
 ) {
    Write-Verbose "Given ConfigDir=$ConfigDir, obtain values in pyvenv.cfg"
    # Ensure the file exists, and issue a warning if it doesn't (but still allow the function to continue).
    $pyvenvConfigPath = Join-Path -Resolve -Path $ConfigDir -ChildPath 'pyvenv.cfg' -ErrorAction Continue
    # An empty map will be returned if no config file is found.
    $pyvenvConfig = @{ }
    if ($pyvenvConfigPath) {
        Write-Verbose "File exists, parse `key = value` lines"
        $pyvenvConfigContent = Get-Content -Path $pyvenvConfigPath
        $pyvenvConfigContent | ForEach-Object {
            $keyval = $PSItem -split "\s*=\s*", 2
            if ($keyval[0] -and $keyval[1]) {
                $val = $keyval[1]
                # Remove extraneous quotations around a string value.
                if ("'""".Contains($val.Substring(0, 1))) {
                    $val = $val.Substring(1, $val.Length - 2)
                }
                $pyvenvConfig[$keyval[0]] = $val
                Write-Verbose "Adding Key: '$($keyval[0])'='$val'"
            }
        }
    }
    return $pyvenvConfig
 }
 <# Begin Activate script --------------------------------------------------- #>
 # Determine the containing directory of this script
 $VenvExecPath = Split-Path -Parent $MyInvocation.MyCommand.Definition
 $VenvExecDir = Get-Item -Path $VenvExecPath
 Write-Verbose "Activation script is located in path: '$VenvExecPath'"
 Write-Verbose "VenvExecDir Fullname: '$($VenvExecDir.FullName)"
 Write-Verbose "VenvExecDir Name: '$($VenvExecDir.Name)"
 # Set values required in priority: CmdLine, ConfigFile, Default
 # First, get the location of the virtual environment, it might not be
 # VenvExecDir if specified on the command line.
 if ($VenvDir) {
    Write-Verbose "VenvDir given as parameter, using '$VenvDir' to determine values"
 }
 else {
    Write-Verbose "VenvDir not given as a parameter, using parent directory name as VenvDir."
    $VenvDir = $VenvExecDir.Parent.FullName.TrimEnd("\\/")
    Write-Verbose "VenvDir=$VenvDir"
 }
 # Next, read the `pyvenv.cfg` file to determine any required value such
 # as `prompt`.
 $pyvenvCfg = Get-PyVenvConfig -ConfigDir $VenvDir
 # Next, set the prompt from the command line, or the config file, or
 # just use the name of the virtual environment folder.
 if ($Prompt) {
    Write-Verbose "Prompt specified as argument, using '$Prompt'"
 }
 else {
    Write-Verbose "Prompt not specified as argument to script, checking pyvenv.cfg value"
    if ($pyvenvCfg -and $pyvenvCfg['prompt']) {
        Write-Verbose "  Setting based on value in pyvenv.cfg='$($pyvenvCfg['prompt'])'"
        $Prompt = $pyvenvCfg['prompt'];
    }
    else {
        Write-Verbose "  Setting prompt based on parent's directory's name. (Is the directory name passed to venv module when creating the virtual environment)"
        Write-Verbose "  Got leaf-name of $VenvDir='$(Split-Path -Path $venvDir -Leaf)'"
        $Prompt = Split-Path -Path $venvDir -Leaf
    }
 }
 Write-Verbose "Prompt = '$Prompt'"
 Write-Verbose "VenvDir='$VenvDir'"
 # Deactivate any currently active virtual environment, but leave the
 # deactivate function in place.
 deactivate -nondestructive
 # Now set the environment variable VIRTUAL_ENV, used by many tools to determine
 # that there is an activated venv.
 $env:VIRTUAL_ENV = $VenvDir
 if (-not $Env:VIRTUAL_ENV_DISABLE_PROMPT) {
    Write-Verbose "Setting prompt to '$Prompt'"
    # Set the prompt to include the env name
    # Make sure _OLD_VIRTUAL_PROMPT is global
    function global:_OLD_VIRTUAL_PROMPT { "" }
    Copy-Item -Path function:prompt -Destination function:_OLD_VIRTUAL_PROMPT
    New-Variable -Name _PYTHON_VENV_PROMPT_PREFIX -Description "Python virtual environment prompt prefix" -Scope Global -Option ReadOnly -Visibility Public -Value $Prompt
    function global:prompt {
        Write-Host -NoNewline -ForegroundColor Green "($_PYTHON_VENV_PROMPT_PREFIX) "
        _OLD_VIRTUAL_PROMPT
    }
    $env:VIRTUAL_ENV_PROMPT = $Prompt
 }
 # Clear PYTHONHOME
 if (Test-Path -Path Env:PYTHONHOME) {
    Copy-Item -Path Env:PYTHONHOME -Destination Env:_OLD_VIRTUAL_PYTHONHOME
    Remove-Item -Path Env:PYTHONHOME
 }
 # Add the venv to the PATH
 Copy-Item -Path Env:PATH -Destination Env:_OLD_VIRTUAL_PATH
 $Env:PATH = "$VenvExecDir$([System.IO.Path]::PathSeparator)$Env:PATH"
--- a/venv/bin/activate
+++ b/venv/bin/activate
@ -0,0 +1,76 @@
 # This file must be used with "source bin/activate" *from bash*
 # You cannot run it directly
 deactivate () {
    # reset old environment variables
    if [ -n "${_OLD_VIRTUAL_PATH:-}" ] ; then
        PATH="${_OLD_VIRTUAL_PATH:-}"
        export PATH
        unset _OLD_VIRTUAL_PATH
    fi
    if [ -n "${_OLD_VIRTUAL_PYTHONHOME:-}" ] ; then
        PYTHONHOME="${_OLD_VIRTUAL_PYTHONHOME:-}"
        export PYTHONHOME
        unset _OLD_VIRTUAL_PYTHONHOME
    fi
    # This should detect bash and zsh, which have a hash command that must
    # be called to get it to forget past commands.  Without forgetting
    # past commands the $PATH changes we made may not be respected
    if [ -n "${BASH:-}" -o -n "${ZSH_VERSION:-}" ] ; then
        hash -r 2> /dev/null
    fi
    if [ -n "${_OLD_VIRTUAL_PS1:-}" ] ; then
        PS1="${_OLD_VIRTUAL_PS1:-}"
        export PS1
        unset _OLD_VIRTUAL_PS1
    fi
    unset VIRTUAL_ENV
    unset VIRTUAL_ENV_PROMPT
    if [ ! "${1:-}" = "nondestructive" ] ; then
    # Self destruct!
        unset -f deactivate
    fi
 }
 # unset irrelevant variables
 deactivate nondestructive
 # on Windows, a path can contain colons and backslashes and has to be converted:
 if [ "$OSTYPE" = "cygwin" ] || [ "$OSTYPE" = "msys" ] ; then
    # transform D:\path\to\venv to /d/path/to/venv on MSYS
    # and to /cygdrive/d/path/to/venv on Cygwin
    export VIRTUAL_ENV=$(cygpath "/home/nick/git/dns-check-py/venv")
 else
    # use the path as-is
    export VIRTUAL_ENV="/home/nick/git/dns-check-py/venv"
 fi
 _OLD_VIRTUAL_PATH="$PATH"
 PATH="$VIRTUAL_ENV/bin:$PATH"
 export PATH
 # unset PYTHONHOME if set
 # this will fail if PYTHONHOME is set to the empty string (which is bad anyway)
 # could use `if (set -u; : $PYTHONHOME) ;` in bash
 if [ -n "${PYTHONHOME:-}" ] ; then
    _OLD_VIRTUAL_PYTHONHOME="${PYTHONHOME:-}"
    unset PYTHONHOME
 fi
 if [ -z "${VIRTUAL_ENV_DISABLE_PROMPT:-}" ] ; then
    _OLD_VIRTUAL_PS1="${PS1:-}"
    PS1="(venv) ${PS1:-}"
    export PS1
    VIRTUAL_ENV_PROMPT="(venv) "
    export VIRTUAL_ENV_PROMPT
 fi
 # This should detect bash and zsh, which have a hash command that must
 # be called to get it to forget past commands.  Without forgetting
 # past commands the $PATH changes we made may not be respected
 if [ -n "${BASH:-}" -o -n "${ZSH_VERSION:-}" ] ; then
    hash -r 2> /dev/null
 fi
--- a/venv/bin/activate.csh
+++ b/venv/bin/activate.csh
@ -0,0 +1,27 @@
 # This file must be used with "source bin/activate.csh" *from csh*.
 # You cannot run it directly.
 # Created by Davide Di Blasi <davidedb@gmail.com>.
 # Ported to Python 3.3 venv by Andrew Svetlov <andrew.svetlov@gmail.com>
 alias deactivate 'test $?_OLD_VIRTUAL_PATH != 0 && setenv PATH "$_OLD_VIRTUAL_PATH" && unset _OLD_VIRTUAL_PATH; rehash; test $?_OLD_VIRTUAL_PROMPT != 0 && set prompt="$_OLD_VIRTUAL_PROMPT" && unset _OLD_VIRTUAL_PROMPT; unsetenv VIRTUAL_ENV; unsetenv VIRTUAL_ENV_PROMPT; test "\!:*" != "nondestructive" && unalias deactivate'
 # Unset irrelevant variables.
 deactivate nondestructive
 setenv VIRTUAL_ENV "/home/nick/git/dns-check-py/venv"
 set _OLD_VIRTUAL_PATH="$PATH"
 setenv PATH "$VIRTUAL_ENV/bin:$PATH"
 set _OLD_VIRTUAL_PROMPT="$prompt"
 if (! "$?VIRTUAL_ENV_DISABLE_PROMPT") then
    set prompt = "(venv) $prompt"
    setenv VIRTUAL_ENV_PROMPT "(venv) "
 endif
 alias pydoc python -m pydoc
 rehash
--- a/venv/bin/activate.fish
+++ b/venv/bin/activate.fish
@ -0,0 +1,69 @@
 # This file must be used with "source <venv>/bin/activate.fish" *from fish*
 # (https://fishshell.com/). You cannot run it directly.
 function deactivate  -d "Exit virtual environment and return to normal shell environment"
    # reset old environment variables
    if test -n "$_OLD_VIRTUAL_PATH"
        set -gx PATH $_OLD_VIRTUAL_PATH
        set -e _OLD_VIRTUAL_PATH
    end
    if test -n "$_OLD_VIRTUAL_PYTHONHOME"
        set -gx PYTHONHOME $_OLD_VIRTUAL_PYTHONHOME
        set -e _OLD_VIRTUAL_PYTHONHOME
    end
    if test -n "$_OLD_FISH_PROMPT_OVERRIDE"
        set -e _OLD_FISH_PROMPT_OVERRIDE
        # prevents error when using nested fish instances (Issue #93858)
        if functions -q _old_fish_prompt
            functions -e fish_prompt
            functions -c _old_fish_prompt fish_prompt
            functions -e _old_fish_prompt
        end
    end
    set -e VIRTUAL_ENV
    set -e VIRTUAL_ENV_PROMPT
    if test "$argv[1]" != "nondestructive"
        # Self-destruct!
        functions -e deactivate
    end
 end
 # Unset irrelevant variables.
 deactivate nondestructive
 set -gx VIRTUAL_ENV "/home/nick/git/dns-check-py/venv"
 set -gx _OLD_VIRTUAL_PATH $PATH
 set -gx PATH "$VIRTUAL_ENV/bin" $PATH
 # Unset PYTHONHOME if set.
 if set -q PYTHONHOME
    set -gx _OLD_VIRTUAL_PYTHONHOME $PYTHONHOME
    set -e PYTHONHOME
 end
 if test -z "$VIRTUAL_ENV_DISABLE_PROMPT"
    # fish uses a function instead of an env var to generate the prompt.
    # Save the current fish_prompt function as the function _old_fish_prompt.
    functions -c fish_prompt _old_fish_prompt
    # With the original prompt function renamed, we can override with our own.
    function fish_prompt
        # Save the return status of the last command.
        set -l old_status $status
        # Output the venv prompt; color taken from the blue of the Python logo.
        printf "%s%s%s" (set_color 4B8BBE) "(venv) " (set_color normal)
        # Restore the return status of the previous command.
        echo "exit $old_status" | .
        # Output the original/"old" prompt.
        _old_fish_prompt
    end
    set -gx _OLD_FISH_PROMPT_OVERRIDE "$VIRTUAL_ENV"
    set -gx VIRTUAL_ENV_PROMPT "(venv) "
 end
--- a/venv/bin/normalizer
+++ b/venv/bin/normalizer
@ -0,0 +1,8 @@
 #!/home/nick/git/dns-check-py/venv/bin/python3
 # -*- coding: utf-8 -*-
 import re
 import sys
 from charset_normalizer.cli import cli_detect
 if __name__ == '__main__':
    sys.argv[0] = re.sub(r'(-script\.pyw|\.exe)?$', '', sys.argv[0])
    sys.exit(cli_detect())
--- a/venv/bin/pip
+++ b/venv/bin/pip
@ -0,0 +1,8 @@
 #!/home/nick/git/dns-check-py/venv/bin/python3
 # -*- coding: utf-8 -*-
 import re
 import sys
 from pip._internal.cli.main import main
 if __name__ == '__main__':
    sys.argv[0] = re.sub(r'(-script\.pyw|\.exe)?$', '', sys.argv[0])
    sys.exit(main())
--- a/venv/bin/pip3
+++ b/venv/bin/pip3
@ -0,0 +1,8 @@
 #!/home/nick/git/dns-check-py/venv/bin/python3
 # -*- coding: utf-8 -*-
 import re
 import sys
 from pip._internal.cli.main import main
 if __name__ == '__main__':
    sys.argv[0] = re.sub(r'(-script\.pyw|\.exe)?$', '', sys.argv[0])
    sys.exit(main())
--- a/venv/bin/pip3.12
+++ b/venv/bin/pip3.12
@ -0,0 +1,8 @@
 #!/home/nick/git/dns-check-py/venv/bin/python3
 # -*- coding: utf-8 -*-
 import re
 import sys
 from pip._internal.cli.main import main
 if __name__ == '__main__':
    sys.argv[0] = re.sub(r'(-script\.pyw|\.exe)?$', '', sys.argv[0])
    sys.exit(main())
--- a/venv/bin/python
+++ b/venv/bin/python
@ -0,0 +1 @@
 python3
--- a/venv/bin/python3
+++ b/venv/bin/python3
@ -0,0 +1 @@
 /usr/bin/python3
--- a/venv/bin/python3.12
+++ b/venv/bin/python3.12
@ -0,0 +1 @@
 python3
--- a/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/INSTALLER
+++ b/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/INSTALLER
@ -0,0 +1 @@
 pip
--- a/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/LICENSE
+++ b/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/LICENSE
@ -0,0 +1,20 @@
 Copyright (c) 2017-2021 Ingy döt Net
 Copyright (c) 2006-2016 Kirill Simonov
 Permission is hereby granted, free of charge, to any person obtaining a copy of
 this software and associated documentation files (the "Software"), to deal in
 the Software without restriction, including without limitation the rights to
 use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
 of the Software, and to permit persons to whom the Software is furnished to do
 so, subject to the following conditions:
 The above copyright notice and this permission notice shall be included in all
 copies or substantial portions of the Software.
 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 SOFTWARE.
--- a/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/METADATA
+++ b/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/METADATA
@ -0,0 +1,46 @@
 Metadata-Version: 2.1
 Name: PyYAML
 Version: 6.0.1
 Summary: YAML parser and emitter for Python
 Home-page: https://pyyaml.org/
 Download-URL: https://pypi.org/project/PyYAML/
 Author: Kirill Simonov
 Author-email: xi@resolvent.net
 License: MIT
 Project-URL: Bug Tracker, https://github.com/yaml/pyyaml/issues
 Project-URL: CI, https://github.com/yaml/pyyaml/actions
 Project-URL: Documentation, https://pyyaml.org/wiki/PyYAMLDocumentation
 Project-URL: Mailing lists, http://lists.sourceforge.net/lists/listinfo/yaml-core
 Project-URL: Source Code, https://github.com/yaml/pyyaml
 Platform: Any
 Classifier: Development Status :: 5 - Production/Stable
 Classifier: Intended Audience :: Developers
 Classifier: License :: OSI Approved :: MIT License
 Classifier: Operating System :: OS Independent
 Classifier: Programming Language :: Cython
 Classifier: Programming Language :: Python
 Classifier: Programming Language :: Python :: 3
 Classifier: Programming Language :: Python :: 3.6
 Classifier: Programming Language :: Python :: 3.7
 Classifier: Programming Language :: Python :: 3.8
 Classifier: Programming Language :: Python :: 3.9
 Classifier: Programming Language :: Python :: 3.10
 Classifier: Programming Language :: Python :: 3.11
 Classifier: Programming Language :: Python :: Implementation :: CPython
 Classifier: Programming Language :: Python :: Implementation :: PyPy
 Classifier: Topic :: Software Development :: Libraries :: Python Modules
 Classifier: Topic :: Text Processing :: Markup
 Requires-Python: >=3.6
 License-File: LICENSE
 YAML is a data serialization format designed for human readability
 and interaction with scripting languages.  PyYAML is a YAML parser
 and emitter for Python.
 PyYAML features a complete YAML 1.1 parser, Unicode support, pickle
 support, capable extension API, and sensible error messages.  PyYAML
 supports standard YAML tags and provides Python-specific tags that
 allow to represent an arbitrary Python object.
 PyYAML is applicable for a broad range of tasks from complex
 configuration files to object serialization and persistence.
--- a/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/RECORD
+++ b/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/RECORD
@ -0,0 +1,44 @@
 PyYAML-6.0.1.dist-info/INSTALLER,sha256=zuuue4knoyJ-UwPPXg8fezS7VCrXJQrAP7zeNuwvFQg,4
 PyYAML-6.0.1.dist-info/LICENSE,sha256=jTko-dxEkP1jVwfLiOsmvXZBAqcoKVQwfT5RZ6V36KQ,1101
 PyYAML-6.0.1.dist-info/METADATA,sha256=UNNF8-SzzwOKXVo-kV5lXUGH2_wDWMBmGxqISpp5HQk,2058
 PyYAML-6.0.1.dist-info/RECORD,,
 PyYAML-6.0.1.dist-info/REQUESTED,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 PyYAML-6.0.1.dist-info/WHEEL,sha256=4ZiCdXIWMxJyEClivrQv1QAHZpQh8kVYU92_ZAVwaok,152
 PyYAML-6.0.1.dist-info/top_level.txt,sha256=rpj0IVMTisAjh_1vG3Ccf9v5jpCQwAz6cD1IVU5ZdhQ,11
 _yaml/__init__.py,sha256=04Ae_5osxahpJHa3XBZUAf4wi6XX32gR8D6X6p64GEA,1402
 _yaml/__pycache__/__init__.cpython-312.pyc,,
 yaml/__init__.py,sha256=bhl05qSeO-1ZxlSRjGrvl2m9nrXb1n9-GQatTN0Mrqc,12311
 yaml/__pycache__/__init__.cpython-312.pyc,,
 yaml/__pycache__/composer.cpython-312.pyc,,
 yaml/__pycache__/constructor.cpython-312.pyc,,
 yaml/__pycache__/cyaml.cpython-312.pyc,,
 yaml/__pycache__/dumper.cpython-312.pyc,,
 yaml/__pycache__/emitter.cpython-312.pyc,,
 yaml/__pycache__/error.cpython-312.pyc,,
 yaml/__pycache__/events.cpython-312.pyc,,
 yaml/__pycache__/loader.cpython-312.pyc,,
 yaml/__pycache__/nodes.cpython-312.pyc,,
 yaml/__pycache__/parser.cpython-312.pyc,,
 yaml/__pycache__/reader.cpython-312.pyc,,
 yaml/__pycache__/representer.cpython-312.pyc,,
 yaml/__pycache__/resolver.cpython-312.pyc,,
 yaml/__pycache__/scanner.cpython-312.pyc,,
 yaml/__pycache__/serializer.cpython-312.pyc,,
 yaml/__pycache__/tokens.cpython-312.pyc,,
 yaml/_yaml.cpython-312-x86_64-linux-gnu.so,sha256=FDFeHFHmIrXrKTyUeQkvzmAVJ8FABnf58koZWEivTLo,2367192
 yaml/composer.py,sha256=_Ko30Wr6eDWUeUpauUGT3Lcg9QPBnOPVlTnIMRGJ9FM,4883
 yaml/constructor.py,sha256=kNgkfaeLUkwQYY_Q6Ff1Tz2XVw_pG1xVE9Ak7z-viLA,28639
 yaml/cyaml.py,sha256=6ZrAG9fAYvdVe2FK_w0hmXoG7ZYsoYUwapG8CiC72H0,3851
 yaml/dumper.py,sha256=PLctZlYwZLp7XmeUdwRuv4nYOZ2UBnDIUy8-lKfLF-o,2837
 yaml/emitter.py,sha256=jghtaU7eFwg31bG0B7RZea_29Adi9CKmXq_QjgQpCkQ,43006
 yaml/error.py,sha256=Ah9z-toHJUbE9j-M8YpxgSRM5CgLCcwVzJgLLRF2Fxo,2533
 yaml/events.py,sha256=50_TksgQiE4up-lKo_V-nBy-tAIxkIPQxY5qDhKCeHw,2445
 yaml/loader.py,sha256=UVa-zIqmkFSCIYq_PgSGm4NSJttHY2Rf_zQ4_b1fHN0,2061
 yaml/nodes.py,sha256=gPKNj8pKCdh2d4gr3gIYINnPOaOxGhJAUiYhGRnPE84,1440
 yaml/parser.py,sha256=ilWp5vvgoHFGzvOZDItFoGjD6D42nhlZrZyjAwa0oJo,25495
 yaml/reader.py,sha256=0dmzirOiDG4Xo41RnuQS7K9rkY3xjHiVasfDMNTqCNw,6794
 yaml/representer.py,sha256=IuWP-cAW9sHKEnS0gCqSa894k1Bg4cgTxaDwIcbRQ-Y,14190
 yaml/resolver.py,sha256=9L-VYfm4mWHxUD1Vg4X7rjDRK_7VZd6b92wzq7Y2IKY,9004
 yaml/scanner.py,sha256=YEM3iLZSaQwXcQRg2l2R4MdT0zGP2F9eHkKGKnHyWQY,51279
 yaml/serializer.py,sha256=ChuFgmhU01hj4xgI8GaKv6vfM2Bujwa9i7d2FAHj7cA,4165
 yaml/tokens.py,sha256=lTQIzSVw8Mg9wv459-TjiOQe6wVziqaRlqX2_89rp54,2573
--- a/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/REQUESTED
+++ b/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/REQUESTED
--- a/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/WHEEL
+++ b/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/WHEEL
@ -0,0 +1,6 @@
 Wheel-Version: 1.0
 Generator: bdist_wheel (0.41.2)
 Root-Is-Purelib: false
 Tag: cp312-cp312-manylinux_2_17_x86_64
 Tag: cp312-cp312-manylinux2014_x86_64
--- a/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/top_level.txt
+++ b/venv/lib/python3.12/site-packages/PyYAML-6.0.1.dist-info/top_level.txt
@ -0,0 +1,2 @@
 _yaml
 yaml
--- a/venv/lib/python3.12/site-packages/_yaml/init.py
+++ b/venv/lib/python3.12/site-packages/_yaml/init.py
@ -0,0 +1,33 @@
 # This is a stub package designed to roughly emulate the _yaml
 # extension module, which previously existed as a standalone module
 # and has been moved into the `yaml` package namespace.
 # It does not perfectly mimic its old counterpart, but should get
 # close enough for anyone who's relying on it even when they shouldn't.
 import yaml
 # in some circumstances, the yaml module we imoprted may be from a different version, so we need
 # to tread carefully when poking at it here (it may not have the attributes we expect)
 if not getattr(yaml, '__with_libyaml__', False):
    from sys import version_info
    exc = ModuleNotFoundError if version_info >= (3, 6) else ImportError
    raise exc("No module named '_yaml'")
 else:
    from yaml._yaml import *
    import warnings
    warnings.warn(
        'The _yaml extension module is now located at yaml._yaml'
        ' and its location is subject to change.  To use the'
        ' LibYAML-based parser and emitter, import from `yaml`:'
        ' `from yaml import CLoader as Loader, CDumper as Dumper`.',
        DeprecationWarning
    )
    del warnings
    # Don't `del yaml` here because yaml is actually an existing
    # namespace member of _yaml.
 __name__ = '_yaml'
 # If the module is top-level (i.e. not a part of any specific package)
 # then the attribute should be set to ''.
 # https://docs.python.org/3.8/library/types.html
 __package__ = ''
--- a/venv/lib/python3.12/site-packages/_yaml/pycache/init.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/_yaml/pycache/init.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/INSTALLER
+++ b/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/INSTALLER
@ -0,0 +1 @@
 pip
--- a/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/LICENSE
+++ b/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/LICENSE
@ -0,0 +1,20 @@
 This package contains a modified version of ca-bundle.crt:
 ca-bundle.crt -- Bundle of CA Root Certificates
 This is a bundle of X.509 certificates of public Certificate Authorities
 (CA). These were automatically extracted from Mozilla's root certificates
 file (certdata.txt).  This file can be found in the mozilla source tree:
 https://hg.mozilla.org/mozilla-central/file/tip/security/nss/lib/ckfw/builtins/certdata.txt
 It contains the certificates in PEM format and therefore
 can be directly used with curl / libcurl / php_curl, or with
 an Apache+mod_ssl webserver for SSL client authentication.
 Just configure this file as the SSLCACertificateFile.#
 ***** BEGIN LICENSE BLOCK *****
 This Source Code Form is subject to the terms of the Mozilla Public License,
 v. 2.0. If a copy of the MPL was not distributed with this file, You can obtain
 one at http://mozilla.org/MPL/2.0/.
 ***** END LICENSE BLOCK *****
@(#) $RCSfile: certdata.txt,v $ $Revision: 1.80 $ $Date: 2011/11/03 15:11:58 $
--- a/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/METADATA
+++ b/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/METADATA
@ -0,0 +1,66 @@
 Metadata-Version: 2.1
 Name: certifi
 Version: 2023.11.17
 Summary: Python package for providing Mozilla's CA Bundle.
 Home-page: https://github.com/certifi/python-certifi
 Author: Kenneth Reitz
 Author-email: me@kennethreitz.com
 License: MPL-2.0
 Project-URL: Source, https://github.com/certifi/python-certifi
 Classifier: Development Status :: 5 - Production/Stable
 Classifier: Intended Audience :: Developers
 Classifier: License :: OSI Approved :: Mozilla Public License 2.0 (MPL 2.0)
 Classifier: Natural Language :: English
 Classifier: Programming Language :: Python
 Classifier: Programming Language :: Python :: 3
 Classifier: Programming Language :: Python :: 3 :: Only
 Classifier: Programming Language :: Python :: 3.6
 Classifier: Programming Language :: Python :: 3.7
 Classifier: Programming Language :: Python :: 3.8
 Classifier: Programming Language :: Python :: 3.9
 Classifier: Programming Language :: Python :: 3.10
 Classifier: Programming Language :: Python :: 3.11
 Requires-Python: >=3.6
 License-File: LICENSE
 Certifi: Python SSL Certificates
 ================================
 Certifi provides Mozilla's carefully curated collection of Root Certificates for
 validating the trustworthiness of SSL certificates while verifying the identity
 of TLS hosts. It has been extracted from the `Requests`_ project.
 Installation
 ------------
 ``certifi`` is available on PyPI. Simply install it with ``pip``::
    $ pip install certifi
 Usage
 -----
 To reference the installed certificate authority (CA) bundle, you can use the
 built-in function::
    >>> import certifi
    >>> certifi.where()
    '/usr/local/lib/python3.7/site-packages/certifi/cacert.pem'
 Or from the command line::
    $ python -m certifi
    /usr/local/lib/python3.7/site-packages/certifi/cacert.pem
 Enjoy!
 .. _`Requests`: https://requests.readthedocs.io/en/master/
 Addition/Removal of Certificates
 --------------------------------
 Certifi does not support any addition/removal or other modification of the
 CA trust store content. This project is intended to provide a reliable and
 highly portable root of trust to python deployments. Look to upstream projects
 for methods to use alternate trust.
--- a/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/RECORD
+++ b/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/RECORD
@ -0,0 +1,14 @@
 certifi-2023.11.17.dist-info/INSTALLER,sha256=zuuue4knoyJ-UwPPXg8fezS7VCrXJQrAP7zeNuwvFQg,4
 certifi-2023.11.17.dist-info/LICENSE,sha256=6TcW2mucDVpKHfYP5pWzcPBpVgPSH2-D8FPkLPwQyvc,989
 certifi-2023.11.17.dist-info/METADATA,sha256=P7BMxvbKUZTP20mLy_wc2atkEPFNVqElEzV6Mhaj3Zc,2172
 certifi-2023.11.17.dist-info/RECORD,,
 certifi-2023.11.17.dist-info/WHEEL,sha256=Xo9-1PvkuimrydujYJAjF7pCkriuXBpUPEjma1nZyJ0,92
 certifi-2023.11.17.dist-info/top_level.txt,sha256=KMu4vUCfsjLrkPbSNdgdekS-pVJzBAJFO__nI8NF6-U,8
 certifi/__init__.py,sha256=oYZVbNEJ66LQQamFRyuICe6FoYDmkY4j4fKEyO9D96c,94
 certifi/__main__.py,sha256=xBBoj905TUWBLRGANOcf7oi6e-3dMP4cEoG9OyMs11g,243
 certifi/__pycache__/__init__.cpython-312.pyc,,
 certifi/__pycache__/__main__.cpython-312.pyc,,
 certifi/__pycache__/core.cpython-312.pyc,,
 certifi/cacert.pem,sha256=z503-oFAev4R3MDXD-YCVhQiqiNEcIwyTkUE24xsV0g,290282
 certifi/core.py,sha256=lhewz0zFb2b4ULsQurElmloYwQoecjWzPqY67P8T7iM,4219
 certifi/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
--- a/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/WHEEL
+++ b/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/WHEEL
@ -0,0 +1,5 @@
 Wheel-Version: 1.0
 Generator: bdist_wheel (0.41.3)
 Root-Is-Purelib: true
 Tag: py3-none-any
--- a/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/top_level.txt
+++ b/venv/lib/python3.12/site-packages/certifi-2023.11.17.dist-info/top_level.txt
@ -0,0 +1 @@
 certifi
--- a/venv/lib/python3.12/site-packages/certifi/init.py
+++ b/venv/lib/python3.12/site-packages/certifi/init.py
@ -0,0 +1,4 @@
 from .core import contents, where
 __all__ = ["contents", "where"]
 __version__ = "2023.11.17"
--- a/venv/lib/python3.12/site-packages/certifi/main.py
+++ b/venv/lib/python3.12/site-packages/certifi/main.py
@ -0,0 +1,12 @@
 import argparse
 from certifi import contents, where
 parser = argparse.ArgumentParser()
 parser.add_argument("-c", "--contents", action="store_true")
 args = parser.parse_args()
 if args.contents:
    print(contents())
 else:
    print(where())
--- a/venv/lib/python3.12/site-packages/certifi/pycache/init.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/certifi/pycache/init.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/certifi/pycache/main.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/certifi/pycache/main.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/certifi/pycache/core.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/certifi/pycache/core.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/certifi/cacert.pem
+++ b/venv/lib/python3.12/site-packages/certifi/cacert.pem
--- a/venv/lib/python3.12/site-packages/certifi/core.py
+++ b/venv/lib/python3.12/site-packages/certifi/core.py
@ -0,0 +1,108 @@
 """
 certifi.py
 ~~~~~~~~~~
 This module returns the installation location of cacert.pem or its contents.
 """
 import sys
 if sys.version_info >= (3, 11):
    from importlib.resources import as_file, files
    _CACERT_CTX = None
    _CACERT_PATH = None
    def where() -> str:
        # This is slightly terrible, but we want to delay extracting the file
        # in cases where we're inside of a zipimport situation until someone
        # actually calls where(), but we don't want to re-extract the file
        # on every call of where(), so we'll do it once then store it in a
        # global variable.
        global _CACERT_CTX
        global _CACERT_PATH
        if _CACERT_PATH is None:
            # This is slightly janky, the importlib.resources API wants you to
            # manage the cleanup of this file, so it doesn't actually return a
            # path, it returns a context manager that will give you the path
            # when you enter it and will do any cleanup when you leave it. In
            # the common case of not needing a temporary file, it will just
            # return the file system location and the __exit__() is a no-op.
            #
            # We also have to hold onto the actual context manager, because
            # it will do the cleanup whenever it gets garbage collected, so
            # we will also store that at the global level as well.
            _CACERT_CTX = as_file(files("certifi").joinpath("cacert.pem"))
            _CACERT_PATH = str(_CACERT_CTX.__enter__())
        return _CACERT_PATH
    def contents() -> str:
        return files("certifi").joinpath("cacert.pem").read_text(encoding="ascii")
 elif sys.version_info >= (3, 7):
    from importlib.resources import path as get_path, read_text
    _CACERT_CTX = None
    _CACERT_PATH = None
    def where() -> str:
        # This is slightly terrible, but we want to delay extracting the
        # file in cases where we're inside of a zipimport situation until
        # someone actually calls where(), but we don't want to re-extract
        # the file on every call of where(), so we'll do it once then store
        # it in a global variable.
        global _CACERT_CTX
        global _CACERT_PATH
        if _CACERT_PATH is None:
            # This is slightly janky, the importlib.resources API wants you
            # to manage the cleanup of this file, so it doesn't actually
            # return a path, it returns a context manager that will give
            # you the path when you enter it and will do any cleanup when
            # you leave it. In the common case of not needing a temporary
            # file, it will just return the file system location and the
            # __exit__() is a no-op.
            #
            # We also have to hold onto the actual context manager, because
            # it will do the cleanup whenever it gets garbage collected, so
            # we will also store that at the global level as well.
            _CACERT_CTX = get_path("certifi", "cacert.pem")
            _CACERT_PATH = str(_CACERT_CTX.__enter__())
        return _CACERT_PATH
    def contents() -> str:
        return read_text("certifi", "cacert.pem", encoding="ascii")
 else:
    import os
    import types
    from typing import Union
    Package = Union[types.ModuleType, str]
    Resource = Union[str, "os.PathLike"]
    # This fallback will work for Python versions prior to 3.7 that lack the
    # importlib.resources module but relies on the existing `where` function
    # so won't address issues with environments like PyOxidizer that don't set
    # __file__ on modules.
    def read_text(
        package: Package,
        resource: Resource,
        encoding: str = 'utf-8',
        errors: str = 'strict'
    ) -> str:
        with open(where(), encoding=encoding) as data:
            return data.read()
    # If we don't have importlib.resources, then we will just do the old logic
    # of assuming we're on the filesystem and munge the path directly.
    def where() -> str:
        f = os.path.dirname(__file__)
        return os.path.join(f, "cacert.pem")
    def contents() -> str:
        return read_text("certifi", "cacert.pem", encoding="ascii")
--- a/venv/lib/python3.12/site-packages/certifi/py.typed
+++ b/venv/lib/python3.12/site-packages/certifi/py.typed
--- a/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/INSTALLER
+++ b/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/INSTALLER
@ -0,0 +1 @@
 pip
--- a/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/LICENSE
+++ b/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/LICENSE
@ -0,0 +1,21 @@
 MIT License
 Copyright (c) 2019 TAHRI Ahmed R.
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
 in the Software without restriction, including without limitation the rights
 to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 copies of the Software, and to permit persons to whom the Software is
 furnished to do so, subject to the following conditions:
 The above copyright notice and this permission notice shall be included in all
 copies or substantial portions of the Software.
 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 SOFTWARE.
--- a/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/METADATA
+++ b/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/METADATA
@ -0,0 +1,683 @@
 Metadata-Version: 2.1
 Name: charset-normalizer
 Version: 3.3.2
 Summary: The Real First Universal Charset Detector. Open, modern and actively maintained alternative to Chardet.
 Home-page: https://github.com/Ousret/charset_normalizer
 Author: Ahmed TAHRI
 Author-email: ahmed.tahri@cloudnursery.dev
 License: MIT
 Project-URL: Bug Reports, https://github.com/Ousret/charset_normalizer/issues
 Project-URL: Documentation, https://charset-normalizer.readthedocs.io/en/latest
 Keywords: encoding,charset,charset-detector,detector,normalization,unicode,chardet,detect
 Classifier: Development Status :: 5 - Production/Stable
 Classifier: License :: OSI Approved :: MIT License
 Classifier: Intended Audience :: Developers
 Classifier: Topic :: Software Development :: Libraries :: Python Modules
 Classifier: Operating System :: OS Independent
 Classifier: Programming Language :: Python
 Classifier: Programming Language :: Python :: 3
 Classifier: Programming Language :: Python :: 3.7
 Classifier: Programming Language :: Python :: 3.8
 Classifier: Programming Language :: Python :: 3.9
 Classifier: Programming Language :: Python :: 3.10
 Classifier: Programming Language :: Python :: 3.11
 Classifier: Programming Language :: Python :: 3.12
 Classifier: Programming Language :: Python :: Implementation :: PyPy
 Classifier: Topic :: Text Processing :: Linguistic
 Classifier: Topic :: Utilities
 Classifier: Typing :: Typed
 Requires-Python: >=3.7.0
 Description-Content-Type: text/markdown
 License-File: LICENSE
 Provides-Extra: unicode_backport
 <h1 align="center">Charset Detection, for Everyone 👋</h1>
 <p align="center">
  <sup>The Real First Universal Charset Detector</sup><br>
  <a href="https://pypi.org/project/charset-normalizer">
    <img src="https://img.shields.io/pypi/pyversions/charset_normalizer.svg?orange=blue" />
  </a>
  <a href="https://pepy.tech/project/charset-normalizer/">
    <img alt="Download Count Total" src="https://static.pepy.tech/badge/charset-normalizer/month" />
  </a>
  <a href="https://bestpractices.coreinfrastructure.org/projects/7297">
    <img src="https://bestpractices.coreinfrastructure.org/projects/7297/badge">
  </a>
 </p>
 <p align="center">
  <sup><i>Featured Packages</i></sup><br>
  <a href="https://github.com/jawah/niquests">
   <img alt="Static Badge" src="https://img.shields.io/badge/Niquests-HTTP_1.1%2C%202%2C_and_3_Client-cyan">
  </a>
  <a href="https://github.com/jawah/wassima">
   <img alt="Static Badge" src="https://img.shields.io/badge/Wassima-Certifi_Killer-cyan">
  </a>
 </p>
 <p align="center">
  <sup><i>In other language (unofficial port - by the community)</i></sup><br>
  <a href="https://github.com/nickspring/charset-normalizer-rs">
   <img alt="Static Badge" src="https://img.shields.io/badge/Rust-red">
  </a>
 </p>
 > A library that helps you read text from an unknown charset encoding.<br /> Motivated by `chardet`,
 > I'm trying to resolve the issue by taking a new approach.
 > All IANA character set names for which the Python core library provides codecs are supported.
 <p align="center">
  >>>>> <a href="https://charsetnormalizerweb.ousret.now.sh" target="_blank">👉 Try Me Online Now, Then Adopt Me 👈 </a> <<<<<
 </p>
 This project offers you an alternative to **Universal Charset Encoding Detector**, also known as **Chardet**.
 | Feature                                          | [Chardet](https://github.com/chardet/chardet) |                                         Charset Normalizer                                         | [cChardet](https://github.com/PyYoshi/cChardet) |
 |--------------------------------------------------|:---------------------------------------------:|:--------------------------------------------------------------------------------------------------:|:-----------------------------------------------:|
 | `Fast`                                           |                       ❌                       |                                                 ✅                                                  |                        ✅                        |
 | `Universal**`                                    |                       ❌                       |                                                 ✅                                                  |                        ❌                        |
 | `Reliable` **without** distinguishable standards |                       ❌                       |                                                 ✅                                                  |                        ✅                        |
 | `Reliable` **with** distinguishable standards    |                       ✅                       |                                                 ✅                                                  |                        ✅                        |
 | `License`                                        |           LGPL-2.1<br>_restrictive_           |                                                MIT                                                 |            MPL-1.1<br>_restrictive_             |
 | `Native Python`                                  |                       ✅                       |                                                 ✅                                                  |                        ❌                        |
 | `Detect spoken language`                         |                       ❌                       |                                                 ✅                                                  |                       N/A                       |
 | `UnicodeDecodeError Safety`                      |                       ❌                       |                                                 ✅                                                  |                        ❌                        |
 | `Whl Size (min)`                                 |                   193.6 kB                    |                                               42 kB                                                |                     ~200 kB                     |
 | `Supported Encoding`                             |                      33                       | 🎉 [99](https://charset-normalizer.readthedocs.io/en/latest/user/support.html#supported-encodings) |                       40                        |
 <p align="center">
 <img src="https://i.imgflip.com/373iay.gif" alt="Reading Normalized Text" width="226"/><img src="https://media.tenor.com/images/c0180f70732a18b4965448d33adba3d0/tenor.gif" alt="Cat Reading Text" width="200"/>
 </p>
 *\*\* : They are clearly using specific code for a specific encoding even if covering most of used one*<br> 
 Did you got there because of the logs? See [https://charset-normalizer.readthedocs.io/en/latest/user/miscellaneous.html](https://charset-normalizer.readthedocs.io/en/latest/user/miscellaneous.html)
 ## ⚡ Performance
 This package offer better performance than its counterpart Chardet. Here are some numbers.
 | Package                                       | Accuracy | Mean per file (ms) | File per sec (est) |
 |-----------------------------------------------|:--------:|:------------------:|:------------------:|
 | [chardet](https://github.com/chardet/chardet) |   86 %   |       200 ms       |     5 file/sec     |
 | charset-normalizer                            | **98 %** |     **10 ms**      |    100 file/sec    |
 | Package                                       | 99th percentile | 95th percentile | 50th percentile |
 |-----------------------------------------------|:---------------:|:---------------:|:---------------:|
 | [chardet](https://github.com/chardet/chardet) |     1200 ms     |     287 ms      |      23 ms      |
 | charset-normalizer                            |     100 ms      |      50 ms      |      5 ms       |
 Chardet's performance on larger file (1MB+) are very poor. Expect huge difference on large payload.
 > Stats are generated using 400+ files using default parameters. More details on used files, see GHA workflows.
 > And yes, these results might change at any time. The dataset can be updated to include more files.
 > The actual delays heavily depends on your CPU capabilities. The factors should remain the same.
 > Keep in mind that the stats are generous and that Chardet accuracy vs our is measured using Chardet initial capability
 > (eg. Supported Encoding) Challenge-them if you want.
 ## ✨ Installation
 Using pip:
 ```sh
 pip install charset-normalizer -U
 ```
 ## 🚀 Basic Usage
 ### CLI
 This package comes with a CLI.
 ```
 usage: normalizer [-h] [-v] [-a] [-n] [-m] [-r] [-f] [-t THRESHOLD]
                  file [file ...]
 The Real First Universal Charset Detector. Discover originating encoding used
 on text file. Normalize text to unicode.
 positional arguments:
  files                 File(s) to be analysed
 optional arguments:
  -h, --help            show this help message and exit
  -v, --verbose         Display complementary information about file if any.
                        Stdout will contain logs about the detection process.
  -a, --with-alternative
                        Output complementary possibilities if any. Top-level
                        JSON WILL be a list.
  -n, --normalize       Permit to normalize input file. If not set, program
                        does not write anything.
  -m, --minimal         Only output the charset detected to STDOUT. Disabling
                        JSON output.
  -r, --replace         Replace file when trying to normalize it instead of
                        creating a new one.
  -f, --force           Replace file without asking if you are sure, use this
                        flag with caution.
  -t THRESHOLD, --threshold THRESHOLD
                        Define a custom maximum amount of chaos allowed in
                        decoded content. 0. <= chaos <= 1.
  --version             Show version information and exit.
 ```
 ```bash
 normalizer ./data/sample.1.fr.srt
 ```
 or
 ```bash
 python -m charset_normalizer ./data/sample.1.fr.srt
 ```
 🎉 Since version 1.4.0 the CLI produce easily usable stdout result in JSON format.
 ```json
 {
    "path": "/home/default/projects/charset_normalizer/data/sample.1.fr.srt",
    "encoding": "cp1252",
    "encoding_aliases": [
        "1252",
        "windows_1252"
    ],
    "alternative_encodings": [
        "cp1254",
        "cp1256",
        "cp1258",
        "iso8859_14",
        "iso8859_15",
        "iso8859_16",
        "iso8859_3",
        "iso8859_9",
        "latin_1",
        "mbcs"
    ],
    "language": "French",
    "alphabets": [
        "Basic Latin",
        "Latin-1 Supplement"
    ],
    "has_sig_or_bom": false,
    "chaos": 0.149,
    "coherence": 97.152,
    "unicode_path": null,
    "is_preferred": true
 }
 ```
 ### Python
 *Just print out normalized text*
 ```python
 from charset_normalizer import from_path
 results = from_path('./my_subtitle.srt')
 print(str(results.best()))
 ```
 *Upgrade your code without effort*
 ```python
 from charset_normalizer import detect
 ```
 The above code will behave the same as **chardet**. We ensure that we offer the best (reasonable) BC result possible.
 See the docs for advanced usage : [readthedocs.io](https://charset-normalizer.readthedocs.io/en/latest/)
 ## 😇 Why
 When I started using Chardet, I noticed that it was not suited to my expectations, and I wanted to propose a
 reliable alternative using a completely different method. Also! I never back down on a good challenge!
 I **don't care** about the **originating charset** encoding, because **two different tables** can
 produce **two identical rendered string.**
 What I want is to get readable text, the best I can. 
 In a way, **I'm brute forcing text decoding.** How cool is that ? 😎
 Don't confuse package **ftfy** with charset-normalizer or chardet. ftfy goal is to repair unicode string whereas charset-normalizer to convert raw file in unknown encoding to unicode.
 ## 🍰 How
  - Discard all charset encoding table that could not fit the binary content.
  - Measure noise, or the mess once opened (by chunks) with a corresponding charset encoding.
  - Extract matches with the lowest mess detected.
  - Additionally, we measure coherence / probe for a language.
 **Wait a minute**, what is noise/mess and coherence according to **YOU ?**
 *Noise :* I opened hundred of text files, **written by humans**, with the wrong encoding table. **I observed**, then
 **I established** some ground rules about **what is obvious** when **it seems like** a mess.
 I know that my interpretation of what is noise is probably incomplete, feel free to contribute in order to
 improve or rewrite it.
 *Coherence :* For each language there is on earth, we have computed ranked letter appearance occurrences (the best we can). So I thought
 that intel is worth something here. So I use those records against decoded text to check if I can detect intelligent design.
 ## ⚡ Known limitations
  - Language detection is unreliable when text contains two or more languages sharing identical letters. (eg. HTML (english tags) + Turkish content (Sharing Latin characters))
  - Every charset detector heavily depends on sufficient content. In common cases, do not bother run detection on very tiny content.
 ## ⚠️ About Python EOLs
 **If you are running:**
 - Python >=2.7,<3.5: Unsupported
 - Python 3.5: charset-normalizer < 2.1
 - Python 3.6: charset-normalizer < 3.1
 - Python 3.7: charset-normalizer < 4.0
 Upgrade your Python interpreter as soon as possible.
 ## 👤 Contributing
 Contributions, issues and feature requests are very much welcome.<br />
 Feel free to check [issues page](https://github.com/ousret/charset_normalizer/issues) if you want to contribute.
 ## 📝 License
 Copyright © [Ahmed TAHRI @Ousret](https://github.com/Ousret).<br />
 This project is [MIT](https://github.com/Ousret/charset_normalizer/blob/master/LICENSE) licensed.
 Characters frequencies used in this project © 2012 [Denny Vrandečić](http://simia.net/letters/)
 ## 💼 For Enterprise
 Professional support for charset-normalizer is available as part of the [Tidelift
 Subscription][1]. Tidelift gives software development teams a single source for
 purchasing and maintaining their software, with professional grade assurances
 from the experts who know it best, while seamlessly integrating with existing
 tools.
 [1]: https://tidelift.com/subscription/pkg/pypi-charset-normalizer?utm_source=pypi-charset-normalizer&utm_medium=readme
 # Changelog
 All notable changes to charset-normalizer will be documented in this file. This project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/).
 ## [3.3.2](https://github.com/Ousret/charset_normalizer/compare/3.3.1...3.3.2) (2023-10-31)
 ### Fixed
 - Unintentional memory usage regression when using large payload that match several encoding (#376)
 - Regression on some detection case showcased in the documentation (#371)
 ### Added
 - Noise (md) probe that identify malformed arabic representation due to the presence of letters in isolated form (credit to my wife)
 ## [3.3.1](https://github.com/Ousret/charset_normalizer/compare/3.3.0...3.3.1) (2023-10-22)
 ### Changed
 - Optional mypyc compilation upgraded to version 1.6.1 for Python >= 3.8
 - Improved the general detection reliability based on reports from the community
 ## [3.3.0](https://github.com/Ousret/charset_normalizer/compare/3.2.0...3.3.0) (2023-09-30)
 ### Added
 - Allow to execute the CLI (e.g. normalizer) through `python -m charset_normalizer.cli` or `python -m charset_normalizer`
 - Support for 9 forgotten encoding that are supported by Python but unlisted in `encoding.aliases` as they have no alias (#323)
 ### Removed
 - (internal) Redundant utils.is_ascii function and unused function is_private_use_only
 - (internal) charset_normalizer.assets is moved inside charset_normalizer.constant
 ### Changed
 - (internal) Unicode code blocks in constants are updated using the latest v15.0.0 definition to improve detection
 - Optional mypyc compilation upgraded to version 1.5.1 for Python >= 3.8
 ### Fixed
 - Unable to properly sort CharsetMatch when both chaos/noise and coherence were close due to an unreachable condition in \_\_lt\_\_ (#350)
 ## [3.2.0](https://github.com/Ousret/charset_normalizer/compare/3.1.0...3.2.0) (2023-06-07)
 ### Changed
 - Typehint for function `from_path` no longer enforce `PathLike` as its first argument
 - Minor improvement over the global detection reliability
 ### Added
 - Introduce function `is_binary` that relies on main capabilities, and optimized to detect binaries
 - Propagate `enable_fallback` argument throughout `from_bytes`, `from_path`, and `from_fp` that allow a deeper control over the detection (default True)
 - Explicit support for Python 3.12
 ### Fixed
 - Edge case detection failure where a file would contain 'very-long' camel cased word (Issue #289)
 ## [3.1.0](https://github.com/Ousret/charset_normalizer/compare/3.0.1...3.1.0) (2023-03-06)
 ### Added
 - Argument `should_rename_legacy` for legacy function `detect` and disregard any new arguments without errors (PR #262)
 ### Removed
 - Support for Python 3.6 (PR #260)
 ### Changed
 - Optional speedup provided by mypy/c 1.0.1
 ## [3.0.1](https://github.com/Ousret/charset_normalizer/compare/3.0.0...3.0.1) (2022-11-18)
 ### Fixed
 - Multi-bytes cutter/chunk generator did not always cut correctly (PR #233)
 ### Changed
 - Speedup provided by mypy/c 0.990 on Python >= 3.7
 ## [3.0.0](https://github.com/Ousret/charset_normalizer/compare/2.1.1...3.0.0) (2022-10-20)
 ### Added
 - Extend the capability of explain=True when cp_isolation contains at most two entries (min one), will log in details of the Mess-detector results
 - Support for alternative language frequency set in charset_normalizer.assets.FREQUENCIES
 - Add parameter `language_threshold` in `from_bytes`, `from_path` and `from_fp` to adjust the minimum expected coherence ratio
 - `normalizer --version` now specify if current version provide extra speedup (meaning mypyc compilation whl)
 ### Changed
 - Build with static metadata using 'build' frontend
 - Make the language detection stricter
 - Optional: Module `md.py` can be compiled using Mypyc to provide an extra speedup up to 4x faster than v2.1
 ### Fixed
 - CLI with opt --normalize fail when using full path for files
 - TooManyAccentuatedPlugin induce false positive on the mess detection when too few alpha character have been fed to it
 - Sphinx warnings when generating the documentation
 ### Removed
 - Coherence detector no longer return 'Simple English' instead return 'English'
 - Coherence detector no longer return 'Classical Chinese' instead return 'Chinese'
 - Breaking: Method `first()` and `best()` from CharsetMatch
 - UTF-7 will no longer appear as "detected" without a recognized SIG/mark (is unreliable/conflict with ASCII)
 - Breaking: Class aliases CharsetDetector, CharsetDoctor, CharsetNormalizerMatch and CharsetNormalizerMatches
 - Breaking: Top-level function `normalize`
 - Breaking: Properties `chaos_secondary_pass`, `coherence_non_latin` and `w_counter` from CharsetMatch
 - Support for the backport `unicodedata2`
 ## [3.0.0rc1](https://github.com/Ousret/charset_normalizer/compare/3.0.0b2...3.0.0rc1) (2022-10-18)
 ### Added
 - Extend the capability of explain=True when cp_isolation contains at most two entries (min one), will log in details of the Mess-detector results
 - Support for alternative language frequency set in charset_normalizer.assets.FREQUENCIES
 - Add parameter `language_threshold` in `from_bytes`, `from_path` and `from_fp` to adjust the minimum expected coherence ratio
 ### Changed
 - Build with static metadata using 'build' frontend
 - Make the language detection stricter
 ### Fixed
 - CLI with opt --normalize fail when using full path for files
 - TooManyAccentuatedPlugin induce false positive on the mess detection when too few alpha character have been fed to it
 ### Removed
 - Coherence detector no longer return 'Simple English' instead return 'English'
 - Coherence detector no longer return 'Classical Chinese' instead return 'Chinese'
 ## [3.0.0b2](https://github.com/Ousret/charset_normalizer/compare/3.0.0b1...3.0.0b2) (2022-08-21)
 ### Added
 - `normalizer --version` now specify if current version provide extra speedup (meaning mypyc compilation whl)
 ### Removed
 - Breaking: Method `first()` and `best()` from CharsetMatch
 - UTF-7 will no longer appear as "detected" without a recognized SIG/mark (is unreliable/conflict with ASCII)
 ### Fixed
 - Sphinx warnings when generating the documentation
 ## [3.0.0b1](https://github.com/Ousret/charset_normalizer/compare/2.1.0...3.0.0b1) (2022-08-15)
 ### Changed
 - Optional: Module `md.py` can be compiled using Mypyc to provide an extra speedup up to 4x faster than v2.1
 ### Removed
 - Breaking: Class aliases CharsetDetector, CharsetDoctor, CharsetNormalizerMatch and CharsetNormalizerMatches
 - Breaking: Top-level function `normalize`
 - Breaking: Properties `chaos_secondary_pass`, `coherence_non_latin` and `w_counter` from CharsetMatch
 - Support for the backport `unicodedata2`
 ## [2.1.1](https://github.com/Ousret/charset_normalizer/compare/2.1.0...2.1.1) (2022-08-19)
 ### Deprecated
 - Function `normalize` scheduled for removal in 3.0
 ### Changed
 - Removed useless call to decode in fn is_unprintable (#206)
 ### Fixed
 - Third-party library (i18n xgettext) crashing not recognizing utf_8 (PEP 263) with underscore from [@aleksandernovikov](https://github.com/aleksandernovikov) (#204)
 ## [2.1.0](https://github.com/Ousret/charset_normalizer/compare/2.0.12...2.1.0) (2022-06-19)
 ### Added
 - Output the Unicode table version when running the CLI with `--version` (PR #194)
 ### Changed
 - Re-use decoded buffer for single byte character sets from [@nijel](https://github.com/nijel) (PR #175)
 - Fixing some performance bottlenecks from [@deedy5](https://github.com/deedy5) (PR #183)
 ### Fixed
 - Workaround potential bug in cpython with Zero Width No-Break Space located in Arabic Presentation Forms-B, Unicode 1.1 not acknowledged as space (PR #175)
 - CLI default threshold aligned with the API threshold from [@oleksandr-kuzmenko](https://github.com/oleksandr-kuzmenko) (PR #181)
 ### Removed
 - Support for Python 3.5 (PR #192)
 ### Deprecated
 - Use of backport unicodedata from `unicodedata2` as Python is quickly catching up, scheduled for removal in 3.0 (PR #194)
 ## [2.0.12](https://github.com/Ousret/charset_normalizer/compare/2.0.11...2.0.12) (2022-02-12)
 ### Fixed
 - ASCII miss-detection on rare cases (PR #170) 
 ## [2.0.11](https://github.com/Ousret/charset_normalizer/compare/2.0.10...2.0.11) (2022-01-30)
 ### Added
 - Explicit support for Python 3.11 (PR #164)
 ### Changed
 - The logging behavior have been completely reviewed, now using only TRACE and DEBUG levels (PR #163 #165)
 ## [2.0.10](https://github.com/Ousret/charset_normalizer/compare/2.0.9...2.0.10) (2022-01-04)
 ### Fixed
 - Fallback match entries might lead to UnicodeDecodeError for large bytes sequence (PR #154)
 ### Changed
 - Skipping the language-detection (CD) on ASCII (PR #155)
 ## [2.0.9](https://github.com/Ousret/charset_normalizer/compare/2.0.8...2.0.9) (2021-12-03)
 ### Changed
 - Moderating the logging impact (since 2.0.8) for specific environments (PR #147)
 ### Fixed
 - Wrong logging level applied when setting kwarg `explain` to True (PR #146)
 ## [2.0.8](https://github.com/Ousret/charset_normalizer/compare/2.0.7...2.0.8) (2021-11-24)
 ### Changed
 - Improvement over Vietnamese detection (PR #126)
 - MD improvement on trailing data and long foreign (non-pure latin) data (PR #124)
 - Efficiency improvements in cd/alphabet_languages from [@adbar](https://github.com/adbar) (PR #122)
 - call sum() without an intermediary list following PEP 289 recommendations from [@adbar](https://github.com/adbar) (PR #129)
 - Code style as refactored by Sourcery-AI (PR #131) 
 - Minor adjustment on the MD around european words (PR #133)
 - Remove and replace SRTs from assets / tests (PR #139)
 - Initialize the library logger with a `NullHandler` by default from [@nmaynes](https://github.com/nmaynes) (PR #135)
 - Setting kwarg `explain` to True will add provisionally (bounded to function lifespan) a specific stream handler (PR #135)
 ### Fixed
 - Fix large (misleading) sequence giving UnicodeDecodeError (PR #137)
 - Avoid using too insignificant chunk (PR #137)
 ### Added
 - Add and expose function `set_logging_handler` to configure a specific StreamHandler from [@nmaynes](https://github.com/nmaynes) (PR #135)
 - Add `CHANGELOG.md` entries, format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/) (PR #141)
 ## [2.0.7](https://github.com/Ousret/charset_normalizer/compare/2.0.6...2.0.7) (2021-10-11)
 ### Added
 - Add support for Kazakh (Cyrillic) language detection (PR #109)
 ### Changed
 - Further, improve inferring the language from a given single-byte code page (PR #112)
 - Vainly trying to leverage PEP263 when PEP3120 is not supported (PR #116)
 - Refactoring for potential performance improvements in loops from [@adbar](https://github.com/adbar) (PR #113)
 - Various detection improvement (MD+CD) (PR #117)
 ### Removed
 - Remove redundant logging entry about detected language(s) (PR #115)
 ### Fixed
 - Fix a minor inconsistency between Python 3.5 and other versions regarding language detection (PR #117 #102)
 ## [2.0.6](https://github.com/Ousret/charset_normalizer/compare/2.0.5...2.0.6) (2021-09-18)
 ### Fixed
 - Unforeseen regression with the loss of the backward-compatibility with some older minor of Python 3.5.x (PR #100)
 - Fix CLI crash when using --minimal output in certain cases (PR #103)
 ### Changed
 - Minor improvement to the detection efficiency (less than 1%) (PR #106 #101)
 ## [2.0.5](https://github.com/Ousret/charset_normalizer/compare/2.0.4...2.0.5) (2021-09-14)
 ### Changed
 - The project now comply with: flake8, mypy, isort and black to ensure a better overall quality (PR #81)
 - The BC-support with v1.x was improved, the old staticmethods are restored (PR #82)
 - The Unicode detection is slightly improved (PR #93)
 - Add syntax sugar \_\_bool\_\_ for results CharsetMatches list-container (PR #91)
 ### Removed
 - The project no longer raise warning on tiny content given for detection, will be simply logged as warning instead (PR #92)
 ### Fixed
 - In some rare case, the chunks extractor could cut in the middle of a multi-byte character and could mislead the mess detection (PR #95)
 - Some rare 'space' characters could trip up the UnprintablePlugin/Mess detection (PR #96)
 - The MANIFEST.in was not exhaustive (PR #78)
 ## [2.0.4](https://github.com/Ousret/charset_normalizer/compare/2.0.3...2.0.4) (2021-07-30)
 ### Fixed
 - The CLI no longer raise an unexpected exception when no encoding has been found (PR #70)
 - Fix accessing the 'alphabets' property when the payload contains surrogate characters (PR #68)
 - The logger could mislead (explain=True) on detected languages and the impact of one MBCS match (PR #72)
 - Submatch factoring could be wrong in rare edge cases (PR #72)
 - Multiple files given to the CLI were ignored when publishing results to STDOUT. (After the first path) (PR #72)
 - Fix line endings from CRLF to LF for certain project files (PR #67)
 ### Changed
 - Adjust the MD to lower the sensitivity, thus improving the global detection reliability (PR #69 #76)
 - Allow fallback on specified encoding if any (PR #71)
 ## [2.0.3](https://github.com/Ousret/charset_normalizer/compare/2.0.2...2.0.3) (2021-07-16)
 ### Changed
 - Part of the detection mechanism has been improved to be less sensitive, resulting in more accurate detection results. Especially ASCII. (PR #63)
 - According to the community wishes, the detection will fall back on ASCII or UTF-8 in a last-resort case. (PR #64)
 ## [2.0.2](https://github.com/Ousret/charset_normalizer/compare/2.0.1...2.0.2) (2021-07-15)
 ### Fixed
 - Empty/Too small JSON payload miss-detection fixed. Report from [@tseaver](https://github.com/tseaver) (PR #59) 
 ### Changed
 - Don't inject unicodedata2 into sys.modules from [@akx](https://github.com/akx) (PR #57)
 ## [2.0.1](https://github.com/Ousret/charset_normalizer/compare/2.0.0...2.0.1) (2021-07-13)
 ### Fixed
 - Make it work where there isn't a filesystem available, dropping assets frequencies.json. Report from [@sethmlarson](https://github.com/sethmlarson). (PR #55)
 - Using explain=False permanently disable the verbose output in the current runtime (PR #47)
 - One log entry (language target preemptive) was not show in logs when using explain=True (PR #47)
 - Fix undesired exception (ValueError) on getitem of instance CharsetMatches (PR #52)
 ### Changed
 - Public function normalize default args values were not aligned with from_bytes (PR #53)
 ### Added
 - You may now use charset aliases in cp_isolation and cp_exclusion arguments (PR #47)
 ## [2.0.0](https://github.com/Ousret/charset_normalizer/compare/1.4.1...2.0.0) (2021-07-02)
 ### Changed
 - 4x to 5 times faster than the previous 1.4.0 release. At least 2x faster than Chardet.
 - Accent has been made on UTF-8 detection, should perform rather instantaneous.
 - The backward compatibility with Chardet has been greatly improved. The legacy detect function returns an identical charset name whenever possible.
 - The detection mechanism has been slightly improved, now Turkish content is detected correctly (most of the time)
 - The program has been rewritten to ease the readability and maintainability. (+Using static typing)+
 - utf_7 detection has been reinstated.
 ### Removed
 - This package no longer require anything when used with Python 3.5 (Dropped cached_property)
 - Removed support for these languages: Catalan, Esperanto, Kazakh, Baque, Volapük, Azeri, Galician, Nynorsk, Macedonian, and Serbocroatian.
 - The exception hook on UnicodeDecodeError has been removed.
 ### Deprecated
 - Methods coherence_non_latin, w_counter, chaos_secondary_pass of the class CharsetMatch are now deprecated and scheduled for removal in v3.0
 ### Fixed
 - The CLI output used the relative path of the file(s). Should be absolute.
 ## [1.4.1](https://github.com/Ousret/charset_normalizer/compare/1.4.0...1.4.1) (2021-05-28)
 ### Fixed
 - Logger configuration/usage no longer conflict with others (PR #44)
 ## [1.4.0](https://github.com/Ousret/charset_normalizer/compare/1.3.9...1.4.0) (2021-05-21)
 ### Removed
 - Using standard logging instead of using the package loguru.
 - Dropping nose test framework in favor of the maintained pytest.
 - Choose to not use dragonmapper package to help with gibberish Chinese/CJK text.
 - Require cached_property only for Python 3.5 due to constraint. Dropping for every other interpreter version.
 - Stop support for UTF-7 that does not contain a SIG.
 - Dropping PrettyTable, replaced with pure JSON output in CLI.
 ### Fixed
 - BOM marker in a CharsetNormalizerMatch instance could be False in rare cases even if obviously present. Due to the sub-match factoring process.
 - Not searching properly for the BOM when trying utf32/16 parent codec.
 ### Changed
 - Improving the package final size by compressing frequencies.json.
 - Huge improvement over the larges payload.
 ### Added
 - CLI now produces JSON consumable output.
 - Return ASCII if given sequences fit. Given reasonable confidence.
 ## [1.3.9](https://github.com/Ousret/charset_normalizer/compare/1.3.8...1.3.9) (2021-05-13)
 ### Fixed
 - In some very rare cases, you may end up getting encode/decode errors due to a bad bytes payload (PR #40)
 ## [1.3.8](https://github.com/Ousret/charset_normalizer/compare/1.3.7...1.3.8) (2021-05-12)
 ### Fixed
 - Empty given payload for detection may cause an exception if trying to access the `alphabets` property. (PR #39)
 ## [1.3.7](https://github.com/Ousret/charset_normalizer/compare/1.3.6...1.3.7) (2021-05-12)
 ### Fixed
 - The legacy detect function should return UTF-8-SIG if sig is present in the payload. (PR #38)
 ## [1.3.6](https://github.com/Ousret/charset_normalizer/compare/1.3.5...1.3.6) (2021-02-09)
 ### Changed
 - Amend the previous release to allow prettytable 2.0 (PR #35)
 ## [1.3.5](https://github.com/Ousret/charset_normalizer/compare/1.3.4...1.3.5) (2021-02-08)
 ### Fixed
 - Fix error while using the package with a python pre-release interpreter (PR #33)
 ### Changed
 - Dependencies refactoring, constraints revised.
 ### Added
 - Add python 3.9 and 3.10 to the supported interpreters
 MIT License
 Copyright (c) 2019 TAHRI Ahmed R.
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
 in the Software without restriction, including without limitation the rights
 to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 copies of the Software, and to permit persons to whom the Software is
 furnished to do so, subject to the following conditions:
 The above copyright notice and this permission notice shall be included in all
 copies or substantial portions of the Software.
 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 SOFTWARE.
--- a/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/RECORD
+++ b/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/RECORD
@ -0,0 +1,35 @@
 ../../../bin/normalizer,sha256=WJyZVNKmQ1Om0a-_THzeHGe8oZSK8RtdNnEgy8nhuJU,261
 charset_normalizer-3.3.2.dist-info/INSTALLER,sha256=zuuue4knoyJ-UwPPXg8fezS7VCrXJQrAP7zeNuwvFQg,4
 charset_normalizer-3.3.2.dist-info/LICENSE,sha256=6zGgxaT7Cbik4yBV0lweX5w1iidS_vPNcgIT0cz-4kE,1070
 charset_normalizer-3.3.2.dist-info/METADATA,sha256=cfLhl5A6SI-F0oclm8w8ux9wshL1nipdeCdVnYb4AaA,33550
 charset_normalizer-3.3.2.dist-info/RECORD,,
 charset_normalizer-3.3.2.dist-info/WHEEL,sha256=4ZiCdXIWMxJyEClivrQv1QAHZpQh8kVYU92_ZAVwaok,152
 charset_normalizer-3.3.2.dist-info/entry_points.txt,sha256=ADSTKrkXZ3hhdOVFi6DcUEHQRS0xfxDIE_pEz4wLIXA,65
 charset_normalizer-3.3.2.dist-info/top_level.txt,sha256=7ASyzePr8_xuZWJsnqJjIBtyV8vhEo0wBCv1MPRRi3Q,19
 charset_normalizer/__init__.py,sha256=UzI3xC8PhmcLRMzSgPb6minTmRq0kWznnCBJ8ZCc2XI,1577
 charset_normalizer/__main__.py,sha256=JxY8bleaENOFlLRb9HfoeZCzAMnn2A1oGR5Xm2eyqg0,73
 charset_normalizer/__pycache__/__init__.cpython-312.pyc,,
 charset_normalizer/__pycache__/__main__.cpython-312.pyc,,
 charset_normalizer/__pycache__/api.cpython-312.pyc,,
 charset_normalizer/__pycache__/cd.cpython-312.pyc,,
 charset_normalizer/__pycache__/constant.cpython-312.pyc,,
 charset_normalizer/__pycache__/legacy.cpython-312.pyc,,
 charset_normalizer/__pycache__/md.cpython-312.pyc,,
 charset_normalizer/__pycache__/models.cpython-312.pyc,,
 charset_normalizer/__pycache__/utils.cpython-312.pyc,,
 charset_normalizer/__pycache__/version.cpython-312.pyc,,
 charset_normalizer/api.py,sha256=WOlWjy6wT8SeMYFpaGbXZFN1TMXa-s8vZYfkL4G29iQ,21097
 charset_normalizer/cd.py,sha256=xwZliZcTQFA3jU0c00PRiu9MNxXTFxQkFLWmMW24ZzI,12560
 charset_normalizer/cli/__init__.py,sha256=D5ERp8P62llm2FuoMzydZ7d9rs8cvvLXqE-1_6oViPc,100
 charset_normalizer/cli/__main__.py,sha256=2F-xURZJzo063Ye-2RLJ2wcmURpbKeAzKwpiws65dAs,9744
 charset_normalizer/cli/__pycache__/__init__.cpython-312.pyc,,
 charset_normalizer/cli/__pycache__/__main__.cpython-312.pyc,,
 charset_normalizer/constant.py,sha256=p0IsOVcEbPWYPOdWhnhRbjK1YVBy6fs05C5vKC-zoxU,40481
 charset_normalizer/legacy.py,sha256=T-QuVMsMeDiQEk8WSszMrzVJg_14AMeSkmHdRYhdl1k,2071
 charset_normalizer/md.cpython-312-x86_64-linux-gnu.so,sha256=W654QTU3QZI6eWJ0fanScAr0_O6sL0I61fyRSdC-39Y,16064
 charset_normalizer/md.py,sha256=NkSuVLK13_a8c7BxZ4cGIQ5vOtGIWOdh22WZEvjp-7U,19624
 charset_normalizer/md__mypyc.cpython-312-x86_64-linux-gnu.so,sha256=IlObIV4dmRhFV8V7H-zK4rTxPzTSi9JmrWZD26JQfxI,272640
 charset_normalizer/models.py,sha256=I5i0s4aKCCgLPY2tUY3pwkgFA-BUbbNxQ7hVkVTt62s,11624
 charset_normalizer/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 charset_normalizer/utils.py,sha256=teiosMqzKjXyAHXnGdjSBOgnBZwx-SkBbCLrx0UXy8M,11894
 charset_normalizer/version.py,sha256=iHKUfHD3kDRSyrh_BN2ojh43TA5-UZQjvbVIEFfpHDs,79
--- a/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/WHEEL
+++ b/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/WHEEL
@ -0,0 +1,6 @@
 Wheel-Version: 1.0
 Generator: bdist_wheel (0.41.2)
 Root-Is-Purelib: false
 Tag: cp312-cp312-manylinux_2_17_x86_64
 Tag: cp312-cp312-manylinux2014_x86_64
--- a/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/entry_points.txt
+++ b/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/entry_points.txt
@ -0,0 +1,2 @@
 [console_scripts]
 normalizer = charset_normalizer.cli:cli_detect
--- a/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/top_level.txt
+++ b/venv/lib/python3.12/site-packages/charset_normalizer-3.3.2.dist-info/top_level.txt
@ -0,0 +1 @@
 charset_normalizer
--- a/venv/lib/python3.12/site-packages/charset_normalizer/init.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/init.py
@ -0,0 +1,46 @@
 # -*- coding: utf-8 -*-
 """
 Charset-Normalizer
 ~~~~~~~~~~~~~~
 The Real First Universal Charset Detector.
 A library that helps you read text from an unknown charset encoding.
 Motivated by chardet, This package is trying to resolve the issue by taking a new approach.
 All IANA character set names for which the Python core library provides codecs are supported.
 Basic usage:
   >>> from charset_normalizer import from_bytes
   >>> results = from_bytes('Bсеки човек има право на образование. Oбразованието!'.encode('utf_8'))
   >>> best_guess = results.best()
   >>> str(best_guess)
   'Bсеки човек има право на образование. Oбразованието!'
 Others methods and usages are available - see the full documentation
 at <https://github.com/Ousret/charset_normalizer>.
 :copyright: (c) 2021 by Ahmed TAHRI
 :license: MIT, see LICENSE for more details.
 """
 import logging
 from .api import from_bytes, from_fp, from_path, is_binary
 from .legacy import detect
 from .models import CharsetMatch, CharsetMatches
 from .utils import set_logging_handler
 from .version import VERSION, __version__
 __all__ = (
    "from_fp",
    "from_path",
    "from_bytes",
    "is_binary",
    "detect",
    "CharsetMatch",
    "CharsetMatches",
    "__version__",
    "VERSION",
    "set_logging_handler",
 )
 # Attach a NullHandler to the top level logger by default
 # https://docs.python.org/3.3/howto/logging.html#configuring-logging-for-a-library
 logging.getLogger("charset_normalizer").addHandler(logging.NullHandler())
--- a/venv/lib/python3.12/site-packages/charset_normalizer/main.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/main.py
@ -0,0 +1,4 @@
 from .cli import cli_detect
 if __name__ == "__main__":
    cli_detect()
--- a/venv/lib/python3.12/site-packages/charset_normalizer/pycache/init.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/pycache/init.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/pycache/main.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/pycache/main.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/pycache/api.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/pycache/api.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/pycache/cd.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/pycache/cd.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/pycache/constant.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/pycache/constant.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/pycache/legacy.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/pycache/legacy.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/pycache/md.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/pycache/md.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/pycache/models.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/pycache/models.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/pycache/utils.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/pycache/utils.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/pycache/version.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/pycache/version.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/api.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/api.py
@ -0,0 +1,626 @@
 import logging
 from os import PathLike
 from typing import BinaryIO, List, Optional, Set, Union
 from .cd import (
    coherence_ratio,
    encoding_languages,
    mb_encoding_languages,
    merge_coherence_ratios,
 )
 from .constant import IANA_SUPPORTED, TOO_BIG_SEQUENCE, TOO_SMALL_SEQUENCE, TRACE
 from .md import mess_ratio
 from .models import CharsetMatch, CharsetMatches
 from .utils import (
    any_specified_encoding,
    cut_sequence_chunks,
    iana_name,
    identify_sig_or_bom,
    is_cp_similar,
    is_multi_byte_encoding,
    should_strip_sig_or_bom,
 )
 # Will most likely be controversial
 # logging.addLevelName(TRACE, "TRACE")
 logger = logging.getLogger("charset_normalizer")
 explain_handler = logging.StreamHandler()
 explain_handler.setFormatter(
    logging.Formatter("%(asctime)s | %(levelname)s | %(message)s")
 )
 def from_bytes(
    sequences: Union[bytes, bytearray],
    steps: int = 5,
    chunk_size: int = 512,
    threshold: float = 0.2,
    cp_isolation: Optional[List[str]] = None,
    cp_exclusion: Optional[List[str]] = None,
    preemptive_behaviour: bool = True,
    explain: bool = False,
    language_threshold: float = 0.1,
    enable_fallback: bool = True,
 ) -> CharsetMatches:
    """
    Given a raw bytes sequence, return the best possibles charset usable to render str objects.
    If there is no results, it is a strong indicator that the source is binary/not text.
    By default, the process will extract 5 blocks of 512o each to assess the mess and coherence of a given sequence.
    And will give up a particular code page after 20% of measured mess. Those criteria are customizable at will.
    The preemptive behavior DOES NOT replace the traditional detection workflow, it prioritize a particular code page
    but never take it for granted. Can improve the performance.
    You may want to focus your attention to some code page or/and not others, use cp_isolation and cp_exclusion for that
    purpose.
    This function will strip the SIG in the payload/sequence every time except on UTF-16, UTF-32.
    By default the library does not setup any handler other than the NullHandler, if you choose to set the 'explain'
    toggle to True it will alter the logger configuration to add a StreamHandler that is suitable for debugging.
    Custom logging format and handler can be set manually.
    """
    if not isinstance(sequences, (bytearray, bytes)):
        raise TypeError(
            "Expected object of type bytes or bytearray, got: {0}".format(
                type(sequences)
            )
        )
    if explain:
        previous_logger_level: int = logger.level
        logger.addHandler(explain_handler)
        logger.setLevel(TRACE)
    length: int = len(sequences)
    if length == 0:
        logger.debug("Encoding detection on empty bytes, assuming utf_8 intention.")
        if explain:
            logger.removeHandler(explain_handler)
            logger.setLevel(previous_logger_level or logging.WARNING)
        return CharsetMatches([CharsetMatch(sequences, "utf_8", 0.0, False, [], "")])
    if cp_isolation is not None:
        logger.log(
            TRACE,
            "cp_isolation is set. use this flag for debugging purpose. "
            "limited list of encoding allowed : %s.",
            ", ".join(cp_isolation),
        )
        cp_isolation = [iana_name(cp, False) for cp in cp_isolation]
    else:
        cp_isolation = []
    if cp_exclusion is not None:
        logger.log(
            TRACE,
            "cp_exclusion is set. use this flag for debugging purpose. "
            "limited list of encoding excluded : %s.",
            ", ".join(cp_exclusion),
        )
        cp_exclusion = [iana_name(cp, False) for cp in cp_exclusion]
    else:
        cp_exclusion = []
    if length <= (chunk_size * steps):
        logger.log(
            TRACE,
            "override steps (%i) and chunk_size (%i) as content does not fit (%i byte(s) given) parameters.",
            steps,
            chunk_size,
            length,
        )
        steps = 1
        chunk_size = length
    if steps > 1 and length / steps < chunk_size:
        chunk_size = int(length / steps)
    is_too_small_sequence: bool = len(sequences) < TOO_SMALL_SEQUENCE
    is_too_large_sequence: bool = len(sequences) >= TOO_BIG_SEQUENCE
    if is_too_small_sequence:
        logger.log(
            TRACE,
            "Trying to detect encoding from a tiny portion of ({}) byte(s).".format(
                length
            ),
        )
    elif is_too_large_sequence:
        logger.log(
            TRACE,
            "Using lazy str decoding because the payload is quite large, ({}) byte(s).".format(
                length
            ),
        )
    prioritized_encodings: List[str] = []
    specified_encoding: Optional[str] = (
        any_specified_encoding(sequences) if preemptive_behaviour else None
    )
    if specified_encoding is not None:
        prioritized_encodings.append(specified_encoding)
        logger.log(
            TRACE,
            "Detected declarative mark in sequence. Priority +1 given for %s.",
            specified_encoding,
        )
    tested: Set[str] = set()
    tested_but_hard_failure: List[str] = []
    tested_but_soft_failure: List[str] = []
    fallback_ascii: Optional[CharsetMatch] = None
    fallback_u8: Optional[CharsetMatch] = None
    fallback_specified: Optional[CharsetMatch] = None
    results: CharsetMatches = CharsetMatches()
    sig_encoding, sig_payload = identify_sig_or_bom(sequences)
    if sig_encoding is not None:
        prioritized_encodings.append(sig_encoding)
        logger.log(
            TRACE,
            "Detected a SIG or BOM mark on first %i byte(s). Priority +1 given for %s.",
            len(sig_payload),
            sig_encoding,
        )
    prioritized_encodings.append("ascii")
    if "utf_8" not in prioritized_encodings:
        prioritized_encodings.append("utf_8")
    for encoding_iana in prioritized_encodings + IANA_SUPPORTED:
        if cp_isolation and encoding_iana not in cp_isolation:
            continue
        if cp_exclusion and encoding_iana in cp_exclusion:
            continue
        if encoding_iana in tested:
            continue
        tested.add(encoding_iana)
        decoded_payload: Optional[str] = None
        bom_or_sig_available: bool = sig_encoding == encoding_iana
        strip_sig_or_bom: bool = bom_or_sig_available and should_strip_sig_or_bom(
            encoding_iana
        )
        if encoding_iana in {"utf_16", "utf_32"} and not bom_or_sig_available:
            logger.log(
                TRACE,
                "Encoding %s won't be tested as-is because it require a BOM. Will try some sub-encoder LE/BE.",
                encoding_iana,
            )
            continue
        if encoding_iana in {"utf_7"} and not bom_or_sig_available:
            logger.log(
                TRACE,
                "Encoding %s won't be tested as-is because detection is unreliable without BOM/SIG.",
                encoding_iana,
            )
            continue
        try:
            is_multi_byte_decoder: bool = is_multi_byte_encoding(encoding_iana)
        except (ModuleNotFoundError, ImportError):
            logger.log(
                TRACE,
                "Encoding %s does not provide an IncrementalDecoder",
                encoding_iana,
            )
            continue
        try:
            if is_too_large_sequence and is_multi_byte_decoder is False:
                str(
                    sequences[: int(50e4)]
                    if strip_sig_or_bom is False
                    else sequences[len(sig_payload) : int(50e4)],
                    encoding=encoding_iana,
                )
            else:
                decoded_payload = str(
                    sequences
                    if strip_sig_or_bom is False
                    else sequences[len(sig_payload) :],
                    encoding=encoding_iana,
                )
        except (UnicodeDecodeError, LookupError) as e:
            if not isinstance(e, LookupError):
                logger.log(
                    TRACE,
                    "Code page %s does not fit given bytes sequence at ALL. %s",
                    encoding_iana,
                    str(e),
                )
            tested_but_hard_failure.append(encoding_iana)
            continue
        similar_soft_failure_test: bool = False
        for encoding_soft_failed in tested_but_soft_failure:
            if is_cp_similar(encoding_iana, encoding_soft_failed):
                similar_soft_failure_test = True
                break
        if similar_soft_failure_test:
            logger.log(
                TRACE,
                "%s is deemed too similar to code page %s and was consider unsuited already. Continuing!",
                encoding_iana,
                encoding_soft_failed,
            )
            continue
        r_ = range(
            0 if not bom_or_sig_available else len(sig_payload),
            length,
            int(length / steps),
        )
        multi_byte_bonus: bool = (
            is_multi_byte_decoder
            and decoded_payload is not None
            and len(decoded_payload) < length
        )
        if multi_byte_bonus:
            logger.log(
                TRACE,
                "Code page %s is a multi byte encoding table and it appear that at least one character "
                "was encoded using n-bytes.",
                encoding_iana,
            )
        max_chunk_gave_up: int = int(len(r_) / 4)
        max_chunk_gave_up = max(max_chunk_gave_up, 2)
        early_stop_count: int = 0
        lazy_str_hard_failure = False
        md_chunks: List[str] = []
        md_ratios = []
        try:
            for chunk in cut_sequence_chunks(
                sequences,
                encoding_iana,
                r_,
                chunk_size,
                bom_or_sig_available,
                strip_sig_or_bom,
                sig_payload,
                is_multi_byte_decoder,
                decoded_payload,
            ):
                md_chunks.append(chunk)
                md_ratios.append(
                    mess_ratio(
                        chunk,
                        threshold,
                        explain is True and 1 <= len(cp_isolation) <= 2,
                    )
                )
                if md_ratios[-1] >= threshold:
                    early_stop_count += 1
                if (early_stop_count >= max_chunk_gave_up) or (
                    bom_or_sig_available and strip_sig_or_bom is False
                ):
                    break
        except (
            UnicodeDecodeError
        ) as e:  # Lazy str loading may have missed something there
            logger.log(
                TRACE,
                "LazyStr Loading: After MD chunk decode, code page %s does not fit given bytes sequence at ALL. %s",
                encoding_iana,
                str(e),
            )
            early_stop_count = max_chunk_gave_up
            lazy_str_hard_failure = True
        # We might want to check the sequence again with the whole content
        # Only if initial MD tests passes
        if (
            not lazy_str_hard_failure
            and is_too_large_sequence
            and not is_multi_byte_decoder
        ):
            try:
                sequences[int(50e3) :].decode(encoding_iana, errors="strict")
            except UnicodeDecodeError as e:
                logger.log(
                    TRACE,
                    "LazyStr Loading: After final lookup, code page %s does not fit given bytes sequence at ALL. %s",
                    encoding_iana,
                    str(e),
                )
                tested_but_hard_failure.append(encoding_iana)
                continue
        mean_mess_ratio: float = sum(md_ratios) / len(md_ratios) if md_ratios else 0.0
        if mean_mess_ratio >= threshold or early_stop_count >= max_chunk_gave_up:
            tested_but_soft_failure.append(encoding_iana)
            logger.log(
                TRACE,
                "%s was excluded because of initial chaos probing. Gave up %i time(s). "
                "Computed mean chaos is %f %%.",
                encoding_iana,
                early_stop_count,
                round(mean_mess_ratio * 100, ndigits=3),
            )
            # Preparing those fallbacks in case we got nothing.
            if (
                enable_fallback
                and encoding_iana in ["ascii", "utf_8", specified_encoding]
                and not lazy_str_hard_failure
            ):
                fallback_entry = CharsetMatch(
                    sequences, encoding_iana, threshold, False, [], decoded_payload
                )
                if encoding_iana == specified_encoding:
                    fallback_specified = fallback_entry
                elif encoding_iana == "ascii":
                    fallback_ascii = fallback_entry
                else:
                    fallback_u8 = fallback_entry
            continue
        logger.log(
            TRACE,
            "%s passed initial chaos probing. Mean measured chaos is %f %%",
            encoding_iana,
            round(mean_mess_ratio * 100, ndigits=3),
        )
        if not is_multi_byte_decoder:
            target_languages: List[str] = encoding_languages(encoding_iana)
        else:
            target_languages = mb_encoding_languages(encoding_iana)
        if target_languages:
            logger.log(
                TRACE,
                "{} should target any language(s) of {}".format(
                    encoding_iana, str(target_languages)
                ),
            )
        cd_ratios = []
        # We shall skip the CD when its about ASCII
        # Most of the time its not relevant to run "language-detection" on it.
        if encoding_iana != "ascii":
            for chunk in md_chunks:
                chunk_languages = coherence_ratio(
                    chunk,
                    language_threshold,
                    ",".join(target_languages) if target_languages else None,
                )
                cd_ratios.append(chunk_languages)
        cd_ratios_merged = merge_coherence_ratios(cd_ratios)
        if cd_ratios_merged:
            logger.log(
                TRACE,
                "We detected language {} using {}".format(
                    cd_ratios_merged, encoding_iana
                ),
            )
        results.append(
            CharsetMatch(
                sequences,
                encoding_iana,
                mean_mess_ratio,
                bom_or_sig_available,
                cd_ratios_merged,
                decoded_payload,
            )
        )
        if (
            encoding_iana in [specified_encoding, "ascii", "utf_8"]
            and mean_mess_ratio < 0.1
        ):
            logger.debug(
                "Encoding detection: %s is most likely the one.", encoding_iana
            )
            if explain:
                logger.removeHandler(explain_handler)
                logger.setLevel(previous_logger_level)
            return CharsetMatches([results[encoding_iana]])
        if encoding_iana == sig_encoding:
            logger.debug(
                "Encoding detection: %s is most likely the one as we detected a BOM or SIG within "
                "the beginning of the sequence.",
                encoding_iana,
            )
            if explain:
                logger.removeHandler(explain_handler)
                logger.setLevel(previous_logger_level)
            return CharsetMatches([results[encoding_iana]])
    if len(results) == 0:
        if fallback_u8 or fallback_ascii or fallback_specified:
            logger.log(
                TRACE,
                "Nothing got out of the detection process. Using ASCII/UTF-8/Specified fallback.",
            )
        if fallback_specified:
            logger.debug(
                "Encoding detection: %s will be used as a fallback match",
                fallback_specified.encoding,
            )
            results.append(fallback_specified)
        elif (
            (fallback_u8 and fallback_ascii is None)
            or (
                fallback_u8
                and fallback_ascii
                and fallback_u8.fingerprint != fallback_ascii.fingerprint
            )
            or (fallback_u8 is not None)
        ):
            logger.debug("Encoding detection: utf_8 will be used as a fallback match")
            results.append(fallback_u8)
        elif fallback_ascii:
            logger.debug("Encoding detection: ascii will be used as a fallback match")
            results.append(fallback_ascii)
    if results:
        logger.debug(
            "Encoding detection: Found %s as plausible (best-candidate) for content. With %i alternatives.",
            results.best().encoding,  # type: ignore
            len(results) - 1,
        )
    else:
        logger.debug("Encoding detection: Unable to determine any suitable charset.")
    if explain:
        logger.removeHandler(explain_handler)
        logger.setLevel(previous_logger_level)
    return results
 def from_fp(
    fp: BinaryIO,
    steps: int = 5,
    chunk_size: int = 512,
    threshold: float = 0.20,
    cp_isolation: Optional[List[str]] = None,
    cp_exclusion: Optional[List[str]] = None,
    preemptive_behaviour: bool = True,
    explain: bool = False,
    language_threshold: float = 0.1,
    enable_fallback: bool = True,
 ) -> CharsetMatches:
    """
    Same thing than the function from_bytes but using a file pointer that is already ready.
    Will not close the file pointer.
    """
    return from_bytes(
        fp.read(),
        steps,
        chunk_size,
        threshold,
        cp_isolation,
        cp_exclusion,
        preemptive_behaviour,
        explain,
        language_threshold,
        enable_fallback,
    )
 def from_path(
    path: Union[str, bytes, PathLike],  # type: ignore[type-arg]
    steps: int = 5,
    chunk_size: int = 512,
    threshold: float = 0.20,
    cp_isolation: Optional[List[str]] = None,
    cp_exclusion: Optional[List[str]] = None,
    preemptive_behaviour: bool = True,
    explain: bool = False,
    language_threshold: float = 0.1,
    enable_fallback: bool = True,
 ) -> CharsetMatches:
    """
    Same thing than the function from_bytes but with one extra step. Opening and reading given file path in binary mode.
    Can raise IOError.
    """
    with open(path, "rb") as fp:
        return from_fp(
            fp,
            steps,
            chunk_size,
            threshold,
            cp_isolation,
            cp_exclusion,
            preemptive_behaviour,
            explain,
            language_threshold,
            enable_fallback,
        )
 def is_binary(
    fp_or_path_or_payload: Union[PathLike, str, BinaryIO, bytes],  # type: ignore[type-arg]
    steps: int = 5,
    chunk_size: int = 512,
    threshold: float = 0.20,
    cp_isolation: Optional[List[str]] = None,
    cp_exclusion: Optional[List[str]] = None,
    preemptive_behaviour: bool = True,
    explain: bool = False,
    language_threshold: float = 0.1,
    enable_fallback: bool = False,
 ) -> bool:
    """
    Detect if the given input (file, bytes, or path) points to a binary file. aka. not a string.
    Based on the same main heuristic algorithms and default kwargs at the sole exception that fallbacks match
    are disabled to be stricter around ASCII-compatible but unlikely to be a string.
    """
    if isinstance(fp_or_path_or_payload, (str, PathLike)):
        guesses = from_path(
            fp_or_path_or_payload,
            steps=steps,
            chunk_size=chunk_size,
            threshold=threshold,
            cp_isolation=cp_isolation,
            cp_exclusion=cp_exclusion,
            preemptive_behaviour=preemptive_behaviour,
            explain=explain,
            language_threshold=language_threshold,
            enable_fallback=enable_fallback,
        )
    elif isinstance(
        fp_or_path_or_payload,
        (
            bytes,
            bytearray,
        ),
    ):
        guesses = from_bytes(
            fp_or_path_or_payload,
            steps=steps,
            chunk_size=chunk_size,
            threshold=threshold,
            cp_isolation=cp_isolation,
            cp_exclusion=cp_exclusion,
            preemptive_behaviour=preemptive_behaviour,
            explain=explain,
            language_threshold=language_threshold,
            enable_fallback=enable_fallback,
        )
    else:
        guesses = from_fp(
            fp_or_path_or_payload,
            steps=steps,
            chunk_size=chunk_size,
            threshold=threshold,
            cp_isolation=cp_isolation,
            cp_exclusion=cp_exclusion,
            preemptive_behaviour=preemptive_behaviour,
            explain=explain,
            language_threshold=language_threshold,
            enable_fallback=enable_fallback,
        )
    return not guesses
--- a/venv/lib/python3.12/site-packages/charset_normalizer/cd.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/cd.py
@ -0,0 +1,395 @@
 import importlib
 from codecs import IncrementalDecoder
 from collections import Counter
 from functools import lru_cache
 from typing import Counter as TypeCounter, Dict, List, Optional, Tuple
 from .constant import (
    FREQUENCIES,
    KO_NAMES,
    LANGUAGE_SUPPORTED_COUNT,
    TOO_SMALL_SEQUENCE,
    ZH_NAMES,
 )
 from .md import is_suspiciously_successive_range
 from .models import CoherenceMatches
 from .utils import (
    is_accentuated,
    is_latin,
    is_multi_byte_encoding,
    is_unicode_range_secondary,
    unicode_range,
 )
 def encoding_unicode_range(iana_name: str) -> List[str]:
    """
    Return associated unicode ranges in a single byte code page.
    """
    if is_multi_byte_encoding(iana_name):
        raise IOError("Function not supported on multi-byte code page")
    decoder = importlib.import_module(
        "encodings.{}".format(iana_name)
    ).IncrementalDecoder
    p: IncrementalDecoder = decoder(errors="ignore")
    seen_ranges: Dict[str, int] = {}
    character_count: int = 0
    for i in range(0x40, 0xFF):
        chunk: str = p.decode(bytes([i]))
        if chunk:
            character_range: Optional[str] = unicode_range(chunk)
            if character_range is None:
                continue
            if is_unicode_range_secondary(character_range) is False:
                if character_range not in seen_ranges:
                    seen_ranges[character_range] = 0
                seen_ranges[character_range] += 1
                character_count += 1
    return sorted(
        [
            character_range
            for character_range in seen_ranges
            if seen_ranges[character_range] / character_count >= 0.15
        ]
    )
 def unicode_range_languages(primary_range: str) -> List[str]:
    """
    Return inferred languages used with a unicode range.
    """
    languages: List[str] = []
    for language, characters in FREQUENCIES.items():
        for character in characters:
            if unicode_range(character) == primary_range:
                languages.append(language)
                break
    return languages
@lru_cache()
 def encoding_languages(iana_name: str) -> List[str]:
    """
    Single-byte encoding language association. Some code page are heavily linked to particular language(s).
    This function does the correspondence.
    """
    unicode_ranges: List[str] = encoding_unicode_range(iana_name)
    primary_range: Optional[str] = None
    for specified_range in unicode_ranges:
        if "Latin" not in specified_range:
            primary_range = specified_range
            break
    if primary_range is None:
        return ["Latin Based"]
    return unicode_range_languages(primary_range)
@lru_cache()
 def mb_encoding_languages(iana_name: str) -> List[str]:
    """
    Multi-byte encoding language association. Some code page are heavily linked to particular language(s).
    This function does the correspondence.
    """
    if (
        iana_name.startswith("shift_")
        or iana_name.startswith("iso2022_jp")
        or iana_name.startswith("euc_j")
        or iana_name == "cp932"
    ):
        return ["Japanese"]
    if iana_name.startswith("gb") or iana_name in ZH_NAMES:
        return ["Chinese"]
    if iana_name.startswith("iso2022_kr") or iana_name in KO_NAMES:
        return ["Korean"]
    return []
@lru_cache(maxsize=LANGUAGE_SUPPORTED_COUNT)
 def get_target_features(language: str) -> Tuple[bool, bool]:
    """
    Determine main aspects from a supported language if it contains accents and if is pure Latin.
    """
    target_have_accents: bool = False
    target_pure_latin: bool = True
    for character in FREQUENCIES[language]:
        if not target_have_accents and is_accentuated(character):
            target_have_accents = True
        if target_pure_latin and is_latin(character) is False:
            target_pure_latin = False
    return target_have_accents, target_pure_latin
 def alphabet_languages(
    characters: List[str], ignore_non_latin: bool = False
 ) -> List[str]:
    """
    Return associated languages associated to given characters.
    """
    languages: List[Tuple[str, float]] = []
    source_have_accents = any(is_accentuated(character) for character in characters)
    for language, language_characters in FREQUENCIES.items():
        target_have_accents, target_pure_latin = get_target_features(language)
        if ignore_non_latin and target_pure_latin is False:
            continue
        if target_have_accents is False and source_have_accents:
            continue
        character_count: int = len(language_characters)
        character_match_count: int = len(
            [c for c in language_characters if c in characters]
        )
        ratio: float = character_match_count / character_count
        if ratio >= 0.2:
            languages.append((language, ratio))
    languages = sorted(languages, key=lambda x: x[1], reverse=True)
    return [compatible_language[0] for compatible_language in languages]
 def characters_popularity_compare(
    language: str, ordered_characters: List[str]
 ) -> float:
    """
    Determine if a ordered characters list (by occurrence from most appearance to rarest) match a particular language.
    The result is a ratio between 0. (absolutely no correspondence) and 1. (near perfect fit).
    Beware that is function is not strict on the match in order to ease the detection. (Meaning close match is 1.)
    """
    if language not in FREQUENCIES:
        raise ValueError("{} not available".format(language))
    character_approved_count: int = 0
    FREQUENCIES_language_set = set(FREQUENCIES[language])
    ordered_characters_count: int = len(ordered_characters)
    target_language_characters_count: int = len(FREQUENCIES[language])
    large_alphabet: bool = target_language_characters_count > 26
    for character, character_rank in zip(
        ordered_characters, range(0, ordered_characters_count)
    ):
        if character not in FREQUENCIES_language_set:
            continue
        character_rank_in_language: int = FREQUENCIES[language].index(character)
        expected_projection_ratio: float = (
            target_language_characters_count / ordered_characters_count
        )
        character_rank_projection: int = int(character_rank * expected_projection_ratio)
        if (
            large_alphabet is False
            and abs(character_rank_projection - character_rank_in_language) > 4
        ):
            continue
        if (
            large_alphabet is True
            and abs(character_rank_projection - character_rank_in_language)
            < target_language_characters_count / 3
        ):
            character_approved_count += 1
            continue
        characters_before_source: List[str] = FREQUENCIES[language][
            0:character_rank_in_language
        ]
        characters_after_source: List[str] = FREQUENCIES[language][
            character_rank_in_language:
        ]
        characters_before: List[str] = ordered_characters[0:character_rank]
        characters_after: List[str] = ordered_characters[character_rank:]
        before_match_count: int = len(
            set(characters_before) & set(characters_before_source)
        )
        after_match_count: int = len(
            set(characters_after) & set(characters_after_source)
        )
        if len(characters_before_source) == 0 and before_match_count <= 4:
            character_approved_count += 1
            continue
        if len(characters_after_source) == 0 and after_match_count <= 4:
            character_approved_count += 1
            continue
        if (
            before_match_count / len(characters_before_source) >= 0.4
            or after_match_count / len(characters_after_source) >= 0.4
        ):
            character_approved_count += 1
            continue
    return character_approved_count / len(ordered_characters)
 def alpha_unicode_split(decoded_sequence: str) -> List[str]:
    """
    Given a decoded text sequence, return a list of str. Unicode range / alphabet separation.
    Ex. a text containing English/Latin with a bit a Hebrew will return two items in the resulting list;
    One containing the latin letters and the other hebrew.
    """
    layers: Dict[str, str] = {}
    for character in decoded_sequence:
        if character.isalpha() is False:
            continue
        character_range: Optional[str] = unicode_range(character)
        if character_range is None:
            continue
        layer_target_range: Optional[str] = None
        for discovered_range in layers:
            if (
                is_suspiciously_successive_range(discovered_range, character_range)
                is False
            ):
                layer_target_range = discovered_range
                break
        if layer_target_range is None:
            layer_target_range = character_range
        if layer_target_range not in layers:
            layers[layer_target_range] = character.lower()
            continue
        layers[layer_target_range] += character.lower()
    return list(layers.values())
 def merge_coherence_ratios(results: List[CoherenceMatches]) -> CoherenceMatches:
    """
    This function merge results previously given by the function coherence_ratio.
    The return type is the same as coherence_ratio.
    """
    per_language_ratios: Dict[str, List[float]] = {}
    for result in results:
        for sub_result in result:
            language, ratio = sub_result
            if language not in per_language_ratios:
                per_language_ratios[language] = [ratio]
                continue
            per_language_ratios[language].append(ratio)
    merge = [
        (
            language,
            round(
                sum(per_language_ratios[language]) / len(per_language_ratios[language]),
                4,
            ),
        )
        for language in per_language_ratios
    ]
    return sorted(merge, key=lambda x: x[1], reverse=True)
 def filter_alt_coherence_matches(results: CoherenceMatches) -> CoherenceMatches:
    """
    We shall NOT return "English—" in CoherenceMatches because it is an alternative
    of "English". This function only keeps the best match and remove the em-dash in it.
    """
    index_results: Dict[str, List[float]] = dict()
    for result in results:
        language, ratio = result
        no_em_name: str = language.replace("—", "")
        if no_em_name not in index_results:
            index_results[no_em_name] = []
        index_results[no_em_name].append(ratio)
    if any(len(index_results[e]) > 1 for e in index_results):
        filtered_results: CoherenceMatches = []
        for language in index_results:
            filtered_results.append((language, max(index_results[language])))
        return filtered_results
    return results
@lru_cache(maxsize=2048)
 def coherence_ratio(
    decoded_sequence: str, threshold: float = 0.1, lg_inclusion: Optional[str] = None
 ) -> CoherenceMatches:
    """
    Detect ANY language that can be identified in given sequence. The sequence will be analysed by layers.
    A layer = Character extraction by alphabets/ranges.
    """
    results: List[Tuple[str, float]] = []
    ignore_non_latin: bool = False
    sufficient_match_count: int = 0
    lg_inclusion_list = lg_inclusion.split(",") if lg_inclusion is not None else []
    if "Latin Based" in lg_inclusion_list:
        ignore_non_latin = True
        lg_inclusion_list.remove("Latin Based")
    for layer in alpha_unicode_split(decoded_sequence):
        sequence_frequencies: TypeCounter[str] = Counter(layer)
        most_common = sequence_frequencies.most_common()
        character_count: int = sum(o for c, o in most_common)
        if character_count <= TOO_SMALL_SEQUENCE:
            continue
        popular_character_ordered: List[str] = [c for c, o in most_common]
        for language in lg_inclusion_list or alphabet_languages(
            popular_character_ordered, ignore_non_latin
        ):
            ratio: float = characters_popularity_compare(
                language, popular_character_ordered
            )
            if ratio < threshold:
                continue
            elif ratio >= 0.8:
                sufficient_match_count += 1
            results.append((language, round(ratio, 4)))
            if sufficient_match_count >= 3:
                break
    return sorted(
        filter_alt_coherence_matches(results), key=lambda x: x[1], reverse=True
    )
--- a/venv/lib/python3.12/site-packages/charset_normalizer/cli/init.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/cli/init.py
@ -0,0 +1,6 @@
 from .__main__ import cli_detect, query_yes_no
 __all__ = (
    "cli_detect",
    "query_yes_no",
 )
--- a/venv/lib/python3.12/site-packages/charset_normalizer/cli/main.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/cli/main.py
@ -0,0 +1,296 @@
 import argparse
 import sys
 from json import dumps
 from os.path import abspath, basename, dirname, join, realpath
 from platform import python_version
 from typing import List, Optional
 from unicodedata import unidata_version
 import charset_normalizer.md as md_module
 from charset_normalizer import from_fp
 from charset_normalizer.models import CliDetectionResult
 from charset_normalizer.version import __version__
 def query_yes_no(question: str, default: str = "yes") -> bool:
    """Ask a yes/no question via input() and return their answer.
    "question" is a string that is presented to the user.
    "default" is the presumed answer if the user just hits <Enter>.
        It must be "yes" (the default), "no" or None (meaning
        an answer is required of the user).
    The "answer" return value is True for "yes" or False for "no".
    Credit goes to (c) https://stackoverflow.com/questions/3041986/apt-command-line-interface-like-yes-no-input
    """
    valid = {"yes": True, "y": True, "ye": True, "no": False, "n": False}
    if default is None:
        prompt = " [y/n] "
    elif default == "yes":
        prompt = " [Y/n] "
    elif default == "no":
        prompt = " [y/N] "
    else:
        raise ValueError("invalid default answer: '%s'" % default)
    while True:
        sys.stdout.write(question + prompt)
        choice = input().lower()
        if default is not None and choice == "":
            return valid[default]
        elif choice in valid:
            return valid[choice]
        else:
            sys.stdout.write("Please respond with 'yes' or 'no' " "(or 'y' or 'n').\n")
 def cli_detect(argv: Optional[List[str]] = None) -> int:
    """
    CLI assistant using ARGV and ArgumentParser
    :param argv:
    :return: 0 if everything is fine, anything else equal trouble
    """
    parser = argparse.ArgumentParser(
        description="The Real First Universal Charset Detector. "
        "Discover originating encoding used on text file. "
        "Normalize text to unicode."
    )
    parser.add_argument(
        "files", type=argparse.FileType("rb"), nargs="+", help="File(s) to be analysed"
    )
    parser.add_argument(
        "-v",
        "--verbose",
        action="store_true",
        default=False,
        dest="verbose",
        help="Display complementary information about file if any. "
        "Stdout will contain logs about the detection process.",
    )
    parser.add_argument(
        "-a",
        "--with-alternative",
        action="store_true",
        default=False,
        dest="alternatives",
        help="Output complementary possibilities if any. Top-level JSON WILL be a list.",
    )
    parser.add_argument(
        "-n",
        "--normalize",
        action="store_true",
        default=False,
        dest="normalize",
        help="Permit to normalize input file. If not set, program does not write anything.",
    )
    parser.add_argument(
        "-m",
        "--minimal",
        action="store_true",
        default=False,
        dest="minimal",
        help="Only output the charset detected to STDOUT. Disabling JSON output.",
    )
    parser.add_argument(
        "-r",
        "--replace",
        action="store_true",
        default=False,
        dest="replace",
        help="Replace file when trying to normalize it instead of creating a new one.",
    )
    parser.add_argument(
        "-f",
        "--force",
        action="store_true",
        default=False,
        dest="force",
        help="Replace file without asking if you are sure, use this flag with caution.",
    )
    parser.add_argument(
        "-t",
        "--threshold",
        action="store",
        default=0.2,
        type=float,
        dest="threshold",
        help="Define a custom maximum amount of chaos allowed in decoded content. 0. <= chaos <= 1.",
    )
    parser.add_argument(
        "--version",
        action="version",
        version="Charset-Normalizer {} - Python {} - Unicode {} - SpeedUp {}".format(
            __version__,
            python_version(),
            unidata_version,
            "OFF" if md_module.__file__.lower().endswith(".py") else "ON",
        ),
        help="Show version information and exit.",
    )
    args = parser.parse_args(argv)
    if args.replace is True and args.normalize is False:
        print("Use --replace in addition of --normalize only.", file=sys.stderr)
        return 1
    if args.force is True and args.replace is False:
        print("Use --force in addition of --replace only.", file=sys.stderr)
        return 1
    if args.threshold < 0.0 or args.threshold > 1.0:
        print("--threshold VALUE should be between 0. AND 1.", file=sys.stderr)
        return 1
    x_ = []
    for my_file in args.files:
        matches = from_fp(my_file, threshold=args.threshold, explain=args.verbose)
        best_guess = matches.best()
        if best_guess is None:
            print(
                'Unable to identify originating encoding for "{}". {}'.format(
                    my_file.name,
                    "Maybe try increasing maximum amount of chaos."
                    if args.threshold < 1.0
                    else "",
                ),
                file=sys.stderr,
            )
            x_.append(
                CliDetectionResult(
                    abspath(my_file.name),
                    None,
                    [],
                    [],
                    "Unknown",
                    [],
                    False,
                    1.0,
                    0.0,
                    None,
                    True,
                )
            )
        else:
            x_.append(
                CliDetectionResult(
                    abspath(my_file.name),
                    best_guess.encoding,
                    best_guess.encoding_aliases,
                    [
                        cp
                        for cp in best_guess.could_be_from_charset
                        if cp != best_guess.encoding
                    ],
                    best_guess.language,
                    best_guess.alphabets,
                    best_guess.bom,
                    best_guess.percent_chaos,
                    best_guess.percent_coherence,
                    None,
                    True,
                )
            )
            if len(matches) > 1 and args.alternatives:
                for el in matches:
                    if el != best_guess:
                        x_.append(
                            CliDetectionResult(
                                abspath(my_file.name),
                                el.encoding,
                                el.encoding_aliases,
                                [
                                    cp
                                    for cp in el.could_be_from_charset
                                    if cp != el.encoding
                                ],
                                el.language,
                                el.alphabets,
                                el.bom,
                                el.percent_chaos,
                                el.percent_coherence,
                                None,
                                False,
                            )
                        )
            if args.normalize is True:
                if best_guess.encoding.startswith("utf") is True:
                    print(
                        '"{}" file does not need to be normalized, as it already came from unicode.'.format(
                            my_file.name
                        ),
                        file=sys.stderr,
                    )
                    if my_file.closed is False:
                        my_file.close()
                    continue
                dir_path = dirname(realpath(my_file.name))
                file_name = basename(realpath(my_file.name))
                o_: List[str] = file_name.split(".")
                if args.replace is False:
                    o_.insert(-1, best_guess.encoding)
                    if my_file.closed is False:
                        my_file.close()
                elif (
                    args.force is False
                    and query_yes_no(
                        'Are you sure to normalize "{}" by replacing it ?'.format(
                            my_file.name
                        ),
                        "no",
                    )
                    is False
                ):
                    if my_file.closed is False:
                        my_file.close()
                    continue
                try:
                    x_[0].unicode_path = join(dir_path, ".".join(o_))
                    with open(x_[0].unicode_path, "w", encoding="utf-8") as fp:
                        fp.write(str(best_guess))
                except IOError as e:
                    print(str(e), file=sys.stderr)
                    if my_file.closed is False:
                        my_file.close()
                    return 2
        if my_file.closed is False:
            my_file.close()
    if args.minimal is False:
        print(
            dumps(
                [el.__dict__ for el in x_] if len(x_) > 1 else x_[0].__dict__,
                ensure_ascii=True,
                indent=4,
            )
        )
    else:
        for my_file in args.files:
            print(
                ", ".join(
                    [
                        el.encoding or "undefined"
                        for el in x_
                        if el.path == abspath(my_file.name)
                    ]
                )
            )
    return 0
 if __name__ == "__main__":
    cli_detect()
--- a/venv/lib/python3.12/site-packages/charset_normalizer/cli/pycache/init.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/cli/pycache/init.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/cli/pycache/main.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/cli/pycache/main.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/charset_normalizer/constant.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/constant.py
--- a/venv/lib/python3.12/site-packages/charset_normalizer/legacy.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/legacy.py
@ -0,0 +1,54 @@
 from typing import Any, Dict, Optional, Union
 from warnings import warn
 from .api import from_bytes
 from .constant import CHARDET_CORRESPONDENCE
 def detect(
    byte_str: bytes, should_rename_legacy: bool = False, **kwargs: Any
 ) -> Dict[str, Optional[Union[str, float]]]:
    """
    chardet legacy method
    Detect the encoding of the given byte string. It should be mostly backward-compatible.
    Encoding name will match Chardet own writing whenever possible. (Not on encoding name unsupported by it)
    This function is deprecated and should be used to migrate your project easily, consult the documentation for
    further information. Not planned for removal.
    :param byte_str:     The byte sequence to examine.
    :param should_rename_legacy:  Should we rename legacy encodings
                                  to their more modern equivalents?
    """
    if len(kwargs):
        warn(
            f"charset-normalizer disregard arguments '{','.join(list(kwargs.keys()))}' in legacy function detect()"
        )
    if not isinstance(byte_str, (bytearray, bytes)):
        raise TypeError(  # pragma: nocover
            "Expected object of type bytes or bytearray, got: "
            "{0}".format(type(byte_str))
        )
    if isinstance(byte_str, bytearray):
        byte_str = bytes(byte_str)
    r = from_bytes(byte_str).best()
    encoding = r.encoding if r is not None else None
    language = r.language if r is not None and r.language != "Unknown" else ""
    confidence = 1.0 - r.chaos if r is not None else None
    # Note: CharsetNormalizer does not return 'UTF-8-SIG' as the sig get stripped in the detection/normalization process
    # but chardet does return 'utf-8-sig' and it is a valid codec name.
    if r is not None and encoding == "utf_8" and r.bom:
        encoding += "_sig"
    if should_rename_legacy is False and encoding in CHARDET_CORRESPONDENCE:
        encoding = CHARDET_CORRESPONDENCE[encoding]
    return {
        "encoding": encoding,
        "language": language,
        "confidence": confidence,
    }
--- a/venv/lib/python3.12/site-packages/charset_normalizer/md.cpython-312-x86_64-linux-gnu.so
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/md.cpython-312-x86_64-linux-gnu.so
--- a/venv/lib/python3.12/site-packages/charset_normalizer/md.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/md.py
@ -0,0 +1,615 @@
 from functools import lru_cache
 from logging import getLogger
 from typing import List, Optional
 from .constant import (
    COMMON_SAFE_ASCII_CHARACTERS,
    TRACE,
    UNICODE_SECONDARY_RANGE_KEYWORD,
 )
 from .utils import (
    is_accentuated,
    is_arabic,
    is_arabic_isolated_form,
    is_case_variable,
    is_cjk,
    is_emoticon,
    is_hangul,
    is_hiragana,
    is_katakana,
    is_latin,
    is_punctuation,
    is_separator,
    is_symbol,
    is_thai,
    is_unprintable,
    remove_accent,
    unicode_range,
 )
 class MessDetectorPlugin:
    """
    Base abstract class used for mess detection plugins.
    All detectors MUST extend and implement given methods.
    """
    def eligible(self, character: str) -> bool:
        """
        Determine if given character should be fed in.
        """
        raise NotImplementedError  # pragma: nocover
    def feed(self, character: str) -> None:
        """
        The main routine to be executed upon character.
        Insert the logic in witch the text would be considered chaotic.
        """
        raise NotImplementedError  # pragma: nocover
    def reset(self) -> None:  # pragma: no cover
        """
        Permit to reset the plugin to the initial state.
        """
        raise NotImplementedError
    @property
    def ratio(self) -> float:
        """
        Compute the chaos ratio based on what your feed() has seen.
        Must NOT be lower than 0.; No restriction gt 0.
        """
        raise NotImplementedError  # pragma: nocover
 class TooManySymbolOrPunctuationPlugin(MessDetectorPlugin):
    def __init__(self) -> None:
        self._punctuation_count: int = 0
        self._symbol_count: int = 0
        self._character_count: int = 0
        self._last_printable_char: Optional[str] = None
        self._frenzy_symbol_in_word: bool = False
    def eligible(self, character: str) -> bool:
        return character.isprintable()
    def feed(self, character: str) -> None:
        self._character_count += 1
        if (
            character != self._last_printable_char
            and character not in COMMON_SAFE_ASCII_CHARACTERS
        ):
            if is_punctuation(character):
                self._punctuation_count += 1
            elif (
                character.isdigit() is False
                and is_symbol(character)
                and is_emoticon(character) is False
            ):
                self._symbol_count += 2
        self._last_printable_char = character
    def reset(self) -> None:  # pragma: no cover
        self._punctuation_count = 0
        self._character_count = 0
        self._symbol_count = 0
    @property
    def ratio(self) -> float:
        if self._character_count == 0:
            return 0.0
        ratio_of_punctuation: float = (
            self._punctuation_count + self._symbol_count
        ) / self._character_count
        return ratio_of_punctuation if ratio_of_punctuation >= 0.3 else 0.0
 class TooManyAccentuatedPlugin(MessDetectorPlugin):
    def __init__(self) -> None:
        self._character_count: int = 0
        self._accentuated_count: int = 0
    def eligible(self, character: str) -> bool:
        return character.isalpha()
    def feed(self, character: str) -> None:
        self._character_count += 1
        if is_accentuated(character):
            self._accentuated_count += 1
    def reset(self) -> None:  # pragma: no cover
        self._character_count = 0
        self._accentuated_count = 0
    @property
    def ratio(self) -> float:
        if self._character_count < 8:
            return 0.0
        ratio_of_accentuation: float = self._accentuated_count / self._character_count
        return ratio_of_accentuation if ratio_of_accentuation >= 0.35 else 0.0
 class UnprintablePlugin(MessDetectorPlugin):
    def __init__(self) -> None:
        self._unprintable_count: int = 0
        self._character_count: int = 0
    def eligible(self, character: str) -> bool:
        return True
    def feed(self, character: str) -> None:
        if is_unprintable(character):
            self._unprintable_count += 1
        self._character_count += 1
    def reset(self) -> None:  # pragma: no cover
        self._unprintable_count = 0
    @property
    def ratio(self) -> float:
        if self._character_count == 0:
            return 0.0
        return (self._unprintable_count * 8) / self._character_count
 class SuspiciousDuplicateAccentPlugin(MessDetectorPlugin):
    def __init__(self) -> None:
        self._successive_count: int = 0
        self._character_count: int = 0
        self._last_latin_character: Optional[str] = None
    def eligible(self, character: str) -> bool:
        return character.isalpha() and is_latin(character)
    def feed(self, character: str) -> None:
        self._character_count += 1
        if (
            self._last_latin_character is not None
            and is_accentuated(character)
            and is_accentuated(self._last_latin_character)
        ):
            if character.isupper() and self._last_latin_character.isupper():
                self._successive_count += 1
            # Worse if its the same char duplicated with different accent.
            if remove_accent(character) == remove_accent(self._last_latin_character):
                self._successive_count += 1
        self._last_latin_character = character
    def reset(self) -> None:  # pragma: no cover
        self._successive_count = 0
        self._character_count = 0
        self._last_latin_character = None
    @property
    def ratio(self) -> float:
        if self._character_count == 0:
            return 0.0
        return (self._successive_count * 2) / self._character_count
 class SuspiciousRange(MessDetectorPlugin):
    def __init__(self) -> None:
        self._suspicious_successive_range_count: int = 0
        self._character_count: int = 0
        self._last_printable_seen: Optional[str] = None
    def eligible(self, character: str) -> bool:
        return character.isprintable()
    def feed(self, character: str) -> None:
        self._character_count += 1
        if (
            character.isspace()
            or is_punctuation(character)
            or character in COMMON_SAFE_ASCII_CHARACTERS
        ):
            self._last_printable_seen = None
            return
        if self._last_printable_seen is None:
            self._last_printable_seen = character
            return
        unicode_range_a: Optional[str] = unicode_range(self._last_printable_seen)
        unicode_range_b: Optional[str] = unicode_range(character)
        if is_suspiciously_successive_range(unicode_range_a, unicode_range_b):
            self._suspicious_successive_range_count += 1
        self._last_printable_seen = character
    def reset(self) -> None:  # pragma: no cover
        self._character_count = 0
        self._suspicious_successive_range_count = 0
        self._last_printable_seen = None
    @property
    def ratio(self) -> float:
        if self._character_count <= 24:
            return 0.0
        ratio_of_suspicious_range_usage: float = (
            self._suspicious_successive_range_count * 2
        ) / self._character_count
        return ratio_of_suspicious_range_usage
 class SuperWeirdWordPlugin(MessDetectorPlugin):
    def __init__(self) -> None:
        self._word_count: int = 0
        self._bad_word_count: int = 0
        self._foreign_long_count: int = 0
        self._is_current_word_bad: bool = False
        self._foreign_long_watch: bool = False
        self._character_count: int = 0
        self._bad_character_count: int = 0
        self._buffer: str = ""
        self._buffer_accent_count: int = 0
    def eligible(self, character: str) -> bool:
        return True
    def feed(self, character: str) -> None:
        if character.isalpha():
            self._buffer += character
            if is_accentuated(character):
                self._buffer_accent_count += 1
            if (
                self._foreign_long_watch is False
                and (is_latin(character) is False or is_accentuated(character))
                and is_cjk(character) is False
                and is_hangul(character) is False
                and is_katakana(character) is False
                and is_hiragana(character) is False
                and is_thai(character) is False
            ):
                self._foreign_long_watch = True
            return
        if not self._buffer:
            return
        if (
            character.isspace() or is_punctuation(character) or is_separator(character)
        ) and self._buffer:
            self._word_count += 1
            buffer_length: int = len(self._buffer)
            self._character_count += buffer_length
            if buffer_length >= 4:
                if self._buffer_accent_count / buffer_length > 0.34:
                    self._is_current_word_bad = True
                # Word/Buffer ending with an upper case accentuated letter are so rare,
                # that we will consider them all as suspicious. Same weight as foreign_long suspicious.
                if (
                    is_accentuated(self._buffer[-1])
                    and self._buffer[-1].isupper()
                    and all(_.isupper() for _ in self._buffer) is False
                ):
                    self._foreign_long_count += 1
                    self._is_current_word_bad = True
            if buffer_length >= 24 and self._foreign_long_watch:
                camel_case_dst = [
                    i
                    for c, i in zip(self._buffer, range(0, buffer_length))
                    if c.isupper()
                ]
                probable_camel_cased: bool = False
                if camel_case_dst and (len(camel_case_dst) / buffer_length <= 0.3):
                    probable_camel_cased = True
                if not probable_camel_cased:
                    self._foreign_long_count += 1
                    self._is_current_word_bad = True
            if self._is_current_word_bad:
                self._bad_word_count += 1
                self._bad_character_count += len(self._buffer)
                self._is_current_word_bad = False
            self._foreign_long_watch = False
            self._buffer = ""
            self._buffer_accent_count = 0
        elif (
            character not in {"<", ">", "-", "=", "~", "|", "_"}
            and character.isdigit() is False
            and is_symbol(character)
        ):
            self._is_current_word_bad = True
            self._buffer += character
    def reset(self) -> None:  # pragma: no cover
        self._buffer = ""
        self._is_current_word_bad = False
        self._foreign_long_watch = False
        self._bad_word_count = 0
        self._word_count = 0
        self._character_count = 0
        self._bad_character_count = 0
        self._foreign_long_count = 0
    @property
    def ratio(self) -> float:
        if self._word_count <= 10 and self._foreign_long_count == 0:
            return 0.0
        return self._bad_character_count / self._character_count
 class CjkInvalidStopPlugin(MessDetectorPlugin):
    """
    GB(Chinese) based encoding often render the stop incorrectly when the content does not fit and
    can be easily detected. Searching for the overuse of '丅' and '丄'.
    """
    def __init__(self) -> None:
        self._wrong_stop_count: int = 0
        self._cjk_character_count: int = 0
    def eligible(self, character: str) -> bool:
        return True
    def feed(self, character: str) -> None:
        if character in {"丅", "丄"}:
            self._wrong_stop_count += 1
            return
        if is_cjk(character):
            self._cjk_character_count += 1
    def reset(self) -> None:  # pragma: no cover
        self._wrong_stop_count = 0
        self._cjk_character_count = 0
    @property
    def ratio(self) -> float:
        if self._cjk_character_count < 16:
            return 0.0
        return self._wrong_stop_count / self._cjk_character_count
 class ArchaicUpperLowerPlugin(MessDetectorPlugin):
    def __init__(self) -> None:
        self._buf: bool = False
        self._character_count_since_last_sep: int = 0
        self._successive_upper_lower_count: int = 0
        self._successive_upper_lower_count_final: int = 0
        self._character_count: int = 0
        self._last_alpha_seen: Optional[str] = None
        self._current_ascii_only: bool = True
    def eligible(self, character: str) -> bool:
        return True
    def feed(self, character: str) -> None:
        is_concerned = character.isalpha() and is_case_variable(character)
        chunk_sep = is_concerned is False
        if chunk_sep and self._character_count_since_last_sep > 0:
            if (
                self._character_count_since_last_sep <= 64
                and character.isdigit() is False
                and self._current_ascii_only is False
            ):
                self._successive_upper_lower_count_final += (
                    self._successive_upper_lower_count
                )
            self._successive_upper_lower_count = 0
            self._character_count_since_last_sep = 0
            self._last_alpha_seen = None
            self._buf = False
            self._character_count += 1
            self._current_ascii_only = True
            return
        if self._current_ascii_only is True and character.isascii() is False:
            self._current_ascii_only = False
        if self._last_alpha_seen is not None:
            if (character.isupper() and self._last_alpha_seen.islower()) or (
                character.islower() and self._last_alpha_seen.isupper()
            ):
                if self._buf is True:
                    self._successive_upper_lower_count += 2
                    self._buf = False
                else:
                    self._buf = True
            else:
                self._buf = False
        self._character_count += 1
        self._character_count_since_last_sep += 1
        self._last_alpha_seen = character
    def reset(self) -> None:  # pragma: no cover
        self._character_count = 0
        self._character_count_since_last_sep = 0
        self._successive_upper_lower_count = 0
        self._successive_upper_lower_count_final = 0
        self._last_alpha_seen = None
        self._buf = False
        self._current_ascii_only = True
    @property
    def ratio(self) -> float:
        if self._character_count == 0:
            return 0.0
        return self._successive_upper_lower_count_final / self._character_count
 class ArabicIsolatedFormPlugin(MessDetectorPlugin):
    def __init__(self) -> None:
        self._character_count: int = 0
        self._isolated_form_count: int = 0
    def reset(self) -> None:  # pragma: no cover
        self._character_count = 0
        self._isolated_form_count = 0
    def eligible(self, character: str) -> bool:
        return is_arabic(character)
    def feed(self, character: str) -> None:
        self._character_count += 1
        if is_arabic_isolated_form(character):
            self._isolated_form_count += 1
    @property
    def ratio(self) -> float:
        if self._character_count < 8:
            return 0.0
        isolated_form_usage: float = self._isolated_form_count / self._character_count
        return isolated_form_usage
@lru_cache(maxsize=1024)
 def is_suspiciously_successive_range(
    unicode_range_a: Optional[str], unicode_range_b: Optional[str]
 ) -> bool:
    """
    Determine if two Unicode range seen next to each other can be considered as suspicious.
    """
    if unicode_range_a is None or unicode_range_b is None:
        return True
    if unicode_range_a == unicode_range_b:
        return False
    if "Latin" in unicode_range_a and "Latin" in unicode_range_b:
        return False
    if "Emoticons" in unicode_range_a or "Emoticons" in unicode_range_b:
        return False
    # Latin characters can be accompanied with a combining diacritical mark
    # eg. Vietnamese.
    if ("Latin" in unicode_range_a or "Latin" in unicode_range_b) and (
        "Combining" in unicode_range_a or "Combining" in unicode_range_b
    ):
        return False
    keywords_range_a, keywords_range_b = unicode_range_a.split(
        " "
    ), unicode_range_b.split(" ")
    for el in keywords_range_a:
        if el in UNICODE_SECONDARY_RANGE_KEYWORD:
            continue
        if el in keywords_range_b:
            return False
    # Japanese Exception
    range_a_jp_chars, range_b_jp_chars = (
        unicode_range_a
        in (
            "Hiragana",
            "Katakana",
        ),
        unicode_range_b in ("Hiragana", "Katakana"),
    )
    if (range_a_jp_chars or range_b_jp_chars) and (
        "CJK" in unicode_range_a or "CJK" in unicode_range_b
    ):
        return False
    if range_a_jp_chars and range_b_jp_chars:
        return False
    if "Hangul" in unicode_range_a or "Hangul" in unicode_range_b:
        if "CJK" in unicode_range_a or "CJK" in unicode_range_b:
            return False
        if unicode_range_a == "Basic Latin" or unicode_range_b == "Basic Latin":
            return False
    # Chinese/Japanese use dedicated range for punctuation and/or separators.
    if ("CJK" in unicode_range_a or "CJK" in unicode_range_b) or (
        unicode_range_a in ["Katakana", "Hiragana"]
        and unicode_range_b in ["Katakana", "Hiragana"]
    ):
        if "Punctuation" in unicode_range_a or "Punctuation" in unicode_range_b:
            return False
        if "Forms" in unicode_range_a or "Forms" in unicode_range_b:
            return False
        if unicode_range_a == "Basic Latin" or unicode_range_b == "Basic Latin":
            return False
    return True
@lru_cache(maxsize=2048)
 def mess_ratio(
    decoded_sequence: str, maximum_threshold: float = 0.2, debug: bool = False
 ) -> float:
    """
    Compute a mess ratio given a decoded bytes sequence. The maximum threshold does stop the computation earlier.
    """
    detectors: List[MessDetectorPlugin] = [
        md_class() for md_class in MessDetectorPlugin.__subclasses__()
    ]
    length: int = len(decoded_sequence) + 1
    mean_mess_ratio: float = 0.0
    if length < 512:
        intermediary_mean_mess_ratio_calc: int = 32
    elif length <= 1024:
        intermediary_mean_mess_ratio_calc = 64
    else:
        intermediary_mean_mess_ratio_calc = 128
    for character, index in zip(decoded_sequence + "\n", range(length)):
        for detector in detectors:
            if detector.eligible(character):
                detector.feed(character)
        if (
            index > 0 and index % intermediary_mean_mess_ratio_calc == 0
        ) or index == length - 1:
            mean_mess_ratio = sum(dt.ratio for dt in detectors)
            if mean_mess_ratio >= maximum_threshold:
                break
    if debug:
        logger = getLogger("charset_normalizer")
        logger.log(
            TRACE,
            "Mess-detector extended-analysis start. "
            f"intermediary_mean_mess_ratio_calc={intermediary_mean_mess_ratio_calc} mean_mess_ratio={mean_mess_ratio} "
            f"maximum_threshold={maximum_threshold}",
        )
        if len(decoded_sequence) > 16:
            logger.log(TRACE, f"Starting with: {decoded_sequence[:16]}")
            logger.log(TRACE, f"Ending with: {decoded_sequence[-16::]}")
        for dt in detectors:  # pragma: nocover
            logger.log(TRACE, f"{dt.__class__}: {dt.ratio}")
    return round(mean_mess_ratio, 3)
--- a/venv/lib/python3.12/site-packages/charset_normalizer/md__mypyc.cpython-312-x86_64-linux-gnu.so
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/md__mypyc.cpython-312-x86_64-linux-gnu.so
--- a/venv/lib/python3.12/site-packages/charset_normalizer/models.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/models.py
@ -0,0 +1,340 @@
 from encodings.aliases import aliases
 from hashlib import sha256
 from json import dumps
 from typing import Any, Dict, Iterator, List, Optional, Tuple, Union
 from .constant import TOO_BIG_SEQUENCE
 from .utils import iana_name, is_multi_byte_encoding, unicode_range
 class CharsetMatch:
    def __init__(
        self,
        payload: bytes,
        guessed_encoding: str,
        mean_mess_ratio: float,
        has_sig_or_bom: bool,
        languages: "CoherenceMatches",
        decoded_payload: Optional[str] = None,
    ):
        self._payload: bytes = payload
        self._encoding: str = guessed_encoding
        self._mean_mess_ratio: float = mean_mess_ratio
        self._languages: CoherenceMatches = languages
        self._has_sig_or_bom: bool = has_sig_or_bom
        self._unicode_ranges: Optional[List[str]] = None
        self._leaves: List[CharsetMatch] = []
        self._mean_coherence_ratio: float = 0.0
        self._output_payload: Optional[bytes] = None
        self._output_encoding: Optional[str] = None
        self._string: Optional[str] = decoded_payload
    def __eq__(self, other: object) -> bool:
        if not isinstance(other, CharsetMatch):
            raise TypeError(
                "__eq__ cannot be invoked on {} and {}.".format(
                    str(other.__class__), str(self.__class__)
                )
            )
        return self.encoding == other.encoding and self.fingerprint == other.fingerprint
    def __lt__(self, other: object) -> bool:
        """
        Implemented to make sorted available upon CharsetMatches items.
        """
        if not isinstance(other, CharsetMatch):
            raise ValueError
        chaos_difference: float = abs(self.chaos - other.chaos)
        coherence_difference: float = abs(self.coherence - other.coherence)
        # Below 1% difference --> Use Coherence
        if chaos_difference < 0.01 and coherence_difference > 0.02:
            return self.coherence > other.coherence
        elif chaos_difference < 0.01 and coherence_difference <= 0.02:
            # When having a difficult decision, use the result that decoded as many multi-byte as possible.
            # preserve RAM usage!
            if len(self._payload) >= TOO_BIG_SEQUENCE:
                return self.chaos < other.chaos
            return self.multi_byte_usage > other.multi_byte_usage
        return self.chaos < other.chaos
    @property
    def multi_byte_usage(self) -> float:
        return 1.0 - (len(str(self)) / len(self.raw))
    def __str__(self) -> str:
        # Lazy Str Loading
        if self._string is None:
            self._string = str(self._payload, self._encoding, "strict")
        return self._string
    def __repr__(self) -> str:
        return "<CharsetMatch '{}' bytes({})>".format(self.encoding, self.fingerprint)
    def add_submatch(self, other: "CharsetMatch") -> None:
        if not isinstance(other, CharsetMatch) or other == self:
            raise ValueError(
                "Unable to add instance <{}> as a submatch of a CharsetMatch".format(
                    other.__class__
                )
            )
        other._string = None  # Unload RAM usage; dirty trick.
        self._leaves.append(other)
    @property
    def encoding(self) -> str:
        return self._encoding
    @property
    def encoding_aliases(self) -> List[str]:
        """
        Encoding name are known by many name, using this could help when searching for IBM855 when it's listed as CP855.
        """
        also_known_as: List[str] = []
        for u, p in aliases.items():
            if self.encoding == u:
                also_known_as.append(p)
            elif self.encoding == p:
                also_known_as.append(u)
        return also_known_as
    @property
    def bom(self) -> bool:
        return self._has_sig_or_bom
    @property
    def byte_order_mark(self) -> bool:
        return self._has_sig_or_bom
    @property
    def languages(self) -> List[str]:
        """
        Return the complete list of possible languages found in decoded sequence.
        Usually not really useful. Returned list may be empty even if 'language' property return something != 'Unknown'.
        """
        return [e[0] for e in self._languages]
    @property
    def language(self) -> str:
        """
        Most probable language found in decoded sequence. If none were detected or inferred, the property will return
        "Unknown".
        """
        if not self._languages:
            # Trying to infer the language based on the given encoding
            # Its either English or we should not pronounce ourselves in certain cases.
            if "ascii" in self.could_be_from_charset:
                return "English"
            # doing it there to avoid circular import
            from charset_normalizer.cd import encoding_languages, mb_encoding_languages
            languages = (
                mb_encoding_languages(self.encoding)
                if is_multi_byte_encoding(self.encoding)
                else encoding_languages(self.encoding)
            )
            if len(languages) == 0 or "Latin Based" in languages:
                return "Unknown"
            return languages[0]
        return self._languages[0][0]
    @property
    def chaos(self) -> float:
        return self._mean_mess_ratio
    @property
    def coherence(self) -> float:
        if not self._languages:
            return 0.0
        return self._languages[0][1]
    @property
    def percent_chaos(self) -> float:
        return round(self.chaos * 100, ndigits=3)
    @property
    def percent_coherence(self) -> float:
        return round(self.coherence * 100, ndigits=3)
    @property
    def raw(self) -> bytes:
        """
        Original untouched bytes.
        """
        return self._payload
    @property
    def submatch(self) -> List["CharsetMatch"]:
        return self._leaves
    @property
    def has_submatch(self) -> bool:
        return len(self._leaves) > 0
    @property
    def alphabets(self) -> List[str]:
        if self._unicode_ranges is not None:
            return self._unicode_ranges
        # list detected ranges
        detected_ranges: List[Optional[str]] = [
            unicode_range(char) for char in str(self)
        ]
        # filter and sort
        self._unicode_ranges = sorted(list({r for r in detected_ranges if r}))
        return self._unicode_ranges
    @property
    def could_be_from_charset(self) -> List[str]:
        """
        The complete list of encoding that output the exact SAME str result and therefore could be the originating
        encoding.
        This list does include the encoding available in property 'encoding'.
        """
        return [self._encoding] + [m.encoding for m in self._leaves]
    def output(self, encoding: str = "utf_8") -> bytes:
        """
        Method to get re-encoded bytes payload using given target encoding. Default to UTF-8.
        Any errors will be simply ignored by the encoder NOT replaced.
        """
        if self._output_encoding is None or self._output_encoding != encoding:
            self._output_encoding = encoding
            self._output_payload = str(self).encode(encoding, "replace")
        return self._output_payload  # type: ignore
    @property
    def fingerprint(self) -> str:
        """
        Retrieve the unique SHA256 computed using the transformed (re-encoded) payload. Not the original one.
        """
        return sha256(self.output()).hexdigest()
 class CharsetMatches:
    """
    Container with every CharsetMatch items ordered by default from most probable to the less one.
    Act like a list(iterable) but does not implements all related methods.
    """
    def __init__(self, results: Optional[List[CharsetMatch]] = None):
        self._results: List[CharsetMatch] = sorted(results) if results else []
    def __iter__(self) -> Iterator[CharsetMatch]:
        yield from self._results
    def __getitem__(self, item: Union[int, str]) -> CharsetMatch:
        """
        Retrieve a single item either by its position or encoding name (alias may be used here).
        Raise KeyError upon invalid index or encoding not present in results.
        """
        if isinstance(item, int):
            return self._results[item]
        if isinstance(item, str):
            item = iana_name(item, False)
            for result in self._results:
                if item in result.could_be_from_charset:
                    return result
        raise KeyError
    def __len__(self) -> int:
        return len(self._results)
    def __bool__(self) -> bool:
        return len(self._results) > 0
    def append(self, item: CharsetMatch) -> None:
        """
        Insert a single match. Will be inserted accordingly to preserve sort.
        Can be inserted as a submatch.
        """
        if not isinstance(item, CharsetMatch):
            raise ValueError(
                "Cannot append instance '{}' to CharsetMatches".format(
                    str(item.__class__)
                )
            )
        # We should disable the submatch factoring when the input file is too heavy (conserve RAM usage)
        if len(item.raw) <= TOO_BIG_SEQUENCE:
            for match in self._results:
                if match.fingerprint == item.fingerprint and match.chaos == item.chaos:
                    match.add_submatch(item)
                    return
        self._results.append(item)
        self._results = sorted(self._results)
    def best(self) -> Optional["CharsetMatch"]:
        """
        Simply return the first match. Strict equivalent to matches[0].
        """
        if not self._results:
            return None
        return self._results[0]
    def first(self) -> Optional["CharsetMatch"]:
        """
        Redundant method, call the method best(). Kept for BC reasons.
        """
        return self.best()
 CoherenceMatch = Tuple[str, float]
 CoherenceMatches = List[CoherenceMatch]
 class CliDetectionResult:
    def __init__(
        self,
        path: str,
        encoding: Optional[str],
        encoding_aliases: List[str],
        alternative_encodings: List[str],
        language: str,
        alphabets: List[str],
        has_sig_or_bom: bool,
        chaos: float,
        coherence: float,
        unicode_path: Optional[str],
        is_preferred: bool,
    ):
        self.path: str = path
        self.unicode_path: Optional[str] = unicode_path
        self.encoding: Optional[str] = encoding
        self.encoding_aliases: List[str] = encoding_aliases
        self.alternative_encodings: List[str] = alternative_encodings
        self.language: str = language
        self.alphabets: List[str] = alphabets
        self.has_sig_or_bom: bool = has_sig_or_bom
        self.chaos: float = chaos
        self.coherence: float = coherence
        self.is_preferred: bool = is_preferred
    @property
    def __dict__(self) -> Dict[str, Any]:  # type: ignore
        return {
            "path": self.path,
            "encoding": self.encoding,
            "encoding_aliases": self.encoding_aliases,
            "alternative_encodings": self.alternative_encodings,
            "language": self.language,
            "alphabets": self.alphabets,
            "has_sig_or_bom": self.has_sig_or_bom,
            "chaos": self.chaos,
            "coherence": self.coherence,
            "unicode_path": self.unicode_path,
            "is_preferred": self.is_preferred,
        }
    def to_json(self) -> str:
        return dumps(self.__dict__, ensure_ascii=True, indent=4)
--- a/venv/lib/python3.12/site-packages/charset_normalizer/py.typed
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/py.typed
--- a/venv/lib/python3.12/site-packages/charset_normalizer/utils.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/utils.py
@ -0,0 +1,421 @@
 import importlib
 import logging
 import unicodedata
 from codecs import IncrementalDecoder
 from encodings.aliases import aliases
 from functools import lru_cache
 from re import findall
 from typing import Generator, List, Optional, Set, Tuple, Union
 from _multibytecodec import MultibyteIncrementalDecoder
 from .constant import (
    ENCODING_MARKS,
    IANA_SUPPORTED_SIMILAR,
    RE_POSSIBLE_ENCODING_INDICATION,
    UNICODE_RANGES_COMBINED,
    UNICODE_SECONDARY_RANGE_KEYWORD,
    UTF8_MAXIMAL_ALLOCATION,
 )
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_accentuated(character: str) -> bool:
    try:
        description: str = unicodedata.name(character)
    except ValueError:
        return False
    return (
        "WITH GRAVE" in description
        or "WITH ACUTE" in description
        or "WITH CEDILLA" in description
        or "WITH DIAERESIS" in description
        or "WITH CIRCUMFLEX" in description
        or "WITH TILDE" in description
        or "WITH MACRON" in description
        or "WITH RING ABOVE" in description
    )
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def remove_accent(character: str) -> str:
    decomposed: str = unicodedata.decomposition(character)
    if not decomposed:
        return character
    codes: List[str] = decomposed.split(" ")
    return chr(int(codes[0], 16))
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def unicode_range(character: str) -> Optional[str]:
    """
    Retrieve the Unicode range official name from a single character.
    """
    character_ord: int = ord(character)
    for range_name, ord_range in UNICODE_RANGES_COMBINED.items():
        if character_ord in ord_range:
            return range_name
    return None
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_latin(character: str) -> bool:
    try:
        description: str = unicodedata.name(character)
    except ValueError:
        return False
    return "LATIN" in description
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_punctuation(character: str) -> bool:
    character_category: str = unicodedata.category(character)
    if "P" in character_category:
        return True
    character_range: Optional[str] = unicode_range(character)
    if character_range is None:
        return False
    return "Punctuation" in character_range
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_symbol(character: str) -> bool:
    character_category: str = unicodedata.category(character)
    if "S" in character_category or "N" in character_category:
        return True
    character_range: Optional[str] = unicode_range(character)
    if character_range is None:
        return False
    return "Forms" in character_range and character_category != "Lo"
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_emoticon(character: str) -> bool:
    character_range: Optional[str] = unicode_range(character)
    if character_range is None:
        return False
    return "Emoticons" in character_range or "Pictographs" in character_range
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_separator(character: str) -> bool:
    if character.isspace() or character in {"｜", "+", "<", ">"}:
        return True
    character_category: str = unicodedata.category(character)
    return "Z" in character_category or character_category in {"Po", "Pd", "Pc"}
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_case_variable(character: str) -> bool:
    return character.islower() != character.isupper()
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_cjk(character: str) -> bool:
    try:
        character_name = unicodedata.name(character)
    except ValueError:
        return False
    return "CJK" in character_name
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_hiragana(character: str) -> bool:
    try:
        character_name = unicodedata.name(character)
    except ValueError:
        return False
    return "HIRAGANA" in character_name
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_katakana(character: str) -> bool:
    try:
        character_name = unicodedata.name(character)
    except ValueError:
        return False
    return "KATAKANA" in character_name
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_hangul(character: str) -> bool:
    try:
        character_name = unicodedata.name(character)
    except ValueError:
        return False
    return "HANGUL" in character_name
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_thai(character: str) -> bool:
    try:
        character_name = unicodedata.name(character)
    except ValueError:
        return False
    return "THAI" in character_name
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_arabic(character: str) -> bool:
    try:
        character_name = unicodedata.name(character)
    except ValueError:
        return False
    return "ARABIC" in character_name
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_arabic_isolated_form(character: str) -> bool:
    try:
        character_name = unicodedata.name(character)
    except ValueError:
        return False
    return "ARABIC" in character_name and "ISOLATED FORM" in character_name
@lru_cache(maxsize=len(UNICODE_RANGES_COMBINED))
 def is_unicode_range_secondary(range_name: str) -> bool:
    return any(keyword in range_name for keyword in UNICODE_SECONDARY_RANGE_KEYWORD)
@lru_cache(maxsize=UTF8_MAXIMAL_ALLOCATION)
 def is_unprintable(character: str) -> bool:
    return (
        character.isspace() is False  # includes \n \t \r \v
        and character.isprintable() is False
        and character != "\x1A"  # Why? Its the ASCII substitute character.
        and character != "\ufeff"  # bug discovered in Python,
        # Zero Width No-Break Space located in 	Arabic Presentation Forms-B, Unicode 1.1 not acknowledged as space.
    )
 def any_specified_encoding(sequence: bytes, search_zone: int = 8192) -> Optional[str]:
    """
    Extract using ASCII-only decoder any specified encoding in the first n-bytes.
    """
    if not isinstance(sequence, bytes):
        raise TypeError
    seq_len: int = len(sequence)
    results: List[str] = findall(
        RE_POSSIBLE_ENCODING_INDICATION,
        sequence[: min(seq_len, search_zone)].decode("ascii", errors="ignore"),
    )
    if len(results) == 0:
        return None
    for specified_encoding in results:
        specified_encoding = specified_encoding.lower().replace("-", "_")
        encoding_alias: str
        encoding_iana: str
        for encoding_alias, encoding_iana in aliases.items():
            if encoding_alias == specified_encoding:
                return encoding_iana
            if encoding_iana == specified_encoding:
                return encoding_iana
    return None
@lru_cache(maxsize=128)
 def is_multi_byte_encoding(name: str) -> bool:
    """
    Verify is a specific encoding is a multi byte one based on it IANA name
    """
    return name in {
        "utf_8",
        "utf_8_sig",
        "utf_16",
        "utf_16_be",
        "utf_16_le",
        "utf_32",
        "utf_32_le",
        "utf_32_be",
        "utf_7",
    } or issubclass(
        importlib.import_module("encodings.{}".format(name)).IncrementalDecoder,
        MultibyteIncrementalDecoder,
    )
 def identify_sig_or_bom(sequence: bytes) -> Tuple[Optional[str], bytes]:
    """
    Identify and extract SIG/BOM in given sequence.
    """
    for iana_encoding in ENCODING_MARKS:
        marks: Union[bytes, List[bytes]] = ENCODING_MARKS[iana_encoding]
        if isinstance(marks, bytes):
            marks = [marks]
        for mark in marks:
            if sequence.startswith(mark):
                return iana_encoding, mark
    return None, b""
 def should_strip_sig_or_bom(iana_encoding: str) -> bool:
    return iana_encoding not in {"utf_16", "utf_32"}
 def iana_name(cp_name: str, strict: bool = True) -> str:
    cp_name = cp_name.lower().replace("-", "_")
    encoding_alias: str
    encoding_iana: str
    for encoding_alias, encoding_iana in aliases.items():
        if cp_name in [encoding_alias, encoding_iana]:
            return encoding_iana
    if strict:
        raise ValueError("Unable to retrieve IANA for '{}'".format(cp_name))
    return cp_name
 def range_scan(decoded_sequence: str) -> List[str]:
    ranges: Set[str] = set()
    for character in decoded_sequence:
        character_range: Optional[str] = unicode_range(character)
        if character_range is None:
            continue
        ranges.add(character_range)
    return list(ranges)
 def cp_similarity(iana_name_a: str, iana_name_b: str) -> float:
    if is_multi_byte_encoding(iana_name_a) or is_multi_byte_encoding(iana_name_b):
        return 0.0
    decoder_a = importlib.import_module(
        "encodings.{}".format(iana_name_a)
    ).IncrementalDecoder
    decoder_b = importlib.import_module(
        "encodings.{}".format(iana_name_b)
    ).IncrementalDecoder
    id_a: IncrementalDecoder = decoder_a(errors="ignore")
    id_b: IncrementalDecoder = decoder_b(errors="ignore")
    character_match_count: int = 0
    for i in range(255):
        to_be_decoded: bytes = bytes([i])
        if id_a.decode(to_be_decoded) == id_b.decode(to_be_decoded):
            character_match_count += 1
    return character_match_count / 254
 def is_cp_similar(iana_name_a: str, iana_name_b: str) -> bool:
    """
    Determine if two code page are at least 80% similar. IANA_SUPPORTED_SIMILAR dict was generated using
    the function cp_similarity.
    """
    return (
        iana_name_a in IANA_SUPPORTED_SIMILAR
        and iana_name_b in IANA_SUPPORTED_SIMILAR[iana_name_a]
    )
 def set_logging_handler(
    name: str = "charset_normalizer",
    level: int = logging.INFO,
    format_string: str = "%(asctime)s | %(levelname)s | %(message)s",
 ) -> None:
    logger = logging.getLogger(name)
    logger.setLevel(level)
    handler = logging.StreamHandler()
    handler.setFormatter(logging.Formatter(format_string))
    logger.addHandler(handler)
 def cut_sequence_chunks(
    sequences: bytes,
    encoding_iana: str,
    offsets: range,
    chunk_size: int,
    bom_or_sig_available: bool,
    strip_sig_or_bom: bool,
    sig_payload: bytes,
    is_multi_byte_decoder: bool,
    decoded_payload: Optional[str] = None,
 ) -> Generator[str, None, None]:
    if decoded_payload and is_multi_byte_decoder is False:
        for i in offsets:
            chunk = decoded_payload[i : i + chunk_size]
            if not chunk:
                break
            yield chunk
    else:
        for i in offsets:
            chunk_end = i + chunk_size
            if chunk_end > len(sequences) + 8:
                continue
            cut_sequence = sequences[i : i + chunk_size]
            if bom_or_sig_available and strip_sig_or_bom is False:
                cut_sequence = sig_payload + cut_sequence
            chunk = cut_sequence.decode(
                encoding_iana,
                errors="ignore" if is_multi_byte_decoder else "strict",
            )
            # multi-byte bad cutting detector and adjustment
            # not the cleanest way to perform that fix but clever enough for now.
            if is_multi_byte_decoder and i > 0:
                chunk_partial_size_chk: int = min(chunk_size, 16)
                if (
                    decoded_payload
                    and chunk[:chunk_partial_size_chk] not in decoded_payload
                ):
                    for j in range(i, i - 4, -1):
                        cut_sequence = sequences[j:chunk_end]
                        if bom_or_sig_available and strip_sig_or_bom is False:
                            cut_sequence = sig_payload + cut_sequence
                        chunk = cut_sequence.decode(encoding_iana, errors="ignore")
                        if chunk[:chunk_partial_size_chk] in decoded_payload:
                            break
            yield chunk
--- a/venv/lib/python3.12/site-packages/charset_normalizer/version.py
+++ b/venv/lib/python3.12/site-packages/charset_normalizer/version.py
@ -0,0 +1,6 @@
 """
 Expose version
 """
 __version__ = "3.3.2"
 VERSION = __version__.split(".")
--- a/venv/lib/python3.12/site-packages/dns/init.py
+++ b/venv/lib/python3.12/site-packages/dns/init.py
@ -0,0 +1,70 @@
 # Copyright (C) Dnspython Contributors, see LICENSE for text of ISC license
 # Copyright (C) 2003-2007, 2009, 2011 Nominum, Inc.
 #
 # Permission to use, copy, modify, and distribute this software and its
 # documentation for any purpose with or without fee is hereby granted,
 # provided that the above copyright notice and this permission notice
 # appear in all copies.
 #
 # THE SOFTWARE IS PROVIDED "AS IS" AND NOMINUM DISCLAIMS ALL WARRANTIES
 # WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
 # MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL NOMINUM BE LIABLE FOR
 # ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
 # WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
 # ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT
 # OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
 """dnspython DNS toolkit"""
 __all__ = [
    "asyncbackend",
    "asyncquery",
    "asyncresolver",
    "dnssec",
    "dnssecalgs",
    "dnssectypes",
    "e164",
    "edns",
    "entropy",
    "exception",
    "flags",
    "immutable",
    "inet",
    "ipv4",
    "ipv6",
    "message",
    "name",
    "namedict",
    "node",
    "opcode",
    "query",
    "quic",
    "rcode",
    "rdata",
    "rdataclass",
    "rdataset",
    "rdatatype",
    "renderer",
    "resolver",
    "reversename",
    "rrset",
    "serial",
    "set",
    "tokenizer",
    "transaction",
    "tsig",
    "tsigkeyring",
    "ttl",
    "rdtypes",
    "update",
    "version",
    "versioned",
    "wire",
    "xfr",
    "zone",
    "zonetypes",
    "zonefile",
 ]
 from dns.version import version as __version__  # noqa
--- a/venv/lib/python3.12/site-packages/dns/pycache/init.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/init.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/_asyncbackend.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/_asyncbackend.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/_asyncio_backend.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/_asyncio_backend.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/_ddr.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/_ddr.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/_immutable_ctx.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/_immutable_ctx.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/_trio_backend.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/_trio_backend.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/asyncbackend.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/asyncbackend.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/asyncquery.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/asyncquery.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/asyncresolver.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/asyncresolver.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/dnssec.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/dnssec.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/dnssectypes.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/dnssectypes.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/e164.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/e164.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/edns.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/edns.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/entropy.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/entropy.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/enum.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/enum.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/exception.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/exception.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/flags.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/flags.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/grange.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/grange.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/immutable.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/immutable.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/inet.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/inet.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/ipv4.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/ipv4.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/ipv6.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/ipv6.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/message.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/message.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/name.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/name.cpython-312.pyc
--- a/venv/lib/python3.12/site-packages/dns/pycache/namedict.cpython-312.pyc
+++ b/venv/lib/python3.12/site-packages/dns/pycache/namedict.cpython-312.pyc
--- a/Show More
+++ b/Show More
		`@ -0,0 +1,2 @@`
							`[console_scripts]`
							`normalizer = charset_normalizer.cli:cli_detect`