⚝
One Hat Cyber Team
⚝
Your IP:
216.73.216.118
Server IP:
84.32.84.50
Server:
Linux sg-nme-web1518.main-hosting.eu 5.14.0-611.16.1.el9_7.x86_64 #1 SMP PREEMPT_DYNAMIC Mon Dec 22 03:40:39 EST 2025 x86_64
Server Software:
LiteSpeed
PHP Version:
8.3.28
Buat File
|
Buat Folder
Eksekusi
Dir :
~
/
opt
/
gsutil
/
third_party
/
charset_normalizer
/
tests
/
View File Name :
test_edge_case.py
from charset_normalizer import from_bytes import pytest import platform @pytest.mark.xfail(platform.python_version_tuple()[0] == "3" and platform.python_version_tuple()[1] == "7", reason="Unicode database is too old for this case (Python 3.7)") def test_unicode_edge_case(): payload = b'\xef\xbb\xbf\xf0\x9f\xa9\xb3' best_guess = from_bytes(payload).best() assert best_guess is not None, "Payload should have given something, detection failure" assert best_guess.encoding == "utf_8", "UTF-8 payload wrongly detected" def test_issue_gh520(): """Verify that minorities does not strip basic latin characters!""" payload = b"/includes/webform.compon\xd2\xaants.inc/" best_guess = from_bytes(payload).best() assert best_guess is not None, "Payload should have given something, detection failure" assert "Basic Latin" in best_guess.alphabets def test_issue_gh509(): """Two common ASCII punctuations should render as-is.""" payload = b");" best_guess = from_bytes(payload).best() assert best_guess is not None, "Payload should have given something, detection failure" assert "ascii" == best_guess.encoding def test_issue_gh498(): """This case was mistaken for utf-16-le, this should never happen again.""" payload = b'\x84\xae\xaa\xe3\xac\xa5\xad\xe2 Microsoft Word.docx' best_guess = from_bytes(payload).best() assert best_guess is not None, "Payload should have given something, detection failure" assert "Cyrillic" in best_guess.alphabets