Fix subtitle character encoding detection

Increase the size of the language recognition buffer to 32K
2025-03-02 17:45:39 +00:00 · 2020-03-25 22:04:04 +02:00 · 2020-03-25 22:04:04 +02:00 · 354454688d
commit 354454688d
parent c982e37024
1 changed files with 2 additions and 2 deletions
--- a/bazarr/list_subtitles.py
+++ b/bazarr/list_subtitles.py
@ -378,8 +378,8 @@ def guess_external_subtitles(dest_folder, subtitles):
                    text = f.read()
                    
                try:
-                    # to improve performance, use only the first 8K to detect encoding
-                    if len(text) > 8192: guess = chardet.detect(text[:8192])
+                    # to improve performance, use only the first 32K to detect encoding
+                    if len(text) > 32768: guess = chardet.detect(text[:32768])
                    else: guess = chardet.detect(text)
                    if guess["confidence"] < 0.8:
                        raise UnicodeError