This commit is contained in:
Danila Fedorin 2025-02-23 13:19:35 -08:00
parent a8c2b1d05a
commit 8c4ede1216

View File

@ -16,6 +16,7 @@ def get_used_characters(files):
"""Collect unique characters from all .html files in the given directory."""
char_set = set()
for file in files:
print("extracting from", file)
text = extract_text_from_html(file)
char_set.update(text)
return "".join(sorted(char_set))