mirror of
https://github.com/danielmiessler/SecLists.git
synced 2025-04-28 09:46:29 -04:00
[Github Action] Automated trickest wordlists update.
This commit is contained in:
parent
d68e46932f
commit
a78faef856
3 changed files with 78 additions and 5 deletions
|
@ -1,6 +1,6 @@
|
|||
{
|
||||
"Jwt secrets update": {
|
||||
"last_update": 1739818986
|
||||
"last_update": 1740206221
|
||||
},
|
||||
"Trickest wordlist update": {
|
||||
"last_update": 1739786646
|
||||
|
|
|
@ -174184,7 +174184,7 @@ zzz_systest
|
|||
~www_pa/
|
||||
Änderungsbestätigungs-Mail
|
||||
éditerbonachat
|
||||
为空时开放所有目录######
|
||||
ΪʱĿ¼######
|
||||
адреснаякнига
|
||||
английский-русский
|
||||
бумажник
|
||||
|
@ -174242,7 +174242,7 @@ zzz_systest
|
|||
プロフィール
|
||||
メールで変更を確認する
|
||||
メールを確認する
|
||||
鋒nliche-fahrzeuge/
|
||||
hnliche-fahrzeuge/
|
||||
个人信息
|
||||
中文-英语
|
||||
付款
|
||||
|
|
73
utf8fixer.py
Executable file
73
utf8fixer.py
Executable file
|
@ -0,0 +1,73 @@
|
|||
#!/usr/bin/python
|
||||
from __future__ import print_function
|
||||
from codecs import open as copen
|
||||
from os import listdir, path
|
||||
from sys import argv
|
||||
|
||||
import unicodedata
|
||||
|
||||
# usage: utf8-fix.py PATH [codec] [normalize]
|
||||
PATH = argv[1] if len(argv) > 1 else ""
|
||||
NORMALIZE = False
|
||||
ENCODING = None
|
||||
DEFAULT_ENCODING = "iso8859_2" # iso8859_2 a.k.a latin2
|
||||
|
||||
for arg in argv[2:]:
|
||||
if arg.lower() == "normalize":
|
||||
NORMALIZE = True
|
||||
else:
|
||||
ENCODING = arg
|
||||
|
||||
|
||||
|
||||
def convert_file(file_path):
|
||||
print("[*]", file_path, "fixed!")
|
||||
foriginal = copen(file_path, "r", "utf8", errors='ignore')
|
||||
content = foriginal.read()
|
||||
foriginal.close()
|
||||
|
||||
ccontent = fix_encoding(content, ENCODING, NORMALIZE, True)
|
||||
fconverted = copen(file_path, "w", "utf8")
|
||||
fconverted.write(ccontent)
|
||||
fconverted.close()
|
||||
|
||||
def normalize_str(text):
|
||||
return ''.join(
|
||||
c for c in unicodedata.normalize('NFKD', text)
|
||||
if unicodedata.category(c) != 'Mn'
|
||||
)
|
||||
|
||||
def fix_encoding(content, encoding=None, norm=False, verbose=False):
|
||||
encoding = encoding or DEFAULT_ENCODING
|
||||
|
||||
try:
|
||||
fixed = content.encode(encoding).decode("utf8")
|
||||
except:
|
||||
fixed = content
|
||||
if verbose:
|
||||
print("[*] error: can't fix the encoding. mixed encoding?")
|
||||
|
||||
if norm:
|
||||
return normalize_str(fixed)
|
||||
else:
|
||||
return fixed
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
if path.isfile(PATH):
|
||||
convert_file(PATH)
|
||||
|
||||
elif path.isdir(PATH):
|
||||
|
||||
for ffile in listdir(PATH):
|
||||
file_path = path.join(PATH, ffile)
|
||||
|
||||
if path.isfile(file_path):
|
||||
convert_file(file_path)
|
||||
else:
|
||||
print(
|
||||
"[*] error: "
|
||||
"usage: %s FILE_OR_DIR_PATH [codec] [normalize]"
|
||||
%
|
||||
argv[0]
|
||||
)
|
Loading…
Add table
Reference in a new issue