| import argparse |
| import re |
|
|
| def extract_ascii_strings(data, min_length=4): |
| ascii_strings = re.findall(rb'[\x20-\x7E]{%d,}' % min_length, data) |
| return [s.decode('ascii', errors='ignore') for s in ascii_strings] |
|
|
| def extract_unicode_strings(data, min_length=4): |
| unicode_strings = re.findall((rb'(?:[\x20-\x7E]\x00){%d,}' % min_length), data) |
| return [s.decode('utf-16le', errors='ignore') for s in unicode_strings] |
|
|
| def extract_strings_from_dll(dll_path): |
| with open(dll_path, 'rb') as f: |
| data = f.read() |
| |
| ascii_strings = extract_ascii_strings(data) |
| unicode_strings = extract_unicode_strings(data) |
|
|
| return ascii_strings + unicode_strings |
|
|
| if __name__ == "__main__": |
| parser = argparse.ArgumentParser(description="Extract text from a DLL file.") |
| parser.add_argument("dll_path", help="Path to the DLL file") |
| parser.add_argument("-o", "--output", help="Output file to save extracted text", default=None) |
|
|
| args = parser.parse_args() |
|
|
| extracted_text = extract_strings_from_dll(args.dll_path) |
|
|
| if args.output: |
| with open(args.output, "w", encoding="utf-8") as out_file: |
| out_file.write("\n".join(extracted_text)) |
| print(f"Extracted text saved to {args.output}") |
| else: |
| for line in extracted_text: |
| print(line) |
|
|