Refactored to class

This commit is contained in:
Kevin Veen-Birkenbach 2023-09-14 18:00:43 +02:00
parent ab609af3bd
commit 1fbf43bfeb

84
scan.py
View File

@ -3,33 +3,63 @@ import argparse
import re
import zlib
class CodeProcessor:
PYTHON = ".py"
JS = ".js"
C = ".c"
CPP = ".cpp"
H = ".h"
@staticmethod
def remove_comments(content, file_type):
"""Remove comments from the content based on file type."""
if file_type == ".py":
# Remove Python single line comments
content = re.sub(r'^\s*#.*\n?', '', content, flags=re.MULTILINE)
# Remove triple double-quote and triple single-quote docstrings
content = re.sub(r'\"\"\"(.*?)\"\"\"', '', content, flags=re.DOTALL)
content = re.sub(r"\'\'\'(.*?)\'\'\'", '', content, flags=re.DOTALL)
elif file_type == ".js" or file_type == ".c" or file_type == ".cpp" or file_type == ".h":
# Remove C-style comments (// and /* */)
content = re.sub(r'\s*//.*', '', content)
content = re.sub(r'/\*.*?\*/', '', content, flags=re.DOTALL)
# Add more file types and their comment styles as needed
"""Remove comments based on file type."""
comment_patterns = {
CodeProcessor.PYTHON: [
(r'^\s*#.*\n?', ''),
(r'\"\"\"(.*?)\"\"\"', ''),
(r"\'\'\'(.*?)\'\'\'", '')
],
CodeProcessor.JS: [
(r'\s*//.*', ''),
(r'/\*.*?\*/', '')
],
CodeProcessor.C: [
(r'\s*//.*', ''),
(r'/\*.*?\*/', '')
],
CodeProcessor.CPP: [
(r'\s*//.*', ''),
(r'/\*.*?\*/', '')
],
CodeProcessor.H: [
(r'\s*//.*', ''),
(r'/\*.*?\*/', '')
]
}
patterns = comment_patterns.get(file_type, [])
for pattern, repl in patterns:
content = re.sub(pattern, repl, content, flags=re.DOTALL)
return content.strip()
def compress_code(content):
@staticmethod
def compress(content):
"""Compress code using zlib."""
return zlib.compress(content.encode())
class DirectoryHandler:
@staticmethod
def filter_directories(dirs, ignore_strings, ignore_hidden):
"""Filter out directories based on ignore criteria."""
if ignore_hidden:
dirs[:] = [d for d in dirs if not d.startswith('.')]
dirs[:] = [d for d in dirs if not any(ig in d for ig in ignore_strings)]
@staticmethod
def should_print_file(file_path, file_filters, ignore_strings, ignore_hidden, include_strings):
"""Determine if a file should be printed based on filters."""
"""Determine if a file should be printed."""
if ignore_hidden and os.path.basename(file_path).startswith('.'):
return False
if file_filters and not any(file_path.endswith(file_type) for file_type in file_filters):
@ -40,6 +70,7 @@ def should_print_file(file_path, file_filters, ignore_strings, ignore_hidden, in
return False
return True
@staticmethod
def print_file_content(file_path, no_comments, compress):
"""Print the content of a file."""
try:
@ -47,10 +78,10 @@ def print_file_content(file_path, no_comments, compress):
content = f.read()
if no_comments:
file_type = os.path.splitext(file_path)[1]
content = remove_comments(content, file_type)
content = CodeProcessor.remove_comments(content, file_type)
print(f"======== File Path: {file_path} ========")
if compress:
compressed_content = compress_code(content)
compressed_content = CodeProcessor.compress(content)
print(f"======== Compressed Code ========")
print(compressed_content)
else:
@ -60,19 +91,22 @@ def print_file_content(file_path, no_comments, compress):
print(f"Warning: Could not read file due to encoding issues: {file_path}")
exit(1)
def handle_directory(directory, file_filters, ignore_strings, ignore_hidden, verbose, no_comments, compress, strings):
@staticmethod
def handle_directory(directory, **kwargs):
"""Handle scanning and printing for directories."""
for root, dirs, files in os.walk(directory):
filter_directories(dirs, ignore_strings, ignore_hidden)
DirectoryHandler.filter_directories(dirs, kwargs['ignore_strings'], kwargs['ignore_hidden'])
for file in files:
if should_print_file(os.path.join(root, file), file_filters, ignore_strings, ignore_hidden, strings):
print_file_content(os.path.join(root, file), no_comments, compress)
elif verbose:
if DirectoryHandler.should_print_file(os.path.join(root, file), kwargs['file_filters'], kwargs['ignore_strings'], kwargs['ignore_hidden'], kwargs['strings']):
DirectoryHandler.print_file_content(os.path.join(root, file), kwargs['no_comments'], kwargs['compress'])
elif kwargs['verbose']:
print(f"Skipped file: {file}")
def handle_file(file_path, file_filters, ignore_strings, ignore_hidden, no_comments, compress):
@staticmethod
def handle_file(file_path, **kwargs):
"""Handle scanning and printing for individual files."""
print_file_content(file_path, no_comments, compress)
DirectoryHandler.print_file_content(file_path, kwargs['no_comments'], kwargs['compress'])
def main():
parser = argparse.ArgumentParser(description="Scan directories and print/compile file contents.")
@ -88,9 +122,9 @@ def main():
for path in args.paths:
if os.path.isdir(path):
handle_directory(path, args.filetype, args.ignore, args.ignore_hidden, args.verbose, args.no_comments, args.compress, args.strings)
DirectoryHandler.handle_directory(path, file_filters=args.filetype, ignore_strings=args.ignore, ignore_hidden=args.ignore_hidden, verbose=args.verbose, no_comments=args.no_comments, compress=args.compress, strings=args.strings)
elif os.path.isfile(path):
handle_file(path, args.filetype, args.ignore, args.ignore_hidden, args.no_comments, args.compress)
DirectoryHandler.handle_file(path, file_filters=args.filetype, ignore_strings=args.ignore, ignore_hidden=args.ignore_hidden, no_comments=args.no_comments, compress=args.compress)
else:
print(f"Error: {path} is neither a valid file nor a directory.")
exit(1)