directory-content-scanner/scan.py

67 lines
2.9 KiB
Python
Raw Normal View History

2023-09-14 07:41:37 +02:00
import os
import argparse
2023-09-14 08:02:05 +02:00
def filter_directories(dirs, ignore_strings, ignore_hidden):
2023-09-14 07:41:37 +02:00
"""Filter out directories based on ignore criteria."""
if ignore_hidden:
dirs[:] = [d for d in dirs if not d.startswith('.')]
dirs[:] = [d for d in dirs if not any(ig in d for ig in ignore_strings)]
2023-09-14 07:50:13 +02:00
def should_print_file(file, file_filters, ignore_strings, ignore_hidden):
2023-09-14 07:41:37 +02:00
"""Determine if a file should be printed based on filters."""
2023-09-14 07:50:13 +02:00
if ignore_hidden and file.startswith('.'):
return False
2023-09-14 08:02:05 +02:00
if file_filters and not any(file.endswith(file_type) for file_type in file_filters):
return False
2023-09-14 07:50:13 +02:00
if any(ignore_str in file for ignore_str in ignore_strings):
return False
return True
2023-09-14 07:41:37 +02:00
2023-09-14 08:02:05 +02:00
def print_file_content(file_path):
"""Print the content of a file."""
try:
with open(file_path, 'r') as f:
content = f.read()
print(f"======== File Path: {file_path} ========")
print(content)
print("==================================\n")
except UnicodeDecodeError:
print(f"Warning: Could not read file due to encoding issues: {file_path}")
exit(1)
2023-09-14 07:41:37 +02:00
2023-09-14 08:02:05 +02:00
def handle_directory(directory, file_filters, ignore_strings, ignore_hidden, verbose):
"""Handle scanning and printing for directories."""
2023-09-14 07:41:37 +02:00
for root, dirs, files in os.walk(directory):
2023-09-14 08:02:05 +02:00
filter_directories(dirs, ignore_strings, ignore_hidden)
2023-09-14 07:41:37 +02:00
for file in files:
2023-09-14 07:50:13 +02:00
if should_print_file(file, file_filters, ignore_strings, ignore_hidden):
2023-09-14 08:02:05 +02:00
print_file_content(os.path.join(root, file))
2023-09-14 07:41:37 +02:00
elif verbose:
print(f"Skipped file: {file}")
2023-09-14 08:02:05 +02:00
def handle_file(file_path, file_filters, ignore_strings, ignore_hidden):
"""Handle scanning and printing for individual files."""
if should_print_file(os.path.basename(file_path), file_filters, ignore_strings, ignore_hidden):
print_file_content(file_path)
2023-09-14 07:41:37 +02:00
def main():
parser = argparse.ArgumentParser(description="Scan directories and print file contents.")
2023-09-14 08:02:05 +02:00
parser.add_argument("paths", nargs='+', help="List of files or directories to scan.")
2023-09-14 07:41:37 +02:00
parser.add_argument("-f", "--filetype", nargs='+', default=[], help="Filter by file types (e.g., .txt .log).")
parser.add_argument("-i", "--ignore", nargs='+', default=[], help="Ignore files and folders containing these strings.")
2023-09-14 08:02:05 +02:00
parser.add_argument("--ignore-hidden", action='store_true', help="Ignore hidden directories and files.")
2023-09-14 07:41:37 +02:00
parser.add_argument("-v", "--verbose", action='store_true', help="Enable verbose mode.")
args = parser.parse_args()
2023-09-14 08:02:05 +02:00
for path in args.paths:
if os.path.isdir(path):
handle_directory(path, args.filetype, args.ignore, args.ignore_hidden, args.verbose)
elif os.path.isfile(path):
handle_file(path, args.filetype, args.ignore, args.ignore_hidden)
else:
print(f"Error: {path} is neither a valid file nor a directory.")
2023-09-14 07:41:37 +02:00
exit(1)
if __name__ == "__main__":
main()