mirror of
https://github.com/Alexander-D-Karpov/scripts.git
synced 2024-11-21 19:46:38 +03:00
updated extract_folder
This commit is contained in:
parent
d7a5e8787d
commit
0dc45b8935
|
@ -1,5 +1,18 @@
|
||||||
import os
|
import os
|
||||||
import sys
|
import sys
|
||||||
|
import pathspec
|
||||||
|
|
||||||
|
|
||||||
|
def read_gitignore(input_dir):
|
||||||
|
"""
|
||||||
|
Reads the .gitignore file in the input directory and returns a pathspec object.
|
||||||
|
"""
|
||||||
|
gitignore_path = os.path.join(input_dir, ".gitignore")
|
||||||
|
if os.path.isfile(gitignore_path):
|
||||||
|
with open(gitignore_path, "r") as gitignore_file:
|
||||||
|
return pathspec.PathSpec.from_lines("gitwildmatch", gitignore_file)
|
||||||
|
else:
|
||||||
|
return pathspec.PathSpec.from_lines("gitwildmatch", [])
|
||||||
|
|
||||||
|
|
||||||
def structure_directory_content(input_dir, output_file=None, extensions=None):
|
def structure_directory_content(input_dir, output_file=None, extensions=None):
|
||||||
|
@ -12,20 +25,30 @@ def structure_directory_content(input_dir, output_file=None, extensions=None):
|
||||||
If None, 'data.txt' or 'data.<extension>' will be used.
|
If None, 'data.txt' or 'data.<extension>' will be used.
|
||||||
:param extensions: A list of file extensions to include. If None, all files are included.
|
:param extensions: A list of file extensions to include. If None, all files are included.
|
||||||
"""
|
"""
|
||||||
|
gitignore_spec = read_gitignore(input_dir)
|
||||||
|
|
||||||
if extensions:
|
if extensions:
|
||||||
extensions = [ext.strip() for ext in extensions.split(",") if ext.strip() != ""]
|
extensions = [ext.strip() for ext in extensions.split(",") if ext.strip() != ""]
|
||||||
# If only one extension is given and no output file is specified, use 'data.<extension>'
|
|
||||||
if not output_file and len(extensions) == 1:
|
if not output_file and len(extensions) == 1:
|
||||||
output_file = f"data.{extensions[0]}"
|
output_file = f"data.{extensions[0]}"
|
||||||
else:
|
else:
|
||||||
extensions = None
|
extensions = None
|
||||||
|
|
||||||
# If no output file is specified, default to 'data.txt'
|
|
||||||
if not output_file:
|
if not output_file:
|
||||||
output_file = "data.txt"
|
output_file = "data.txt"
|
||||||
|
|
||||||
with open(output_file, "w") as outfile:
|
with open(output_file, "w") as outfile:
|
||||||
for root, dirs, files in os.walk(input_dir):
|
for root, dirs, files in os.walk(input_dir):
|
||||||
|
files = [
|
||||||
|
f
|
||||||
|
for f in files
|
||||||
|
if not gitignore_spec.match_file(os.path.join(root, str(f)))
|
||||||
|
]
|
||||||
|
dirs[:] = [
|
||||||
|
d
|
||||||
|
for d in dirs
|
||||||
|
if not gitignore_spec.match_file(os.path.join(root, str(d)))
|
||||||
|
]
|
||||||
for file in files:
|
for file in files:
|
||||||
if extensions is None or any(
|
if extensions is None or any(
|
||||||
file.endswith(f".{ext}") for ext in extensions
|
file.endswith(f".{ext}") for ext in extensions
|
||||||
|
|
Loading…
Reference in New Issue
Block a user