file_management.py 4.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123
  1. from pathlib import Path
  2. import re
  3. class OverwriteError(Exception):
  4. pass
  5. def overwrite_protection(path: Path) -> None:
  6. if path.is_file():
  7. raise OverwriteError(f'File {path} already exists and should not be overwritten.')
  8. if path.is_dir():
  9. raise OverwriteError(f'Directory {path} already exists and should not be overwritten.')
  10. def rm_directory(path: Path) -> None:
  11. """Removes a directory with its entire content."""
  12. for child in path.iterdir():
  13. if child.is_file():
  14. child.unlink()
  15. else:
  16. rm_directory(child)
  17. path.rmdir()
  18. def recursive_dir_empty(path: Path, ignore_top_level_files=False) -> bool:
  19. """Check if the directory is empty."""
  20. if not path.exists():
  21. return True
  22. # Check if path is empty
  23. has_next = next(path.iterdir(), None)
  24. if has_next is None:
  25. return True
  26. # Iterate over items in dir_path
  27. for item in path.iterdir():
  28. if item.is_dir():
  29. # Recursively check if subdirectory is empty or contains only empty subdirectories
  30. if not recursive_dir_empty(item, ignore_top_level_files=False): # files in subdirectories are never allowed
  31. return False
  32. if item.is_file() and not ignore_top_level_files:
  33. return False
  34. return True
  35. def split_base_and_num(name: str, sep: str, no_num_return=0):
  36. separated = str(name).split(sep)
  37. try:
  38. num = int(separated[-1])
  39. return sep.join(separated[:-1]), num
  40. except ValueError:
  41. return sep.join(separated), no_num_return
  42. def get_unique_filename(file_path: Path) -> Path:
  43. # Get the base name and the extension
  44. ext = file_path.suffix # Get the file extension (e.g., .dat)
  45. base_name, current_suffix = split_base_and_num(file_path.stem, '_', no_num_return=0)
  46. directory = file_path.parent
  47. existing_files = list(directory.glob(f"{base_name}_*{ext}"))
  48. # Extract all existing suffixes (numbers) and find the highest one
  49. suffixes = []
  50. for file in existing_files:
  51. suffix_part = file.stem[len(base_name) + 1:] # Skip base name and underscore
  52. if suffix_part.isdigit():
  53. suffixes.append(int(suffix_part))
  54. # Find the next available suffix
  55. if suffixes:
  56. new_suffix = max(suffixes) + 1
  57. else:
  58. new_suffix = 1 # Start with _1 if no suffixes are found
  59. new_file_name = f"{base_name}_{new_suffix}{ext}"
  60. return directory / new_file_name
  61. def new_folder(folder_name: Path, sep='_', mkdir: bool = True) -> Path:
  62. """Create a new folder based on the given folder_name with unique (sequential) number added in the end."""
  63. folder_name = folder_name.resolve()
  64. if folder_name.is_file():
  65. raise NameError(f'{folder_name} is not a directory.')
  66. parent = folder_name.parent
  67. base_str, num = split_base_and_num(folder_name.name, sep=sep, no_num_return=0)
  68. pattern = re.compile(rf"^{base_str}{sep}\d+$")
  69. all_directory_nums = []
  70. for folder in parent.glob(f'{base_str}*'):
  71. if folder.is_dir() and pattern.match(folder.name):
  72. _, dir_num = split_base_and_num(folder.name, sep=sep, no_num_return=0)
  73. all_directory_nums.append(dir_num)
  74. try:
  75. max_num = max(all_directory_nums)
  76. except ValueError: # if all_directory_nums is empty (i.e. no file with such name exists)
  77. max_num = num
  78. new_folder_name = parent.joinpath(base_str + sep + str(max_num))
  79. if new_folder_name.exists(): # and not recursive_dir_empty(new_folder_name, ignore_top_level_files=ignore_files):
  80. new_folder_name = parent.joinpath(base_str + sep + str(max_num + 1))
  81. if mkdir:
  82. new_folder_name.mkdir(parents=True, exist_ok=True)
  83. return new_folder_name
  84. def new_folder_with_number(folder_name: Path, number: int, sep='_') -> Path:
  85. folder_name = folder_name.resolve()
  86. if folder_name.is_file():
  87. raise NameError(f'{folder_name} is not a directory.')
  88. parent = folder_name.parent
  89. base_str, num = split_base_and_num(folder_name.name, sep=sep, no_num_return=0)
  90. new_folder_name = parent.joinpath(base_str + sep + str(number))
  91. new_folder_name.mkdir(parents=True, exist_ok=True)
  92. return new_folder_name