utils_fs.py 8.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263
  1. import os
  2. import re
  3. import shutil
  4. def get_path_stem(path):
  5. """
  6. References:
  7. `std::filesystem::path::stem` since C++17
  8. """
  9. return os.path.splitext(os.path.basename(path))[0]
  10. def replace_path_stem(path, new_stem):
  11. dirname, basename = os.path.split(path)
  12. stem, extension = os.path.splitext(basename)
  13. if isinstance(new_stem, str):
  14. return os.path.join(dirname, new_stem + extension)
  15. elif hasattr(new_stem, '__call__'):
  16. return os.path.join(dirname, new_stem(stem) + extension)
  17. else:
  18. raise ValueError('Unsupported Type!')
  19. def get_path_extension(path):
  20. """
  21. References:
  22. `std::filesystem::path::extension` since C++17
  23. Notes:
  24. Not fully consistent with `std::filesystem::path::extension`
  25. """
  26. return os.path.splitext(os.path.basename(path))[1]
  27. def replace_path_extension(path, new_extension=None):
  28. """Replaces the extension with new_extension or removes it when the default value is used.
  29. Firstly, if this path has an extension, it is removed. Then, a dot character is appended
  30. to the pathname, if new_extension is not empty or does not begin with a dot character.
  31. References:
  32. `std::filesystem::path::replace_extension` since C++17
  33. """
  34. filename_wo_ext = os.path.splitext(path)[0]
  35. if new_extension == '' or new_extension is None:
  36. return filename_wo_ext
  37. elif new_extension.startswith('.'):
  38. return ''.join([filename_wo_ext, new_extension])
  39. else:
  40. return '.'.join([filename_wo_ext, new_extension])
  41. def normalize_extension(extension):
  42. if extension.startswith('.'):
  43. new_extension = extension.lower()
  44. else:
  45. new_extension = '.' + extension.lower()
  46. return new_extension
  47. def is_path_in_extensions(path, extensions):
  48. if isinstance(extensions, str):
  49. extensions = [extensions]
  50. extensions = [normalize_extension(item) for item in extensions]
  51. extension = get_path_extension(path)
  52. return extension.lower() in extensions
  53. def makedirs(name, mode=0o755):
  54. """
  55. References:
  56. mmcv.mkdir_or_exist
  57. """
  58. if name == '':
  59. return
  60. name = os.path.expanduser(name)
  61. os.makedirs(name, mode=mode, exist_ok=True)
  62. def listdirs(paths, path_sep=None, full_path=True):
  63. """Enhancement on `os.listdir`
  64. """
  65. assert isinstance(paths, (str, tuple, list))
  66. if isinstance(paths, str):
  67. path_sep = path_sep or os.path.pathsep
  68. paths = paths.split(path_sep)
  69. all_filenames = []
  70. for path in paths:
  71. path_ex = os.path.expanduser(path)
  72. filenames = os.listdir(path_ex)
  73. if full_path:
  74. filenames = [os.path.join(path_ex, filename) for filename in filenames]
  75. all_filenames.extend(filenames)
  76. return all_filenames
  77. def get_all_filenames(path, extensions=None, is_valid_file=None):
  78. if (extensions is not None) and (is_valid_file is not None):
  79. raise ValueError("Both extensions and is_valid_file cannot "
  80. "be not None at the same time")
  81. if is_valid_file is None:
  82. if extensions is not None:
  83. def is_valid_file(filename):
  84. return is_path_in_extensions(filename, extensions)
  85. else:
  86. def is_valid_file(filename):
  87. return True
  88. all_filenames = []
  89. path_ex = os.path.expanduser(path)
  90. for root, _, filenames in sorted(os.walk(path_ex, followlinks=True)):
  91. for filename in sorted(filenames):
  92. fullname = os.path.join(root, filename)
  93. if is_valid_file(fullname):
  94. all_filenames.append(fullname)
  95. return all_filenames
  96. def get_top_level_dirs(path, full_path=True):
  97. if path is None:
  98. path = os.getcwd()
  99. path_ex = os.path.expanduser(path)
  100. filenames = os.listdir(path_ex)
  101. if full_path:
  102. return [os.path.join(path_ex, item) for item in filenames
  103. if os.path.isdir(os.path.join(path_ex, item))]
  104. else:
  105. return [item for item in filenames
  106. if os.path.isdir(os.path.join(path_ex, item))]
  107. def get_top_level_files(path, full_path=True):
  108. if path is None:
  109. path = os.getcwd()
  110. path_ex = os.path.expanduser(path)
  111. filenames = os.listdir(path_ex)
  112. if full_path:
  113. return [os.path.join(path_ex, item) for item in filenames
  114. if os.path.isfile(os.path.join(path_ex, item))]
  115. else:
  116. return [item for item in filenames
  117. if os.path.isfile(os.path.join(path_ex, item))]
  118. def get_folder_size(dirname):
  119. if not os.path.exists(dirname):
  120. raise ValueError("Incorrect path: {}".format(dirname))
  121. total_size = 0
  122. for root, _, filenames in os.walk(dirname):
  123. for name in filenames:
  124. total_size += os.path.getsize(os.path.join(root, name))
  125. return total_size
  126. def replace_invalid_filename_char(filename, new_char='_'):
  127. assert isinstance(new_char, str)
  128. control_chars = ''.join((map(chr, range(0x00, 0x20))))
  129. pattern = r'[\\/*?:"<>|{}]'.format(control_chars)
  130. return re.sub(pattern, new_char, filename)
  131. def copy_file(src, dst_dir, action_if_exist='rename'):
  132. """
  133. Args:
  134. src: source file path
  135. dst_dir: dest dir
  136. action_if_exist:
  137. None: same as shutil.copy
  138. rename: when dest file exists, rename it
  139. Returns:
  140. dest filename
  141. """
  142. src_basename = os.path.basename(src)
  143. src_stem, src_extension = os.path.splitext(src_basename)
  144. dst = os.path.join(dst_dir, src_basename)
  145. if action_if_exist is None:
  146. os.makedirs(dst_dir, exist_ok=True)
  147. shutil.copy(src, dst_dir)
  148. elif action_if_exist.lower() == 'rename':
  149. suffix = 2
  150. while os.path.exists(dst):
  151. dst_basename = '{} ({}){}'.format(src_stem, suffix, src_extension)
  152. dst = os.path.join(dst_dir, dst_basename)
  153. suffix += 1
  154. else:
  155. os.makedirs(dst_dir, exist_ok=True)
  156. shutil.copy(src, dst)
  157. else:
  158. raise ValueError('Invalid action_if_exist, got {}.'.format(action_if_exist))
  159. return dst
  160. def move_file(src, dst_dir, action_if_exist='rename'):
  161. """
  162. Args:
  163. src: source file path
  164. dst_dir: dest dir
  165. action_if_exist:
  166. None: same as shutil.move
  167. rename: when dest file exists, rename it
  168. Returns:
  169. dest filename
  170. """
  171. src_basename = os.path.basename(src)
  172. src_stem, src_extension = os.path.splitext(src_basename)
  173. dst = os.path.join(dst_dir, src_basename)
  174. if action_if_exist is None:
  175. os.makedirs(dst_dir, exist_ok=True)
  176. shutil.move(src, dst_dir)
  177. elif action_if_exist.lower() == 'rename':
  178. suffix = 2
  179. while os.path.exists(dst):
  180. dst_basename = '{} ({}){}'.format(src_stem, suffix, src_extension)
  181. dst = os.path.join(dst_dir, dst_basename)
  182. suffix += 1
  183. else:
  184. os.makedirs(dst_dir, exist_ok=True)
  185. shutil.move(src, dst)
  186. else:
  187. raise ValueError('Invalid action_if_exist, got {}.'.format(action_if_exist))
  188. return dst
  189. def rename_file(src, dst, action_if_exist='rename'):
  190. """
  191. Args:
  192. src: source file path
  193. dst: dest file path
  194. action_if_exist:
  195. None: same as os.rename
  196. rename: when dest file exists, rename it
  197. Returns:
  198. dest filename
  199. """
  200. if dst == src:
  201. return dst
  202. if action_if_exist is None:
  203. os.rename(src, dst)
  204. elif action_if_exist.lower() == 'rename':
  205. dirname, basename = os.path.split(dst)
  206. stem, extension = os.path.splitext(basename)
  207. suffix = 2
  208. while os.path.exists(dst):
  209. new_basename = '{} ({}){}'.format(stem, suffix, extension)
  210. dst = os.path.join(dirname, new_basename)
  211. suffix += 1
  212. os.makedirs(dirname, exist_ok=True)
  213. os.rename(src, dst)
  214. else:
  215. raise ValueError('Invalid action_if_exist, got {}.'.format(action_if_exist))
  216. return dst