system.py 4.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126
  1. from future.utils import viewitems
  2. from pypeflow.io import cd, capture
  3. import fnmatch
  4. import logging
  5. import os
  6. import pprint
  7. import random
  8. import time
  9. log = logging.getLogger(__name__)
  10. def only_these_symlinks(dir2paths):
  11. """Create symlinks, and delete all other symlinks for each directory.
  12. dir2paths := {dir: [paths]}
  13. ('paths' is usually a list of 1.)
  14. Use relative symlink targets.
  15. Possibly, log everything we do, as one log statement to avoid user complaints.
  16. """
  17. log.info('Symlink .las files for further merging:\n{}'.format(
  18. pprint.pformat(dict(dir2paths))))
  19. for (d, paths) in viewitems(dir2paths):
  20. bases = [os.path.basename(path) for path in paths]
  21. base2rel = {os.path.basename(path): os.path.relpath(
  22. path, d) for path in paths}
  23. assert len(base2rel) == len(
  24. bases), 'Non-unique basename in {}'.format(repr(paths))
  25. for existing_base in os.listdir(d):
  26. existing_path = os.path.join(d, existing_base)
  27. if os.path.islink(existing_path):
  28. if existing_base in base2rel:
  29. if os.readlink(existing_path) != base2rel[existing_base]:
  30. # Wrong target (or non-relative) so remove it.
  31. os.unlink(existing_path)
  32. else:
  33. del base2rel[existing_base] # Just keep it.
  34. else:
  35. os.unlink(existing_path) # Old? Remove it for safety.
  36. for (base, rel) in viewitems(base2rel):
  37. path = os.path.join(d, base)
  38. os.symlink(rel, path)
  39. def lfs_setstripe_maybe(path='.', stripe=12):
  40. path = os.path.abspath(path)
  41. cmd = 'lfs setstripe -c {:d} {!s}'.format(stripe, path)
  42. try:
  43. capture(cmd)
  44. log.info('Lustre filesystem detected. This lfs stripe ({}) should propagate to subdirs of {!r}.'.format(
  45. stripe, path))
  46. except Exception as exc:
  47. log.info('Apparently {!r} is not in lustre filesystem, which is fine.'.format(
  48. path))
  49. def find_files(root_path, pattern):
  50. """
  51. Finds all files with filenames formatted as the
  52. given pattern, descending down from root_path.
  53. raise Exception if root_path is not a directory.
  54. """
  55. if not os.path.isdir(root_path):
  56. raise Exception('Not a directory: {!r}'.format(root_path))
  57. for root, dirs, files in os.walk(root_path):
  58. dirs.sort()
  59. for filename in sorted(fnmatch.filter(files, pattern)):
  60. yield os.path.join(root, filename)
  61. def abs_fns(ifofns, idir=None):
  62. """Yield absolute filenames from a streamed file-of-filenames.
  63. """
  64. log.info('Absolutizing FOFN in dir={!r}'.format(os.path.abspath(idir)))
  65. for line in ifofns.read().split():
  66. ifn = line.strip()
  67. if not ifn:
  68. continue
  69. if not os.path.isabs(ifn):
  70. ifn = os.path.abspath(os.path.join(idir, ifn))
  71. yield ifn
  72. def make_fofn_abs(i_fofn_fn, o_fofn_fn):
  73. """Copy i_fofn to o_fofn, but with relative filenames expanded for the dir of i_fofn.
  74. """
  75. assert os.path.abspath(o_fofn_fn) != os.path.abspath(
  76. i_fofn_fn), '{!r} != {!r}'.format(o_fofn_fn, i_fofn_fn)
  77. with open(i_fofn_fn) as ifs, open(o_fofn_fn, 'w') as ofs:
  78. for fn in abs_fns(ifs, os.path.dirname(os.path.realpath(i_fofn_fn))):
  79. ofs.write(fn + '\n')
  80. # return o_fofn_fn
  81. def make_dirs(d):
  82. if not os.path.isdir(d):
  83. log.debug('mkdir -p {!r}'.format(d))
  84. os.makedirs(d)
  85. def touch(*paths):
  86. """touch a file.
  87. """
  88. msg = 'touch {!r}'.format(paths)
  89. log.debug(msg)
  90. for path in paths:
  91. if os.path.exists(path):
  92. os.utime(path, None)
  93. else:
  94. open(path, 'a').close()
  95. def make_executable(path):
  96. """http://stackoverflow.com/questions/12791997/how-do-you-do-a-simple-chmod-x-from-within-python
  97. """
  98. mode = os.stat(path).st_mode
  99. mode |= (mode & 0o444) >> 2 # copy R bits to X
  100. os.chmod(path, mode)
  101. def set_random_seed(seed):
  102. seed = seed if seed else int(time.time())
  103. random.seed(seed)
  104. log.info('Random seed: {}'.format(seed))