123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126 |
- from future.utils import viewitems
- from pypeflow.io import cd, capture
- import fnmatch
- import logging
- import os
- import pprint
- import random
- import time
- log = logging.getLogger(__name__)
- def only_these_symlinks(dir2paths):
- """Create symlinks, and delete all other symlinks for each directory.
- dir2paths := {dir: [paths]}
- ('paths' is usually a list of 1.)
- Use relative symlink targets.
- Possibly, log everything we do, as one log statement to avoid user complaints.
- """
- log.info('Symlink .las files for further merging:\n{}'.format(
- pprint.pformat(dict(dir2paths))))
- for (d, paths) in viewitems(dir2paths):
- bases = [os.path.basename(path) for path in paths]
- base2rel = {os.path.basename(path): os.path.relpath(
- path, d) for path in paths}
- assert len(base2rel) == len(
- bases), 'Non-unique basename in {}'.format(repr(paths))
- for existing_base in os.listdir(d):
- existing_path = os.path.join(d, existing_base)
- if os.path.islink(existing_path):
- if existing_base in base2rel:
- if os.readlink(existing_path) != base2rel[existing_base]:
- # Wrong target (or non-relative) so remove it.
- os.unlink(existing_path)
- else:
- del base2rel[existing_base] # Just keep it.
- else:
- os.unlink(existing_path) # Old? Remove it for safety.
- for (base, rel) in viewitems(base2rel):
- path = os.path.join(d, base)
- os.symlink(rel, path)
- def lfs_setstripe_maybe(path='.', stripe=12):
- path = os.path.abspath(path)
- cmd = 'lfs setstripe -c {:d} {!s}'.format(stripe, path)
- try:
- capture(cmd)
- log.info('Lustre filesystem detected. This lfs stripe ({}) should propagate to subdirs of {!r}.'.format(
- stripe, path))
- except Exception as exc:
- log.info('Apparently {!r} is not in lustre filesystem, which is fine.'.format(
- path))
- def find_files(root_path, pattern):
- """
- Finds all files with filenames formatted as the
- given pattern, descending down from root_path.
- raise Exception if root_path is not a directory.
- """
- if not os.path.isdir(root_path):
- raise Exception('Not a directory: {!r}'.format(root_path))
- for root, dirs, files in os.walk(root_path):
- dirs.sort()
- for filename in sorted(fnmatch.filter(files, pattern)):
- yield os.path.join(root, filename)
- def abs_fns(ifofns, idir=None):
- """Yield absolute filenames from a streamed file-of-filenames.
- """
- log.info('Absolutizing FOFN in dir={!r}'.format(os.path.abspath(idir)))
- for line in ifofns.read().split():
- ifn = line.strip()
- if not ifn:
- continue
- if not os.path.isabs(ifn):
- ifn = os.path.abspath(os.path.join(idir, ifn))
- yield ifn
- def make_fofn_abs(i_fofn_fn, o_fofn_fn):
- """Copy i_fofn to o_fofn, but with relative filenames expanded for the dir of i_fofn.
- """
- assert os.path.abspath(o_fofn_fn) != os.path.abspath(
- i_fofn_fn), '{!r} != {!r}'.format(o_fofn_fn, i_fofn_fn)
- with open(i_fofn_fn) as ifs, open(o_fofn_fn, 'w') as ofs:
- for fn in abs_fns(ifs, os.path.dirname(os.path.realpath(i_fofn_fn))):
- ofs.write(fn + '\n')
- # return o_fofn_fn
- def make_dirs(d):
- if not os.path.isdir(d):
- log.debug('mkdir -p {!r}'.format(d))
- os.makedirs(d)
- def touch(*paths):
- """touch a file.
- """
- msg = 'touch {!r}'.format(paths)
- log.debug(msg)
- for path in paths:
- if os.path.exists(path):
- os.utime(path, None)
- else:
- open(path, 'a').close()
- def make_executable(path):
- """http://stackoverflow.com/questions/12791997/how-do-you-do-a-simple-chmod-x-from-within-python
- """
- mode = os.stat(path).st_mode
- mode |= (mode & 0o444) >> 2 # copy R bits to X
- os.chmod(path, mode)
- def set_random_seed(seed):
- seed = seed if seed else int(time.time())
- random.seed(seed)
- log.info('Random seed: {}'.format(seed))
|