diff --git a/cosima_cookbook/database.py b/cosima_cookbook/database.py index a7388c4..8a46e22 100644 --- a/cosima_cookbook/database.py +++ b/cosima_cookbook/database.py @@ -5,6 +5,7 @@ import re import subprocess from tqdm import tqdm +import warnings import cftime from dask.distributed import as_completed @@ -22,6 +23,8 @@ from . import netcdf_utils from .database_utils import * +logging.captureWarnings(True) + __DB_VERSION__ = 2 __DEFAULT_DB__ = '/g/data/hh5/tmp/cosima/database/access-om2.db' @@ -295,12 +298,14 @@ def index_experiment(experiment_dir, session=None, client=None, update=False): # find all netCDF files in the hierarchy below this directory files = [] - try: - results = subprocess.check_output(['find', experiment_dir, '-name', '*.nc']) - results = [s for s in results.decode('utf-8').split()] - files.extend(results) - except Exception as e: - logging.error('Error occurred while finding output files: %s', e) + proc = subprocess.run(['find', experiment_dir, '-name', '*.nc'], + stdout=subprocess.PIPE, stderr=subprocess.PIPE, + encoding='utf-8') + if proc.returncode != 0: + warnings.warn('Some files or directories could not be read while finding output files: %s', UserWarning) + + results = [s for s in proc.stdout.split()] + files.extend(results) expt_path = Path(experiment_dir) expt = NCExperiment(experiment=str(expt_path.name), diff --git a/test/test_indexing.py b/test/test_indexing.py index 3659257..a793497 100644 --- a/test/test_indexing.py +++ b/test/test_indexing.py @@ -14,6 +14,24 @@ def session_db(tmpdir): s.close() +@pytest.fixture +def unreadable_dir(tmpdir): + expt_path = tmpdir / "expt_dir" + expt_path.mkdir() + idx_dir = expt_path / "unreadable" + idx_dir.mkdir() + idx_dir.chmod(0o300) + + yield idx_dir + + expt_path.remove(ignore_errors=True) + +def test_unreadable(session_db, unreadable_dir): + session, db = session_db + + with pytest.warns(UserWarning, match="Some files or directories could not be read"): + indexed = database.build_index(str(unreadable_dir), session) + def test_broken(session_db): session, db = session_db indexed = database.build_index('test/data/indexing/broken_file', session)