Skip to content

Commit c79313d

Browse files
authored
fix test_path issues (#160)
* fix test_path issues * changelog
1 parent 945841f commit c79313d

File tree

3 files changed

+35
-10
lines changed

3 files changed

+35
-10
lines changed

CHANGELOG.md

+2-1
Original file line numberDiff line numberDiff line change
@@ -2,8 +2,9 @@
22

33
## v1.0.2 - unreleased
44

5-
- Restore behavior of `FileContainer.search(key=None)` - passing `None` to `search` is ignored again [#143](https://github.com/mpytools/filefisher/issues/143).
5+
- Restore behavior of `FileContainer.search(key=None)` - passing `None` to `search` is ignored again ([#143](https://github.com/mpytools/filefisher/issues/143)).
66
- Added `FileContainer.search_single` to search for _exactly_ one path in a `FileContainer` ([#158](https://github.com/mpytools/filefisher/pull/158)).
7+
- Fixed issues of non-unique `test_path` ([#139](https://github.com/mpytools/filefisher/issues/139)).
78

89
## v1.0.1 - 16.01.205
910
This version patches a bug from v1.0.0. that broke `FileContainer.concat()`.

filefisher/_filefinder.py

+11-4
Original file line numberDiff line numberDiff line change
@@ -300,21 +300,28 @@ def __init__(
300300
self._full_pattern = self.full.pattern
301301

302302
if test_paths is not None:
303+
304+
if isinstance(test_paths, str):
305+
test_paths = [test_paths]
306+
307+
if len(test_paths) != len(set(test_paths)):
308+
raise ValueError("`test_paths` are not unique")
309+
303310
self._set_test_paths(test_paths)
304311

305312
def _set_test_paths(self, test_paths):
306313

307-
if isinstance(test_paths, str):
308-
test_paths = [test_paths]
309-
310314
self._test_paths = test_paths
311315

312316
# use fnmatch.filter to 'glob' pseudo-filenames
313317
def finder(pat):
314318

315319
# make fnmatch work (almost) the same as glob
316320
if pat.endswith(os.path.sep):
317-
paths_ = [os.path.dirname(s) + os.path.sep for s in test_paths]
321+
# remove duplicate paths (i.e. if the filename made it non-unique)
322+
paths_ = sorted(
323+
set(os.path.dirname(s) + os.path.sep for s in test_paths)
324+
)
318325
else:
319326
paths_ = test_paths
320327

filefisher/tests/test_filefinder.py

+22-5
Original file line numberDiff line numberDiff line change
@@ -134,6 +134,18 @@ def test_test_path_property():
134134
assert ff._test_paths == ["a", "b"]
135135

136136

137+
def test_test_path_assert_nonunique():
138+
139+
with pytest.raises(ValueError, match="`test_paths` are not unique"):
140+
FileFinder("a", "", test_paths=["a", "a"])
141+
142+
with pytest.raises(ValueError, match="`test_paths` are not unique"):
143+
FileFinder("a", "", test_paths=["a/", "a/"])
144+
145+
with pytest.raises(ValueError, match="`test_paths` are not unique"):
146+
FileFinder("a", "", test_paths=["a/b", "a/b"])
147+
148+
137149
def test_file_pattern_no_sep():
138150

139151
path_pattern = "path_pattern"
@@ -279,12 +291,15 @@ def test_find_path_none_found(tmp_path, test_paths):
279291

280292
def test_find_paths_non_unique():
281293

282-
# test raises error for non-unique metadata - AFAIK not possible for real paths
294+
# ensure find_paths works for duplicated folder names (made unique by the file name)
283295

284-
ff = FileFinder("{cat}", "", test_paths=["a/", "a/"])
296+
ff = FileFinder("{cat}", "", test_paths=["a/a", "a/b"])
285297

286-
with pytest.raises(ValueError, match="Non-unique metadata detected"):
287-
ff.find_paths()
298+
result = ff.find_paths()
299+
300+
expected = {"path": {0: "a/*"}, "cat": {0: "a"}}
301+
expected = pd.DataFrame.from_dict(expected).set_index("path")
302+
pd.testing.assert_frame_equal(result.df, expected)
288303

289304

290305
def test_find_paths_simple(tmp_path, test_paths):
@@ -460,7 +475,9 @@ def test_find_files_non_unique():
460475

461476
# test raises error for non-unique metadata - AFAIK not possible for real paths
462477

463-
ff = FileFinder("", "{cat}", test_paths=["/a", "/a"])
478+
ff = FileFinder("", "{cat}")
479+
# need to set via `_set_test_paths` to avoid duplicate check
480+
ff._set_test_paths(test_paths=["/a", "/a"])
464481

465482
with pytest.raises(ValueError, match="Non-unique metadata detected"):
466483
ff.find_files()

0 commit comments

Comments
 (0)