Skip to content

Commit 8f33085

Browse files
authored
FileContainer: add search_single (#158)
* `FileContainer`: add `search_single` * changelog
1 parent 98a94e8 commit 8f33085

File tree

3 files changed

+56
-1
lines changed

3 files changed

+56
-1
lines changed

CHANGELOG.md

+1
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,7 @@
33
## v1.0.2 - unreleased
44

55
- Restore behavior of `FileContainer.search(key=None)` - passing `None` to `search` is ignored again [#143](https://github.com/mpytools/filefisher/issues/143).
6+
- Added `FileContainer.search_single` to search for _exacly_ one path in a `FileContainer` ([#158](https://github.com/mpytools/filefisher/pull/158)).
67

78
## v1.0.1 - 16.01.205
89
This version patches a bug from v1.0.0. that broke `FileContainer.concat()`.

filefisher/_filefinder.py

+38-1
Original file line numberDiff line numberDiff line change
@@ -675,14 +675,18 @@ def _combine_by_keys(self, keys=None, sep="."):
675675

676676
return self.df[list(keys)].apply(lambda x: sep.join(x.map(str)), axis=1)
677677

678-
def search(self, **query):
678+
def search(self, **query) -> "FileContainer":
679679
"""subset paths given a search query
680680
681681
Parameters
682682
----------
683683
**query : Mapping[str, str | int | list[str | int]]
684684
Search query.
685685
686+
Returns
687+
-------
688+
search_result : FileContainer
689+
686690
Notes
687691
-----
688692
- individual conditions are combined with "and", e.g., ``model="a", exp="b"``
@@ -695,6 +699,39 @@ def search(self, **query):
695699
df = self._get_subset(**query)
696700
return type(self)(df)
697701

702+
def search_single(self, **query) -> "FileContainer":
703+
"""find exactly one path given a search query - raises an error otherwise
704+
705+
Parameters
706+
----------
707+
**query : Mapping[str, str | int | list[str | int]]
708+
Search query.
709+
710+
Returns
711+
-------
712+
search_result : FileContainer
713+
714+
See also
715+
--------
716+
FileContainer.search
717+
"""
718+
719+
fc = self.search(**query)
720+
721+
if len(fc) == 0:
722+
msg = "Found no paths"
723+
raise ValueError(msg)
724+
725+
if len(fc) > 1:
726+
n_found = len(fc)
727+
msg = (
728+
f"Found more than one ({n_found}) paths. Please adjust your"
729+
f" query.\nFirst five paths:\n{fc.df.head()}"
730+
)
731+
raise ValueError(msg)
732+
733+
return fc
734+
698735
def concat(self, other, drop_duplicates=True):
699736
"""concatenate two FileContainers
700737

filefisher/tests/test_filecontainer.py

+17
Original file line numberDiff line numberDiff line change
@@ -170,6 +170,23 @@ def test_filecontainer_search_none_key(example_df, example_fc):
170170
pd.testing.assert_frame_equal(result.df, expected)
171171

172172

173+
def test_filecontainer_search_single(example_df, example_fc):
174+
175+
# empty search query results in an empty FileContainer
176+
with pytest.raises(ValueError, match="Found no paths"):
177+
example_fc.search_single()
178+
179+
with pytest.raises(ValueError, match="Found more than one \(5\) paths"):
180+
example_fc.search_single(model=None)
181+
182+
with pytest.raises(ValueError, match="Found more than one \(2\) paths"):
183+
example_fc.search_single(model="a")
184+
185+
result = example_fc.search_single(model="a", scen="h")
186+
expected = example_df.iloc[[1]]
187+
pd.testing.assert_frame_equal(result.df, expected)
188+
189+
173190
def test_filecontainer_concat(example_fc):
174191

175192
with pytest.raises(ValueError, match="Can only concatenate two FileContainers."):

0 commit comments

Comments
 (0)