@@ -51,3 +51,47 @@ def sample_dataframe_parsed() -> pd.DataFrame:
5151 df ["parent_types" ] = df ["parent_types" ].apply (ast .literal_eval )
5252
5353 return df
54+
55+
56+ @pytest .fixture
57+ def sample_dataframe_match () -> pd .DataFrame :
58+ """Sample DataFrame with markdown content for batch processing with matcher."""
59+ return pd .read_csv (
60+ pathlib .Path (__file__ ).parent / "fixtures" / "sample_data_match.csv"
61+ )
62+
63+
64+ @pytest .fixture
65+ def sample_dataframe_match_parsed () -> pd .DataFrame :
66+ """Expected parsed output for sample_dataframe_match with matcher."""
67+ path = pathlib .Path (__file__ ).parent / "fixtures" / "sample_data_match_parsed.csv"
68+ df = pd .read_csv (path )
69+
70+ # Convert string representations of lists back to actual lists
71+ df ["parents" ] = df ["parents" ].apply (ast .literal_eval )
72+ df ["parent_types" ] = df ["parent_types" ].apply (ast .literal_eval )
73+ df ["matched_headings" ] = df ["matched_headings" ].apply (ast .literal_eval )
74+ df ["missing_headings" ] = df ["missing_headings" ].apply (ast .literal_eval )
75+
76+ return df
77+
78+
79+ @pytest .fixture
80+ def expected_json_files () -> dict [str , dict ]:
81+ """Expected JSON output files for batch processing tests."""
82+ json_dir = pathlib .Path (__file__ ).parent / "fixtures" / "expected_json"
83+ result = {}
84+ for json_file in sorted (json_dir .glob ("*.json" )):
85+ with open (json_file ) as f :
86+ result [json_file .name ] = json .load (f )
87+ return result
88+
89+
90+ @pytest .fixture
91+ def expected_tree_files () -> dict [str , str ]:
92+ """Expected tree output files for batch processing tests."""
93+ tree_dir = pathlib .Path (__file__ ).parent / "fixtures" / "expected_tree"
94+ result = {}
95+ for tree_file in sorted (tree_dir .glob ("*.txt" )):
96+ result [tree_file .name ] = tree_file .read_text ()
97+ return result
0 commit comments