@@ -20,20 +20,19 @@ def test_format_prompt_truncates_long_task():
2020 prompt = _format_prompt (long_task , "output" )
2121 assert len (long_task ) > 3000
2222 assert "..." in prompt
23- # Should be truncated to 3000 + "..."
24- task_section = prompt .split ("Task: " )[1 ].split ("\n \n " )[0 ]
23+ task_section = prompt .split ("<task>\n " , 1 )[1 ].split ("\n </task>" , 1 )[0 ]
2524 assert len (task_section ) == 3003 # 3000 + "..."
2625
2726
2827def test_format_prompt_empty_task ():
2928 prompt = _format_prompt ("" , "some output" )
30- assert "Task: \n " in prompt
29+ assert "<task> \n \n </task> " in prompt
3130 assert "some output" in prompt
3231
3332
34- def test_system_prompt_has_json_format ():
33+ def test_system_prompt_has_relevant_lines_format ():
3534 assert "relevant_lines" in SYSTEM_PROMPT
36- assert "JSON " in SYSTEM_PROMPT
35+ assert "<relevant_lines> " in SYSTEM_PROMPT
3736
3837
3938def test_load_config_returns_dict ():
@@ -53,8 +52,9 @@ def test_assign_split(self):
5352 from squeez .data .sample_assembler import _assign_split
5453
5554 assert _assign_split ("django__django" ) == "train"
56- assert _assign_split ("pydata__xarray" ) == "eval"
57- assert _assign_split ("pallets__flask" ) == "eval"
55+ assert _assign_split ("pydata__xarray" ) == "test"
56+ assert _assign_split ("pallets__flask" ) == "test"
57+ assert _assign_split ("psf__requests" ) == "dev"
5858 assert _assign_split ("scikit-learn__scikit-learn" ) == "train"
5959
6060 def test_format_prompt (self ):
0 commit comments