@@ -32,7 +32,7 @@ def setUp(self):
3232 "language" : "en" ,
3333 "authority" : "FAO" ,
3434 "confidence" : 1 ,
35- "place" : "Rome" ,
35+ "place" : 0 ,
3636 }
3737 ],
3838 "dc.contributor.author" : [
@@ -41,7 +41,7 @@ def setUp(self):
4141 "language" : "en" ,
4242 "authority" : "FAO" ,
4343 "confidence" : 1 ,
44- "place" : "Rome" ,
44+ "place" : 0 ,
4545 }
4646 ],
4747 "dc.description.abstract" : [
@@ -50,7 +50,7 @@ def setUp(self):
5050 "language" : "en" ,
5151 "authority" : "FAO" ,
5252 "confidence" : 1 ,
53- "place" : "Rome" ,
53+ "place" : 0 ,
5454 }
5555 ],
5656 "dc.identifier.doi" : [
@@ -59,7 +59,7 @@ def setUp(self):
5959 "language" : "en" ,
6060 "authority" : "FAO" ,
6161 "confidence" : 1 ,
62- "place" : "Rome" ,
62+ "place" : 0 ,
6363 }
6464 ],
6565 "dc.date.available" : [
@@ -68,7 +68,7 @@ def setUp(self):
6868 "language" : "en" ,
6969 "authority" : "FAO" ,
7070 "confidence" : 1 ,
71- "place" : "Rome" ,
71+ "place" : 0 ,
7272 }
7373 ],
7474 "dc.date.lastModified" : [
@@ -77,7 +77,7 @@ def setUp(self):
7777 "language" : "en" ,
7878 "authority" : "FAO" ,
7979 "confidence" : 1 ,
80- "place" : "Rome" ,
80+ "place" : 0 ,
8181 }
8282 ],
8383 "fao.taxonomy.type" : [
@@ -86,7 +86,7 @@ def setUp(self):
8686 "language" : "en" ,
8787 "authority" : "FAO" ,
8888 "confidence" : 1 ,
89- "place" : "Rome" ,
89+ "place" : 0 ,
9090 }
9191 ],
9292 },
@@ -140,17 +140,22 @@ def test_run_success(self, mock_get_metadata, mock_get_bundle, mock_get_pdf):
140140 # Simulate a successful run with valid PDF and metadata
141141 mock_get_metadata .return_value = self .item
142142 mock_get_bundle .return_value = [self .bundle ]
143- mock_get_pdf .return_value = "PDF content extracted."
143+ mock_get_pdf .return_value = "PDF content extracted. Lorem ispum "
144144 result = self .collector .run ([self .doc ])
145145 self .assertEqual (len (result ), 1 )
146146 doc_result = result [0 ]
147147 self .assertIsNone (doc_result .error_info )
148148 self .assertIsInstance (doc_result .document , WeLearnDocument )
149- self .assertEqual (doc_result .document .full_content , "PDF content extracted." )
149+ self .assertEqual (
150+ doc_result .document .full_content , "PDF content extracted. Lorem ispum"
151+ )
150152 self .assertEqual (doc_result .document .title , "FAO Document Title" )
151153 self .assertEqual (doc_result .document .description , "A description." )
152154 self .assertEqual (doc_result .document .details ["doi" ], "10.1234/fao.5678" )
153- self .assertEqual (doc_result .document .details ["license_url" ], "cc-by-4.0" )
155+ self .assertEqual (
156+ doc_result .document .details ["license_url" ],
157+ "https://creativecommons.org/licenses/by/4.0/" ,
158+ )
154159 self .assertEqual (doc_result .document .details ["type" ], "Report" )
155160 self .assertTrue (
156161 doc_result .document .details ["contrent_from_pdf" ]
@@ -238,19 +243,6 @@ def test_run_embargo(self, mock_get_metadata, mock_get_bundle, mock_get_pdf):
238243 self .assertIn ("unauthorized state" , result [0 ].error_info )
239244 self .assertTrue (result [0 ].is_error )
240245
241- # @patch.object(FAOOpenKnowledgeCollector, "_get_pdf_content")
242- # @patch.object(FAOOpenKnowledgeCollector, "get_bundle_json")
243- # @patch.object(FAOOpenKnowledgeCollector, "get_metadata_json")
244- # def test_run_pydantic_validation_error(
245- # self, mock_get_metadata, mock_get_bundle, mock_get_pdf
246- # ):
247- # # Simulate pydantic validation error
248- # mock_get_metadata.side_effect = pydantic.ValidationError([], "error")
249- # result = self.collector.run([self.doc])
250- # self.assertEqual(len(result), 1)
251- # self.assertIn("validation error", result[0].error_info)
252- # self.assertTrue(result[0].is_error)
253-
254246 @patch .object (FAOOpenKnowledgeCollector , "_get_pdf_content" )
255247 @patch .object (FAOOpenKnowledgeCollector , "get_bundle_json" )
256248 @patch .object (FAOOpenKnowledgeCollector , "get_metadata_json" )
0 commit comments