Merge pull request #1225 from Sage-Bionetworks/develop-fix-api-test

linglp · web-flow · commit 9fb2ba6185b5 · 2023-06-14T16:26:27.000-04:00
fix: fixed tests in test_api.py
diff --git a/.github/workflows/api_test.yml b/.github/workflows/api_test.yml
@@ -85,5 +85,4 @@ jobs:
         if: ${{ false == inputs.perform_benchmarking }}
         run: >
           source .venv/bin/activate;
-          pytest -m "schematic_api and not rule_benchmark"
-          
+          pytest -m "schematic_api and not rule_benchmark"
diff --git a/tests/data/mock_manifests/example_biospecimen_test.csv b/tests/data/mock_manifests/example_biospecimen_test.csv
@@ -0,0 +1,2 @@
+Sample ID,Patient ID,Tissue Status,Component
+123,1,Healthy,Biospecimen
diff --git a/tests/test_api.py b/tests/test_api.py
@@ -1,15 +1,20 @@
 
-import pytest
-from schematic_api.api import create_app
 import configparser
 import json
+import logging
 import os
 import re
+import time
 from math import ceil
-import logging
 from time import perf_counter
-import pandas as pd # third party library import
-from schematic.schemas.generator import SchemaGenerator #Local application/library specific imports.
+
+import numpy as np
+import pandas as pd  # third party library import
+import pytest
+
+from schematic.schemas.generator import \
+    SchemaGenerator  # Local application/library specific imports.
+from schematic_api.api import create_app
 
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
@@ -32,6 +37,11 @@ def test_manifest_csv(helpers):
     test_manifest_path = helpers.get_data_path("mock_manifests/Valid_Test_Manifest.csv")
     yield test_manifest_path
 
+@pytest.fixture(scope="class")
+def test_manifest_submit(helpers):
+    test_manifest_path = helpers.get_data_path("mock_manifests/example_biospecimen_test.csv")
+    yield test_manifest_path   
+
 @pytest.fixture(scope="class")
 def test_invalid_manifest(helpers):
     test_invalid_manifest = helpers.get_data_frame("mock_manifests/Invalid_Test_Manifest.csv", preserve_raw_input=False)
@@ -656,104 +666,105 @@ def test_dataset_manifest_download(self, client, as_json, syn_token, new_manifes
 
         if as_json: 
             response_json = json.loads(response_dt)
-            assert response_json == [{'Component': 'BulkRNA-seqAssay', 'File Format': 'CSV/TSV', 'Filename': 'Sample_A', 'Genome Build': 'GRCm38', 'Genome FASTA': None, 'Sample ID': 2022, 'entityId': 'syn28278954'}]
+            assert response_json[0]["Component"] == "BulkRNA-seqAssay"
+            assert response_json[0]["File Format"] == "CSV/TSV"
+            assert response_json[0]["Sample ID"] == 2022
+            assert response_json[0]["entityId"] == "syn28278954"
         else:
             # return a file path
             response_path = response_dt.decode('utf-8')
 
             assert isinstance(response_path, str)
             assert response_path.endswith(".csv")
 
-    @pytest.mark.parametrize("json_str", [None, '[{ "Patient ID": 123, "Sex": "Female", "Year of Birth": "", "Diagnosis": "Healthy", "Component": "Patient", "Cancer Type": "Breast", "Family History": "Breast, Lung", }]'])
-    @pytest.mark.parametrize("use_schema_label", ['true','false'])
-    @pytest.mark.parametrize("manifest_record_type", ['table_and_file', 'file_only'])
-    def test_submit_manifest(self, client, syn_token, data_model_jsonld, json_str, test_manifest_csv, use_schema_label, manifest_record_type):
+    def test_submit_manifest_table_and_file_replace(self, client, syn_token, data_model_jsonld, test_manifest_submit):
+        """Testing submit manifest in a csv format as a table and a file. Only replace the table
+        """
         params = {
             "access_token": syn_token,
             "schema_url": data_model_jsonld,
-            "data_type": "Patient",
+            "data_type": "Biospecimen",
             "restrict_rules": False, 
-            "manifest_record_type": manifest_record_type,
-            "asset_view": "syn44259375",
-            "dataset_id": "syn44259313",
+            "manifest_record_type": "table_and_file",
+            "asset_view": "syn51514344",
+            "dataset_id": "syn51514345",
             "table_manipulation": 'replace',
-            "use_schema_label": use_schema_label
+            "use_schema_label": True
         }
 
-        if json_str:
-            params["json_str"] = json_str
-            response = client.post('http://localhost:3001/v1/model/submit', query_string = params, data={"file_name":''})
-            assert response.status_code == 200
-        else: 
-            headers = {
-            'Content-Type': "multipart/form-data",
-            'Accept': "application/json"
-            }
-            params["data_type"] = "MockComponent"
-
-            # test uploading a csv file
-            response_csv = client.post('http://localhost:3001/v1/model/submit', query_string=params, data={"file_name": (open(test_manifest_csv, 'rb'), "test.csv")}, headers=headers)
-            assert response_csv.status_code == 200
+        response_csv = client.post('http://localhost:3001/v1/model/submit', query_string=params, data={"file_name": (open(test_manifest_submit, 'rb'), "test.csv")})
+        assert response_csv.status_code == 200
 
-    @pytest.mark.parametrize("json_str", [None, '[{ "Patient ID": 123, "Sex": "Female", "Year of Birth": "", "Diagnosis": "Healthy", "Component": "Patient", "Cancer Type": "Breast", "Family History": "Breast, Lung", }]'])
-    @pytest.mark.parametrize("manifest_record_type", ['file_and_entities', 'table_file_and_entities'])
-    def test_submit_manifest_w_entities(self, client, syn_token, data_model_jsonld, json_str, test_manifest_csv, manifest_record_type):
+    def test_submit_manifest_file_only_replace(self, client, syn_token, data_model_jsonld, test_manifest_submit):
+        """Testing submit manifest in a csv format as a file
+        """
         params = {
             "access_token": syn_token,
             "schema_url": data_model_jsonld,
-            "data_type": "Patient",
+            "data_type": "Biospecimen",
             "restrict_rules": False, 
-            "manifest_record_type": manifest_record_type,
-            "asset_view": "syn44259375",
-            "dataset_id": "syn44259313",
+            "manifest_record_type": "file_only",
+            "asset_view": "syn51514344",
+            "dataset_id": "syn51514345",
             "table_manipulation": 'replace',
             "use_schema_label": True
         }
+        response_csv = client.post('http://localhost:3001/v1/model/submit', query_string=params, data={"file_name": (open(test_manifest_submit, 'rb'), "test.csv")})
+        assert response_csv.status_code == 200 
+    
+    def test_submit_manifest_json_str_replace(self, client, syn_token, data_model_jsonld):
+        """Submit json str as a file
+        """
+        json_str = '[{"Sample ID": 123, "Patient ID": 1,"Tissue Status": "Healthy","Component": "Biospecimen"}]'
+        params = {
+            "access_token": syn_token,
+            "schema_url": data_model_jsonld,
+            "data_type": "Biospecimen",
+            "json_str": json_str,
+            "restrict_rules": False, 
+            "manifest_record_type": "file_only",
+            "asset_view": "syn51514344",
+            "dataset_id": "syn51514345",
+            "table_manipulation": 'replace',
+            "use_schema_label": True
+        }
+        params["json_str"] = json_str
+        response = client.post('http://localhost:3001/v1/model/submit', query_string = params, data={"file_name":''})
+        assert response.status_code == 200
 
-        if json_str:
-            params["json_str"] = json_str
-            response = client.post('http://localhost:3001/v1/model/submit', query_string = params, data={"file_name":''})
-            assert response.status_code == 200
-        else: 
-            headers = {
-            'Content-Type': "multipart/form-data",
-            'Accept': "application/json"
-            }
-            params["data_type"] = "MockComponent"
+    def test_submit_manifest_w_file_and_entities(self, client, syn_token, data_model_jsonld, test_manifest_submit):
+        params = {
+            "access_token": syn_token,
+            "schema_url": data_model_jsonld,
+            "data_type": "Biospecimen",
+            "restrict_rules": False, 
+            "manifest_record_type": "file_and_entities",
+            "asset_view": "syn51514501",
+            "dataset_id": "syn51514523",
+            "table_manipulation": 'replace',
+            "use_schema_label": True
+        }
 
-            # test uploading a csv file
-            response_csv = client.post('http://localhost:3001/v1/model/submit', query_string=params, data={"file_name": (open(test_manifest_csv, 'rb'), "test.csv")}, headers=headers)
-            assert response_csv.status_code == 200  
+        # test uploading a csv file
+        response_csv = client.post('http://localhost:3001/v1/model/submit', query_string=params, data={"file_name": (open(test_manifest_submit, 'rb'), "test.csv")})
+        assert response_csv.status_code == 200
 
-    
-    @pytest.mark.parametrize("json_str", [None, '[{ "Component": "MockRDB", "MockRDB_id": 5 }]'])
-    def test_submit_manifest_upsert(self, client, syn_token, data_model_jsonld, json_str, test_upsert_manifest_csv, ):
+    def test_submit_manifest_table_and_file_upsert(self, client, syn_token, data_model_jsonld, test_upsert_manifest_csv, ):
         params = {
             "access_token": syn_token,
             "schema_url": data_model_jsonld,
             "data_type": "MockRDB",
             "restrict_rules": False, 
-            "manifest_record_type": "table",
-            "asset_view": "syn44259375",
-            "dataset_id": "syn44259313",
+            "manifest_record_type": "table_and_file",
+            "asset_view": "syn51514557",
+            "dataset_id": "syn51514551",
             "table_manipulation": 'upsert',
-            "use_schema_label": False
+            "use_schema_label": False # have to set use_schema_label to false to ensure upsert feature works
         }
 
-        if json_str:
-            params["json_str"] = json_str
-            response = client.post('http://localhost:3001/v1/model/submit', query_string = params, data={"file_name":''})
-            assert response.status_code == 200
-        else: 
-            headers = {
-            'Content-Type': "multipart/form-data",
-            'Accept': "application/json"
-            }
-            params["data_type"] = "MockRDB"
-
-            # test uploading a csv file
-            response_csv = client.post('http://localhost:3001/v1/model/submit', query_string=params, data={"file_name": (open(test_upsert_manifest_csv, 'rb'), "test.csv")}, headers=headers)            
-            assert response_csv.status_code == 200     
+        # test uploading a csv file
+        response_csv = client.post('http://localhost:3001/v1/model/submit', query_string=params, data={"file_name": (open(test_upsert_manifest_csv, 'rb'), "test.csv")},)            
+        assert response_csv.status_code == 200     
 
 @pytest.mark.schematic_api
 class TestSchemaVisualization:

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+Sample ID,Patient ID,Tissue Status,Component`
	`2`	`+123,1,Healthy,Biospecimen`