Sage-Bionetworks · GiaJordan · Dec 3, 2024 · Nov 23, 2024 · Nov 23, 2024 · Nov 23, 2024
diff --git a/schematic/store/synapse.py b/schematic/store/synapse.py
@@ -705,7 +705,10 @@ def getFilesInStorageDataset(
             ValueError: Dataset ID not found.
         """
         file_list = []
-
+        # HACK: must requery the fileview to get new files, since SynapseStorage will query the last state
+        # of the fileview which may not contain any new folders in the fileview.
+        # This is a workaround to fileviews not always containing the latest information
+        self.query_fileview(force_requery=True)
         # Get path to dataset folder by using childern to avoid cases where the dataset is the scope of the view
         child_path = self.storageFileviewTable.loc[
             self.storageFileviewTable["parentId"] == datasetId, "path"

diff --git a/tests/test_store.py b/tests/test_store.py
@@ -11,7 +11,7 @@
 import uuid
 from contextlib import nullcontext as does_not_raise
 from typing import Any, Callable, Generator
-from unittest.mock import AsyncMock, patch
+from unittest.mock import AsyncMock, MagicMock, patch
 
 import pandas as pd
 import pytest
@@ -464,49 +464,45 @@ def test_getDatasetProject(self, dataset_id, synapse_store):
             (
                 True,
                 [
-                    ("syn126", "schematic - main/parent_folder/test_file"),
+                    ("syn126", "syn_mock", "schematic - main/parent_folder/test_file"),
                     (
                         "syn125",
+                        "syn_mock",
                         "schematic - main/parent_folder/test_folder/test_file_2",
                     ),
                 ],
             ),
-            (False, [("syn126", "test_file"), ("syn125", "test_file_2")]),
+            (
+                False,
+                [
+                    ("syn126", "syn_mock", "test_file"),
+                    ("syn125", "syn_mock", "test_file_2"),
+                ],
+            ),
         ],
     )
     def test_getFilesInStorageDataset(self, synapse_store, full_path, expected):
-        mock_table_dataFrame_initial = pd.DataFrame(
-            {
-                "id": ["syn_mock"],
-                "path": ["schematic - main/parent_folder"],
-            }
-        )
-
-        mock_table_dataFrame_return = pd.DataFrame(
+        mock_table_dataframe_return = pd.DataFrame(
             {
                 "id": ["syn126", "syn125"],
+                "parentId": ["syn_mock", "syn_mock"],
                 "path": [
                     "schematic - main/parent_folder/test_file",
                     "schematic - main/parent_folder/test_folder/test_file_2",
                 ],
             }
         )
-        mock_table_return = build_table(
-            "Mock Table", "syn123", mock_table_dataFrame_return
-        )
 
-        with patch.object(synapse_store, "syn") as mocked_synapse_client:
-            with patch.object(
-                synapse_store, "storageFileviewTable"
-            ) as mocked_fileview_table:
-                mocked_fileview_table.storageFileviewTable.return_value = (
-                    mock_table_dataFrame_initial
-                )
-                mocked_synapse_client.tableQuery.return_value = mock_table_return
-                file_list = synapse_store.getFilesInStorageDataset(
-                    datasetId="syn_mock", fileNames=None, fullpath=full_path
-                )
-        assert file_list == expected
+        with patch.object(
+            synapse_store, "storageFileviewTable", mock_table_dataframe_return
+        ), patch.object(synapse_store, "query_fileview") as mocked_query:
+            # query_fileview is the function called to get the fileview
+            mocked_query.return_value = mock_table_dataframe_return
+
+            file_list = synapse_store.getFilesInStorageDataset(
+                datasetId="syn_mock", fileNames=None, fullpath=full_path
+            )
+            assert file_list == expected
 
     @pytest.mark.parametrize(
         "full_path",
@@ -516,27 +512,25 @@ def test_getFilesInStorageDataset(self, synapse_store, full_path, expected):
         ],
     )
     def test_get_files_in_storage_dataset_exception(self, synapse_store, full_path):
-        mock_table_dataFrame_initial = pd.DataFrame(
+        mock_table_dataframe_return = pd.DataFrame(
             {
                 "id": ["child_syn_mock"],
                 "path": ["schematic - main/parent_folder/child_entity"],
                 "parentId": ["wrong_syn_mock"],
             }
         )
+        with patch.object(
+            synapse_store, "storageFileviewTable", mock_table_dataframe_return
+        ), patch.object(synapse_store, "query_fileview") as mocked_query:
+            # query_fileview is the function called to get the fileview
+            mocked_query.return_value = mock_table_dataframe_return
 
-        with patch.object(synapse_store, "syn") as mocked_synapse_client:
-            with patch.object(
-                synapse_store, "storageFileviewTable"
-            ) as mocked_fileview_table:
-                mocked_fileview_table.storageFileviewTable.return_value = (
-                    mock_table_dataFrame_initial
+            with pytest.raises(
+                LookupError, match="Dataset syn_mock could not be found"
+            ):
+                synapse_store.getFilesInStorageDataset(
+                    datasetId="syn_mock", fileNames=None, fullpath=full_path
                 )
-                with pytest.raises(
-                    LookupError, match="Dataset syn_mock could not be found"
-                ):
-                    file_list = synapse_store.getFilesInStorageDataset(
-                        datasetId="syn_mock", fileNames=None, fullpath=full_path
-                    )
 
     @pytest.mark.parametrize("downloadFile", [True, False])
     def test_getDatasetManifest(self, synapse_store, downloadFile):