Skip to content

Commit 5bb5488

Browse files
authored
bugfix/index_chunks_not_updated (#216)
Allow generate_event_index_pipeline to overwrite existing index-chunks
1 parent 889e01a commit 5bb5488

File tree

3 files changed

+75
-8
lines changed

3 files changed

+75
-8
lines changed

cdp_backend/file_store/functions.py

+5-1
Original file line numberDiff line numberDiff line change
@@ -67,6 +67,7 @@ def upload_file(
6767
filepath: str,
6868
save_name: Optional[str] = None,
6969
remove_local: bool = False,
70+
overwrite: bool = False,
7071
) -> str:
7172
"""
7273
Uploads a file to a Google Cloud file store bucket.
@@ -88,6 +89,9 @@ def upload_file(
8889
The name to save the file as in the file store.
8990
remove_local: bool
9091
If True, remove the local file upon successful upload.
92+
overwrite: bool
93+
Boolean value indicating whether or not to overwrite the remote resource with
94+
the same name if it already exists.
9195
9296
Returns
9397
-------
@@ -107,7 +111,7 @@ def upload_file(
107111
uri = get_file_uri(bucket, save_name, credentials_file)
108112

109113
# Return existing uri and remove local copy if desired
110-
if uri:
114+
if uri and not overwrite:
111115
if remove_local:
112116
remove_local_file(resolved_filepath)
113117

cdp_backend/pipeline/generate_event_index_pipeline.py

+1
Original file line numberDiff line numberDiff line change
@@ -383,6 +383,7 @@ def chunk_index(
383383
bucket=bucket_name,
384384
filepath=str(local_chunk_path),
385385
save_name=f"{REMOTE_INDEX_CHUNK_DIR}/{save_filename}",
386+
overwrite=True,
386387
)
387388

388389

cdp_backend/tests/file_store/test_functions.py

+69-7
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@
1717
BUCKET = "bucket"
1818
FILEPATH = "fake/path/" + FILENAME
1919
SAVE_NAME = "fakeSaveName"
20-
EXISTING_FILE_URI = "gs://bucket/existing_file.json"
20+
EXISTING_FILE_URI = "gs://bucket/" + SAVE_NAME
2121
GCS_FILE_URI = functions.GCS_URI.format(bucket=BUCKET, filename=FILENAME)
2222

2323
###############################################################################
@@ -56,19 +56,76 @@ def test_get_file_uri(
5656

5757

5858
@pytest.mark.parametrize(
59-
"bucket, filepath, save_name, remove_local, existing_file_uri, expected",
59+
"bucket, filepath, save_name, remove_local, overwrite, existing_file_uri, expected",
6060
[
61-
(BUCKET, FILEPATH, SAVE_NAME, True, EXISTING_FILE_URI, EXISTING_FILE_URI),
62-
(BUCKET, FILEPATH, SAVE_NAME, False, EXISTING_FILE_URI, EXISTING_FILE_URI),
63-
(BUCKET, FILEPATH, None, False, None, GCS_FILE_URI),
64-
(BUCKET, FILEPATH, None, True, None, GCS_FILE_URI),
61+
(
62+
BUCKET,
63+
FILEPATH,
64+
SAVE_NAME,
65+
True,
66+
True,
67+
EXISTING_FILE_URI,
68+
EXISTING_FILE_URI,
69+
),
70+
(
71+
BUCKET,
72+
FILEPATH,
73+
SAVE_NAME,
74+
True,
75+
True,
76+
None,
77+
EXISTING_FILE_URI,
78+
),
79+
(
80+
BUCKET,
81+
FILEPATH,
82+
SAVE_NAME,
83+
True,
84+
False,
85+
EXISTING_FILE_URI,
86+
EXISTING_FILE_URI,
87+
),
88+
(
89+
BUCKET,
90+
FILEPATH,
91+
SAVE_NAME,
92+
False,
93+
True,
94+
EXISTING_FILE_URI,
95+
EXISTING_FILE_URI,
96+
),
97+
(
98+
BUCKET,
99+
FILEPATH,
100+
SAVE_NAME,
101+
False,
102+
True,
103+
None,
104+
EXISTING_FILE_URI,
105+
),
106+
(
107+
BUCKET,
108+
FILEPATH,
109+
SAVE_NAME,
110+
False,
111+
False,
112+
EXISTING_FILE_URI,
113+
EXISTING_FILE_URI,
114+
),
115+
(BUCKET, FILEPATH, None, False, True, GCS_FILE_URI, GCS_FILE_URI),
116+
(BUCKET, FILEPATH, None, False, True, None, GCS_FILE_URI),
117+
(BUCKET, FILEPATH, None, False, False, None, GCS_FILE_URI),
118+
(BUCKET, FILEPATH, None, True, True, GCS_FILE_URI, GCS_FILE_URI),
119+
(BUCKET, FILEPATH, None, True, True, None, GCS_FILE_URI),
120+
(BUCKET, FILEPATH, None, True, False, None, GCS_FILE_URI),
65121
],
66122
)
67123
def test_upload_file(
68124
bucket: str,
69125
filepath: str,
70126
save_name: Optional[str],
71127
remove_local: bool,
128+
overwrite: bool,
72129
existing_file_uri: str,
73130
expected: str,
74131
) -> None:
@@ -82,7 +139,12 @@ def test_upload_file(
82139
mock_path.return_value.name = FILENAME
83140

84141
assert expected == functions.upload_file(
85-
"path/to/creds", bucket, filepath, save_name, remove_local
142+
"path/to/creds",
143+
bucket,
144+
filepath,
145+
save_name,
146+
remove_local,
147+
overwrite,
86148
)
87149

88150

0 commit comments

Comments
 (0)