@@ -134,6 +134,19 @@ def test_diff_and_filter_exports(self, tmp_path):
134
134
"missing_sample_size" : [Nans .DELETED ] + [Nans .NOT_MISSING ] * 2 ,
135
135
})
136
136
137
+ csv2_deleted = pd .DataFrame (
138
+ np .empty (0 , dtype = [
139
+ ("geo_id" , str ),
140
+ ("val" , float ),
141
+ ("se" , float ),
142
+ ("sample_size" , float ),
143
+ ("missing_val" , int ),
144
+ ("missing_se" , int ),
145
+ ("missing_sample_size" , int )
146
+ ]),
147
+ index = []
148
+ )
149
+
137
150
arch_diff = ArchiveDiffer (cache_dir , export_dir )
138
151
139
152
# Test diff_exports
@@ -163,7 +176,10 @@ def test_diff_and_filter_exports(self, tmp_path):
163
176
164
177
# Check filesystem for actual files
165
178
assert set (listdir (export_dir )) == {
166
- "csv0.csv" , "csv1.csv" , "csv1.csv.diff" , "csv3.csv" , "csv4.csv" , "csv4.csv.diff" }
179
+ "csv0.csv" , "csv1.csv" , "csv1.csv.diff" ,
180
+ "csv3.csv" , "csv4.csv" , "csv4.csv.diff" ,
181
+ "csv2.csv"
182
+ }
167
183
assert_frame_equal (
168
184
pd .read_csv (join (export_dir , "csv1.csv.diff" ), dtype = CSV_DTYPES ),
169
185
csv1_diff )
@@ -180,8 +196,11 @@ def test_diff_and_filter_exports(self, tmp_path):
180
196
181
197
arch_diff .filter_exports (common_diffs )
182
198
183
- # Check exports directory just has incremental changes
184
- assert set (listdir (export_dir )) == {"csv1.csv" , "csv3.csv" , "csv4.csv" }
199
+ # Check exports directory just has incremental and deleted changes
200
+ assert set (listdir (export_dir )) == {"csv1.csv" , "csv2.csv" , "csv3.csv" , "csv4.csv" }
201
+ assert_frame_equal (
202
+ pd .read_csv (join (export_dir , "csv2.csv" ), dtype = CSV_DTYPES ),
203
+ csv2_deleted )
185
204
assert_frame_equal (
186
205
pd .read_csv (join (export_dir , "csv1.csv" ), dtype = CSV_DTYPES ),
187
206
csv1_diff )
@@ -308,7 +327,7 @@ def test_run(self, tmp_path, s3_client):
308
327
assert_frame_equal (pd .read_csv (body , dtype = CSV_DTYPES ), df )
309
328
310
329
# Check exports directory just has incremental changes
311
- assert set (listdir (export_dir )) == {"csv1.csv" , "csv3.csv" , "csv4.csv" }
330
+ assert set (listdir (export_dir )) == {"csv1.csv" , "csv2.csv" , " csv3.csv" , "csv4.csv" }
312
331
csv1_diff = pd .DataFrame ({
313
332
"geo_id" : ["3" , "2" , "4" ],
314
333
"val" : [np .nan , 2.1 , 4.0 ],
@@ -321,6 +340,21 @@ def test_run(self, tmp_path, s3_client):
321
340
assert_frame_equal (
322
341
pd .read_csv (join (export_dir , "csv1.csv" ), dtype = CSV_DTYPES ),
323
342
csv1_diff )
343
+ csv2_deleted = pd .DataFrame (
344
+ np .empty (0 , dtype = [
345
+ ("geo_id" , str ),
346
+ ("val" , float ),
347
+ ("se" , float ),
348
+ ("sample_size" , float ),
349
+ ("missing_val" , int ),
350
+ ("missing_se" , int ),
351
+ ("missing_sample_size" , int )
352
+ ]),
353
+ index = []
354
+ )
355
+ assert_frame_equal (
356
+ pd .read_csv (join (export_dir , "csv2.csv" ), dtype = CSV_DTYPES ),
357
+ csv2_deleted )
324
358
325
359
326
360
class TestGitArchiveDiffer :
@@ -521,7 +555,7 @@ def test_run(self, tmp_path):
521
555
original_branch .checkout ()
522
556
523
557
# Check exports directory just has incremental changes
524
- assert set (listdir (export_dir )) == {"csv1.csv" , "csv3.csv" , "csv4.csv" }
558
+ assert set (listdir (export_dir )) == {"csv1.csv" , "csv2.csv" , " csv3.csv" , "csv4.csv" }
525
559
csv1_diff = pd .DataFrame ({
526
560
"geo_id" : ["3" , "2" , "4" ],
527
561
"val" : [np .nan , 2.1 , 4.0 ],
@@ -534,6 +568,22 @@ def test_run(self, tmp_path):
534
568
assert_frame_equal (
535
569
pd .read_csv (join (export_dir , "csv1.csv" ), dtype = CSV_DTYPES ),
536
570
csv1_diff )
571
+ csv2_deleted = pd .DataFrame (
572
+ np .empty (0 , dtype = [
573
+ ("geo_id" , str ),
574
+ ("val" , float ),
575
+ ("se" , float ),
576
+ ("sample_size" , float ),
577
+ ("missing_val" , int ),
578
+ ("missing_se" , int ),
579
+ ("missing_sample_size" , int )
580
+ ]),
581
+ index = []
582
+ )
583
+ assert_frame_equal (
584
+ pd .read_csv (join (export_dir , "csv2.csv" ), dtype = CSV_DTYPES ),
585
+ csv2_deleted )
586
+
537
587
538
588
539
589
class TestFromParams :
0 commit comments