@@ -135,16 +135,6 @@ def test_diff_and_filter_exports(self, tmp_path):
135
135
"missing_sample_size" : [Nans .DELETED ] + [Nans .NOT_MISSING ] * 2 ,
136
136
})
137
137
138
- csv2_deleted = pd .DataFrame ({
139
- "geo_id" : ["1" ],
140
- "val" : [np .nan ],
141
- "se" : [np .nan ],
142
- "sample_size" : [np .nan ],
143
- "missing_val" : [Nans .DELETED ],
144
- "missing_se" : [Nans .DELETED ],
145
- "missing_sample_size" : [Nans .DELETED ],
146
- })
147
-
148
138
arch_diff = ArchiveDiffer (cache_dir , export_dir )
149
139
150
140
# Test diff_exports
@@ -164,7 +154,7 @@ def test_diff_and_filter_exports(self, tmp_path):
164
154
deleted_files , common_diffs , new_files = arch_diff .diff_exports ()
165
155
166
156
# Check return values
167
- assert set (deleted_files ) == {join (export_dir , "csv2.csv" )}
157
+ assert set (deleted_files ) == {join (cache_dir , "csv2.csv" )}
168
158
assert set (common_diffs .keys ()) == {
169
159
join (export_dir , f ) for f in ["csv0.csv" , "csv1.csv" , "csv4.csv" ]}
170
160
assert set (new_files ) == {join (export_dir , "csv3.csv" )}
@@ -175,8 +165,7 @@ def test_diff_and_filter_exports(self, tmp_path):
175
165
# Check filesystem for actual files
176
166
assert set (listdir (export_dir )) == {
177
167
"csv0.csv" , "csv1.csv" , "csv1.csv.diff" ,
178
- "csv3.csv" , "csv4.csv" , "csv4.csv.diff" ,
179
- "csv2.csv"
168
+ "csv3.csv" , "csv4.csv" , "csv4.csv.diff"
180
169
}
181
170
assert_frame_equal (
182
171
pd .read_csv (join (export_dir , "csv1.csv.diff" ), dtype = CSV_DTYPES ),
@@ -194,11 +183,8 @@ def test_diff_and_filter_exports(self, tmp_path):
194
183
195
184
arch_diff .filter_exports (common_diffs )
196
185
197
- # Check exports directory just has incremental and deleted changes
198
- assert set (listdir (export_dir )) == {"csv1.csv" , "csv2.csv" , "csv3.csv" , "csv4.csv" }
199
- assert_frame_equal (
200
- pd .read_csv (join (export_dir , "csv2.csv" ), dtype = CSV_DTYPES ),
201
- csv2_deleted )
186
+ # Check exports directory just has incremental changes
187
+ assert set (listdir (export_dir )) == {"csv1.csv" , "csv3.csv" , "csv4.csv" }
202
188
assert_frame_equal (
203
189
pd .read_csv (join (export_dir , "csv1.csv" ), dtype = CSV_DTYPES ),
204
190
csv1_diff )
@@ -325,7 +311,7 @@ def test_run(self, tmp_path, s3_client):
325
311
assert_frame_equal (pd .read_csv (body , dtype = CSV_DTYPES ), df )
326
312
327
313
# Check exports directory just has incremental changes
328
- assert set (listdir (export_dir )) == {"csv1.csv" , "csv2.csv" , " csv3.csv" , "csv4.csv" }
314
+ assert set (listdir (export_dir )) == {"csv1.csv" , "csv3.csv" , "csv4.csv" }
329
315
csv1_diff = pd .DataFrame ({
330
316
"geo_id" : ["3" , "2" , "4" ],
331
317
"val" : [np .nan , 2.1 , 4.0 ],
@@ -338,18 +324,6 @@ def test_run(self, tmp_path, s3_client):
338
324
assert_frame_equal (
339
325
pd .read_csv (join (export_dir , "csv1.csv" ), dtype = CSV_DTYPES ),
340
326
csv1_diff )
341
- csv2_deleted = pd .DataFrame ({
342
- "geo_id" : ["1" ],
343
- "val" : [np .nan ],
344
- "se" : [np .nan ],
345
- "sample_size" : [np .nan ],
346
- "missing_val" : [Nans .DELETED ],
347
- "missing_se" : [Nans .DELETED ],
348
- "missing_sample_size" : [Nans .DELETED ],
349
- })
350
- assert_frame_equal (
351
- pd .read_csv (join (export_dir , "csv2.csv" ), dtype = CSV_DTYPES ),
352
- csv2_deleted )
353
327
354
328
355
329
class TestGitArchiveDiffer :
@@ -550,7 +524,7 @@ def test_run(self, tmp_path):
550
524
original_branch .checkout ()
551
525
552
526
# Check exports directory just has incremental changes
553
- assert set (listdir (export_dir )) == {"csv1.csv" , "csv2.csv" , " csv3.csv" , "csv4.csv" }
527
+ assert set (listdir (export_dir )) == {"csv1.csv" , "csv3.csv" , "csv4.csv" }
554
528
csv1_diff = pd .DataFrame ({
555
529
"geo_id" : ["3" , "2" , "4" ],
556
530
"val" : [np .nan , 2.1 , 4.0 ],
@@ -563,19 +537,6 @@ def test_run(self, tmp_path):
563
537
assert_frame_equal (
564
538
pd .read_csv (join (export_dir , "csv1.csv" ), dtype = CSV_DTYPES ),
565
539
csv1_diff )
566
- csv2_deleted = pd .DataFrame ({
567
- "geo_id" : ["1" ],
568
- "val" : [np .nan ],
569
- "se" : [np .nan ],
570
- "sample_size" : [np .nan ],
571
- "missing_val" : [Nans .DELETED ],
572
- "missing_se" : [Nans .DELETED ],
573
- "missing_sample_size" : [Nans .DELETED ],
574
- })
575
- assert_frame_equal (
576
- pd .read_csv (join (export_dir , "csv2.csv" ), dtype = CSV_DTYPES ),
577
- csv2_deleted )
578
-
579
540
580
541
581
542
class TestFromParams :
0 commit comments