@@ -137,18 +137,45 @@ async def test_prepare_non_compressed_dataset_with_path(httpserver):
137
137
138
138
139
139
@pytest .mark .asyncio
140
- async def test_prepare_non_compressed_dataset_with_overwrite (httpserver ):
140
+ async def test_prepare_non_compressed_dataset_no_path_with_overwrite (httpserver ):
141
141
url = "/test.csv"
142
142
expected_path = Path ("./test.csv" )
143
143
with open ("tests/test.csv" , "rb" ) as expected_data :
144
144
httpserver .expect_request (url ).respond_with_data (expected_data )
145
- await skillsnetwork .prepare_dataset (httpserver .url_for (url ), overwrite = True )
145
+ await skillsnetwork .prepare_dataset (httpserver .url_for (url ))
146
146
assert expected_path .exists ()
147
147
httpserver .clear ()
148
- print (expected_path .absolute (), expected_path .absolute ().exists ())
149
148
with open ("tests/test.csv" , "rb" ) as expected_data :
150
149
httpserver .expect_request (url ).respond_with_data (expected_data )
151
150
await skillsnetwork .prepare_dataset (httpserver .url_for (url ), overwrite = True )
152
151
assert expected_path .exists ()
153
152
assert Path (expected_path ).stat ().st_size == 540
154
153
expected_path .unlink ()
154
+
155
+
156
+ @pytest .mark .asyncio
157
+ async def test_prepare_dataset_tar_no_path_with_overwrite (httpserver ):
158
+ url = "/test.tar.gz"
159
+ expected_directory = Path ("test" )
160
+ try :
161
+ shutil .rmtree (expected_directory ) # clean up any previous test
162
+ except FileNotFoundError as e :
163
+ print (e )
164
+ pass
165
+
166
+ with open ("tests/test.tar.gz" , "rb" ) as expected_data :
167
+ httpserver .expect_request (url ).respond_with_data (expected_data )
168
+ await skillsnetwork .prepare_dataset (httpserver .url_for (url ))
169
+
170
+ assert os .path .isdir (expected_directory )
171
+ with open (expected_directory / "1.txt" ) as f :
172
+ assert "I am the first test file" in f .read ()
173
+ httpserver .clear ()
174
+
175
+ with open ("tests/test.tar.gz" , "rb" ) as expected_data :
176
+ httpserver .expect_request (url ).respond_with_data (expected_data )
177
+ await skillsnetwork .prepare_dataset (httpserver .url_for (url ), overwrite = True )
178
+ assert os .path .isdir (expected_directory )
179
+ with open (expected_directory / "1.txt" ) as f :
180
+ assert "I am the first test file" in f .read ()
181
+ expected_directory .unlink ()
0 commit comments