Added test for zipfiles with hidden folders

ml-evs · ml-evs · commit 37bdc8491060 · 2020-10-13T15:51:38.000+01:00
diff --git a/pandas/tests/io/test_pickle.py b/pandas/tests/io/test_pickle.py
@@ -376,6 +376,60 @@ def test_read_infer(self, ext, get_random_path):
 
             tm.assert_frame_equal(df, df2)
 
+<<<<<<< Updated upstream
+    @pytest.mark.parametrize("cruft", ["__MACOSX", ".DS_STORE"])
+=======
+<<<<<<< Updated upstream
+=======
+    @pytest.mark.parametrize("cruft", ["__MACOSX/", ".DS_STORE"])
+>>>>>>> Stashed changes
+    def test_load_zip_with_hidden_folders(self, cruft, get_random_path):
+        """Test loading .zip files that have extraneous metadata in hidden folders. """
+        base = get_random_path
+        path1 = base + ".raw"
+        path2 = base + ".zip"
+        dummy = base + ".dummy"
+        compression = "zip"
+
+        with tm.ensure_clean(path1) as p1, tm.ensure_clean(
+            path2
+        ) as p2, tm.ensure_clean(dummy) as d:
+            df = tm.makeDataFrame()
+
+            # write to uncompressed file
+            df.to_pickle(p1, compression=None)
+
+            # compress dataframe normally
+            self.compress_file(p1, p2, compression=compression)
+
+<<<<<<< Updated upstream
+            # add dummy file `{cruft}/{dummy}` to add to the archive
+            with zipfile.ZipFile(p2, "a", compression=zipfile.ZIP_DEFLATED) as f:
+                f.write(d, f"{cruft}/{dummy}")
+
+            # check the file was definitely added to the archive
+            with zipfile.ZipFile(p2, "r") as f:
+                assert f"{cruft}/{dummy}" in f.namelist()
+=======
+            # add dummy file `{cruft}{dummy}` to the archive
+            with zipfile.ZipFile(p2, "a", compression=zipfile.ZIP_DEFLATED) as f:
+                f.write(d, f"{cruft}{dummy}")
+
+            # check the file was definitely added to the archive
+            with zipfile.ZipFile(p2, "r") as f:
+                assert f"{cruft}{dummy}" in f.namelist()
+>>>>>>> Stashed changes
+
+            # compressed file by inferred compression method,
+            # dummy file should have been ignored
+            df2 = pd.read_pickle(p2)
+
+            tm.assert_frame_equal(df, df2)
+
+<<<<<<< Updated upstream
+=======
+>>>>>>> Stashed changes
+>>>>>>> Stashed changes
 
 # ---------------------
 # test pickle compression