Add test for bz2; mypy ignore non-typesafe use of kwargs

jessefarnham · jessefarnham · commit 0028df79e94c · 2020-04-08T12:55:03.000-04:00
diff --git a/pandas/io/common.py b/pandas/io/common.py
@@ -403,16 +403,20 @@ def get_handle(
         # GZ Compression
         if compression == "gzip":
             if is_path:
-                f = gzip.open(path_or_buf, mode, **compression_args)
+                f = gzip.open(
+                    path_or_buf, mode, **compression_args)  # type: ignore
             else:
-                f = gzip.GzipFile(fileobj=path_or_buf, **compression_args)
+                f = gzip.GzipFile(
+                    fileobj=path_or_buf, **compression_args)  # type: ignore
 
         # BZ Compression
         elif compression == "bz2":
             if is_path:
-                f = bz2.BZ2File(path_or_buf, mode, **compression_args)
+                f = bz2.BZ2File(
+                    path_or_buf, mode, **compression_args)  # type: ignore
             else:
-                f = bz2.BZ2File(path_or_buf, **compression_args)
+                f = bz2.BZ2File(
+                    path_or_buf, **compression_args)  # type: ignore
 
         # ZIP Compression
         elif compression == "zip":
diff --git a/pandas/tests/io/test_compression.py b/pandas/tests/io/test_compression.py
@@ -156,13 +156,33 @@ def test_with_missing_lzma_runtime():
     ],
 )
 @pytest.mark.parametrize("method", ["to_pickle", "to_json", "to_csv"])
-def test_gzip_compression_level_path(obj, method):
-    """GH#33398 Ideally this test should be repeated for bz2 as well,
-    but that is not practical because a file size of >100k is needed to see any
-    size difference between bz2 compression settings."""
+def test_gzip_compression_level(obj, method):
+    #GH33196
     with tm.ensure_clean() as path:
         getattr(obj, method)(path, compression="gzip")
         compressed_size_default = os.path.getsize(path)
-        getattr(obj, method)(path, compression={"method": "gzip", "compresslevel": 1})
+        getattr(obj, method)(
+            path, compression={ "method": "gzip", "compresslevel": 1})
         compressed_size_fast = os.path.getsize(path)
         assert compressed_size_default < compressed_size_fast
+
+
+@pytest.mark.parametrize(
+    "obj",
+    [
+        pd.DataFrame(
+            100 * [[0.123456, 0.234567, 0.567567], [12.32112, 123123.2, 321321.2]],
+            columns=["X", "Y", "Z"],
+        ),
+        pd.Series(100 * [0.123456, 0.234567, 0.567567], name="X"),
+    ],
+)
+@pytest.mark.parametrize("method", ["to_pickle", "to_json", "to_csv"])
+def test_bzip_compression_level(obj, method):
+    """GH33196 bzip needs file size > 100k to show a size difference between
+    compression levels, so here we just check if the call works when
+    compression is passed as a dict.
+    """
+    with tm.ensure_clean() as path:
+        getattr(obj, method)(
+            path, compression={ "method": "bz2", "compresslevel": 1})