googleapis · gcf-merge-on-green · Oct 12, 2020 · Oct 9, 2020 · Oct 11, 2020 · Oct 11, 2020
@@ -26,10 +26,6 @@
 
 import pytest
 
-try:
-    import fastparquet
-except (ImportError, AttributeError):
-    fastparquet = None
 try:
     import pandas
 except (ImportError, AttributeError):

@@ -2152,8 +2152,7 @@ def load_table_from_dataframe(
         Raises:
             ImportError:
                 If a usable parquet engine cannot be found. This method
-                requires :mod:`pyarrow` or :mod:`fastparquet` to be
-                installed.
+                requires :mod:`pyarrow` to be installed.
             TypeError:
                 If ``job_config`` is not an instance of :class:`~google.cloud.bigquery.job.LoadJobConfig`
                 class.

@@ -49,10 +49,7 @@ def default(session):
         constraints_path,
     )
 
-    # fastparquet is not included in .[all] because, in general, it's
-    # redundant with pyarrow. We still want to run some unit tests with
-    # fastparquet serialization, though.
-    session.install("-e", ".[all,fastparquet]", "-c", constraints_path)
+    session.install("-e", ".[all]", "-c", constraints_path)
 
     session.install("ipython", "-c", constraints_path)
 

@@ -53,7 +53,6 @@
         "pyarrow >= 1.0.0, < 2.0dev",
     ],
     "tqdm": ["tqdm >= 4.7.4, <5.0.0dev"],
-    "fastparquet": ["fastparquet", "python-snappy", "llvmlite>=0.34.0"],
     "opentelemetry": [
         "opentelemetry-api==0.9b0",
         "opentelemetry-sdk==0.9b0",
@@ -64,13 +63,6 @@
 all_extras = []
 
 for extra in extras:
-    if extra in (
-        # Skip fastparquet from "all" because it is redundant with pyarrow and
-        # creates a dependency on pre-release versions of numpy. See:
-        # https://github.com/googleapis/google-cloud-python/issues/8549
-        "fastparquet",
-    ):
-        continue
     all_extras.extend(extras[extra])
 
 extras["all"] = all_extras

@@ -1,4 +1,3 @@
-fastparquet==0.4.1
 google-api-core==1.22.2
 google-cloud-bigquery-storage==2.0.0
 google-cloud-core==1.4.1

@@ -32,10 +32,6 @@
 import pytz
 import pkg_resources
 
-try:
-    import fastparquet
-except (ImportError, AttributeError):  # pragma: NO COVER
-    fastparquet = None
 try:
     import pandas
 except (ImportError, AttributeError):  # pragma: NO COVER
@@ -7839,7 +7835,6 @@ def test_load_table_from_dataframe_unknown_table(self):
         )
 
     @unittest.skipIf(pandas is None, "Requires `pandas`")
-    @unittest.skipIf(fastparquet is None, "Requires `fastparquet`")
     def test_load_table_from_dataframe_no_pyarrow_warning(self):
             parquet_compression (Optional[str]): 
                  [Beta] The compression method to use if intermittently 
                  serializing ``dataframe`` to a parquet file. 
                  If ``pyarrow`` and job config schema are used, the argument 
                  is directly passed as the ``compression`` argument to the 
                  underlying ``pyarrow.parquet.write_table()`` method (the 
                  default value "snappy" gets converted to uppercase). 
                  https://arrow.apache.org/docs/python/generated/pyarrow.parquet.write_table.html#pyarrow-parquet-write-table 
                  If either ``pyarrow`` or job config schema are missing, the 
                  argument is directly passed as the ``compression`` argument 
                  to the underlying ``DataFrame.to_parquet()`` method. 
                  https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.to_parquet.html#pandas.DataFrame.to_parquet 
             parquet_compression (Optional[str]): 
                  [Beta] The compression method to use if intermittently 
                  serializing ``dataframe`` to a parquet file. 
  
                  If ``pyarrow`` and job config schema are used, the argument 
                  is directly passed as the ``compression`` argument to the 
                  underlying ``pyarrow.parquet.write_table()`` method (the 
                  default value "snappy" gets converted to uppercase). 
                  https://arrow.apache.org/docs/python/generated/pyarrow.parquet.write_table.html#pyarrow-parquet-write-table 
  
                  If either ``pyarrow`` or job config schema are missing, the 
                  argument is directly passed as the ``compression`` argument 
                  to the underlying ``DataFrame.to_parquet()`` method. 
                  https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.to_parquet.html#pandas.DataFrame.to_parquet 
         from google.cloud.bigquery.client import PyarrowMissingWarning
 
@@ -7875,7 +7870,6 @@ def test_load_table_from_dataframe_no_pyarrow_warning(self):
         assert matches, "A missing pyarrow deprecation warning was not raised."
 
     @unittest.skipIf(pandas is None, "Requires `pandas`")
-    @unittest.skipIf(fastparquet is None, "Requires `fastparquet`")
     def test_load_table_from_dataframe_no_schema_warning_wo_pyarrow(self):
         client = self._make_client()
 
@@ -8182,7 +8176,6 @@ def test_load_table_from_dataframe_w_partial_schema_extra_types(self):
         assert "unknown_col" in message
 
     @unittest.skipIf(pandas is None, "Requires `pandas`")
-    @unittest.skipIf(fastparquet is None, "Requires `fastparquet`")
     def test_load_table_from_dataframe_w_partial_schema_missing_types(self):
         from google.cloud.bigquery.client import _DEFAULT_NUM_RETRIES
         from google.cloud.bigquery import job