coiled · jrbourbeau · Oct 13, 2021 · Oct 11, 2021 · Oct 11, 2021 · Oct 12, 2021
diff --git a/dask_bigquery/core.py b/dask_bigquery/core.py
@@ -2,6 +2,7 @@
 
 from contextlib import contextmanager
 from functools import partial
+from typing import List
 
 import pandas as pd
 import pyarrow
@@ -88,7 +89,8 @@ def read_gbq(
     project_id: str,
     dataset_id: str,
     table_id: str,
-    row_filter="",
+    row_filter: str = "",
+    columns: List[str] = None,
     read_kwargs: dict = None,
 ):
     """Read table as dask dataframe using BigQuery Storage API via Arrow format.
@@ -104,6 +106,8 @@ def read_gbq(
       BigQuery table within dataset
     row_filter: str
       SQL text filtering statement to pass to `row_restriction`
+    columns: list[str]
+      list of columns to load from the table
     read_kwargs: dict
       kwargs to pass to read_rows()
 
@@ -124,7 +128,7 @@ def make_create_read_session_request(row_filter=""):
                 read_session=bigquery_storage.types.ReadSession(
                     data_format=bigquery_storage.types.DataFormat.ARROW,
                     read_options=bigquery_storage.types.ReadSession.TableReadOptions(
-                        row_restriction=row_filter,
+                        row_restriction=row_filter, selected_fields=columns
                     ),
                     table=table_ref.to_bqstorage(),
                 ),

diff --git a/dask_bigquery/tests/test_core.py b/dask_bigquery/tests/test_core.py
@@ -82,3 +82,16 @@ def test_read_kwargs(dataset, client):
 
     with pytest.raises(Exception, match="504 Deadline Exceeded"):
         ddf.compute()
+
+
+def test_read_columns(df, dataset, client):
+    project_id, dataset_id, table_id = dataset
+    columns = ["name"]
+    ddf = read_gbq(
+        project_id=project_id,
+        dataset_id=dataset_id,
+        table_id=table_id,
+        columns=columns,
+    )
+
+    assert list(ddf.columns) == columns