Skip to content

Commit 55bf05c

Browse files
committed
Added udf_resource_uri parameter to read_gbq
Now more complicated queries could be processed.
1 parent 22d982a commit 55bf05c

File tree

2 files changed

+18
-3
lines changed

2 files changed

+18
-3
lines changed

doc/source/whatsnew/v0.19.0.txt

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -379,6 +379,7 @@ Google BigQuery Enhancements
379379

380380
- The :func:`read_gbq` method has gained the ``dialect`` argument to allow users to specify whether to use BigQuery's legacy SQL or BigQuery's standard SQL. See the :ref:`docs <io.bigquery_reader>` for more details (:issue:`13615`).
381381
- The :func:`~DataFrame.to_gbq` method now allows the DataFrame column order to differ from the destination table schema (:issue:`11359`).
382+
- The :func:`read_gbq` method now allows passing user defined functions
382383

383384
.. _whatsnew_0190.errstate:
384385

pandas/io/gbq.py

Lines changed: 17 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -375,7 +375,7 @@ def process_insert_errors(self, insert_errors):
375375

376376
raise StreamingInsertError
377377

378-
def run_query(self, query):
378+
def run_query(self, query, udf_resource_uri=None):
379379
try:
380380
from googleapiclient.errors import HttpError
381381
except:
@@ -395,6 +395,14 @@ def run_query(self, query):
395395
}
396396
}
397397
}
398+
399+
if udf_resource_uri is not None:
400+
if not isinstance(udf_resource_uri, list):
401+
udf_resource_uri = [udf_resource_uri]
402+
403+
job_data['configuration']['query']['userDefinedFunctionResources'] = \
404+
[{'resourceUri': uri} for uri in udf_resource_uri]
405+
398406

399407
self._start_timer()
400408
try:
@@ -622,7 +630,7 @@ def _parse_entry(field_value, field_type):
622630

623631

624632
def read_gbq(query, project_id=None, index_col=None, col_order=None,
625-
reauth=False, verbose=True, private_key=None, dialect='legacy'):
633+
reauth=False, verbose=True, private_key=None, dialect='legacy', udf_resource_uri=None):
626634
"""Load data from Google BigQuery.
627635
628636
THIS IS AN EXPERIMENTAL LIBRARY
@@ -682,6 +690,12 @@ def read_gbq(query, project_id=None, index_col=None, col_order=None,
682690
683691
.. versionadded:: 0.19.0
684692
693+
udf_resource_uri : list(str) or str (optional)
694+
A code resource to load from a Google Cloud Storage URI.
695+
Describes user-defined function resources used in the query.
696+
697+
.. versionadded:: 0.19.0
698+
685699
Returns
686700
-------
687701
df: DataFrame
@@ -698,7 +712,7 @@ def read_gbq(query, project_id=None, index_col=None, col_order=None,
698712
connector = GbqConnector(project_id, reauth=reauth, verbose=verbose,
699713
private_key=private_key,
700714
dialect=dialect)
701-
schema, pages = connector.run_query(query)
715+
schema, pages = connector.run_query(query, udf_resource_uri)
702716
dataframe_list = []
703717
while len(pages) > 0:
704718
page = pages.pop()

0 commit comments

Comments
 (0)