googleapis
diff --git a/‎bigframes/core/blocks.py‎
Lines changed: 3 additions & 0 deletions b/‎bigframes/core/blocks.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎bigframes/dataframe.py‎
Lines changed: 15 additions & 0 deletions b/‎bigframes/dataframe.py‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎bigframes/display/anywidget.py‎
Lines changed: 10 additions & 2 deletions b/‎bigframes/display/anywidget.py‎
Lines changed: 10 additions & 2 deletions
diff --git a/‎bigframes/display/table_widget.js‎
Lines changed: 10 additions & 0 deletions b/‎bigframes/display/table_widget.js‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎bigframes/formatting_helpers.py‎
Lines changed: 59 additions & 24 deletions b/‎bigframes/formatting_helpers.py‎
Lines changed: 59 additions & 24 deletions
diff --git a/‎bigframes/pandas/io/api.py‎
Lines changed: 6 additions & 1 deletion b/‎bigframes/pandas/io/api.py‎
Lines changed: 6 additions & 1 deletion
diff --git a/‎bigframes/session/__init__.py‎
Lines changed: 7 additions & 0 deletions b/‎bigframes/session/__init__.py‎
Lines changed: 7 additions & 0 deletions
@@ -30,6 +30,7 @@
 import textwrap
 import typing
 from typing import (
+    Callable,
     Iterable,
     Iterator,
     List,
@@ -679,6 +680,7 @@ def to_pandas_batches(
         page_size: Optional[int] = None,
         max_results: Optional[int] = None,
         allow_large_results: Optional[bool] = None,
+        callback: Callable = lambda _: None,
     ) -> Iterator[pd.DataFrame]:
         """Download results one message at a time.
 
@@ -696,6 +698,7 @@ def to_pandas_batches(
                 promise_under_10gb=under_10gb,
                 ordered=True,
             ),
+            callback=callback,
         )
 
         # To reduce the number of edge cases to consider when working with the
 
@@ -1885,6 +1885,21 @@ def to_pandas_batches(
             allow_large_results=allow_large_results,
         )
 
+    def _to_pandas_batches_colab(
+        self,
+        page_size: Optional[int] = None,
+        max_results: Optional[int] = None,
+        *,
+        allow_large_results: Optional[bool] = None,
+        callback: Callable = lambda _: None,
+    ) -> Iterable[pandas.DataFrame]:
+        return self._block.to_pandas_batches(
+            page_size=page_size,
+            max_results=max_results,
+            allow_large_results=allow_large_results,
+            callback=callback,
+        )
+
     def _compute_dry_run(self) -> bigquery.QueryJob:
         _, query_job = self._block._compute_dry_run()
         return query_job
 
@@ -23,6 +23,7 @@
 import pandas as pd
 
 import bigframes
+import bigframes.dataframe
 import bigframes.display.html
 
 # anywidget and traitlets are optional dependencies. We don't want the import of this
@@ -73,7 +74,7 @@ def __init__(self, dataframe: bigframes.dataframe.DataFrame):
         initial_page_size = bigframes.options.display.max_rows
 
         # Initialize data fetching attributes.
-        self._batches = dataframe.to_pandas_batches(page_size=initial_page_size)
+        # self._batches = dataframe._to_pandas_batches_colab(page_size=initial_page_size, callback=self._update_progress)
 
         # set traitlets properties that trigger observers
         self.page_size = initial_page_size
@@ -100,6 +101,7 @@ def _css(self):
     page = traitlets.Int(0).tag(sync=True)
     page_size = traitlets.Int(25).tag(sync=True)
     row_count = traitlets.Int(0).tag(sync=True)
+    progress_html = traitlets.Unicode().tag(sync=True)
     table_html = traitlets.Unicode().tag(sync=True)
 
     @traitlets.validate("page")
@@ -145,6 +147,10 @@ def _validate_page_size(self, proposal: Dict[str, Any]) -> int:
         max_page_size = 1000
         return min(value, max_page_size)
 
+    def _update_progress(self, event):
+        # TODO: use formatting helpers here.
+        self.progress_html = f"<code>{repr(event)}"
+
     def _get_next_batch(self) -> bool:
         """
         Gets the next batch of data from the generator and appends to cache.
@@ -180,7 +186,9 @@ def _cached_data(self) -> pd.DataFrame:
 
     def _reset_batches_for_new_page_size(self):
         """Reset the batch iterator when page size changes."""
-        self._batches = self._dataframe.to_pandas_batches(page_size=self.page_size)
+        self._batches = self._dataframe._to_pandas_batches_colab(
+            page_size=self.page_size, callback=self._update_progress
+        )
         self._cached_batches = []
         self._batch_iter = None
         self._all_data_loaded = False
 
@@ -19,11 +19,13 @@ const ModelProperty = {
 	PAGE_SIZE: "page_size",
 	ROW_COUNT: "row_count",
 	TABLE_HTML: "table_html",
+	PROGRESS_HTML: "progress_html",
 };
 
 const Event = {
 	CHANGE: "change",
 	CHANGE_TABLE_HTML: `change:${ModelProperty.TABLE_HTML}`,
+	CHANGE_PROGRESS_HTML: `change:${ModelProperty.PROGRESS_HTML}`,
 	CLICK: "click",
 };
 
@@ -39,6 +41,7 @@ function render({ model, el }) {
 	el.classList.add("bigframes-widget");
 
 	// Structure
+	const progressContainer = document.createElement("div");
 	const tableContainer = document.createElement("div");
 	const footer = document.createElement("div");
 
@@ -119,6 +122,13 @@ function render({ model, el }) {
 		}
 	}
 
+	/** Updates the HTML in the progress container. */
+	function handleTableHTMLChange() {
+		// Note: Using innerHTML is safe here because the content is generated
+		// by a trusted backend (formatting_helpers).
+		progressContainer.innerHTML = model.get(ModelProperty.PROGRESS_HTML);
+	}
+
 	/** Updates the HTML in the table container and refreshes button states. */
 	function handleTableHTMLChange() {
 		// Note: Using innerHTML is safe here because the content is generated
 
@@ -13,15 +13,17 @@
 # limitations under the License.
 
 """Shared helper functions for formatting jobs related info."""
-# TODO(orrbradford): cleanup up typings and documenttion in this file
+
+from __future__ import annotations
 
 import datetime
 import random
-from typing import Any, Optional, Type, Union
+from typing import Any, Callable, Optional, Type, Union
 
 import bigframes_vendored.constants as constants
 import google.api_core.exceptions as api_core_exceptions
 import google.cloud.bigquery as bigquery
+import google.cloud.bigquery._job_helpers
 import humanize
 import IPython
 import IPython.display as display
@@ -124,6 +126,7 @@ def wait_for_query_job(
     max_results: Optional[int] = None,
     page_size: Optional[int] = None,
     progress_bar: Optional[str] = None,
+    callback: Callable = lambda _: None,
 ) -> bigquery.table.RowIterator:
     """Return query results. Displays a progress bar while the query is running
     Args:
@@ -141,35 +144,67 @@ def wait_for_query_job(
     if progress_bar == "auto":
         progress_bar = "notebook" if in_ipython() else "terminal"
 
-    try:
-        if progress_bar == "notebook":
-            display_id = str(random.random())
-            loading_bar = display.HTML(get_query_job_loading_html(query_job))
-            display.display(loading_bar, display_id=display_id)
-            query_result = query_job.result(
-                max_results=max_results, page_size=page_size
-            )
-            query_job.reload()
+    if progress_bar == "notebook":
+        loading_bar = display.HTML(get_query_job_loading_html(query_job))
+        display_id = str(random.random())
+        display.display(loading_bar, display_id=display_id)
+
+        def extended_callback(event):
+            callback(event)
             display.update_display(
                 display.HTML(get_query_job_loading_html(query_job)),
                 display_id=display_id,
             )
-        elif progress_bar == "terminal":
-            initial_loading_bar = get_query_job_loading_string(query_job)
-            print(initial_loading_bar)
-            query_result = query_job.result(
-                max_results=max_results, page_size=page_size
-            )
-            query_job.reload()
+
+    elif progress_bar == "terminal":
+        initial_loading_bar = get_query_job_loading_string(query_job)
+        print(initial_loading_bar)
+
+        def extended_callback(event):
+            callback(event)
+
             if initial_loading_bar != get_query_job_loading_string(query_job):
                 print(get_query_job_loading_string(query_job))
-        else:
-            # No progress bar.
-            query_result = query_job.result(
-                max_results=max_results, page_size=page_size
+
+    else:
+        extended_callback = callback
+
+    try:
+        extended_callback(
+            # DONOTSUBMIT: we should create our own events.
+            google.cloud.bigquery._job_helpers.QueryReceivedEvent(
+                billing_project=query_job.project,
+                location=query_job.location,
+                job_id=query_job.job_id,
+                statement_type=query_job.statement_type,
+                state=query_job.state,
+                query_plan=query_job.query_plan,
+                created=query_job.created,
+                started=query_job.started,
+                ended=query_job.ended,
             )
-            query_job.reload()
-        return query_result
+        )
+        query_results = query_job.result(
+            page_size=page_size,
+            max_results=max_results,
+        )
+        extended_callback(
+            # DONOTSUBMIT: we should create our own events.
+            google.cloud.bigquery._job_helpers.QueryFinishedEvent(
+                billing_project=query_job.project,
+                location=query_results.location,
+                query_id=query_results.query_id,
+                job_id=query_results.job_id,
+                total_rows=query_results.total_rows,
+                total_bytes_processed=query_results.total_bytes_processed,
+                slot_millis=query_results.slot_millis,
+                destination=query_job.destination,
+                created=query_job.created,
+                started=query_job.started,
+                ended=query_job.ended,
+            )
+        )
+        return query_results
     except api_core_exceptions.RetryError as exc:
         add_feedback_link(exc)
         raise
 
@@ -273,7 +273,8 @@ def _try_read_gbq_colab_sessionless_dry_run(
     with _default_location_lock:
         if not config.options.bigquery._session_started:
             return _run_read_gbq_colab_sessionless_dry_run(
-                query, pyformat_args=pyformat_args
+                query,
+                pyformat_args=pyformat_args,
             )
 
     # Explicitly return None to indicate that we didn't run the dry run query.
@@ -305,6 +306,7 @@ def _read_gbq_colab(
     *,
     pyformat_args: Optional[Dict[str, Any]] = None,
     dry_run: bool = False,
+    callback: Callable = lambda _: None,
 ) -> bigframes.dataframe.DataFrame | pandas.Series:
     """A Colab-specific version of read_gbq.
 
@@ -319,6 +321,8 @@ def _read_gbq_colab(
         dry_run (bool):
             If True, estimates the query results size without returning data.
             The return will be a pandas Series with query metadata.
+        callback (Callable):
+            A callback function used by bigframes to report query progress.
 
     Returns:
         Union[bigframes.dataframe.DataFrame, pandas.Series]:
@@ -364,6 +368,7 @@ def _read_gbq_colab(
         query_or_table,
         pyformat_args=pyformat_args,
         dry_run=dry_run,
+        callback=callback,
     )
 
 
 
@@ -512,6 +512,7 @@ def _read_gbq_colab(
         *,
         pyformat_args: Optional[Dict[str, Any]] = None,
         dry_run: bool = False,
+        callback: Callable = lambda _: None,
     ) -> Union[dataframe.DataFrame, pandas.Series]:
         """A version of read_gbq that has the necessary default values for use in colab integrations.
 
@@ -528,6 +529,11 @@ def _read_gbq_colab(
                 instead. Note: unlike read_gbq / read_gbq_query, even if set to
                 None, this function always assumes {var} refers to a variable
                 that is supposed to be supplied in this dictionary.
+            dry_run (bool):
+                If True, estimates the query results size without returning data.
+                The return will be a pandas Series with query metadata.
+            callback (Callable):
+                A callback function used by bigframes to report query progress.
         """
         if pyformat_args is None:
             pyformat_args = {}
@@ -547,6 +553,7 @@ def _read_gbq_colab(
             force_total_order=False,
             dry_run=typing.cast(Union[Literal[False], Literal[True]], dry_run),
             allow_large_results=allow_large_results,
+            callback=callback,
         )
 
     @overload