move-coop · bear-jordan · Jan 27, 2024 · Jan 27, 2024 · Jan 27, 2024 · Jan 31, 2024
diff --git a/parsons/google/google_bigquery.py b/parsons/google/google_bigquery.py
@@ -41,6 +41,9 @@
 # 100k rows per batch at ~1k bytes each = ~100MB per batch.
 QUERY_BATCH_SIZE = 100000
 
+# Max number of seconds to wait for a request before raising a timeout error
+MAX_TIMEOUT = 30
+
 
 def get_table_ref(client, table_name):
     # Helper function to build a TableReference for our table
@@ -464,7 +467,7 @@ def copy_from_gcs(
                     job_config=job_config,
                     **load_kwargs,
                 )
-                load_job.result()
+                load_job.result(timeout=MAX_TIMEOUT)
         except exceptions.BadRequest as e:
             if "one of the files is larger than the maximum allowed size." in str(e):
                 logger.debug(
@@ -504,6 +507,10 @@ def copy_from_gcs(
             else:
                 raise e
 
+        except exceptions.DeadlineExceeded as e:
+            logger.error(f"Max timeout exceeded for {gcs_blob_uri.split('/')[-1]}")
+            raise e
+
     def copy_large_compressed_file_from_gcs(
         self,
         gcs_blob_uri: str,
@@ -632,7 +639,10 @@ def copy_large_compressed_file_from_gcs(
                 job_config=job_config,
                 **load_kwargs,
             )
-            load_job.result()
+            load_job.result(timeout=MAX_TIMEOUT)
+        except exceptions.DeadlineExceeded as e:
+            logger.error(f"Max timeout exceeded for {gcs_blob_uri.split('/')[-1]}")
+            raise e
         finally:
             if uncompressed_gcs_uri:
                 new_bucket_name, new_blob_name = gcs.split_uri(