datahub-project · hsheth2 · Jul 31, 2024 · Jul 25, 2024 · Jul 26, 2024 · Jul 26, 2024
diff --git a/metadata-ingestion/src/datahub/ingestion/api/source.py b/metadata-ingestion/src/datahub/ingestion/api/source.py
@@ -137,7 +137,10 @@ def report_log(
                 )
 
             # Add the simple exception details to the context.
-            context = f"{context}: {exc}"
+            if context:
+                context = f"{context} {type(exc)}: {exc}"
+            else:
+                context = f"{type(exc)}: {exc}"
         elif log:
             logger.log(level=level.value, msg=log_content, stacklevel=stacklevel)
 

diff --git a/metadata-ingestion/src/datahub/ingestion/source/state/stale_entity_removal_handler.py b/metadata-ingestion/src/datahub/ingestion/source/state/stale_entity_removal_handler.py
@@ -298,7 +298,7 @@ def gen_removed_entity_workunits(self) -> Iterable[MetadataWorkUnit]:
 
         if copy_previous_state_and_fail:
             logger.info(
-                f"Copying urns from last state (size {last_checkpoint_state.urns}) to current state (size {cur_checkpoint_state.urns}) "
+                f"Copying urns from last state (size {len(last_checkpoint_state.urns)}) to current state (size {len(cur_checkpoint_state.urns)}) "
                 "to ensure stale entities from previous runs are deleted on the next successful run."
             )
             for urn in last_checkpoint_state.urns:

diff --git a/metadata-ingestion/src/datahub/ingestion/source/tableau.py b/metadata-ingestion/src/datahub/ingestion/source/tableau.py
@@ -1,5 +1,6 @@
 import logging
 import re
+import time
 from collections import OrderedDict
 from dataclasses import dataclass
 from datetime import datetime
@@ -1038,6 +1039,30 @@ def get_connection_object_page(
                     )
 
             else:
+                # As of Tableau Server 2024.2, the metadata API sporadically returns a 30 second
+                # timeout error. It doesn't reliably happen, so retrying a couple times makes sense.
+                if all(
+                    error.get("message")
+                    == "Execution canceled because timeout of 30000 millis was reached"
+                    for error in errors
+                ):
+                    # If it was only a timeout error, we can retry.
+                    if retries_remaining <= 0:
+                        raise
+                    logger.info(
+                        f"Query {connection_type} received a 30 second timeout error - will retry in a few seconds"
+                    )
+                    # This is a pretty dumb backoff mechanism, but it's good enough for now.
+                    time.sleep(60 / retries_remaining)
+                    return self.get_connection_object_page(
+                        query,
+                        connection_type,
+                        query_filter,
+                        count,
+                        offset,
+                        retry_on_auth_error=False,
+                        retries_remaining=retries_remaining - 1,
+                    )
-                # As of Tableau Server 2024.2, the metadata API sporadically returns a 30 second
-                # timeout error. It doesn't reliably happen, so retrying a couple times makes sense.
-                if all(
-                    error.get("message")
-                    == "Execution canceled because timeout of 30000 millis was reached"
-                    for error in errors
-                ):
-                    # If it was only a timeout error, we can retry.
-                    if retries_remaining <= 0:
-                        raise
-                    logger.info(
-                        f"Query {connection_type} received a 30 second timeout error - will retry in a few seconds"
-                    )
-                    # This is a pretty dumb backoff mechanism, but it's good enough for now.
-                    time.sleep(60 / retries_remaining)
-                    return self.get_connection_object_page(
-                        query,
-                        connection_type,
-                        query_filter,
-                        count,
-                        offset,
-                        retry_on_auth_error=False,
-                        retries_remaining=retries_remaining - 1,
-                    )
+                # As of Tableau Server 2024.2, the metadata API sporadically returns a 30 second
+                # timeout error. It doesn't reliably happen, so retrying a couple times makes sense.
+                if all(
+                    error.get("message")
+                    == "Execution canceled because timeout of 30000 millis was reached"
+                    for error in errors
+                ):
+                    # If it was only a timeout error, we can retry.
+                    if retries_remaining <= 0:
+                        raise
+                    logger.info(
+                        f"Query {connection_type} received a 30 second timeout error - will retry in a few seconds"
+                    )
+                    # This is a pretty dumb backoff mechanism, but it's good enough for now.
+                    backoff_time = (self.config.max_retries - retries_remaining + 1) ** 2
+                    time.sleep(backoff_time)
+                    return self.get_connection_object_page(
+                        query,
+                        connection_type,
+                        query_filter,
+                        count,
+                        offset,
+                        retry_on_auth_error=False,
+                        retries_remaining=retries_remaining - 1,
+                    )
-                # As of Tableau Server 2024.2, the metadata API sporadically returns a 30 second
-                # timeout error. It doesn't reliably happen, so retrying a couple times makes sense.
-                if all(
-                    error.get("message")
-                    == "Execution canceled because timeout of 30000 millis was reached"
-                    for error in errors
-                ):
-                    # If it was only a timeout error, we can retry.
-                    if retries_remaining <= 0:
-                        raise
-                    logger.info(
-                        f"Query {connection_type} received a 30 second timeout error - will retry in a few seconds"
-                    )
-                    # This is a pretty dumb backoff mechanism, but it's good enough for now.
-                    time.sleep(60 / retries_remaining)
-                    return self.get_connection_object_page(
-                        query,
-                        connection_type,
-                        query_filter,
-                        count,
-                        offset,
-                        retry_on_auth_error=False,
-                        retries_remaining=retries_remaining - 1,
-                    )
+                # As of Tableau Server 2024.2, the metadata API sporadically returns a 30 second
+                # timeout error. It doesn't reliably happen, so retrying a couple times makes sense.
+                if all(
+                    error.get("message")
+                    == "Execution canceled because timeout of 30000 millis was reached"
+                    for error in errors
+                ):
+                    # If it was only a timeout error, we can retry.
+                    if retries_remaining <= 0:
+                        raise
+                    logger.info(
+                        f"Query {connection_type} received a 30 second timeout error - will retry in a few seconds"
+                    )
+                    # This is a pretty dumb backoff mechanism, but it's good enough for now.
+                    backoff_time = (self.config.max_retries - retries_remaining + 1) ** 2
+                    time.sleep(backoff_time)
+                    return self.get_connection_object_page(
+                        query,
+                        connection_type,
+                        query_filter,
+                        count,
+                        offset,
+                        retry_on_auth_error=False,
+                        retries_remaining=retries_remaining - 1,
+                    )
                 raise RuntimeError(f"Query {connection_type} error: {errors}")
 
         connection_object = query_data.get(c.DATA, {}).get(connection_type, {})