readthedocs · ericholscher · Feb 14, 2022 · Feb 14, 2022 · Feb 14, 2022 · Feb 14, 2022
diff --git a/readthedocs/core/utils/__init__.py b/readthedocs/core/utils/__init__.py
@@ -186,8 +186,8 @@ def prepare_build(
                 project_slug=project.slug,
                 version_slug=version.slug,
             )
-            options['countdown'] = 5 * 60
-            options['max_retries'] = 25
+            options['countdown'] = settings.RTD_BUILDS_RETRY_DELAY
-            options['countdown'] = settings.RTD_BUILDS_RETRY_DELAY
+            # Delay the start of the build for the build retry delay.
+            # We're still triggering the task, but it won't run immediately,
+            # and the user will be alerted in the UI from the Error below.
+            options['countdown'] = settings.RTD_BUILDS_RETRY_DELAY
-            options['countdown'] = settings.RTD_BUILDS_RETRY_DELAY
+            # Delay the start of the build for the build retry delay.
+            # We're still triggering the task, but it won't run immediately,
+            # and the user will be alerted in the UI from the Error below.
+            options['countdown'] = settings.RTD_BUILDS_RETRY_DELAY
+            options['max_retries'] = settings.RTD_BUILDS_MAX_RETRIES
             build.error = BuildMaxConcurrencyError.message.format(
                 limit=max_concurrent_builds,
             )

diff --git a/readthedocs/projects/tasks/builds.py b/readthedocs/projects/tasks/builds.py
@@ -31,6 +31,7 @@
     BUILD_STATE_CLONING,
     BUILD_STATE_FINISHED,
     BUILD_STATE_INSTALLING,
+    BUILD_STATE_TRIGGERED,
     BUILD_STATE_UPLOADING,
     BUILD_STATUS_FAILURE,
     BUILD_STATUS_SUCCESS,
@@ -217,8 +218,9 @@ class UpdateDocsTask(SyncRepositoryMixin, Task):
     autoretry_for = (
         BuildMaxConcurrencyError,
     )
-    max_retries = 5  # 5 per normal builds, 25 per concurrency limited
-    default_retry_delay = 7 * 60
+    max_retries = settings.RTD_BUILDS_MAX_RETRIES
+    default_retry_delay = settings.RTD_BUILDS_RETRY_DELAY
+    retry_backoff = False
 
     # Expected exceptions that will be logged as info only and not retried
     throws = (
@@ -263,25 +265,12 @@ def _check_concurrency_limit(self):
             max_concurrent_builds = settings.RTD_MAX_CONCURRENT_BUILDS
 
         if concurrency_limit_reached:
-            # TODO: this could be handled in `on_retry` probably
-            log.warning(
-                'Delaying tasks due to concurrency limit.',
-                project_slug=self.data.project.slug,
-                version_slug=self.data.version.slug,
-            )
-
-            # This is done automatically on the environment context, but
-            # we are executing this code before creating one
-            api_v2.build(self.data.build['id']).patch({
-                'error': BuildMaxConcurrencyError.message.format(
+            # By raising this exception and using ``autoretry_for``, Celery
+            # will handle this automatically calling ``on_retry``
+            raise BuildMaxConcurrencyError(
+                BuildMaxConcurrencyError.message.format(
                     limit=max_concurrent_builds,
-                ),
-                'builder': socket.gethostname(),
-            })
-            self.retry(
-                exc=BuildMaxConcurrencyError,
-                # We want to retry this build more times
-                max_retries=25,
+                )
             )
 
     def _check_duplicated_build(self):
@@ -482,7 +471,16 @@ def on_success(self, retval, task_id, args, kwargs):
         self.data.build['success'] = True
 
     def on_retry(self, exc, task_id, args, kwargs, einfo):
-        log.warning('Retrying this task.')
+        log.info('Retrying this task.')
+
+        if isinstance(exc, BuildMaxConcurrencyError):
+            log.warning(
+                'Delaying tasks due to concurrency limit.',
+                project_slug=self.data.project.slug,
+                version_slug=self.data.version.slug,
+            )
+            self.data.build['error'] = exc.message
+            self.update_build(state=BUILD_STATE_TRIGGERED)
 
     def after_return(self, status, retval, task_id, args, kwargs, einfo):
         # Update build object

diff --git a/readthedocs/settings/base.py b/readthedocs/settings/base.py
@@ -125,6 +125,8 @@ def SESSION_COOKIE_SAMESITE(self):
     RTD_STABLE_VERBOSE_NAME = 'stable'
     RTD_CLEAN_AFTER_BUILD = False
     RTD_MAX_CONCURRENT_BUILDS = 4
+    RTD_BUILDS_MAX_RETRIES = 25
+    RTD_BUILDS_RETRY_DELAY = 5 * 60  # seconds
     RTD_BUILD_STATUS_API_NAME = 'docs/readthedocs'
     RTD_ANALYTICS_DEFAULT_RETENTION_DAYS = 30 * 3
     RTD_AUDITLOGS_DEFAULT_RETENTION_DAYS = 30 * 3