Zero downtime redeploys

When deploying check if there is already a container with the existing name. If there is rename it to "<version>_<random_hex_string>" to remove the name clash with the new container we want to boot. We can then do the normal zero downtime run/wait/stop. While implementing this I discovered the --filter name=foo does a substring match for foo, so I've updated those filters to do an exact match instead.
2023-03-24 17:06:54 +00:00
parent 01a2b678d7
commit 05488e4c1e
12 changed files with 48 additions and 48 deletions
--- a/lib/mrsk/cli/app.rb
+++ b/lib/mrsk/cli/app.rb
@@ -15,22 +15,17 @@ class Mrsk::Cli::App < Mrsk::Cli::Base
            execute *MRSK.auditor(role: role).record("Booted app version #{version}"), verbosity: :debug

            begin
+              if capture_with_info(*MRSK.app(role: role).container_id_for_version(version)).present?
+                tmp_version = "#{version}_#{SecureRandom.hex(8)}"
+                info "Renaming container #{version} to #{tmp_version} as already deployed on #{host}"
+                execute *MRSK.auditor(role: role).record("Renaming container #{version} to #{tmp_version}"), verbosity: :debug
+                execute *MRSK.app(role: role).rename_container(version: version, new_version: tmp_version)
+              end
+
              old_version = capture_with_info(*MRSK.app(role: role).current_running_version).strip
              execute *MRSK.app(role: role).run
              sleep MRSK.config.readiness_delay
              execute *MRSK.app(role: role).stop(version: old_version), raise_on_non_zero_exit: false if old_version.present?
-
-            rescue SSHKit::Command::Failed => e
-              if e.message =~ /already in use/
-                error "Rebooting container with same version #{version} already deployed on #{host} (may cause gap in zero-downtime promise!)"
-                execute *MRSK.auditor(role: role).record("Rebooted app version #{version}"), verbosity: :debug
-
-                execute *MRSK.app(role: role).stop(version: version)
-                execute *MRSK.app(role: role).remove_container(version: version)
-                execute *MRSK.app(role: role).run
-              else
-                raise
-              end
            end
          end
        end