Don't panic in container list/remove/inspect race

Fixes #2802 While it's hard to reproduce the theoretical race is: 1. This goroutine calls ListContainers() 2. Another goroutine removes a container X 3. This goroutine attempts to InspectContainer(X) However, this bug could be hit in the much simpler case of InspectContainer() timing out. In those cases an error is returned and the old code attempted to wrap the error with the now-nil container.ID. Storing the container ID fixes that panic.
2026-01-07 10:55:42 +03:00 · 2017-07-07 14:55:57 -07:00
parent 12b0c0da6a
commit c47860f928
1 changed files with 10 additions and 4 deletions
--- a/client/driver/docker.go
+++ b/client/driver/docker.go
@@ -1179,10 +1179,10 @@ CREATE:
 		// container names with a / pre-pended to the Nomad generated container names
 		containerName := "/" + config.Name
 		d.logger.Printf("[DEBUG] driver.docker: searching for container name %q to purge", containerName)
-		for _, container := range containers {
+		for _, shimContainer := range containers {
 			d.logger.Printf("[DEBUG] driver.docker: listed container %+v", container)
 			found := false
-			for _, name := range container.Names {
+			for _, name := range shimContainer.Names {
 				if name == containerName {
 					found = true
 					break
@@ -1195,9 +1195,15 @@ CREATE:

 			// Inspect the container and if the container isn't dead then return
 			// the container
-			container, err := client.InspectContainer(container.ID)
+			container, err := client.InspectContainer(shimContainer.ID)
 			if err != nil {
-				return nil, recoverableErrTimeouts(fmt.Errorf("Failed to inspect container %s: %s", container.ID, err))
+				err = fmt.Errorf("Failed to inspect container %s: %s", shimContainer.ID, err)
+
+				// This error is always recoverable as it could
+				// be caused by races between listing
+				// containers and this container being removed.
+				// See #2802
+				return nil, structs.NewRecoverableError(err, true)
 			}
 			if container != nil && (container.State.Running || container.State.FinishedAt.IsZero()) {
 				return container, nil