From 9068e8065c1a9ec7e9aefeb51a3c989a3693545d Mon Sep 17 00:00:00 2001
From: Codex <codex@users.noreply.github.com>
Date: Fri, 5 Jun 2026 13:12:18 +0800
Subject: [PATCH] feat: wire running service details to real status

---
 cmd/aima/tooldeps_deploy.go      |    6 +
 cmd/aima/tooldeps_deploy_test.go |   17 +-
 internal/k3s/client.go           |    7 +
 internal/k3s/client_test.go      |   37 +
 internal/runtime/docker.go       |  308 +++++++-
 internal/runtime/docker_test.go  |  119 ++++
 internal/runtime/k3s.go          |    1 +
 internal/runtime/runtime.go      |   33 +-
 internal/ui/handler_test.go      |   18 +-
 internal/ui/static/index.html    | 1117 ++++++++++++++++++++++++++----
 10 files changed, 1496 insertions(+), 167 deletions(-)

diff --git a/cmd/aima/tooldeps_deploy.go b/cmd/aima/tooldeps_deploy.go
index f8e8b051..8f0a955e 100644
--- a/cmd/aima/tooldeps_deploy.go
+++ b/cmd/aima/tooldeps_deploy.go
@@ -693,6 +693,7 @@ type deploymentOverview struct {
 	Name                string `json:"name"`
 	Model               string `json:"model"`
 	Engine              string `json:"engine,omitempty"`
+	Image               string `json:"image,omitempty"`
 	Slot                string `json:"slot,omitempty"`
 	Phase               string `json:"phase"`
 	Status              string `json:"status"`
@@ -704,6 +705,8 @@ type deploymentOverview struct {
 	Message             string `json:"message,omitempty"`
 	Restarts            int    `json:"restarts,omitempty"`
 	ExitCode            *int   `json:"exit_code,omitempty"`
+	GPUMemoryMiB        int    `json:"gpu_memory_mib,omitempty"`
+	GPUMemorySource     string `json:"gpu_memory_source,omitempty"`
 	StartupPhase        string `json:"startup_phase,omitempty"`
 	StartupProgress     int    `json:"startup_progress,omitempty"`
 	StartupMessage      string `json:"startup_message,omitempty"`
@@ -724,6 +727,7 @@ func deploymentOverviewFromStatus(status *runtime.DeploymentStatus, cat *knowled
 		Name:                status.Name,
 		Model:               status.Model,
 		Engine:              status.Engine,
+		Image:               status.Image,
 		Slot:                status.Slot,
 		Phase:               status.Phase,
 		Status:              status.Phase,
@@ -735,6 +739,8 @@ func deploymentOverviewFromStatus(status *runtime.DeploymentStatus, cat *knowled
 		Message:             status.Message,
 		Restarts:            status.Restarts,
 		ExitCode:            status.ExitCode,
+		GPUMemoryMiB:        status.GPUMemoryMiB,
+		GPUMemorySource:     status.GPUMemorySource,
 		StartupPhase:        status.StartupPhase,
 		StartupProgress:     status.StartupProgress,
 		StartupMessage:      status.StartupMessage,
diff --git a/cmd/aima/tooldeps_deploy_test.go b/cmd/aima/tooldeps_deploy_test.go
index 203999d7..ef14802c 100644
--- a/cmd/aima/tooldeps_deploy_test.go
+++ b/cmd/aima/tooldeps_deploy_test.go
@@ -36,12 +36,21 @@ func TestDeploymentOverviewIncludesCatalogModelType(t *testing.T) {
 		}},
 	}
 	overview := deploymentOverviewFromStatus(&runtime.DeploymentStatus{
-		Name:  "qwen3-tts-0.6b-qwen-tts-fastapi",
-		Model: "qwen3-tts-0.6b",
-		Phase: "running",
-		Ready: true,
+		Name:            "qwen3-tts-0.6b-qwen-tts-fastapi",
+		Model:           "qwen3-tts-0.6b",
+		Image:           "docker.1ms.run/example/qwen-tts:latest",
+		Phase:           "running",
+		Ready:           true,
+		GPUMemoryMiB:    1536,
+		GPUMemorySource: "nvidia-smi",
 	}, cat)
 	if overview.ModelType != "tts" {
 		t.Fatalf("ModelType = %q, want tts", overview.ModelType)
 	}
+	if overview.Image != "docker.1ms.run/example/qwen-tts:latest" {
+		t.Fatalf("Image = %q, want docker.1ms.run/example/qwen-tts:latest", overview.Image)
+	}
+	if overview.GPUMemoryMiB != 1536 || overview.GPUMemorySource != "nvidia-smi" {
+		t.Fatalf("GPU memory = %d/%q, want 1536/nvidia-smi", overview.GPUMemoryMiB, overview.GPUMemorySource)
+	}
 }
diff --git a/internal/k3s/client.go b/internal/k3s/client.go
index d7de31d2..183c7a8b 100644
--- a/internal/k3s/client.go
+++ b/internal/k3s/client.go
@@ -41,6 +41,7 @@ type PodStatus struct {
 	DeletionTimestamp string            `json:"deletion_timestamp,omitempty"`
 	Message           string            `json:"message,omitempty"`
 	ContainerPort     int               `json:"container_port,omitempty"`
+	ContainerImage    string            `json:"container_image,omitempty"`
 	RestartCount      int               `json:"restart_count,omitempty"`
 	ExitCode          *int              `json:"exit_code,omitempty"`         // from Terminated state
 	ContainerStarted  string            `json:"container_started,omitempty"` // when the current container instance started
@@ -270,6 +271,7 @@ type kubePod struct {
 	} `json:"metadata"`
 	Spec struct {
 		Containers []struct {
+			Image string `json:"image"`
 			Ports []struct {
 				ContainerPort int `json:"containerPort"`
 			} `json:"ports"`
@@ -357,8 +359,12 @@ func parsePodJSON(data []byte) (*PodStatus, error) {
 	}
 
 	containerPort := 0
+	containerImage := ""
 	if len(kp.Spec.Containers) > 0 && len(kp.Spec.Containers[0].Ports) > 0 {
+		containerImage = kp.Spec.Containers[0].Image
 		containerPort = kp.Spec.Containers[0].Ports[0].ContainerPort
+	} else if len(kp.Spec.Containers) > 0 {
+		containerImage = kp.Spec.Containers[0].Image
 	}
 
 	var conditions []PodCondition
@@ -376,6 +382,7 @@ func parsePodJSON(data []byte) (*PodStatus, error) {
 		DeletionTimestamp: kp.Metadata.DeletionTimestamp,
 		Message:           msg,
 		ContainerPort:     containerPort,
+		ContainerImage:    containerImage,
 		RestartCount:      restartCount,
 		ExitCode:          exitCode,
 		ContainerStarted:  containerStarted,
diff --git a/internal/k3s/client_test.go b/internal/k3s/client_test.go
index e9f4fe87..86791c14 100644
--- a/internal/k3s/client_test.go
+++ b/internal/k3s/client_test.go
@@ -195,6 +195,18 @@ const terminatingPodJSON = `{
       "aima.dev/model": "qwen3-8b"
     }
   },
+  "spec": {
+    "containers": [
+      {
+        "image": "nvcr.io/nvidia/vllm:26.01-py3",
+        "ports": [
+          {
+            "containerPort": 8000
+          }
+        ]
+      }
+    ]
+  },
   "status": {
     "phase": "Running",
     "podIP": "10.42.0.5",
@@ -217,6 +229,18 @@ const runningPodJSON = `{
       "aima.dev/model": "qwen3-8b"
     }
   },
+  "spec": {
+    "containers": [
+      {
+        "image": "nvcr.io/nvidia/vllm:26.01-py3",
+        "ports": [
+          {
+            "containerPort": 8000
+          }
+        ]
+      }
+    ]
+  },
   "status": {
     "phase": "Running",
     "podIP": "10.42.0.5",
@@ -621,3 +645,16 @@ func TestParsePodJSON_DeletionTimestamp(t *testing.T) {
 		t.Fatal("expected raw pod readiness to reflect container status before runtime mapping")
 	}
 }
+
+func TestParsePodJSON_ContainerImage(t *testing.T) {
+	pod, err := parsePodJSON([]byte(runningPodJSON))
+	if err != nil {
+		t.Fatal(err)
+	}
+	if pod.ContainerImage != "nvcr.io/nvidia/vllm:26.01-py3" {
+		t.Fatalf("ContainerImage = %q, want nvcr.io/nvidia/vllm:26.01-py3", pod.ContainerImage)
+	}
+	if pod.ContainerPort != 8000 {
+		t.Fatalf("ContainerPort = %d, want 8000", pod.ContainerPort)
+	}
+}
diff --git a/internal/runtime/docker.go b/internal/runtime/docker.go
index 3fa06984..e076a831 100644
--- a/internal/runtime/docker.go
+++ b/internal/runtime/docker.go
@@ -295,6 +295,7 @@ func (r *DockerRuntime) Status(ctx context.Context, name string) (*DeploymentSta
 
 	di := inspects[0]
 	ds := r.inspectToStatus(di)
+	r.enrichGPUMemory(ctx, ds, di.ID, di.State.Pid)
 	asset := findEngineAsset(r.engineAssets, ds.Labels["aima.dev/engine"])
 	if asset != nil && ds.EstimatedTotalS == 0 && len(asset.TimeConstraints.ColdStartS) >= 2 {
 		ds.EstimatedTotalS = asset.TimeConstraints.ColdStartS[1]
@@ -357,6 +358,7 @@ func (r *DockerRuntime) List(ctx context.Context) ([]*DeploymentStatus, error) {
 
 		ds := &DeploymentStatus{
 			Name:    ps.Names,
+			Image:   ps.Image,
 			Phase:   phase,
 			Ready:   ready,
 			Address: addr,
@@ -402,6 +404,7 @@ func (r *DockerRuntime) Logs(ctx context.Context, name string, tailLines int) (s
 // --- internal types ---
 
 type dockerInspect struct {
+	ID    string `json:"Id"`
 	Name  string `json:"Name"`
 	State struct {
 		Status     string `json:"Status"` // running, created, exited, paused, restarting
@@ -409,19 +412,167 @@ type dockerInspect struct {
 		ExitCode   int    `json:"ExitCode"`
 		Running    bool   `json:"Running"`
 		Restarting bool   `json:"Restarting"`
+		Pid        int    `json:"Pid"`
 	} `json:"State"`
 	Config struct {
-		Labels map[string]string `json:"Labels"`
+		Entrypoint []string          `json:"Entrypoint"`
+		Cmd        []string          `json:"Cmd"`
+		Image      string            `json:"Image"`
+		Labels     map[string]string `json:"Labels"`
 	} `json:"Config"`
 }
 
 type dockerPsEntry struct {
+	ID        string `json:"ID"`
+	Image     string `json:"Image"`
 	Names     string `json:"Names"`
 	Status    string `json:"Status"`
 	Labels    string `json:"Labels"`
 	CreatedAt string `json:"CreatedAt"`
 }
 
+func (r *DockerRuntime) enrichGPUMemory(ctx context.Context, ds *DeploymentStatus, containerID string, containerPID int) {
+	if ds == nil || ds.Name == "" || ds.Phase != "running" {
+		return
+	}
+	if containerPID <= 0 || strings.TrimSpace(containerID) == "" {
+		pidOut, err := exec.CommandContext(ctx, "docker", "inspect", "--format", "{{.State.Pid}} {{.Id}}", ds.Name).CombinedOutput()
+		if err == nil {
+			fields := strings.Fields(string(pidOut))
+			if len(fields) > 0 && containerPID <= 0 {
+				containerPID, _ = strconv.Atoi(fields[0])
+			}
+			if len(fields) > 1 && strings.TrimSpace(containerID) == "" {
+				containerID = fields[1]
+			}
+		}
+	}
+	usedMiB := containerNvidiaGPUMemoryMiB(ctx, ds.Name, containerID, containerPID)
+	if usedMiB <= 0 {
+		return
+	}
+	ds.GPUMemoryMiB = usedMiB
+	ds.GPUMemorySource = "nvidia-smi"
+}
+
+func containerNvidiaGPUMemoryMiB(ctx context.Context, containerName, containerID string, containerPID int) int {
+	if containerPID <= 0 && strings.TrimSpace(containerName) == "" && strings.TrimSpace(containerID) == "" {
+		return 0
+	}
+	smiCtx, cancel := context.WithTimeout(ctx, 2*time.Second)
+	defer cancel()
+	out, err := exec.CommandContext(smiCtx, "nvidia-smi",
+		"--query-compute-apps=pid,used_gpu_memory",
+		"--format=csv,noheader,nounits",
+	).CombinedOutput()
+	if err != nil {
+		return 0
+	}
+	totalMiB := 0
+	for _, line := range strings.Split(strings.TrimSpace(string(out)), "\n") {
+		parts := strings.SplitN(strings.TrimSpace(line), ",", 2)
+		if len(parts) != 2 {
+			continue
+		}
+		pid := strings.TrimSpace(parts[0])
+		memMiB := parseNvidiaMemoryMiB(parts[1])
+		if pid == "" || memMiB <= 0 {
+			continue
+		}
+		if processBelongsToDockerContainer(ctx, pid, containerName, containerID, containerPID) {
+			totalMiB += memMiB
+		}
+	}
+	return totalMiB
+}
+
+func parseNvidiaMemoryMiB(value string) int {
+	value = strings.TrimSpace(value)
+	value = strings.TrimSuffix(value, "MiB")
+	value = strings.TrimSpace(value)
+	if fields := strings.Fields(value); len(fields) > 0 {
+		value = fields[0]
+	}
+	memMiB, err := strconv.Atoi(value)
+	if err != nil {
+		return 0
+	}
+	return memMiB
+}
+
+func processBelongsToDockerContainer(ctx context.Context, pid, containerName, containerID string, containerPID int) bool {
+	data, err := os.ReadFile(filepath.Join("/proc", pid, "cgroup"))
+	if err == nil {
+		cgroup := strings.ToLower(string(data))
+		for _, token := range dockerContainerMatchTokens(containerName, containerID) {
+			if token != "" && strings.Contains(cgroup, token) {
+				return true
+			}
+		}
+	}
+	if containerPID <= 0 {
+		return false
+	}
+	return isDescendantPID(ctx, pid, strconv.Itoa(containerPID))
+}
+
+func dockerContainerMatchTokens(containerName, containerID string) []string {
+	id := strings.ToLower(strings.TrimSpace(containerID))
+	shortID := id
+	if len(shortID) > 12 {
+		shortID = shortID[:12]
+	}
+	if id != "" {
+		return []string{id, shortID}
+	}
+	name := strings.ToLower(strings.TrimPrefix(strings.TrimSpace(containerName), "/"))
+	return []string{name}
+}
+
+func isDescendantPID(ctx context.Context, childPID, parentPID string) bool {
+	current := strings.TrimSpace(childPID)
+	parentPID = strings.TrimSpace(parentPID)
+	if current == "" || parentPID == "" {
+		return false
+	}
+	if current == parentPID {
+		return true
+	}
+	for i := 0; i < 16; i++ {
+		select {
+		case <-ctx.Done():
+			return false
+		default:
+		}
+		data, err := os.ReadFile(filepath.Join("/proc", current, "stat"))
+		if err != nil {
+			return false
+		}
+		ppid := parentPIDFromProcStat(string(data))
+		if ppid == "" || ppid == "0" || ppid == "1" {
+			return false
+		}
+		if ppid == parentPID {
+			return true
+		}
+		current = ppid
+	}
+	return false
+}
+
+func parentPIDFromProcStat(stat string) string {
+	stat = strings.TrimSpace(stat)
+	endComm := strings.LastIndex(stat, ")")
+	if endComm < 0 || endComm+2 >= len(stat) {
+		return ""
+	}
+	fields := strings.Fields(stat[endComm+1:])
+	if len(fields) < 2 {
+		return ""
+	}
+	return fields[1]
+}
+
 func (r *DockerRuntime) inspectToStatus(di dockerInspect) *DeploymentStatus {
 	labels := di.Config.Labels
 	port := 0
@@ -466,9 +617,11 @@ func (r *DockerRuntime) inspectToStatus(di dockerInspect) *DeploymentStatus {
 
 	ds := &DeploymentStatus{
 		Name:    name,
+		Image:   di.Config.Image,
 		Phase:   phase,
 		Ready:   ready,
 		Address: addr,
+		Config:  dockerLaunchConfigFromInspect(di),
 		Labels:  labels,
 		Runtime: "docker",
 	}
@@ -482,6 +635,159 @@ func (r *DockerRuntime) inspectToStatus(di dockerInspect) *DeploymentStatus {
 	return ds
 }
 
+func dockerLaunchConfigFromInspect(di dockerInspect) map[string]any {
+	args := make([]string, 0, len(di.Config.Entrypoint)+len(di.Config.Cmd))
+	args = append(args, di.Config.Entrypoint...)
+	args = append(args, di.Config.Cmd...)
+	if shellArgs := dockerShellCommandArgs(args); len(shellArgs) > 0 {
+		if config := parseLaunchConfigFlags(shellArgs); len(config) > 0 {
+			return config
+		}
+	}
+	return parseLaunchConfigFlags(args)
+}
+
+func dockerShellCommandArgs(args []string) []string {
+	for i := 0; i+1 < len(args); i++ {
+		name := shellExecutableName(args[i])
+		if name != "bash" && name != "sh" {
+			continue
+		}
+		for j := i + 1; j+1 < len(args); j++ {
+			if !isShellCommandFlag(args[j]) {
+				continue
+			}
+			command := strings.TrimSpace(args[j+1])
+			if command == "" {
+				return nil
+			}
+			if idx := strings.LastIndex(command, " exec "); idx >= 0 {
+				command = command[idx+6:]
+			} else if strings.HasPrefix(command, "exec ") {
+				command = strings.TrimSpace(strings.TrimPrefix(command, "exec "))
+			}
+			return splitShellFields(command)
+		}
+	}
+	return nil
+}
+
+func isShellCommandFlag(value string) bool {
+	value = strings.TrimSpace(value)
+	if value == "-c" {
+		return true
+	}
+	if strings.HasPrefix(value, "--") || !strings.HasPrefix(value, "-") {
+		return false
+	}
+	return strings.Contains(value[1:], "c")
+}
+
+func shellExecutableName(value string) string {
+	value = strings.TrimSpace(value)
+	if idx := strings.LastIndexAny(value, `/\`); idx >= 0 {
+		return value[idx+1:]
+	}
+	return value
+}
+
+func parseLaunchConfigFlags(args []string) map[string]any {
+	config := make(map[string]any)
+	for i := 0; i < len(args); i++ {
+		arg := strings.TrimSpace(args[i])
+		if arg == "" || !strings.HasPrefix(arg, "--") {
+			continue
+		}
+		key, value, hasValue := strings.Cut(strings.TrimPrefix(arg, "--"), "=")
+		key = strings.TrimSpace(key)
+		if key == "" {
+			continue
+		}
+		boolValue := true
+		if strings.HasPrefix(key, "no-") {
+			key = strings.TrimPrefix(key, "no-")
+			boolValue = false
+		}
+		key = strings.ReplaceAll(key, "-", "_")
+		if !hasValue && i+1 < len(args) && !strings.HasPrefix(strings.TrimSpace(args[i+1]), "--") {
+			value = args[i+1]
+			hasValue = true
+			i++
+		}
+		if hasValue {
+			config[key] = parseLaunchConfigValue(value)
+		} else {
+			config[key] = boolValue
+		}
+	}
+	return config
+}
+
+func splitShellFields(input string) []string {
+	var fields []string
+	var b strings.Builder
+	var quote rune
+	escaped := false
+	for _, r := range input {
+		if escaped {
+			b.WriteRune(r)
+			escaped = false
+			continue
+		}
+		if quote != '\'' && r == '\\' {
+			escaped = true
+			continue
+		}
+		if quote != 0 {
+			if r == quote {
+				quote = 0
+				continue
+			}
+			b.WriteRune(r)
+			continue
+		}
+		if r == '\'' || r == '"' {
+			quote = r
+			continue
+		}
+		if r == ' ' || r == '\t' || r == '\n' || r == '\r' {
+			if b.Len() > 0 {
+				fields = append(fields, b.String())
+				b.Reset()
+			}
+			continue
+		}
+		b.WriteRune(r)
+	}
+	if escaped {
+		b.WriteRune('\\')
+	}
+	if b.Len() > 0 {
+		fields = append(fields, b.String())
+	}
+	return fields
+}
+
+func parseLaunchConfigValue(value string) any {
+	value = strings.TrimSpace(value)
+	if value == "" {
+		return ""
+	}
+	if strings.EqualFold(value, "true") {
+		return true
+	}
+	if strings.EqualFold(value, "false") {
+		return false
+	}
+	if i, err := strconv.Atoi(value); err == nil {
+		return i
+	}
+	if f, err := strconv.ParseFloat(value, 64); err == nil {
+		return f
+	}
+	return value
+}
+
 // enrichDockerProgress reads container logs and matches engine patterns.
 func (r *DockerRuntime) enrichDockerProgress(ctx context.Context, ds *DeploymentStatus) string {
 	engineName := ""
diff --git a/internal/runtime/docker_test.go b/internal/runtime/docker_test.go
index a24d8dd0..9e225bb7 100644
--- a/internal/runtime/docker_test.go
+++ b/internal/runtime/docker_test.go
@@ -1,6 +1,7 @@
 package runtime
 
 import (
+	"context"
 	"strings"
 	"testing"
 
@@ -378,6 +379,7 @@ func TestDockerInspectToStatus(t *testing.T) {
 					ExitCode   int    `json:"ExitCode"`
 					Running    bool   `json:"Running"`
 					Restarting bool   `json:"Restarting"`
+					Pid        int    `json:"Pid"`
 				}{Status: "running", Running: true, StartedAt: "2026-03-03T00:00:00Z"},
 			},
 			wantPhase: "running",
@@ -392,6 +394,7 @@ func TestDockerInspectToStatus(t *testing.T) {
 					ExitCode   int    `json:"ExitCode"`
 					Running    bool   `json:"Running"`
 					Restarting bool   `json:"Restarting"`
+					Pid        int    `json:"Pid"`
 				}{Status: "exited", ExitCode: 1},
 			},
 			wantPhase: "failed",
@@ -410,6 +413,7 @@ func TestDockerInspectToStatus(t *testing.T) {
 					ExitCode   int    `json:"ExitCode"`
 					Running    bool   `json:"Running"`
 					Restarting bool   `json:"Restarting"`
+					Pid        int    `json:"Pid"`
 				}{Status: "exited", ExitCode: 0},
 			},
 			wantPhase: "stopped",
@@ -424,6 +428,7 @@ func TestDockerInspectToStatus(t *testing.T) {
 					ExitCode   int    `json:"ExitCode"`
 					Running    bool   `json:"Running"`
 					Restarting bool   `json:"Restarting"`
+					Pid        int    `json:"Pid"`
 				}{Status: "restarting", ExitCode: 2, Restarting: true},
 			},
 			wantPhase: "failed",
@@ -442,6 +447,7 @@ func TestDockerInspectToStatus(t *testing.T) {
 					ExitCode   int    `json:"ExitCode"`
 					Running    bool   `json:"Running"`
 					Restarting bool   `json:"Restarting"`
+					Pid        int    `json:"Pid"`
 				}{Status: "created"},
 			},
 			wantPhase: "starting",
@@ -469,6 +475,119 @@ func TestDockerInspectToStatus(t *testing.T) {
 	}
 }
 
+func TestDockerInspectToStatusIncludesImageAndLaunchConfig(t *testing.T) {
+	r := &DockerRuntime{}
+	di := dockerInspect{Name: "/test-vllm"}
+	di.State.Status = "running"
+	di.State.Running = true
+	di.Config.Entrypoint = []string{"vllm", "serve"}
+	di.Config.Cmd = []string{
+		"--gpu-memory-utilization", "0.6",
+		"--max-model-len=131072",
+		"--served-model-name", "GLM-4.6V-Flash-FP4",
+		"--trust-remote-code",
+		"--no-enable-prefix-caching",
+	}
+	di.Config.Image = "nvcr.io/nvidia/vllm:26.01-py3"
+	di.Config.Labels = map[string]string{"aima.dev/port": "8000"}
+	ds := r.inspectToStatus(di)
+
+	if ds.Image != "nvcr.io/nvidia/vllm:26.01-py3" {
+		t.Fatalf("Image = %q, want nvcr.io/nvidia/vllm:26.01-py3", ds.Image)
+	}
+	if got, ok := ds.Config["gpu_memory_utilization"].(float64); !ok || got != 0.6 {
+		t.Fatalf("gpu_memory_utilization = %#v, want 0.6", ds.Config["gpu_memory_utilization"])
+	}
+	if got, ok := ds.Config["max_model_len"].(int); !ok || got != 131072 {
+		t.Fatalf("max_model_len = %#v, want 131072", ds.Config["max_model_len"])
+	}
+	if got := ds.Config["served_model_name"]; got != "GLM-4.6V-Flash-FP4" {
+		t.Fatalf("served_model_name = %#v, want GLM-4.6V-Flash-FP4", got)
+	}
+	if got, ok := ds.Config["trust_remote_code"].(bool); !ok || !got {
+		t.Fatalf("trust_remote_code = %#v, want true", ds.Config["trust_remote_code"])
+	}
+	if got, ok := ds.Config["enable_prefix_caching"].(bool); !ok || got {
+		t.Fatalf("enable_prefix_caching = %#v, want false", ds.Config["enable_prefix_caching"])
+	}
+}
+
+func TestDockerInspectToStatusParsesShellLaunchConfig(t *testing.T) {
+	r := &DockerRuntime{}
+	di := dockerInspect{Name: "/test-vllm-shell"}
+	di.State.Status = "running"
+	di.State.Running = true
+	di.Config.Entrypoint = []string{"/bin/bash"}
+	di.Config.Cmd = []string{
+		"-c",
+		"python - <<'PY'\nprint('init')\nPY\n && exec vllm serve /models --gpu-memory-utilization 0.6 --served-model-name 'GLM-4.6V-Flash-FP4'",
+	}
+	di.Config.Image = "nvcr.io/nvidia/vllm:26.01-py3"
+	di.Config.Labels = map[string]string{"aima.dev/port": "8000"}
+	ds := r.inspectToStatus(di)
+
+	if got, ok := ds.Config["gpu_memory_utilization"].(float64); !ok || got != 0.6 {
+		t.Fatalf("gpu_memory_utilization = %#v, want 0.6", ds.Config["gpu_memory_utilization"])
+	}
+	if got := ds.Config["served_model_name"]; got != "GLM-4.6V-Flash-FP4" {
+		t.Fatalf("served_model_name = %#v, want GLM-4.6V-Flash-FP4", got)
+	}
+}
+
+func TestDockerInspectToStatusParsesCombinedShellCommandFlag(t *testing.T) {
+	r := &DockerRuntime{}
+	di := dockerInspect{Name: "/test-vllm-shell-lc"}
+	di.State.Status = "running"
+	di.State.Running = true
+	di.Config.Entrypoint = []string{"/bin/bash"}
+	di.Config.Cmd = []string{"-lc", "exec vllm serve /models --gpu-memory-utilization 0.7 --max-model-len 65536"}
+	di.Config.Image = "nvcr.io/nvidia/vllm:26.01-py3"
+	di.Config.Labels = map[string]string{"aima.dev/port": "8000"}
+	ds := r.inspectToStatus(di)
+
+	if got, ok := ds.Config["gpu_memory_utilization"].(float64); !ok || got != 0.7 {
+		t.Fatalf("gpu_memory_utilization = %#v, want 0.7", ds.Config["gpu_memory_utilization"])
+	}
+	if got, ok := ds.Config["max_model_len"].(int); !ok || got != 65536 {
+		t.Fatalf("max_model_len = %#v, want 65536", ds.Config["max_model_len"])
+	}
+}
+
+func TestParseNvidiaMemoryMiB(t *testing.T) {
+	tests := map[string]int{
+		"1700":     1700,
+		"1700 MiB": 1700,
+		" 42 ":     42,
+		"N/A":      0,
+		"":         0,
+	}
+	for input, want := range tests {
+		if got := parseNvidiaMemoryMiB(input); got != want {
+			t.Fatalf("parseNvidiaMemoryMiB(%q) = %d, want %d", input, got, want)
+		}
+	}
+}
+
+func TestDockerContainerMatchTokensPrefersContainerID(t *testing.T) {
+	tokens := dockerContainerMatchTokens("qwen3-vllm", "abcdef1234567890")
+	if strings.Join(tokens, ",") != "abcdef1234567890,abcdef123456" {
+		t.Fatalf("tokens = %#v, want full and short container IDs only", tokens)
+	}
+}
+
+func TestParentPIDFromProcStat(t *testing.T) {
+	stat := "12345 (python worker) S 6789 1 1 0 -1 4194560"
+	if got := parentPIDFromProcStat(stat); got != "6789" {
+		t.Fatalf("parentPIDFromProcStat = %q, want 6789", got)
+	}
+}
+
+func TestIsDescendantPIDIncludesSelf(t *testing.T) {
+	if !isDescendantPID(context.Background(), "12345", "12345") {
+		t.Fatal("expected a container main PID to match itself")
+	}
+}
+
 func TestParseLabelString(t *testing.T) {
 	tests := []struct {
 		name  string
diff --git a/internal/runtime/k3s.go b/internal/runtime/k3s.go
index ba0cf286..055aba24 100644
--- a/internal/runtime/k3s.go
+++ b/internal/runtime/k3s.go
@@ -246,6 +246,7 @@ func podToStatus(pod *k3s.PodStatus) *DeploymentStatus {
 
 	ds := &DeploymentStatus{
 		Name:     pod.Name,
+		Image:    pod.ContainerImage,
 		Phase:    phase,
 		Ready:    ready,
 		Address:  addr,
diff --git a/internal/runtime/runtime.go b/internal/runtime/runtime.go
index b75f3f52..a70aa02b 100644
--- a/internal/runtime/runtime.go
+++ b/internal/runtime/runtime.go
@@ -53,21 +53,24 @@ type DeployRequest struct {
 
 // DeploymentStatus is the unified status across runtimes.
 type DeploymentStatus struct {
-	Name          string            `json:"name"`
-	Model         string            `json:"model,omitempty"`
-	Engine        string            `json:"engine,omitempty"`
-	Slot          string            `json:"slot,omitempty"`
-	Phase         string            `json:"phase"` // running / starting / stopped / failed
-	Ready         bool              `json:"ready"`
-	Address       string            `json:"address"` // host:port
-	Config        map[string]any    `json:"config,omitempty"`
-	Labels        map[string]string `json:"labels"`
-	StartTime     string            `json:"start_time"`
-	StartedAtUnix int64             `json:"started_at_unix,omitempty"`
-	Message       string            `json:"message,omitempty"`
-	Runtime       string            `json:"runtime"` // "k3s", "docker", or "native"
-	Restarts      int               `json:"restarts,omitempty"`
-	ExitCode      *int              `json:"exit_code,omitempty"`
+	Name            string            `json:"name"`
+	Model           string            `json:"model,omitempty"`
+	Engine          string            `json:"engine,omitempty"`
+	Image           string            `json:"image,omitempty"`
+	Slot            string            `json:"slot,omitempty"`
+	Phase           string            `json:"phase"` // running / starting / stopped / failed
+	Ready           bool              `json:"ready"`
+	Address         string            `json:"address"` // host:port
+	Config          map[string]any    `json:"config,omitempty"`
+	Labels          map[string]string `json:"labels"`
+	StartTime       string            `json:"start_time"`
+	StartedAtUnix   int64             `json:"started_at_unix,omitempty"`
+	Message         string            `json:"message,omitempty"`
+	Runtime         string            `json:"runtime"` // "k3s", "docker", or "native"
+	Restarts        int               `json:"restarts,omitempty"`
+	ExitCode        *int              `json:"exit_code,omitempty"`
+	GPUMemoryMiB    int               `json:"gpu_memory_mib,omitempty"`
+	GPUMemorySource string            `json:"gpu_memory_source,omitempty"`
 
 	StartupPhase    string `json:"startup_phase,omitempty"`    // scheduling/pulling_image/initializing/loading_weights/cuda_graphs/ready
 	StartupProgress int    `json:"startup_progress,omitempty"` // 0-100
diff --git a/internal/ui/handler_test.go b/internal/ui/handler_test.go
index 5aee95c7..932b7740 100644
--- a/internal/ui/handler_test.go
+++ b/internal/ui/handler_test.go
@@ -284,10 +284,10 @@ func TestRegisterRoutes_IndexShowsAPIAccessWithoutRenderingPrivateIP(t *testing.
 		`api_access`,
 		`api_access_desc`,
 		`apiBaseDisplay()`,
-		`apiDeploymentChatCapable(dep)`,
+		`apiDeploymentChatCapable(deploymentDetailData)`,
 		`api_non_chat_hint`,
 		`copyCurrentAPIBaseURL($event)`,
-		`copyAPICurl(dep, $event)`,
+		`copyAPICurl(deploymentDetailData, $event)`,
 		`apiCurlTemplate(dep)`,
 		`api_public_unconfigured`,
 	} {
@@ -493,11 +493,19 @@ func TestRegisterRoutes_IndexIncludesDeploymentStageFeedback(t *testing.T) {
 	body := rec.Body.String()
 	for _, token := range []string{
 		"startup_progress",
-		"startup_message || dep.startup_phase || 'Initializing...'",
-		"dep.eta ? '~' + dep.eta",
+		"deployment-service-card",
+		"deploymentShowProgress(dep)",
+		"deploymentProgressValue(dep)",
+		"deploymentProgressText(dep)",
+		"openDeploymentDetail(dep)",
+		"deploymentDetailOpen",
+		"deploymentDetailRequestSeq",
+		"this.callTool('deploy.status', { name })",
+		"clearMissingGpuMemory: true",
+		"deploymentGpuMemoryMiB(d)",
+		"handleDeploymentStopClick($event, deploymentDetailData.name, { closeDetail: true })",
 		"failure_detail: this.summarizeDeploymentFailure(d)",
 		"summarizeDeploymentFailure(dep)",
-		"dep.phase === 'running' && dep.ready && dep.address",
 	} {
 		if !strings.Contains(body, token) {
 			t.Fatalf("body missing %q", token)
diff --git a/internal/ui/static/index.html b/internal/ui/static/index.html
index 446f79b2..30d896cf 100644
--- a/internal/ui/static/index.html
+++ b/internal/ui/static/index.html
@@ -483,12 +483,303 @@
   border-color: var(--accent);
   background: var(--accent);
 }
+.api-copy-btn.icon-only {
+  width: 28px;
+  height: 28px;
+  padding: 0;
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+}
 .api-public-note {
   margin-top: 8px;
   color: var(--text-tertiary);
   font-size: 11px;
   line-height: 1.45;
 }
+.deployment-services-panel .panel-title {
+  font-size: 15px;
+  padding-bottom: 10px;
+}
+.deployment-service-list {
+  display: flex;
+  flex-direction: column;
+  gap: 12px;
+}
+.deployment-service-card {
+  padding: 14px;
+  border: 1px solid var(--border-medium);
+  border-radius: var(--radius-md);
+  background:
+    linear-gradient(135deg, rgba(255, 255, 255, 0.055), rgba(255, 255, 255, 0.025)),
+    var(--bg-panel);
+  box-shadow: inset 0 1px 0 rgba(255, 255, 255, 0.04);
+}
+.deployment-service-content {
+  min-width: 0;
+}
+.deployment-service-head {
+  display: flex;
+  align-items: center;
+  gap: 10px;
+}
+.deployment-service-head::before {
+  content: "";
+  width: 8px;
+  height: 8px;
+  border-radius: 999px;
+  flex-shrink: 0;
+  background: var(--warning);
+  box-shadow: 0 0 12px currentColor;
+  color: var(--warning);
+}
+.deployment-service-card:has(.deployment-service-badge.ready) .deployment-service-head::before {
+  background: var(--success);
+  color: var(--success);
+}
+.deployment-service-card:has(.deployment-service-badge.failed) .deployment-service-head::before {
+  background: var(--error);
+  color: var(--error);
+}
+.deployment-service-main {
+  min-width: 0;
+}
+.deployment-service-name {
+  color: var(--text);
+  font-size: 13px;
+  font-weight: 700;
+  line-height: 1.3;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+}
+.deployment-service-row {
+  display: grid;
+  align-items: center;
+  gap: 10px;
+  margin-top: 12px;
+}
+.deployment-service-row.ready {
+  grid-template-columns: auto auto auto;
+}
+.deployment-service-row.starting {
+  grid-template-columns: auto minmax(0, 1fr) auto;
+}
+.deployment-service-row.failed {
+  grid-template-columns: minmax(0, 1fr) auto auto;
+}
+.deployment-service-badge {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  flex-shrink: 0;
+  min-width: 48px;
+  height: 24px;
+  padding: 0 10px;
+  border-radius: 999px;
+  font-size: 11px;
+  font-weight: 700;
+  line-height: 1;
+  white-space: nowrap;
+}
+.deployment-service-badge.ready {
+  color: var(--success);
+  background: rgba(48, 209, 88, 0.14);
+}
+.deployment-service-badge.starting {
+  color: var(--warning);
+  background: rgba(255, 159, 10, 0.14);
+}
+.deployment-service-badge.failed {
+  color: var(--error);
+  background: rgba(255, 69, 58, 0.14);
+}
+.deployment-service-progress {
+  display: grid;
+  grid-template-columns: minmax(0, 1fr) auto;
+  align-items: center;
+  gap: 10px;
+  min-width: 0;
+}
+.deployment-service-progress .deploy-progress {
+  height: 7px;
+  margin-top: 0;
+}
+.deployment-service-progress span {
+  color: var(--text-dim);
+  font-family: var(--font-mono);
+  font-size: 12px;
+}
+.deployment-service-error {
+  min-width: 0;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+}
+.deployment-service-row .deployment-service-error {
+  margin-top: 0;
+  padding-left: 0;
+}
+.deployment-service-row .deployment-service-action-btn {
+  min-width: 52px;
+  height: 24px;
+  padding: 0 10px;
+  font-size: 11px;
+  line-height: 1;
+  white-space: nowrap;
+}
+.deployment-service-btn {
+  min-width: 54px;
+  height: 32px;
+  padding: 0 12px;
+  border: 1px solid var(--border-medium);
+  border-radius: 9px;
+  background: var(--input-bg);
+  color: var(--text-dim);
+  font-family: var(--font-sans);
+  font-size: 12px;
+  font-weight: 700;
+  cursor: pointer;
+}
+.deployment-service-btn:hover {
+  color: var(--text);
+  border-color: rgba(255, 255, 255, 0.24);
+  background: var(--btn-icon-hover);
+}
+.deployment-service-btn:disabled {
+  opacity: 0.4;
+  cursor: not-allowed;
+}
+.deployment-service-btn.danger:hover {
+  color: var(--error);
+  border-color: rgba(255, 69, 58, 0.5);
+  background: rgba(255, 69, 58, 0.1);
+}
+@media (max-width: 520px) {
+  .deployment-service-row.ready,
+  .deployment-service-row.starting,
+  .deployment-service-row.failed {
+    grid-template-columns: minmax(0, 1fr) auto;
+  }
+  .deployment-service-row.starting .deployment-service-progress {
+    grid-column: 1 / -1;
+  }
+}
+.deployment-service-modal {
+  width: min(920px, calc(100vw - 64px));
+}
+.deployment-service-modal .api-access-row {
+  grid-template-columns: 110px minmax(0, 1fr) auto;
+  min-height: 38px;
+  padding: 0 10px;
+  border-bottom: 1px solid var(--border-light);
+}
+.deployment-service-modal .api-access-row:last-child {
+  border-bottom: none;
+}
+.deployment-service-modal .api-copy-btn:hover {
+  color: var(--text);
+  border-color: var(--border-medium);
+  background: var(--btn-icon-hover);
+}
+.deployment-detail-status-bar {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+  min-width: 0;
+  color: var(--text-dim);
+  font-size: 12px;
+  font-weight: 600;
+}
+.deployment-detail-status-dot {
+  width: 8px;
+  height: 8px;
+  border-radius: 999px;
+  flex-shrink: 0;
+}
+.deployment-detail-status-dot.ready { background: var(--success); box-shadow: 0 0 10px rgba(48, 209, 88, 0.45); }
+.deployment-detail-status-dot.starting { background: var(--warning); box-shadow: 0 0 10px rgba(255, 159, 10, 0.42); }
+.deployment-detail-status-dot.failed { background: var(--error); box-shadow: 0 0 10px rgba(255, 69, 58, 0.42); }
+.deployment-diagnostics-table {
+  display: grid;
+  grid-template-columns: repeat(2, minmax(0, 1fr));
+  border: 1px solid var(--border-light);
+  border-radius: var(--radius-sm);
+  overflow: hidden;
+  background: var(--input-bg);
+}
+.deployment-config-table {
+  display: grid;
+  grid-template-columns: repeat(2, minmax(300px, 1fr));
+  border: 1px solid var(--border-light);
+  border-radius: var(--radius-sm);
+  overflow: hidden;
+  background: var(--input-bg);
+}
+.deployment-diagnostics-row {
+  display: grid;
+  grid-template-columns: minmax(120px, 0.8fr) minmax(0, 1fr);
+  gap: 10px;
+  align-items: center;
+  min-height: 44px;
+  padding: 9px 12px;
+  border-right: 1px solid var(--border-light);
+  border-bottom: 1px solid var(--border-light);
+}
+.deployment-config-row {
+  display: grid;
+  grid-template-columns: minmax(0, 1fr) minmax(132px, max-content);
+  column-gap: 36px;
+  align-items: center;
+  min-height: 44px;
+  padding: 9px 28px 9px 24px;
+  border-right: 1px solid var(--border-light);
+  border-bottom: 1px solid var(--border-light);
+}
+.deployment-config-row:nth-child(2n),
+.deployment-diagnostics-row:nth-child(2n) {
+  border-right: none;
+}
+.deployment-config-row:nth-last-child(-n + 2),
+.deployment-diagnostics-row:nth-last-child(-n + 2) {
+  border-bottom: none;
+}
+.deployment-config-key,
+.deployment-diagnostics-key {
+  color: var(--text-tertiary);
+  font-size: 12px;
+}
+.deployment-config-key {
+  min-width: 0;
+  overflow-wrap: anywhere;
+}
+.deployment-config-value,
+.deployment-diagnostics-value {
+  color: var(--text);
+  font-family: var(--font-mono);
+  font-size: 12px;
+  overflow-wrap: anywhere;
+}
+.deployment-config-value {
+  min-width: 0;
+  justify-self: start;
+  padding-left: 10px;
+}
+.deployment-diagnostics-value {
+  color: var(--text-dim);
+}
+.deployment-service-footer {
+  padding-top: 12px;
+}
+.deployment-service-footer .modal-btn.danger {
+  color: var(--error);
+  border-color: rgba(255, 69, 58, 0.45);
+  background: rgba(255, 69, 58, 0.08);
+}
+.deployment-service-footer .modal-btn.danger:hover {
+  border-color: var(--error);
+  background: rgba(255, 69, 58, 0.14);
+}
 .model-list-item {
   display: flex;
   align-items: flex-start;
@@ -2794,11 +3085,25 @@
   }
   .deploy-chip-row,
   .deploy-grid,
+  .deployment-config-table,
+  .deployment-diagnostics-table,
   .deploy-vram-top,
   .deploy-form-grid,
   .deploy-vram-breakdown {
     grid-template-columns: 1fr;
   }
+  .deployment-config-row,
+  .deployment-diagnostics-row {
+    border-right: none;
+  }
+  .deployment-config-row:nth-last-child(-n + 2),
+  .deployment-diagnostics-row:nth-last-child(-n + 2) {
+    border-bottom: 1px solid var(--border-light);
+  }
+  .deployment-config-row:last-child,
+  .deployment-diagnostics-row:last-child {
+    border-bottom: none;
+  }
   .deploy-param-row {
     grid-template-columns: 1fr;
   }
@@ -5054,86 +5359,77 @@ <h3 x-text="t('wiz_complete_title')"></h3>
       </div>
 
       <!-- Deployments Panel -->
-      <div class="panel">
-        <div class="panel-title">&#x25B2; <span x-text="t('deployments')"></span><span class="panel-title-actions"><button type="button" class="panel-action-btn" :disabled="deploymentScanning" @click="scanDeployments()" x-text="deploymentScanning ? t('scanning_label') : t('scan_label')"></button></span></div>
+      <div class="panel deployment-services-panel">
+        <div class="panel-title">&#x25B2; <span x-text="t('running_services')"></span><span class="panel-title-actions"><button type="button" class="panel-action-btn" :disabled="deploymentScanning" @click="scanDeployments()" x-text="deploymentScanning ? t('scanning_label') : t('refresh_label')"></button></span></div>
         <template x-if="deployments.length === 0">
           <div class="empty" x-text="t('no_deployments')"></div>
         </template>
-        <ul class="panel-list">
+        <div class="deployment-service-list">
           <template x-for="dep in deployments" :key="dep.name || dep.model || dep.address || dep.detail">
-            <li :class="{ starting: dep.startup_progress > 0 && dep.startup_progress < 100 }">
-              <span class="dot" :class="dep.phase === 'running' && dep.ready ? 'dot-green' : dep.phase === 'failed' ? 'dot-red' : 'dot-orange'"></span>
-              <div style="flex:1;overflow:hidden">
-                <div x-text="dep.name" style="text-overflow:ellipsis;overflow:hidden"></div>
-                <div style="font-size:10px;color:var(--text-dim)" x-text="dep.detail"></div>
-                <!-- Startup progress - show when starting or has progress -->
-                <template x-if="(dep.phase === 'starting' || dep.startup_progress > 0) && !dep.ready">
-                  <div style="margin-top:6px">
-                    <div class="deploy-progress">
-                      <div class="deploy-progress-fill starting" :style="'width:' + Math.max(5, Math.min(dep.startup_progress || 5, 95)) + '%'"></div>
-                    </div>
-                    <div class="deploy-phase-text">
-                      <span>
-                        <span class="deploy-phase-icon">◐</span>
-                        <span x-text="dep.startup_message || dep.startup_phase || 'Initializing...'"></span>
-                      </span>
-                      <span class="deploy-eta" x-text="dep.eta ? '~' + dep.eta : (dep.startup_progress || 5) + '%'"></span>
+            <div class="deployment-service-card">
+              <div class="deployment-service-content">
+                <div class="deployment-service-head">
+                  <div class="deployment-service-main">
+                    <div class="deployment-service-name" x-text="apiDeploymentModel(dep)" :title="dep.name || apiDeploymentModel(dep)"></div>
+                  </div>
+                </div>
+                <template x-if="deploymentShowProgress(dep)">
+                  <div class="deployment-service-row starting">
+                    <span class="deployment-service-badge" :class="deploymentTone(dep)" x-text="deploymentStatusLabel(dep)"></span>
+                    <div class="deployment-service-progress">
+                      <div class="deploy-progress">
+                        <div class="deploy-progress-fill starting" :style="'width:' + deploymentProgressValue(dep) + '%'"></div>
+                      </div>
+                      <span x-text="deploymentProgressText(dep)"></span>
                     </div>
+                    <template x-if="dep.name">
+                      <button
+                        type="button"
+                        class="model-deploy-btn deployment-service-action-btn is-stop"
+                        :class="deploymentStopping[dep.name] ? 'is-busy' : ''"
+                        :aria-busy="deploymentStopping[dep.name] ? 'true' : 'false'"
+                        @click.stop.prevent="handleDeploymentStopClick($event, dep.name)"
+                        x-text="deploymentStopping[dep.name] ? t('stop_service_progress') : t('stop_label')"></button>
+                    </template>
                   </div>
                 </template>
-                <!-- Ready indicator -->
-                <template x-if="dep.phase === 'running' && dep.ready && dep.address">
-                  <div style="font-size:10px;color:var(--success);margin-top:2px;display:flex;align-items:center;gap:4px">
-                    <span>●</span>
-                    <span x-text="t('backend_ready')"></span>
+                <template x-if="!deploymentShowProgress(dep) && dep.phase !== 'failed'">
+                  <div class="deployment-service-row ready">
+                    <span class="deployment-service-badge" :class="deploymentTone(dep)" x-text="deploymentStatusLabel(dep)"></span>
+                    <button type="button" class="model-deploy-btn deployment-service-action-btn" @click.stop.prevent="openDeploymentDetail(dep)" x-text="t('deployment_detail_action')"></button>
+                    <template x-if="dep.name">
+                      <button
+                        type="button"
+                        class="model-deploy-btn deployment-service-action-btn is-stop"
+                        :class="deploymentStopping[dep.name] ? 'is-busy' : ''"
+                        :aria-busy="deploymentStopping[dep.name] ? 'true' : 'false'"
+                        @click.stop.prevent="handleDeploymentStopClick($event, dep.name)"
+                        x-text="deploymentStopping[dep.name] ? t('stop_service_progress') : t('stop_label')"></button>
+                    </template>
                   </div>
                 </template>
-                <template x-if="dep.phase === 'running' && dep.ready">
-                  <div class="api-access-inline">
-                    <div class="api-access-head">
-                      <span class="api-access-title" x-text="t('api_access')"></span>
-                      <span class="api-access-desc" x-text="t('api_access_desc')"></span>
-                    </div>
-                    <div class="api-access-row">
-                      <span class="api-access-label" x-text="t('api_base_url')"></span>
-                      <code class="api-access-value" x-text="apiBaseDisplay()"></code>
-                      <button type="button" class="api-copy-btn" @click="copyCurrentAPIBaseURL($event)" x-text="t('wiz_copy')"></button>
-                    </div>
-                    <div class="api-access-row">
-                      <span class="api-access-label" x-text="t('api_model')"></span>
-                      <code class="api-access-value" x-text="apiDeploymentModel(dep)"></code>
-                      <button type="button" class="api-copy-btn" @click="wizCopyText(apiDeploymentModel(dep), $event)" x-text="t('wiz_copy')"></button>
-                    </div>
-                    <div class="api-access-row">
-                      <span class="api-access-label" x-text="t('api_key')"></span>
-                      <code class="api-access-value" x-text="apiKeyDisplay()"></code>
-                      <button type="button" class="api-copy-btn" @click="copyCurrentAPIKey($event)" x-text="t('wiz_copy')"></button>
-                    </div>
-                    <div class="api-access-actions" x-show="apiDeploymentChatCapable(dep)">
-                      <button type="button" class="api-copy-btn" @click="copyAPICurl(dep, $event)" x-text="t('api_copy_curl')"></button>
-                      <button type="button" class="api-copy-btn" @click="copyOpenAISDKExample(dep, $event)" x-text="t('api_copy_openai')"></button>
-                    </div>
-                    <div class="api-public-note" x-show="!apiDeploymentChatCapable(dep)" x-text="apiNonChatHint(dep)"></div>
-                    <div class="api-public-note" x-text="t('api_public_unconfigured')"></div>
+                <template x-if="dep.phase === 'failed'">
+                  <div class="deployment-service-row failed">
+                    <div class="deploy-error-lines deployment-service-error" x-text="deploymentFailureText(dep) || deploymentStatusLabel(dep)" :title="dep.error_lines || deploymentFailureText(dep)"></div>
+                    <button type="button" class="model-deploy-btn deployment-service-action-btn" @click.stop.prevent="openDeploymentDetail(dep)" x-text="t('deployment_detail_action')"></button>
+                    <template x-if="dep.name">
+                      <button
+                        type="button"
+                        class="model-deploy-btn deployment-service-action-btn is-stop"
+                        :class="deploymentStopping[dep.name] ? 'is-busy' : ''"
+                        :aria-busy="deploymentStopping[dep.name] ? 'true' : 'false'"
+                        @click.stop.prevent="handleDeploymentStopClick($event, dep.name)"
+                        x-text="deploymentStopping[dep.name] ? t('stop_service_progress') : t('stop_label')"></button>
+                    </template>
                   </div>
                 </template>
-                <!-- Error display -->
-                <template x-if="dep.phase === 'failed' && dep.failure_detail">
-                  <div class="deploy-error-lines" x-text="dep.failure_detail" :title="dep.error_lines || dep.failure_detail"></div>
+                <template x-if="deploymentStopFeedback[dep.name]">
+                  <div class="modal-feedback deploy-modal-feedback deployment-service-error" :class="deploymentStopFeedback[dep.name].type" x-text="deploymentStopFeedback[dep.name].text"></div>
                 </template>
               </div>
-              <template x-if="dep.name">
-                <button
-                  type="button"
-                  class="model-deploy-btn is-stop"
-                  :class="deploymentStopping[dep.name] ? 'is-busy' : ''"
-                  :disabled="deploymentStopping[dep.name]"
-                  @click="stopDeployment(dep.name)"
-                  x-text="deploymentStopping[dep.name] ? t('deploying_label') : t('stop_label')"></button>
-              </template>
-            </li>
+            </div>
           </template>
-        </ul>
+        </div>
       </div>
 
       <!-- Fleet Panel -->
@@ -5222,83 +5518,77 @@ <h3 x-text="t('wiz_complete_title')"></h3>
             <span class="agent-info-value clickable" @click="openSettings()" x-text="t('configure')"></span>
           </div>
         </div>
-        <div class="panel">
-          <div class="panel-title">&#x25B2; <span x-text="t('deployments')"></span><span class="panel-title-actions"><button type="button" class="panel-action-btn" :disabled="deploymentScanning" @click="scanDeployments()" x-text="deploymentScanning ? t('scanning_label') : t('scan_label')"></button></span></div>
+        <div class="panel deployment-services-panel">
+          <div class="panel-title">&#x25B2; <span x-text="t('running_services')"></span><span class="panel-title-actions"><button type="button" class="panel-action-btn" :disabled="deploymentScanning" @click="scanDeployments()" x-text="deploymentScanning ? t('scanning_label') : t('refresh_label')"></button></span></div>
           <template x-if="deployments.length === 0">
             <div class="empty" x-text="t('no_deployments')"></div>
           </template>
-          <ul class="panel-list">
+          <div class="deployment-service-list">
             <template x-for="dep in deployments" :key="dep.name || dep.model || dep.address || dep.detail">
-              <li :class="{ starting: dep.startup_progress > 0 && dep.startup_progress < 100 }" style="flex-wrap:wrap">
-                <span class="dot" :class="dep.phase === 'running' && dep.ready ? 'dot-green' : dep.phase === 'failed' ? 'dot-red' : 'dot-orange'"></span>
-                <div style="flex:1;min-width:0">
-                  <div x-text="dep.name" style="text-overflow:ellipsis;overflow:hidden"></div>
-                  <div style="font-size:10px;color:var(--text-dim)" x-text="dep.detail"></div>
-                  <template x-if="dep.phase === 'running' && dep.ready && dep.address">
-                    <div style="font-size:10px;color:var(--success);margin-top:2px;display:flex;align-items:center;gap:4px">
-                      <span>●</span>
-                      <span x-text="t('backend_ready')"></span>
+              <div class="deployment-service-card">
+                <div class="deployment-service-content">
+                  <div class="deployment-service-head">
+                    <div class="deployment-service-main">
+                      <div class="deployment-service-name" x-text="apiDeploymentModel(dep)" :title="dep.name || apiDeploymentModel(dep)"></div>
                     </div>
-                  </template>
-                  <template x-if="dep.phase === 'running' && dep.ready">
-                    <div class="api-access-inline">
-                      <div class="api-access-head">
-                        <span class="api-access-title" x-text="t('api_access')"></span>
-                        <span class="api-access-desc" x-text="t('api_access_desc')"></span>
-                      </div>
-                      <div class="api-access-row">
-                        <span class="api-access-label" x-text="t('api_base_url')"></span>
-                        <code class="api-access-value" x-text="apiBaseDisplay()"></code>
-                        <button type="button" class="api-copy-btn" @click="copyCurrentAPIBaseURL($event)" x-text="t('wiz_copy')"></button>
-                      </div>
-                      <div class="api-access-row">
-                        <span class="api-access-label" x-text="t('api_model')"></span>
-                        <code class="api-access-value" x-text="apiDeploymentModel(dep)"></code>
-                        <button type="button" class="api-copy-btn" @click="wizCopyText(apiDeploymentModel(dep), $event)" x-text="t('wiz_copy')"></button>
-                      </div>
-                      <div class="api-access-row">
-                        <span class="api-access-label" x-text="t('api_key')"></span>
-                        <code class="api-access-value" x-text="apiKeyDisplay()"></code>
-                        <button type="button" class="api-copy-btn" @click="copyCurrentAPIKey($event)" x-text="t('wiz_copy')"></button>
-                      </div>
-                      <div class="api-access-actions" x-show="apiDeploymentChatCapable(dep)">
-                        <button type="button" class="api-copy-btn" @click="copyAPICurl(dep, $event)" x-text="t('api_copy_curl')"></button>
-                        <button type="button" class="api-copy-btn" @click="copyOpenAISDKExample(dep, $event)" x-text="t('api_copy_openai')"></button>
+                  </div>
+                  <template x-if="deploymentShowProgress(dep)">
+                    <div class="deployment-service-row starting">
+                      <span class="deployment-service-badge" :class="deploymentTone(dep)" x-text="deploymentStatusLabel(dep)"></span>
+                      <div class="deployment-service-progress">
+                        <div class="deploy-progress">
+                          <div class="deploy-progress-fill starting" :style="'width:' + deploymentProgressValue(dep) + '%'"></div>
+                        </div>
+                        <span x-text="deploymentProgressText(dep)"></span>
                       </div>
-                      <div class="api-public-note" x-show="!apiDeploymentChatCapable(dep)" x-text="apiNonChatHint(dep)"></div>
-                      <div class="api-public-note" x-text="t('api_public_unconfigured')"></div>
+                      <template x-if="dep.name">
+                        <button
+                          type="button"
+                          class="model-deploy-btn deployment-service-action-btn is-stop"
+                          :class="deploymentStopping[dep.name] ? 'is-busy' : ''"
+                          :aria-busy="deploymentStopping[dep.name] ? 'true' : 'false'"
+                          @click.stop.prevent="handleDeploymentStopClick($event, dep.name)"
+                          x-text="deploymentStopping[dep.name] ? t('stop_service_progress') : t('stop_label')"></button>
+                      </template>
                     </div>
                   </template>
-                  <template x-if="(dep.phase === 'starting' || dep.startup_progress > 0) && !dep.ready">
-                    <div style="margin-top:6px">
-                      <div class="deploy-progress">
-                        <div class="deploy-progress-fill starting" :style="'width:' + Math.max(5, Math.min(dep.startup_progress || 5, 95)) + '%'"></div>
-                      </div>
-                      <div class="deploy-phase-text">
-                        <span>
-                          <span class="deploy-phase-icon">◐</span>
-                          <span x-text="dep.startup_message || dep.startup_phase || 'Initializing...'"></span>
-                        </span>
-                        <span class="deploy-eta" x-text="dep.eta ? '~' + dep.eta : (dep.startup_progress || 5) + '%'"></span>
-                      </div>
+                  <template x-if="!deploymentShowProgress(dep) && dep.phase !== 'failed'">
+                    <div class="deployment-service-row ready">
+                      <span class="deployment-service-badge" :class="deploymentTone(dep)" x-text="deploymentStatusLabel(dep)"></span>
+                      <button type="button" class="model-deploy-btn deployment-service-action-btn" @click.stop.prevent="openDeploymentDetail(dep)" x-text="t('deployment_detail_action')"></button>
+                      <template x-if="dep.name">
+                        <button
+                          type="button"
+                          class="model-deploy-btn deployment-service-action-btn is-stop"
+                          :class="deploymentStopping[dep.name] ? 'is-busy' : ''"
+                          :aria-busy="deploymentStopping[dep.name] ? 'true' : 'false'"
+                          @click.stop.prevent="handleDeploymentStopClick($event, dep.name)"
+                          x-text="deploymentStopping[dep.name] ? t('stop_service_progress') : t('stop_label')"></button>
+                      </template>
                     </div>
                   </template>
-                <template x-if="dep.phase === 'failed' && dep.failure_detail">
-                  <div class="deploy-error-lines" x-text="dep.failure_detail" :title="dep.error_lines || dep.failure_detail"></div>
-                </template>
+                  <template x-if="dep.phase === 'failed'">
+                    <div class="deployment-service-row failed">
+                      <div class="deploy-error-lines deployment-service-error" x-text="deploymentFailureText(dep) || deploymentStatusLabel(dep)" :title="dep.error_lines || deploymentFailureText(dep)"></div>
+                      <button type="button" class="model-deploy-btn deployment-service-action-btn" @click.stop.prevent="openDeploymentDetail(dep)" x-text="t('deployment_detail_action')"></button>
+                      <template x-if="dep.name">
+                        <button
+                          type="button"
+                          class="model-deploy-btn deployment-service-action-btn is-stop"
+                          :class="deploymentStopping[dep.name] ? 'is-busy' : ''"
+                          :aria-busy="deploymentStopping[dep.name] ? 'true' : 'false'"
+                          @click.stop.prevent="handleDeploymentStopClick($event, dep.name)"
+                          x-text="deploymentStopping[dep.name] ? t('stop_service_progress') : t('stop_label')"></button>
+                      </template>
+                    </div>
+                  </template>
+                  <template x-if="deploymentStopFeedback[dep.name]">
+                    <div class="modal-feedback deploy-modal-feedback deployment-service-error" :class="deploymentStopFeedback[dep.name].type" x-text="deploymentStopFeedback[dep.name].text"></div>
+                  </template>
+                </div>
               </div>
-              <template x-if="dep.name">
-                <button
-                  type="button"
-                  class="model-deploy-btn is-stop"
-                  :class="deploymentStopping[dep.name] ? 'is-busy' : ''"
-                  :disabled="deploymentStopping[dep.name]"
-                  @click="stopDeployment(dep.name)"
-                  x-text="deploymentStopping[dep.name] ? t('deploying_label') : t('stop_label')"></button>
-              </template>
-              </li>
             </template>
-          </ul>
+          </div>
         </div>
         <div class="panel">
           <div class="panel-title">&#x25A0; <span x-text="t('hardware')"></span></div>
@@ -5419,9 +5709,77 @@ <h3 x-text="t('wiz_complete_title')"></h3>
           <div class="panel-title">&#x25C9; <span x-text="t('fleet')"></span></div>
           <template x-for="(d, fi) in fleet" :key="d.id || d.addr || fi"><div class="fleet-device"><span class="status-dot" :class="d.online ? 'online' : 'offline'" style="width:6px;height:6px"></span><div><div class="name" x-text="d.name || d.id"></div><div class="meta" x-text="d.meta || ''"></div></div></div></template>
         </div>
-        <div class="panel">
-          <div class="panel-title">&#x25B2; <span x-text="t('deployments')"></span><span class="panel-title-actions"><button type="button" class="panel-action-btn" :disabled="deploymentScanning" @click="scanDeployments()" x-text="deploymentScanning ? t('scanning_label') : t('scan_label')"></button></span></div>
-          <ul class="panel-list"><template x-for="dep in deployments" :key="dep.name || dep.model || dep.address || dep.detail"><li style="flex-wrap:wrap"><span class="dot" :class="dep.phase === 'running' && dep.ready ? 'dot-green' : dep.phase === 'failed' ? 'dot-red' : 'dot-orange'"></span><span x-text="dep.name"></span><span class="item-detail" x-text="dep.phase === 'failed' ? (dep.failure_detail || dep.detail) : (dep.startup_message || dep.phase)"></span><template x-if="dep.startup_progress > 0 && dep.startup_progress < 100"><div style="width:100%;margin-top:2px"><div class="deploy-progress"><div class="deploy-progress-fill" :style="'width:' + dep.startup_progress + '%'"></div></div></div></template></li></template></ul>
+        <div class="panel deployment-services-panel">
+          <div class="panel-title">&#x25B2; <span x-text="t('running_services')"></span><span class="panel-title-actions"><button type="button" class="panel-action-btn" :disabled="deploymentScanning" @click="scanDeployments()" x-text="deploymentScanning ? t('scanning_label') : t('refresh_label')"></button></span></div>
+          <template x-if="deployments.length === 0">
+            <div class="empty" x-text="t('no_deployments')"></div>
+          </template>
+          <div class="deployment-service-list">
+            <template x-for="dep in deployments" :key="dep.name || dep.model || dep.address || dep.detail">
+              <div class="deployment-service-card">
+                <div class="deployment-service-content">
+                  <div class="deployment-service-head">
+                    <div class="deployment-service-main">
+                      <div class="deployment-service-name" x-text="apiDeploymentModel(dep)" :title="dep.name || apiDeploymentModel(dep)"></div>
+                    </div>
+                  </div>
+                  <template x-if="deploymentShowProgress(dep)">
+                    <div class="deployment-service-row starting">
+                      <span class="deployment-service-badge" :class="deploymentTone(dep)" x-text="deploymentStatusLabel(dep)"></span>
+                      <div class="deployment-service-progress">
+                        <div class="deploy-progress">
+                          <div class="deploy-progress-fill starting" :style="'width:' + deploymentProgressValue(dep) + '%'"></div>
+                        </div>
+                        <span x-text="deploymentProgressText(dep)"></span>
+                      </div>
+                      <template x-if="dep.name">
+                        <button
+                          type="button"
+                          class="model-deploy-btn deployment-service-action-btn is-stop"
+                          :class="deploymentStopping[dep.name] ? 'is-busy' : ''"
+                          :aria-busy="deploymentStopping[dep.name] ? 'true' : 'false'"
+                          @click.stop.prevent="handleDeploymentStopClick($event, dep.name)"
+                          x-text="deploymentStopping[dep.name] ? t('stop_service_progress') : t('stop_label')"></button>
+                      </template>
+                    </div>
+                  </template>
+                  <template x-if="!deploymentShowProgress(dep) && dep.phase !== 'failed'">
+                    <div class="deployment-service-row ready">
+                      <span class="deployment-service-badge" :class="deploymentTone(dep)" x-text="deploymentStatusLabel(dep)"></span>
+                      <button type="button" class="model-deploy-btn deployment-service-action-btn" @click.stop.prevent="openDeploymentDetail(dep)" x-text="t('deployment_detail_action')"></button>
+                      <template x-if="dep.name">
+                        <button
+                          type="button"
+                          class="model-deploy-btn deployment-service-action-btn is-stop"
+                          :class="deploymentStopping[dep.name] ? 'is-busy' : ''"
+                          :aria-busy="deploymentStopping[dep.name] ? 'true' : 'false'"
+                          @click.stop.prevent="handleDeploymentStopClick($event, dep.name)"
+                          x-text="deploymentStopping[dep.name] ? t('stop_service_progress') : t('stop_label')"></button>
+                      </template>
+                    </div>
+                  </template>
+                  <template x-if="dep.phase === 'failed'">
+                    <div class="deployment-service-row failed">
+                      <div class="deploy-error-lines deployment-service-error" x-text="deploymentFailureText(dep) || deploymentStatusLabel(dep)" :title="dep.error_lines || deploymentFailureText(dep)"></div>
+                      <button type="button" class="model-deploy-btn deployment-service-action-btn" @click.stop.prevent="openDeploymentDetail(dep)" x-text="t('deployment_detail_action')"></button>
+                      <template x-if="dep.name">
+                        <button
+                          type="button"
+                          class="model-deploy-btn deployment-service-action-btn is-stop"
+                          :class="deploymentStopping[dep.name] ? 'is-busy' : ''"
+                          :aria-busy="deploymentStopping[dep.name] ? 'true' : 'false'"
+                          @click.stop.prevent="handleDeploymentStopClick($event, dep.name)"
+                          x-text="deploymentStopping[dep.name] ? t('stop_service_progress') : t('stop_label')"></button>
+                      </template>
+                    </div>
+                  </template>
+                  <template x-if="deploymentStopFeedback[dep.name]">
+                    <div class="modal-feedback deploy-modal-feedback deployment-service-error" :class="deploymentStopFeedback[dep.name].type" x-text="deploymentStopFeedback[dep.name].text"></div>
+                  </template>
+                </div>
+              </div>
+            </template>
+          </div>
         </div>
       </div>
     </template>
@@ -5661,6 +6019,131 @@ <h3 x-text="deployDetailTitle()"></h3>
     </div>
   </template>
 
+  <!-- Deployment Detail Modal -->
+  <template x-if="deploymentDetailOpen">
+    <div class="modal-overlay deploy-modal-overlay" :class="{ minimized: deploymentDetailMinimized }" @click.self="closeDeploymentDetail()">
+      <div class="modal deploy-modal deployment-service-modal" :class="{ maximized: deploymentDetailMaximized && !deploymentDetailMinimized, minimized: deploymentDetailMinimized }" role="dialog" aria-modal="true" :aria-label="deploymentDetailTitle()">
+        <div class="deploy-modal-header">
+          <div class="deploy-modal-title">
+            <h3 x-text="deploymentDetailTitle()"></h3>
+            <div class="deploy-modal-subtitle" x-text="deploymentDetailSubtitle()"></div>
+          </div>
+          <div class="deploy-window-controls">
+            <button type="button" class="deploy-window-btn" @click="toggleDeploymentDetailMinimized()" :aria-label="deploymentDetailMinimized ? t('deploy_restore_modal') : t('deploy_minimize_modal')" :title="deploymentDetailMinimized ? t('deploy_restore_modal') : t('deploy_minimize_modal')" x-text="deploymentDetailMinimized ? '□' : '−'"></button>
+            <button type="button" class="deploy-window-btn" x-show="!deploymentDetailMinimized" @click="toggleDeploymentDetailMaximized()" :aria-label="deploymentDetailMaximized ? t('deploy_restore_modal') : t('deploy_maximize_modal')" :title="deploymentDetailMaximized ? t('deploy_restore_modal') : t('deploy_maximize_modal')" x-text="deploymentDetailMaximized ? '▣' : '□'"></button>
+            <button type="button" class="deploy-close-btn" @click="closeDeploymentDetail()" :aria-label="t('close_label')" title="Close">×</button>
+          </div>
+        </div>
+
+        <template x-if="deploymentDetailFeedback && !deploymentDetailMinimized">
+          <div class="modal-feedback deploy-modal-feedback" :class="deploymentDetailFeedback.type" x-text="deploymentDetailFeedback.text"></div>
+        </template>
+
+        <div class="deploy-scroll-body" x-show="!deploymentDetailMinimized">
+          <div class="modal-section">
+            <div class="modal-section-title" x-text="t('deployment_service_overview')"></div>
+            <div class="deploy-grid">
+              <div class="deploy-info-card">
+                <span class="deploy-info-label" x-text="t('wiz_engine_label')"></span>
+                <span class="deploy-info-value" x-text="deploymentEngineLabel(deploymentDetailData)"></span>
+              </div>
+              <div class="deploy-info-card">
+                <span class="deploy-info-label" x-text="t('deployment_actual_image')"></span>
+                <span class="deploy-info-value" x-text="deploymentImageLabel(deploymentDetailData)"></span>
+              </div>
+              <div class="deploy-info-card">
+                <span class="deploy-info-label" x-text="t('deploy_port')"></span>
+                <span class="deploy-info-value" x-text="deploymentPortLabel(deploymentDetailData)"></span>
+              </div>
+              <div class="deploy-info-card">
+                <span class="deploy-info-label" x-text="t('deploy_runtime')"></span>
+                <span class="deploy-info-value" x-text="deploymentDetailData && deploymentDetailData.runtime ? deploymentDetailData.runtime : '-'"></span>
+              </div>
+              <div class="deploy-info-card">
+                <span class="deploy-info-label" x-text="t('deployment_uptime')"></span>
+                <span class="deploy-info-value" x-text="deploymentUptimeLabel(deploymentDetailData)"></span>
+              </div>
+              <div class="deploy-info-card">
+                <span class="deploy-info-label" x-text="t('deployment_gpu_memory')"></span>
+                <span class="deploy-info-value" x-text="deploymentGpuUsedLabel()"></span>
+              </div>
+            </div>
+          </div>
+
+          <div class="modal-section" x-show="deploymentDetailData && deploymentDetailData.ready">
+            <div class="modal-section-title" x-text="t('api_access')"></div>
+            <div class="api-access-card">
+              <div class="api-access-row">
+                <span class="api-access-label" x-text="t('api_base_url')"></span>
+                <code class="api-access-value" x-text="apiBaseDisplay()"></code>
+                <button type="button" class="api-copy-btn icon-only" @click="copyCurrentAPIBaseURL($event)" :aria-label="t('wiz_copy')" title="Copy" aria-hidden="false">&#10697;</button>
+              </div>
+              <div class="api-access-row">
+                <span class="api-access-label" x-text="t('api_model')"></span>
+                <code class="api-access-value" x-text="apiDeploymentModel(deploymentDetailData)"></code>
+                <button type="button" class="api-copy-btn icon-only" @click="wizCopyText(apiDeploymentModel(deploymentDetailData), $event)" :aria-label="t('wiz_copy')" title="Copy" aria-hidden="false">&#10697;</button>
+              </div>
+              <div class="api-access-row">
+                <span class="api-access-label" x-text="t('api_key')"></span>
+                <code class="api-access-value" x-text="apiKeyDisplay()"></code>
+                <button type="button" class="api-copy-btn icon-only" @click="copyCurrentAPIKey($event)" :aria-label="t('wiz_copy')" title="Copy" aria-hidden="false">&#10697;</button>
+              </div>
+              <div class="api-access-actions" x-show="apiDeploymentChatCapable(deploymentDetailData)">
+                <button type="button" class="api-copy-btn" @click="copyAPICurl(deploymentDetailData, $event)" x-text="t('api_copy_curl')"></button>
+                <button type="button" class="api-copy-btn" @click="copyOpenAISDKExample(deploymentDetailData, $event)" x-text="t('api_copy_openai')"></button>
+              </div>
+              <div class="api-public-note" x-show="!apiDeploymentChatCapable(deploymentDetailData)" x-text="apiNonChatHint(deploymentDetailData)"></div>
+              <div class="api-public-note" x-text="t('api_public_unconfigured')"></div>
+            </div>
+          </div>
+
+          <div class="modal-section" x-show="deploymentConfigRows().length > 0">
+            <div class="modal-section-title" x-text="t('deployment_launch_config')"></div>
+            <div class="deployment-config-table">
+              <template x-for="row in deploymentConfigRows()" :key="row.key">
+                <div class="deployment-config-row">
+                  <span class="deployment-config-key" x-text="row.key"></span>
+                  <span class="deployment-config-value" x-text="row.value"></span>
+                </div>
+              </template>
+            </div>
+          </div>
+
+          <div class="modal-section">
+            <div class="modal-section-title" x-text="t('deployment_diagnostics')"></div>
+            <div class="deployment-diagnostics-table">
+              <template x-for="row in deploymentDiagnosticsRows()" :key="row.key">
+                <div class="deployment-diagnostics-row">
+                  <span class="deployment-diagnostics-key" x-text="row.label"></span>
+                  <span class="deployment-diagnostics-value" x-text="row.value"></span>
+                </div>
+              </template>
+            </div>
+          </div>
+
+          <div class="modal-section" x-show="deploymentFailureText(deploymentDetailData)">
+            <div class="modal-section-title" x-text="t('deploy_failed')"></div>
+            <div class="deploy-error-lines" x-text="deploymentFailureText(deploymentDetailData)"></div>
+          </div>
+        </div>
+
+        <div class="modal-actions deploy-sticky-actions deployment-service-footer" x-show="!deploymentDetailMinimized">
+          <div class="deployment-detail-status-bar">
+            <span class="deployment-detail-status-dot" :class="deploymentTone(deploymentDetailData)"></span>
+            <span x-text="deploymentFooterStatusText()"></span>
+          </div>
+          <div class="deploy-action-buttons">
+            <button class="modal-btn" @click="refreshDeploymentDetail()" :disabled="deploymentDetailLoading" x-text="deploymentDetailLoading ? t('loading') : t('refresh_status')"></button>
+            <template x-if="deploymentDetailData && deploymentDetailData.name">
+              <button type="button" class="model-deploy-btn deployment-service-action-btn is-stop" :aria-busy="deploymentStopping[deploymentDetailData.name] ? 'true' : 'false'" @click.stop.prevent="handleDeploymentStopClick($event, deploymentDetailData.name, { closeDetail: true })" x-text="deploymentStopping[deploymentDetailData.name] ? t('stop_service_progress') : t('stop_service')"></button>
+            </template>
+            <button class="modal-btn" @click="closeDeploymentDetail()" x-text="t('close_label')"></button>
+          </div>
+        </div>
+      </div>
+    </div>
+  </template>
+
   <!-- Settings Modal -->
   <template x-if="showSettings">
     <div class="modal-overlay" @click.self="showSettings = false">
@@ -6121,6 +6604,31 @@ <h3 class="onboarding-drawer-title" x-text="onboardingText(((onboardingLocaleDat
     no_deployments: 'No active deployments',
     private_address_hidden: 'Private address hidden',
     backend_ready: 'Backend ready',
+    running_services: 'Running services',
+    refresh_label: 'Refresh',
+    close_label: 'Close',
+    refresh_status: 'Refresh status',
+    stop_service: 'Stop service',
+    stop_service_progress: 'Stopping service',
+    stop_service_failed: 'Stop failed:',
+    stop_service_done: 'Stopped service',
+    stop_deploy_progress: 'Stopping deployment',
+    stop_deploy_failed: 'Stop failed:',
+    stop_deploy_done: 'Stopped deployment',
+    deployment_detail_action: 'Details',
+    deployment_detail_title: 'Service details',
+    deployment_detail_subtitle: 'Runtime status, API access, and actual running parameters.',
+    deployment_service_overview: 'Service overview',
+    deployment_status: 'Status',
+    deployment_actual_image: 'Actual image',
+    deployment_uptime: 'Runtime',
+    deployment_gpu_memory: 'Service GPU memory',
+    deployment_gpu_memory_hint: 'GPU memory currently attributed to this service.',
+    deployment_launch_config: 'Running parameters',
+    deployment_diagnostics: 'Diagnostics',
+    deployment_detail_loading: 'Loading service details...',
+    deployment_detail_failed: 'Could not load full service details. Showing latest overview.',
+    deployment_detail_updated: 'Updated',
     api_access: 'API Access',
     api_access_desc: 'Call the model through the AIMA OpenAI-compatible proxy. Do not call the backend engine address directly.',
     api_base_url: 'Base URL',
@@ -6498,6 +7006,31 @@ <h3 class="onboarding-drawer-title" x-text="onboardingText(((onboardingLocaleDat
     no_deployments: '\u65E0\u6D3B\u52A8\u90E8\u7F72',
     private_address_hidden: '\u79C1\u7F51\u5730\u5740\u5DF2\u9690\u85CF',
     backend_ready: '\u540E\u7AEF\u5DF2\u5C31\u7EEA',
+    running_services: '\u8FD0\u884C\u670D\u52A1',
+    refresh_label: '\u5237\u65B0',
+    close_label: '\u5173\u95ED',
+    refresh_status: '\u5237\u65B0\u72B6\u6001',
+    stop_service: '\u505C\u6B62\u670D\u52A1',
+    stop_service_progress: '\u6B63\u5728\u505C\u6B62\u670D\u52A1',
+    stop_service_failed: '\u505C\u6B62\u5931\u8D25\uFF1A',
+    stop_service_done: '\u5DF2\u505C\u6B62\u670D\u52A1',
+    stop_deploy_progress: '\u6B63\u5728\u505C\u6B62\u90E8\u7F72',
+    stop_deploy_failed: '\u505C\u6B62\u5931\u8D25\uFF1A',
+    stop_deploy_done: '\u5DF2\u505C\u6B62\u90E8\u7F72',
+    deployment_detail_action: '\u8BE6\u60C5',
+    deployment_detail_title: '\u670D\u52A1\u8BE6\u60C5',
+    deployment_detail_subtitle: '\u67E5\u770B\u8FD0\u884C\u72B6\u6001\u3001API \u63A5\u5165\u548C\u5B9E\u9645\u8FD0\u884C\u53C2\u6570\u3002',
+    deployment_service_overview: '\u670D\u52A1\u6982\u89C8',
+    deployment_status: '\u72B6\u6001',
+    deployment_actual_image: '\u5B9E\u9645\u955C\u50CF',
+    deployment_uptime: '\u8FD0\u884C\u65F6\u957F',
+    deployment_gpu_memory: '\u8BE5\u670D\u52A1\u663E\u5B58\u5360\u7528',
+    deployment_gpu_memory_hint: '\u540E\u7AEF\u6309\u8FD9\u4E2A\u8FD0\u884C\u670D\u52A1\u7EDF\u8BA1\u7684 GPU \u663E\u5B58\u5360\u7528\u3002',
+    deployment_launch_config: '\u8FD0\u884C\u53C2\u6570',
+    deployment_diagnostics: '\u8BCA\u65AD',
+    deployment_detail_loading: '\u6B63\u5728\u8BFB\u53D6\u670D\u52A1\u8BE6\u60C5...',
+    deployment_detail_failed: '\u6682\u65F6\u8BFB\u53D6\u4E0D\u5230\u5B8C\u6574\u8BE6\u60C5\uFF0C\u5148\u663E\u793A\u6700\u65B0\u6982\u89C8\u3002',
+    deployment_detail_updated: '\u5DF2\u66F4\u65B0',
     api_access: 'API \u63A5\u5165',
     api_access_desc: '\u901A\u8FC7 AIMA \u7684 OpenAI \u517C\u5BB9\u4EE3\u7406\u8C03\u7528\u6A21\u578B\uFF0C\u4E0D\u8981\u76F4\u63A5\u8C03\u7528\u540E\u7AEF\u5F15\u64CE\u5730\u5740\u3002',
     api_base_url: 'Base URL',
@@ -7357,6 +7890,7 @@ <h3 class="onboarding-drawer-title" x-text="onboardingText(((onboardingLocaleDat
     deploymentScanning: false,
     modelDeploying: {},
     deploymentStopping: {},
+    deploymentStopFeedback: {},
     deployDetailOpen: false,
     deployDetailLoading: false,
     deployDetailSubmitting: false,
@@ -7374,6 +7908,14 @@ <h3 class="onboarding-drawer-title" x-text="onboardingText(((onboardingLocaleDat
     deployDefaultsApplied: false,
     deployDefaultsAvailable: false,
     deploySavedDefaults: null,
+    deploymentDetailOpen: false,
+    deploymentDetailLoading: false,
+    deploymentDetailFeedback: null,
+    deploymentDetailData: null,
+    deploymentDetailUpdatedAt: '',
+    deploymentDetailMinimized: false,
+    deploymentDetailMaximized: false,
+    deploymentDetailRequestSeq: 0,
     fleet: [],
     // View toggle (chat / support / explorer)
     currentView: 'chat',
@@ -10198,6 +10740,225 @@ <h3 class="onboarding-drawer-title" x-text="onboardingText(((onboardingLocaleDat
       return this.lang === 'zh' ? '组件' : 'Component';
     },
 
+    deploymentStatusLabel(dep) {
+      if (!dep) return '-';
+      if (dep.phase === 'running' && dep.ready) return this.t('running_label');
+      if (dep.phase === 'failed') return this.t('deploy_failed');
+      if (dep.phase === 'starting' || (dep.phase === 'running' && !dep.ready)) return this.t('deploying_label');
+      return dep.phase || '-';
+    },
+
+    deploymentTone(dep) {
+      if (!dep) return 'starting';
+      if (dep.phase === 'failed') return 'failed';
+      if (dep.phase === 'running' && dep.ready) return 'ready';
+      return 'starting';
+    },
+
+    deploymentSummaryText(dep) {
+      if (!dep) return '';
+      if (dep.phase === 'failed') return dep.failure_detail || dep.message || dep.detail || dep.phase || '';
+      return dep.startup_message || dep.detail || dep.address || dep.phase || '';
+    },
+
+    deploymentEngineLabel(dep) {
+      if (!dep) return '-';
+      const labels = dep.labels || {};
+      return dep.engine || labels['aima.dev/engine'] || '-';
+    },
+
+    deploymentImageLabel(dep) {
+      if (!dep) return '-';
+      const labels = dep.labels || {};
+      const image = dep.image || dep.engine_image || labels['aima.dev/image'] || '';
+      return image || '-';
+    },
+
+    deploymentPortLabel(dep) {
+      if (!dep) return '-';
+      const labels = dep.labels || {};
+      const explicit = dep.port || dep.host_port || labels['aima.dev/host-port'] || labels['aima.dev/port'];
+      if (explicit) return String(explicit);
+      const match = String(dep.address || '').match(/:(\d+)$/);
+      return match ? match[1] : '-';
+    },
+
+    deploymentShowProgress(dep) {
+      return !!(dep && (dep.phase === 'starting' || dep.startup_progress > 0) && !dep.ready);
+    },
+
+    deploymentProgressValue(dep) {
+      const value = Number(dep && dep.startup_progress ? dep.startup_progress : 0);
+      return Math.max(5, Math.min(value || 5, 95));
+    },
+
+    deploymentProgressText(dep) {
+      if (!dep) return '';
+      if (dep.eta) return '~' + dep.eta;
+      return this.deploymentProgressValue(dep) + '%';
+    },
+
+    deploymentDetailTitle() {
+      const dep = this.deploymentDetailData || {};
+      return this.t('deployment_detail_title') + (dep.name ? ': ' + dep.name : '');
+    },
+
+    deploymentDetailSubtitle() {
+      const dep = this.deploymentDetailData || {};
+      const model = this.apiDeploymentModel(dep);
+      const status = this.deploymentStatusLabel(dep);
+      return [model && model !== 'model' ? model : '', status].filter(Boolean).join(' · ') || this.t('deployment_detail_subtitle');
+    },
+
+    async openDeploymentDetail(dep) {
+      if (!dep) return;
+      const requestSeq = ++this.deploymentDetailRequestSeq;
+      this.deploymentDetailOpen = true;
+      this.deploymentDetailLoading = true;
+      this.deploymentDetailFeedback = { type: 'warning', text: this.t('deployment_detail_loading') };
+      this.deploymentDetailData = { ...dep };
+      this.deploymentDetailUpdatedAt = '';
+      this.deploymentDetailMinimized = false;
+      this.deploymentDetailMaximized = false;
+      try {
+        await this.pollSystemStatus();
+        if (requestSeq !== this.deploymentDetailRequestSeq) return;
+        const name = dep.name || dep.model || '';
+        if (name) {
+          const data = await this.callTool('deploy.status', { name });
+          if (requestSeq !== this.deploymentDetailRequestSeq) return;
+          if (data && !data._err) {
+            this.deploymentDetailData = this.normalizeDeploymentDetail(data, dep, { clearMissingGpuMemory: true, clearMissingConfig: true });
+            this.deploymentDetailFeedback = null;
+          } else {
+            this.deploymentDetailFeedback = { type: 'warning', text: this.t('deployment_detail_failed') };
+          }
+        }
+        if (requestSeq !== this.deploymentDetailRequestSeq) return;
+        this.deploymentDetailUpdatedAt = new Date().toLocaleTimeString();
+      } finally {
+        if (requestSeq === this.deploymentDetailRequestSeq) {
+          this.deploymentDetailLoading = false;
+        }
+      }
+    },
+
+    closeDeploymentDetail() {
+      this.deploymentDetailRequestSeq += 1;
+      this.deploymentDetailOpen = false;
+      this.deploymentDetailFeedback = null;
+      this.deploymentDetailData = null;
+      this.deploymentDetailMinimized = false;
+      this.deploymentDetailMaximized = false;
+    },
+
+    toggleDeploymentDetailMinimized() {
+      this.deploymentDetailMinimized = !this.deploymentDetailMinimized;
+      if (this.deploymentDetailMinimized) this.deploymentDetailMaximized = false;
+    },
+
+    toggleDeploymentDetailMaximized() {
+      this.deploymentDetailMaximized = !this.deploymentDetailMaximized;
+    },
+
+    async refreshDeploymentDetail() {
+      if (!this.deploymentDetailData) return;
+      await this.openDeploymentDetail(this.deploymentDetailData);
+    },
+
+    normalizeDeploymentDetail(data, fallback, options = {}) {
+      const labels = { ...((fallback && fallback.labels) || {}), ...((data && data.labels) || {}) };
+      const merged = { ...(fallback || {}), ...(data || {}), labels };
+      const clearMissingGpuMemory = !!options.clearMissingGpuMemory;
+      if (!merged.model) merged.model = labels['aima.dev/model'] || '';
+      if (!merged.model_type) merged.model_type = (data && data.model_type) || labels['aima.dev/model_type'] || (fallback && fallback.model_type) || '';
+      if (!merged.engine) merged.engine = labels['aima.dev/engine'] || '';
+      if (!merged.image) merged.image = (data && (data.image || data.engine_image)) || (fallback && (fallback.image || fallback.engine_image)) || labels['aima.dev/image'] || '';
+      if (options.clearMissingConfig && (!data || !Object.prototype.hasOwnProperty.call(data, 'config'))) {
+        merged.config = {};
+      }
+      const hasGpuMemory = !!(data && (Object.prototype.hasOwnProperty.call(data, 'gpu_memory_mib') || Object.prototype.hasOwnProperty.call(data, 'gpu_memory_used_mib')));
+      if (hasGpuMemory) {
+        const rawGpuMemory = Object.prototype.hasOwnProperty.call(data, 'gpu_memory_mib') ? data.gpu_memory_mib : data.gpu_memory_used_mib;
+        const gpuMemory = Number(rawGpuMemory);
+        merged.gpu_memory_mib = Number.isFinite(gpuMemory) ? gpuMemory : 0;
+        merged.gpu_memory_used_mib = merged.gpu_memory_mib;
+      } else if (clearMissingGpuMemory) {
+        merged.gpu_memory_mib = 0;
+        merged.gpu_memory_used_mib = 0;
+      } else if (merged.gpu_memory_mib === undefined || merged.gpu_memory_mib === null) {
+        merged.gpu_memory_mib = this.deploymentGpuMemoryMiB(fallback);
+      }
+      if (data && Object.prototype.hasOwnProperty.call(data, 'gpu_memory_source')) {
+        merged.gpu_memory_source = data.gpu_memory_source || '';
+      } else if (clearMissingGpuMemory) {
+        merged.gpu_memory_source = '';
+      } else if (!merged.gpu_memory_source) {
+        merged.gpu_memory_source = (fallback && fallback.gpu_memory_source) || '';
+      }
+      if (!merged.detail) merged.detail = [merged.runtime, merged.ready ? this.t('running_label') : merged.phase].filter(Boolean).join(' ');
+      if (!merged.failure_detail) merged.failure_detail = this.summarizeDeploymentFailure(merged);
+      return merged;
+    },
+
+    deploymentGpuMemoryMiB(dep) {
+      if (!dep) return 0;
+      const hasGpuMemory = Object.prototype.hasOwnProperty.call(dep, 'gpu_memory_mib');
+      const hasLegacyGpuMemory = Object.prototype.hasOwnProperty.call(dep, 'gpu_memory_used_mib');
+      const raw = hasGpuMemory ? dep.gpu_memory_mib : (hasLegacyGpuMemory ? dep.gpu_memory_used_mib : 0);
+      const used = Number(raw);
+      return Number.isFinite(used) ? used : 0;
+    },
+
+    deploymentGpuUsedLabel() {
+      const dep = this.deploymentDetailData || {};
+      const used = this.deploymentGpuMemoryMiB(dep);
+      if (!Number.isFinite(used) || used <= 0) return this.t('unavailable');
+      return this.fmtMiB(used);
+    },
+
+    deploymentConfigRows() {
+      const dep = this.deploymentDetailData || {};
+      const cfg = dep.config && typeof dep.config === 'object' ? dep.config : {};
+      return Object.keys(cfg).sort().map(key => ({
+        key,
+        value: this.deployParamValueToString(cfg[key])
+      }));
+    },
+
+    deploymentFailureText(dep) {
+      if (!dep) return '';
+      return dep.failure_detail || dep.message || dep.error_lines || '';
+    },
+
+    deploymentUptimeLabel(dep) {
+      if (!dep) return '-';
+      const raw = dep.start_time || dep.started_at || '';
+      const ts = raw ? new Date(raw).getTime() : Number(dep.started_at_unix || 0) * 1000;
+      if (!ts || !Number.isFinite(ts)) return '-';
+      const seconds = Math.max(0, Math.floor((Date.now() - ts) / 1000));
+      if (seconds < 60) return seconds + 's';
+      if (seconds < 3600) return Math.floor(seconds / 60) + 'm';
+      if (seconds < 86400) return Math.floor(seconds / 3600) + 'h';
+      return Math.floor(seconds / 86400) + 'd';
+    },
+
+    deploymentDetailUpdatedText() {
+      return this.deploymentDetailUpdatedAt ? this.t('deployment_detail_updated') + ' ' + this.deploymentDetailUpdatedAt : '';
+    },
+
+    deploymentFooterStatusText() {
+      return [this.deploymentStatusLabel(this.deploymentDetailData), this.deploymentDetailUpdatedText()].filter(Boolean).join(' · ');
+    },
+
+    deploymentDiagnosticsRows() {
+      const dep = this.deploymentDetailData || {};
+      return [
+        { key: 'latest_status', label: this.lang === 'zh' ? '最近状态' : 'Latest status', value: this.deploymentSummaryText(dep) || this.deploymentStatusLabel(dep) },
+        { key: 'updated_at', label: this.lang === 'zh' ? '最近刷新' : 'Last refresh', value: this.deploymentDetailUpdatedAt || '-' }
+      ];
+    },
+
     deploymentForModel(modelName) {
       return this.deployments.find(d => d.model === modelName || (!d.model && d.name === modelName)) || null;
     },
@@ -10237,20 +10998,49 @@ <h3 class="onboarding-drawer-title" x-text="onboardingText(((onboardingLocaleDat
       return dep.startup_message || dep.startup_phase || dep.phase || this.t('deploying_label');
     },
 
-    async stopDeployment(deploymentName) {
+    setDeploymentStopFeedback(deploymentName, type, text) {
+      if (!deploymentName) return;
+      this.deploymentStopFeedback = { ...this.deploymentStopFeedback, [deploymentName]: { type, text } };
+      if (this.deploymentDetailData && this.deploymentDetailData.name === deploymentName) {
+        this.deploymentDetailFeedback = { type, text };
+      }
+    },
+
+    clearDeploymentStopFeedback(deploymentName) {
+      if (!deploymentName || !this.deploymentStopFeedback[deploymentName]) return;
+      const next = { ...this.deploymentStopFeedback };
+      delete next[deploymentName];
+      this.deploymentStopFeedback = next;
+    },
+
+    handleDeploymentStopClick(event, deploymentName, options = {}) {
+      if (event) {
+        event.preventDefault();
+        event.stopPropagation();
+      }
+      return this.stopDeployment(deploymentName, options);
+    },
+
+    async stopDeployment(deploymentName, options = {}) {
       if (!deploymentName || this.deploymentStopping[deploymentName]) return;
 
       this.deploymentStopping = { ...this.deploymentStopping, [deploymentName]: true };
-      this.messages.push({ role: 'system', text: (this.lang === 'zh' ? '正在停止部署 ' : 'Stopping deployment ') + deploymentName + '...' });
+      this.setDeploymentStopFeedback(deploymentName, 'warning', this.t('stop_service_progress') + ' ' + deploymentName + '...');
+      this.messages.push({ role: 'system', text: this.t('stop_deploy_progress') + ' ' + deploymentName + '...' });
       this.scrollChat();
 
       try {
         const data = await this.callTool('deploy.delete', { name: deploymentName });
-        if (data && data._err) {
-          this.messages.push({ role: 'error', text: (this.lang === 'zh' ? '停止 ' : 'Stop ') + deploymentName + (this.lang === 'zh' ? ' 失败: ' : ' failed: ') + data._err });
+        const stopError = data && data._err ? data._err : '';
+        if (stopError) {
+          this.setDeploymentStopFeedback(deploymentName, 'error', this.t('stop_service_failed') + ' ' + stopError);
+          this.messages.push({ role: 'error', text: this.t('stop_deploy_failed') + ' ' + deploymentName + ': ' + stopError });
           return;
         }
-        this.messages.push({ role: 'system', text: (this.lang === 'zh' ? '已停止部署 ' : 'Stopped deployment ') + deploymentName + '.' });
+        this.setDeploymentStopFeedback(deploymentName, 'success', this.t('stop_service_done') + ' ' + deploymentName + '.');
+        this.deployments = this.deployments.filter(d => d.name !== deploymentName);
+        if (options.closeDetail) this.closeDeploymentDetail();
+        this.messages.push({ role: 'system', text: this.t('stop_deploy_done') + ' ' + deploymentName + '.' });
       } finally {
         const next = { ...this.deploymentStopping };
         delete next[deploymentName];
@@ -10272,13 +11062,22 @@ <h3 class="onboarding-drawer-title" x-text="onboardingText(((onboardingLocaleDat
           const remaining = Math.max(0, d.estimated_total_s - elapsed);
           eta = remaining >= 60 ? Math.ceil(remaining / 60) + 'm' : Math.ceil(remaining) + 's';
         }
-        return {
+        const labels = d.labels || {};
+        const dep = {
           name: d.name || 'unknown',
-          model: (d.labels && d.labels['aima.dev/model']) || '',
-          model_type: d.model_type || (d.labels && d.labels['aima.dev/model_type']) || '',
+          model: d.model || labels['aima.dev/model'] || '',
+          model_type: d.model_type || labels['aima.dev/model_type'] || '',
           phase: d.phase || 'unknown',
           ready: d.ready || false,
           address: d.address || '',
+          labels,
+          engine: d.engine || labels['aima.dev/engine'] || '',
+          image: d.image || d.engine_image || '',
+          runtime: d.runtime || '',
+          port: d.port || d.host_port || '',
+          start_time: d.start_time || '',
+          started_at_unix: d.started_at_unix || 0,
+          message: d.message || '',
           detail: [d.runtime, d.ready ? this.t('running_label') : d.phase].filter(Boolean).join(' '),
           startup_phase: d.startup_phase || '',
           startup_progress: d.startup_progress || 0,
@@ -10287,7 +11086,23 @@ <h3 class="onboarding-drawer-title" x-text="onboardingText(((onboardingLocaleDat
           failure_detail: this.summarizeDeploymentFailure(d),
           eta
         };
+        if (Object.prototype.hasOwnProperty.call(d, 'gpu_memory_mib') || Object.prototype.hasOwnProperty.call(d, 'gpu_memory_used_mib')) {
+          dep.gpu_memory_mib = this.deploymentGpuMemoryMiB(d);
+        }
+        if (Object.prototype.hasOwnProperty.call(d, 'gpu_memory_source')) {
+          dep.gpu_memory_source = d.gpu_memory_source || '';
+        }
+        if (d.config && typeof d.config === 'object') {
+          dep.config = d.config;
+        }
+        return dep;
       });
+      for (const dep of nextDeployments) {
+        const stopFeedback = dep.name ? this.deploymentStopFeedback[dep.name] : null;
+        if (dep.name && stopFeedback && stopFeedback.type !== 'error' && (dep.phase === 'starting' || dep.phase === 'running')) {
+          this.clearDeploymentStopFeedback(dep.name);
+        }
+      }
       nextDeployments.sort((a, b) => {
         const rank = dep => {
           if (dep.phase === 'running' && dep.ready) return 0;
@@ -10305,6 +11120,15 @@ <h3 class="onboarding-drawer-title" x-text="onboardingText(((onboardingLocaleDat
         return addrA.localeCompare(addrB);
       });
       this.deployments = nextDeployments;
+      if (this.deploymentDetailOpen && this.deploymentDetailData && this.deploymentDetailData.name) {
+        const detailName = this.deploymentDetailData.name;
+        const fresh = nextDeployments.find(d => d.name === detailName);
+        if (fresh) {
+          this.deploymentDetailData = this.normalizeDeploymentDetail(fresh, this.deploymentDetailData);
+        } else if (!this.deploymentStopping[detailName]) {
+          this.closeDeploymentDetail();
+        }
+      }
       // Adaptive polling: surface externally-triggered deploys quickly enough to show startup.
       this._adjustDeployPoll(hasStarting);
     },
@@ -11665,6 +12489,15 @@ <h3 class="onboarding-drawer-title" x-text="onboardingText(((onboardingLocaleDat
         }
         return;
       }
+      if (this.deploymentDetailOpen) {
+        if (key === 'escape') {
+          e.preventDefault();
+          this.closeDeploymentDetail();
+        } else if ((e.ctrlKey || e.metaKey) && key === 'k') {
+          e.preventDefault();
+        }
+        return;
+      }
       if ((e.ctrlKey || e.metaKey) && key === 'k') {
         e.preventDefault();
         if (this.$refs.chatInput) this.$refs.chatInput.focus();