From 6ded2003ded5e904b3f745511fce1556f52fc5c4 Mon Sep 17 00:00:00 2001
From: Evan Lezar <elezar@nvidia.com>
Date: Wed, 3 Jun 2026 21:12:46 +0200
Subject: [PATCH 1/5] fix(cli): allow gpu-device to imply GPU requests

Signed-off-by: Evan Lezar <elezar@nvidia.com>
---
 crates/openshell-cli/src/main.rs              | 31 ++++++++++++-
 crates/openshell-cli/src/run.rs               |  4 +-
 .../sandbox_create_lifecycle_integration.rs   | 44 +++++++++++++++++++
 3 files changed, 76 insertions(+), 3 deletions(-)
diff --git a/crates/openshell-cli/src/main.rs b/crates/openshell-cli/src/main.rs
index 2254f0c89..907a9b4b9 100644
--- a/crates/openshell-cli/src/main.rs
+++ b/crates/openshell-cli/src/main.rs
@@ -1215,8 +1215,9 @@ enum SandboxCommands {
 
         /// Target a driver-specific GPU device. Docker and Podman use CDI device IDs
         /// (for example "nvidia.com/gpu=0"); VM uses a PCI BDF or index.
-        /// Only valid with --gpu. When omitted with --gpu, the driver uses its default GPU selection.
-        #[arg(long, requires = "gpu")]
+        /// Specifying --gpu-device also requests GPU resources.
+        /// When omitted with --gpu, the driver uses its default GPU selection.
+        #[arg(long)]
         gpu_device: Option<String>,
 
         /// CPU limit for the sandbox (for example: 500m, 1, 2.5).
@@ -4287,6 +4288,32 @@ mod tests {
         }
     }
 
+    #[test]
+    fn sandbox_create_gpu_device_parses_without_gpu_flag() {
+        let cli = Cli::try_parse_from([
+            "openshell",
+            "sandbox",
+            "create",
+            "--gpu-device",
+            "nvidia.com/gpu=0",
+        ])
+        .expect("sandbox create --gpu-device should parse without --gpu");
+
+        match cli.command {
+            Some(Commands::Sandbox {
+                command:
+                    Some(SandboxCommands::Create {
+                        gpu, gpu_device, ..
+                    }),
+                ..
+            }) => {
+                assert!(!gpu);
+                assert_eq!(gpu_device.as_deref(), Some("nvidia.com/gpu=0"));
+            }
+            other => panic!("expected SandboxCommands::Create, got: {other:?}"),
+        }
+    }
+
     #[test]
     fn service_expose_accepts_positional_target_port_and_service() {
         let cli = Cli::try_parse_from([
diff --git a/crates/openshell-cli/src/run.rs b/crates/openshell-cli/src/run.rs
index 9988d46db..33b263d17 100644
--- a/crates/openshell-cli/src/run.rs
+++ b/crates/openshell-cli/src/run.rs
@@ -1732,7 +1732,9 @@ pub async fn sandbox_create(
         }
         None => None,
     };
-    let requested_gpu = gpu || image.as_deref().is_some_and(image_requests_gpu);
+    let requested_gpu = gpu
+        || gpu_device.is_some_and(|device_id| !device_id.is_empty())
+        || image.as_deref().is_some_and(image_requests_gpu);
 
     let providers_v2_enabled = gateway_providers_v2_enabled(&mut client).await?;
     let inferred_types: Vec<String> = if providers_v2_enabled {
diff --git a/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs b/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs
index aee91de56..4a14d5cc4 100644
--- a/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs
+++ b/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs
@@ -884,6 +884,50 @@ async fn sandbox_create_sends_cpu_and_memory_limits_only() {
     assert!(!resources.fields.contains_key("requests"));
 }
 
+#[tokio::test]
+async fn sandbox_create_sends_gpu_device_request_without_gpu_flag() {
+    let server = run_server().await;
+    let fake_ssh_dir = tempfile::tempdir().unwrap();
+    let xdg_dir = tempfile::tempdir().unwrap();
+    let _env = test_env(&fake_ssh_dir, &xdg_dir);
+    let tls = test_tls(&server);
+    install_fake_ssh(&fake_ssh_dir);
+
+    run::sandbox_create(
+        &server.endpoint,
+        Some("gpu-device"),
+        None,
+        "openshell",
+        None,
+        true,
+        false,
+        Some("nvidia.com/gpu=0"),
+        None,
+        None,
+        None,
+        &[],
+        None,
+        None,
+        &["echo".to_string(), "OK".to_string()],
+        Some(false),
+        Some(false),
+        &HashMap::new(),
+        "manual",
+        &tls,
+    )
+    .await
+    .expect("sandbox create should succeed");
+
+    let requests = create_requests(&server).await;
+    let spec = requests[0]
+        .spec
+        .as_ref()
+        .expect("sandbox spec should be sent");
+
+    assert!(spec.gpu);
+    assert_eq!(spec.gpu_device, "nvidia.com/gpu=0");
+}
+
 #[tokio::test]
 async fn sandbox_create_does_not_infer_command_providers_when_v2_enabled() {
     let server = run_server().await;

From 919f2beee31bdfb72882f45111cd7be9225a4039 Mon Sep 17 00:00:00 2001
From: Evan Lezar <elezar@nvidia.com>
Date: Mon, 4 May 2026 21:56:16 +0200
Subject: [PATCH 2/5] refactor(gpu): centralize driver request validation

Signed-off-by: Evan Lezar <elezar@nvidia.com>
---
 .../openshell-driver-kubernetes/src/driver.rs |  4 ++++
 crates/openshell-driver-vm/src/driver.rs      | 24 ++++++++++++-------
 2 files changed, 19 insertions(+), 9 deletions(-)

diff --git a/crates/openshell-driver-kubernetes/src/driver.rs b/crates/openshell-driver-kubernetes/src/driver.rs
index 34ab44a2e..79487c04d 100644
--- a/crates/openshell-driver-kubernetes/src/driver.rs
+++ b/crates/openshell-driver-kubernetes/src/driver.rs
@@ -204,6 +204,10 @@ impl KubernetesComputeDriver {
 
     pub async fn validate_sandbox_create(&self, sandbox: &Sandbox) -> Result<(), tonic::Status> {
         let gpu_requested = sandbox.spec.as_ref().is_some_and(|spec| spec.gpu);
+        self.validate_gpu_request(gpu_requested).await
+    }
+
+    async fn validate_gpu_request(&self, gpu_requested: bool) -> Result<(), tonic::Status> {
         if gpu_requested
             && !self.has_gpu_capacity().await.map_err(|err| {
                 tonic::Status::internal(format!("check GPU node capacity failed: {err}"))
diff --git a/crates/openshell-driver-vm/src/driver.rs b/crates/openshell-driver-vm/src/driver.rs
index 445905a1e..ed6b57a01 100644
--- a/crates/openshell-driver-vm/src/driver.rs
+++ b/crates/openshell-driver-vm/src/driver.rs
@@ -2577,15 +2577,7 @@ fn validate_vm_sandbox(sandbox: &Sandbox, gpu_enabled: bool) -> Result<(), Statu
         .as_ref()
         .ok_or_else(|| Status::invalid_argument("sandbox spec is required"))?;
 
-    if spec.gpu && !gpu_enabled {
-        return Err(Status::failed_precondition(
-            "GPU support is not enabled on this driver; start with --gpu",
-        ));
-    }
-
-    if !spec.gpu && !spec.gpu_device.is_empty() {
-        return Err(Status::invalid_argument("gpu_device requires gpu=true"));
-    }
+    validate_gpu_request(spec.gpu, &spec.gpu_device, gpu_enabled)?;
 
     if let Some(template) = spec.template.as_ref() {
         if !template.agent_socket_path.is_empty() {
@@ -2628,6 +2620,20 @@ fn validate_sandbox_id(sandbox_id: &str) -> Result<(), Status> {
     Ok(())
 }
 
+#[allow(clippy::result_large_err)]
+fn validate_gpu_request(gpu: bool, gpu_device: &str, gpu_enabled: bool) -> Result<(), Status> {
+    if gpu && !gpu_enabled {
+        return Err(Status::failed_precondition(
+            "GPU support is not enabled on this driver; start with --gpu",
+        ));
+    }
+
+    if !gpu && !gpu_device.is_empty() {
+        return Err(Status::invalid_argument("gpu_device requires gpu=true"));
+    }
+    Ok(())
+}
+
 #[allow(clippy::result_large_err)]
 fn parse_registry_reference(image_ref: &str) -> Result<Reference, Status> {
     Reference::try_from(image_ref).map_err(|err| {

From 148e5adc9a3dccba094dc791d268af175d402fc3 Mon Sep 17 00:00:00 2001
From: Evan Lezar <elezar@nvidia.com>
Date: Mon, 4 May 2026 22:12:28 +0200
Subject: [PATCH 3/5] refactor(vm): derive GPU device request once

Signed-off-by: Evan Lezar <elezar@nvidia.com>
---
 crates/openshell-driver-vm/src/driver.rs | 31 +++++++++++++++++++++---
 1 file changed, 27 insertions(+), 4 deletions(-)

diff --git a/crates/openshell-driver-vm/src/driver.rs b/crates/openshell-driver-vm/src/driver.rs
index ed6b57a01..56e431f38 100644
--- a/crates/openshell-driver-vm/src/driver.rs
+++ b/crates/openshell-driver-vm/src/driver.rs
@@ -615,10 +615,11 @@ impl VmDriver {
             )));
         }
 
-        let spec = sandbox.spec.as_ref();
-        let is_gpu = spec.is_some_and(|s| s.gpu);
-        let gpu_device = spec.map_or("", |s| s.gpu_device.as_str());
-        let gpu_bdf = if is_gpu {
+        let gpu_device = sandbox
+            .spec
+            .as_ref()
+            .and_then(|spec| requested_gpu_device(spec.gpu, &spec.gpu_device));
+        let gpu_bdf = if let Some(gpu_device) = gpu_device {
             Some(self.assign_gpu_to_record(&sandbox.id, gpu_device).await?)
         } else {
             None
@@ -2620,6 +2621,10 @@ fn validate_sandbox_id(sandbox_id: &str) -> Result<(), Status> {
     Ok(())
 }
 
+fn requested_gpu_device(gpu: bool, gpu_device: &str) -> Option<&str> {
+    gpu.then_some(gpu_device)
+}
+
 #[allow(clippy::result_large_err)]
 fn validate_gpu_request(gpu: bool, gpu_device: &str, gpu_enabled: bool) -> Result<(), Status> {
     if gpu && !gpu_enabled {
@@ -4538,6 +4543,24 @@ mod tests {
         assert!(err.message().contains("gpu_device requires gpu=true"));
     }
 
+    #[test]
+    fn requested_gpu_device_returns_none_without_gpu_request() {
+        assert_eq!(requested_gpu_device(false, ""), None);
+    }
+
+    #[test]
+    fn requested_gpu_device_defaults_empty_request_to_inventory_choice() {
+        assert_eq!(requested_gpu_device(true, ""), Some(""));
+    }
+
+    #[test]
+    fn requested_gpu_device_returns_explicit_device_id() {
+        assert_eq!(
+            requested_gpu_device(true, "0000:2d:00.0"),
+            Some("0000:2d:00.0")
+        );
+    }
+
     #[test]
     fn validate_vm_sandbox_rejects_platform_config() {
         let sandbox = Sandbox {

From 9dcc2695da59780b559b4be4cd70773dc1cbbae4 Mon Sep 17 00:00:00 2001
From: Evan Lezar <elezar@nvidia.com>
Date: Mon, 4 May 2026 22:14:48 +0200
Subject: [PATCH 4/5] feat(gpu): introduce GPU request spec

Signed-off-by: Evan Lezar <elezar@nvidia.com>
---
 architecture/compute-runtimes.md              |   4 +-
 crates/openshell-cli/src/main.rs              |  54 ++++++-
 crates/openshell-cli/src/run.rs               |  90 +++++++++--
 .../sandbox_create_lifecycle_integration.rs   |  65 +++++++-
 crates/openshell-core/src/gpu.rs              |  65 ++++++--
 crates/openshell-driver-docker/README.md      |   2 +-
 crates/openshell-driver-docker/src/lib.rs     |  32 ++--
 crates/openshell-driver-docker/src/tests.rs   |  48 ++++--
 crates/openshell-driver-kubernetes/README.md  |   6 +-
 .../openshell-driver-kubernetes/src/driver.rs | 147 +++++++++++++-----
 crates/openshell-driver-podman/README.md      |   2 +-
 .../openshell-driver-podman/src/container.rs  |  21 ++-
 crates/openshell-driver-podman/src/driver.rs  |  30 +++-
 crates/openshell-driver-vm/src/driver.rs      | 116 ++++++++++----
 crates/openshell-server/src/compute/mod.rs    |  73 +++++++--
 crates/openshell-server/src/grpc/sandbox.rs   |   2 +-
 .../openshell-server/src/grpc/validation.rs   |  68 +++++++-
 docs/sandboxes/manage-sandboxes.mdx           |  10 ++
 proto/compute_driver.proto                    |  19 ++-
 proto/openshell.proto                         |  27 ++--
 20 files changed, 704 insertions(+), 177 deletions(-)

diff --git a/architecture/compute-runtimes.md b/architecture/compute-runtimes.md
index 02891c03e..58f46eeb3 100644
--- a/architecture/compute-runtimes.md
+++ b/architecture/compute-runtimes.md
@@ -77,7 +77,9 @@ users.
 Custom sandbox images must include the agent runtime and any system
 dependencies, but they should not need to include the gateway. GPU-capable
 images must include the user-space libraries required by the workload. The
-runtime still owns GPU device injection.
+runtime still owns GPU device injection. GPU requests can include explicit
+driver-native device IDs or a requested count; the gateway validates the public
+request shape and each runtime enforces the GPU allocation modes it supports.
 
 ## Deployment Shape
 
diff --git a/crates/openshell-cli/src/main.rs b/crates/openshell-cli/src/main.rs
index 907a9b4b9..5e6d1fbdd 100644
--- a/crates/openshell-cli/src/main.rs
+++ b/crates/openshell-cli/src/main.rs
@@ -1217,9 +1217,13 @@ enum SandboxCommands {
         /// (for example "nvidia.com/gpu=0"); VM uses a PCI BDF or index.
         /// Specifying --gpu-device also requests GPU resources.
         /// When omitted with --gpu, the driver uses its default GPU selection.
-        #[arg(long)]
+        #[arg(long, conflicts_with = "gpu_count")]
         gpu_device: Option<String>,
 
+        /// Request a specific number of GPUs. Mutually exclusive with --gpu-device.
+        #[arg(long, value_parser = clap::value_parser!(u32).range(1..), conflicts_with = "gpu_device")]
+        gpu_count: Option<u32>,
+
         /// CPU limit for the sandbox (for example: 500m, 1, 2.5).
         #[arg(long)]
         cpu: Option<String>,
@@ -2540,6 +2544,7 @@ async fn main() -> Result<()> {
                     editor,
                     gpu,
                     gpu_device,
+                    gpu_count,
                     cpu,
                     memory,
                     providers,
@@ -2609,6 +2614,7 @@ async fn main() -> Result<()> {
                         keep,
                         gpu,
                         gpu_device.as_deref(),
+                        gpu_count,
                         cpu.as_deref(),
                         memory.as_deref(),
                         editor,
@@ -4314,6 +4320,52 @@ mod tests {
         }
     }
 
+    #[test]
+    fn sandbox_create_gpu_count_parses_without_gpu_flag() {
+        let cli = Cli::try_parse_from(["openshell", "sandbox", "create", "--gpu-count", "2"])
+            .expect("sandbox create --gpu-count should parse");
+
+        match cli.command {
+            Some(Commands::Sandbox {
+                command: Some(SandboxCommands::Create { gpu, gpu_count, .. }),
+                ..
+            }) => {
+                assert!(!gpu);
+                assert_eq!(gpu_count, Some(2));
+            }
+            other => panic!("expected SandboxCommands::Create, got: {other:?}"),
+        }
+    }
+
+    #[test]
+    fn sandbox_create_gpu_count_rejects_zero() {
+        let result = Cli::try_parse_from(["openshell", "sandbox", "create", "--gpu-count", "0"]);
+
+        assert!(
+            result.is_err(),
+            "sandbox create --gpu-count 0 should be rejected"
+        );
+    }
+
+    #[test]
+    fn sandbox_create_gpu_count_conflicts_with_gpu_device() {
+        let result = Cli::try_parse_from([
+            "openshell",
+            "sandbox",
+            "create",
+            "--gpu",
+            "--gpu-device",
+            "nvidia.com/gpu=0",
+            "--gpu-count",
+            "2",
+        ]);
+
+        assert!(
+            result.is_err(),
+            "sandbox create should reject --gpu-count with --gpu-device"
+        );
+    }
+
     #[test]
     fn service_expose_accepts_positional_target_port_and_service() {
         let cli = Cli::try_parse_from([
diff --git a/crates/openshell-cli/src/run.rs b/crates/openshell-cli/src/run.rs
index 33b263d17..83234f7e7 100644
--- a/crates/openshell-cli/src/run.rs
+++ b/crates/openshell-cli/src/run.rs
@@ -39,17 +39,18 @@ use openshell_core::proto::{
     GetClusterInferenceRequest, GetDraftHistoryRequest, GetDraftPolicyRequest,
     GetGatewayConfigRequest, GetProviderProfileRequest, GetProviderRefreshStatusRequest,
     GetProviderRequest, GetSandboxConfigRequest, GetSandboxLogsRequest,
-    GetSandboxPolicyStatusRequest, GetSandboxRequest, GetServiceRequest, HealthRequest,
-    ImportProviderProfilesRequest, LintProviderProfilesRequest, ListProviderProfilesRequest,
-    ListProvidersRequest, ListSandboxPoliciesRequest, ListSandboxProvidersRequest,
-    ListSandboxesRequest, ListServicesRequest, PlatformEvent, PolicySource, PolicyStatus, Provider,
-    ProviderCredentialRefreshStatus, ProviderCredentialRefreshStrategy, ProviderProfile,
-    ProviderProfileDiagnostic, ProviderProfileImportItem, RejectDraftChunkRequest,
-    RevokeSshSessionRequest, RotateProviderCredentialRequest, Sandbox, SandboxPhase, SandboxPolicy,
-    SandboxSpec, SandboxTemplate, ServiceEndpointResponse, SetClusterInferenceRequest,
-    SettingScope, SettingValue, TcpForwardFrame, TcpForwardInit, TcpRelayTarget,
-    UpdateConfigRequest, UpdateProviderRequest, WatchSandboxRequest, exec_sandbox_event,
-    setting_value, tcp_forward_init,
+    GetSandboxPolicyStatusRequest, GetSandboxRequest, GetServiceRequest, GpuRequestSpec,
+    HealthRequest, ImportProviderProfilesRequest, LintProviderProfilesRequest,
+    ListProviderProfilesRequest, ListProvidersRequest, ListSandboxPoliciesRequest,
+    ListSandboxProvidersRequest, ListSandboxesRequest, ListServicesRequest, PlatformEvent,
+    PolicySource, PolicyStatus, Provider, ProviderCredentialRefreshStatus,
+    ProviderCredentialRefreshStrategy, ProviderProfile, ProviderProfileDiagnostic,
+    ProviderProfileImportItem, RejectDraftChunkRequest, RevokeSshSessionRequest,
+    RotateProviderCredentialRequest, Sandbox, SandboxPhase, SandboxPolicy, SandboxSpec,
+    SandboxTemplate, ServiceEndpointResponse, SetClusterInferenceRequest, SettingScope,
+    SettingValue, TcpForwardFrame, TcpForwardInit, TcpRelayTarget, UpdateConfigRequest,
+    UpdateProviderRequest, WatchSandboxRequest, exec_sandbox_event, setting_value,
+    tcp_forward_init,
 };
 use openshell_core::settings::{self, SettingValueKind};
 use openshell_core::{ObjectId, ObjectName};
@@ -1679,6 +1680,7 @@ pub async fn sandbox_create(
     keep: bool,
     gpu: bool,
     gpu_device: Option<&str>,
+    gpu_count: Option<u32>,
     cpu: Option<&str>,
     memory: Option<&str>,
     editor: Option<Editor>,
@@ -1734,6 +1736,7 @@ pub async fn sandbox_create(
     };
     let requested_gpu = gpu
         || gpu_device.is_some_and(|device_id| !device_id.is_empty())
+        || gpu_count.is_some()
         || image.as_deref().is_some_and(image_requests_gpu);
 
     let providers_v2_enabled = gateway_providers_v2_enabled(&mut client).await?;
@@ -1765,8 +1768,7 @@ pub async fn sandbox_create(
 
     let request = CreateSandboxRequest {
         spec: Some(SandboxSpec {
-            gpu: requested_gpu,
-            gpu_device: gpu_device.unwrap_or_default().to_string(),
+            gpu: gpu_request_from_cli(requested_gpu, gpu_device, gpu_count),
             policy,
             providers: configured_providers,
             template,
@@ -2191,6 +2193,20 @@ pub async fn sandbox_create(
     }
 }
 
+fn gpu_request_from_cli(
+    requested_gpu: bool,
+    gpu_device: Option<&str>,
+    gpu_count: Option<u32>,
+) -> Option<GpuRequestSpec> {
+    requested_gpu.then(|| GpuRequestSpec {
+        device_id: gpu_device
+            .filter(|device_id| !device_id.is_empty())
+            .map(|device_id| vec![device_id.to_string()])
+            .unwrap_or_default(),
+        count: gpu_count,
+    })
+}
+
 /// Resolved source for the `--from` flag on `sandbox create`.
 #[derive(Debug)]
 enum ResolvedSource {
@@ -7440,10 +7456,10 @@ mod tests {
         dockerfile_sources_supported_for_gateway, format_endpoint, format_gateway_select_header,
         format_gateway_select_items, format_provider_attachment_table, gateway_add,
         gateway_auth_label, gateway_env_override_warning, gateway_select_with, gateway_type_label,
-        git_sync_files, http_health_check, image_requests_gpu, import_local_package_mtls_bundle,
-        inferred_provider_type, package_managed_tls_dirs, parse_cli_setting_value,
-        parse_credential_expiry_cli_value, parse_credential_expiry_pairs, parse_credential_pairs,
-        plaintext_gateway_is_remote, progress_step_from_metadata,
+        git_sync_files, gpu_request_from_cli, http_health_check, image_requests_gpu,
+        import_local_package_mtls_bundle, inferred_provider_type, package_managed_tls_dirs,
+        parse_cli_setting_value, parse_credential_expiry_cli_value, parse_credential_expiry_pairs,
+        parse_credential_pairs, plaintext_gateway_is_remote, progress_step_from_metadata,
         provider_profile_allows_refresh_bootstrap, provisioning_timeout_message,
         ready_false_condition_message, refresh_status_header, refresh_status_row, resolve_from,
         sandbox_should_persist, sandbox_upload_plan, service_expose_status_error,
@@ -7926,6 +7942,46 @@ mod tests {
         }
     }
 
+    #[test]
+    fn gpu_request_from_cli_uses_presence_with_empty_device_ids_for_default_gpu() {
+        let request =
+            gpu_request_from_cli(true, None, None).expect("gpu request should be present");
+
+        assert!(request.device_id.is_empty());
+        assert_eq!(request.count, None);
+    }
+
+    #[test]
+    fn gpu_request_from_cli_maps_gpu_device_to_one_device_id() {
+        let request = gpu_request_from_cli(true, Some("0000:2d:00.0"), None)
+            .expect("gpu request should be present");
+
+        assert_eq!(request.device_id, vec!["0000:2d:00.0"]);
+        assert_eq!(request.count, None);
+    }
+
+    #[test]
+    fn gpu_request_from_cli_maps_gpu_count() {
+        let request = gpu_request_from_cli(true, None, Some(2)).expect("gpu request should exist");
+
+        assert!(request.device_id.is_empty());
+        assert_eq!(request.count, Some(2));
+    }
+
+    #[test]
+    fn gpu_request_from_cli_preserves_device_and_gpu_count_for_gateway_validation() {
+        let request = gpu_request_from_cli(true, Some("nvidia.com/gpu=0"), Some(2))
+            .expect("gpu request should exist");
+
+        assert_eq!(request.device_id, vec!["nvidia.com/gpu=0"]);
+        assert_eq!(request.count, Some(2));
+    }
+
+    #[test]
+    fn gpu_request_from_cli_omits_gpu_request_when_not_requested() {
+        assert!(gpu_request_from_cli(false, Some("0"), None).is_none());
+    }
+
     #[test]
     fn resolve_from_classifies_existing_dockerfile_path() {
         let temp = tempfile::tempdir().expect("failed to create tempdir");
diff --git a/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs b/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs
index 4a14d5cc4..e25d7df8a 100644
--- a/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs
+++ b/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs
@@ -787,6 +787,7 @@ async fn sandbox_create_keeps_command_sessions_by_default() {
         None,
         None,
         None,
+        None,
         &[],
         None,
         None,
@@ -826,6 +827,7 @@ async fn sandbox_create_sends_cpu_and_memory_limits_only() {
         true,
         false,
         None,
+        None,
         Some("500m"),
         Some("2Gi"),
         None,
@@ -919,13 +921,60 @@ async fn sandbox_create_sends_gpu_device_request_without_gpu_flag() {
     .expect("sandbox create should succeed");
 
     let requests = create_requests(&server).await;
-    let spec = requests[0]
+    let gpu = requests[0]
+        .spec
+        .as_ref()
+        .and_then(|spec| spec.gpu.as_ref())
+        .expect("GPU request should be sent");
+
+    assert_eq!(gpu.device_id, vec!["nvidia.com/gpu=0"]);
+    assert_eq!(gpu.count, None);
+}
+
+#[tokio::test]
+async fn sandbox_create_sends_gpu_count_request() {
+    let server = run_server().await;
+    let fake_ssh_dir = tempfile::tempdir().unwrap();
+    let xdg_dir = tempfile::tempdir().unwrap();
+    let _env = test_env(&fake_ssh_dir, &xdg_dir);
+    let tls = test_tls(&server);
+    install_fake_ssh(&fake_ssh_dir);
+
+    run::sandbox_create(
+        &server.endpoint,
+        Some("gpu-count"),
+        None,
+        "openshell",
+        None,
+        true,
+        false,
+        None,
+        Some(2),
+        None,
+        None,
+        None,
+        &[],
+        None,
+        None,
+        &["echo".to_string(), "OK".to_string()],
+        Some(false),
+        Some(false),
+        &HashMap::new(),
+        "manual",
+        &tls,
+    )
+    .await
+    .expect("sandbox create should succeed");
+
+    let requests = create_requests(&server).await;
+    let gpu = requests[0]
         .spec
         .as_ref()
-        .expect("sandbox spec should be sent");
+        .and_then(|spec| spec.gpu.as_ref())
+        .expect("GPU request should be sent");
 
-    assert!(spec.gpu);
-    assert_eq!(spec.gpu_device, "nvidia.com/gpu=0");
+    assert!(gpu.device_id.is_empty());
+    assert_eq!(gpu.count, Some(2));
 }
 
 #[tokio::test]
@@ -950,6 +999,7 @@ async fn sandbox_create_does_not_infer_command_providers_when_v2_enabled() {
         None,
         None,
         None,
+        None,
         &[],
         None,
         None,
@@ -1007,6 +1057,7 @@ async fn sandbox_create_returns_vm_error_without_waiting_for_timeout() {
         None,
         None,
         None,
+        None,
         &[],
         None,
         None,
@@ -1060,6 +1111,7 @@ async fn sandbox_create_keeps_waiting_while_vm_progress_arrives() {
         None,
         None,
         None,
+        None,
         &[],
         None,
         None,
@@ -1105,6 +1157,7 @@ async fn sandbox_create_times_out_when_only_logs_arrive() {
         None,
         None,
         None,
+        None,
         &[],
         None,
         None,
@@ -1146,6 +1199,7 @@ async fn sandbox_create_deletes_command_sessions_with_no_keep() {
         None,
         None,
         None,
+        None,
         &[],
         None,
         None,
@@ -1191,6 +1245,7 @@ async fn sandbox_create_deletes_shell_sessions_with_no_keep() {
         None,
         None,
         None,
+        None,
         &[],
         None,
         None,
@@ -1236,6 +1291,7 @@ async fn sandbox_create_keeps_sandbox_with_hidden_keep_flag() {
         None,
         None,
         None,
+        None,
         &[],
         None,
         None,
@@ -1281,6 +1337,7 @@ async fn sandbox_create_keeps_sandbox_with_forwarding() {
         None,
         None,
         None,
+        None,
         &[],
         None,
         Some(openshell_core::forward::ForwardSpec::new(forward_port)),
diff --git a/crates/openshell-core/src/gpu.rs b/crates/openshell-core/src/gpu.rs
index 5df8702ed..9c6eed8cd 100644
--- a/crates/openshell-core/src/gpu.rs
+++ b/crates/openshell-core/src/gpu.rs
@@ -4,21 +4,25 @@
 //! Shared GPU request helpers.
 
 use crate::config::CDI_GPU_DEVICE_ALL;
+use crate::proto::compute::v1::{DriverSandboxSpec, GpuRequestSpec};
 
-/// Resolve the existing GPU request fields into CDI device identifiers.
+/// Extract the driver GPU request from a sandbox spec.
+#[must_use]
+pub fn driver_gpu_request(spec: &DriverSandboxSpec) -> Option<&GpuRequestSpec> {
+    spec.gpu.as_ref()
+}
+
+/// Resolve a driver GPU request into CDI device identifiers.
 ///
-/// `None` means no GPU was requested. A GPU request with no explicit device
-/// ID uses the CDI all-GPU request; otherwise the driver-native ID passes
-/// through unchanged.
+/// `None` means no GPU was requested. Presence with no explicit device IDs
+/// uses the CDI all-GPU request; otherwise the driver-native IDs pass through.
 #[must_use]
-pub fn cdi_gpu_device_ids(gpu: bool, gpu_device: &str) -> Option<Vec<String>> {
-    gpu.then(|| {
-        if gpu_device.is_empty() {
-            vec![CDI_GPU_DEVICE_ALL.to_string()]
-        } else {
-            vec![gpu_device.to_string()]
-        }
-    })
+pub fn cdi_gpu_device_ids(gpu: Option<&GpuRequestSpec>) -> Option<Vec<String>> {
+    match gpu {
+        Some(gpu) if gpu.device_id.is_empty() => Some(vec![CDI_GPU_DEVICE_ALL.to_string()]),
+        Some(gpu) => Some(gpu.device_id.clone()),
+        None => None,
+    }
 }
 
 #[cfg(test)]
@@ -27,22 +31,51 @@ mod tests {
 
     #[test]
     fn cdi_gpu_device_ids_returns_none_when_absent() {
-        assert_eq!(cdi_gpu_device_ids(false, ""), None);
+        assert_eq!(cdi_gpu_device_ids(None), None);
     }
 
     #[test]
     fn cdi_gpu_device_ids_defaults_empty_request_to_all_gpus() {
+        let request = GpuRequestSpec {
+            device_id: vec![],
+            count: None,
+        };
+
         assert_eq!(
-            cdi_gpu_device_ids(true, ""),
+            cdi_gpu_device_ids(Some(&request)),
             Some(vec![CDI_GPU_DEVICE_ALL.to_string()])
         );
     }
 
     #[test]
-    fn cdi_gpu_device_ids_passes_explicit_device_id_through() {
+    fn cdi_gpu_device_ids_passes_single_device_id_through() {
+        let request = GpuRequestSpec {
+            device_id: vec!["nvidia.com/gpu=0".to_string()],
+            count: None,
+        };
+
         assert_eq!(
-            cdi_gpu_device_ids(true, "nvidia.com/gpu=0"),
+            cdi_gpu_device_ids(Some(&request)),
             Some(vec!["nvidia.com/gpu=0".to_string()])
         );
     }
+
+    #[test]
+    fn cdi_gpu_device_ids_passes_multiple_device_ids_through() {
+        let request = GpuRequestSpec {
+            device_id: vec![
+                "nvidia.com/gpu=0".to_string(),
+                "nvidia.com/gpu=1".to_string(),
+            ],
+            count: None,
+        };
+
+        assert_eq!(
+            cdi_gpu_device_ids(Some(&request)),
+            Some(vec![
+                "nvidia.com/gpu=0".to_string(),
+                "nvidia.com/gpu=1".to_string()
+            ])
+        );
+    }
 }
diff --git a/crates/openshell-driver-docker/README.md b/crates/openshell-driver-docker/README.md
index ea57f44e4..df4069059 100644
--- a/crates/openshell-driver-docker/README.md
+++ b/crates/openshell-driver-docker/README.md
@@ -32,7 +32,7 @@ contract:
 | `apparmor=unconfined` | Avoids Docker's default profile blocking required mount operations. |
 | `restart_policy = unless-stopped` | Keeps managed sandboxes resumable across daemon or gateway restarts. |
 | `PidsLimit` | Enforces the sandbox PID budget at the Docker cgroup layer. Set `[openshell.drivers.docker].sandbox_pids_limit = 0` to inherit the Docker/runtime default. |
-| CDI GPU request | Uses the sandbox `gpu_device` value when set; otherwise requests all NVIDIA GPUs when the sandbox spec asks for GPU support and daemon CDI support is detected. |
+| CDI GPU request | Uses explicit GPU request device IDs when set; otherwise requests all NVIDIA GPUs when the sandbox spec asks for GPU support and daemon CDI support is detected. Count-based GPU requests are rejected until Docker CDI selection can map counts to concrete devices. |
 
 The agent child process does not retain these supervisor privileges.
 
diff --git a/crates/openshell-driver-docker/src/lib.rs b/crates/openshell-driver-docker/src/lib.rs
index e30ee7754..e7c8d77c3 100644
--- a/crates/openshell-driver-docker/src/lib.rs
+++ b/crates/openshell-driver-docker/src/lib.rs
@@ -25,7 +25,7 @@ use openshell_core::driver_utils::{
     LABEL_MANAGED_BY, LABEL_MANAGED_BY_VALUE, LABEL_SANDBOX_ID, LABEL_SANDBOX_NAME,
     LABEL_SANDBOX_NAMESPACE, SUPERVISOR_IMAGE_BINARY_PATH,
 };
-use openshell_core::gpu::cdi_gpu_device_ids;
+use openshell_core::gpu::{cdi_gpu_device_ids, driver_gpu_request};
 use openshell_core::progress::{
     PROGRESS_STEP_PULLING_IMAGE, PROGRESS_STEP_REQUESTING_SANDBOX, PROGRESS_STEP_STARTING_SANDBOX,
     format_bytes, mark_progress_active, mark_progress_complete, mark_progress_detail,
@@ -34,11 +34,11 @@ use openshell_core::proto::compute::v1::{
     CreateSandboxRequest, CreateSandboxResponse, DeleteSandboxRequest, DeleteSandboxResponse,
     DriverCondition, DriverPlatformEvent, DriverSandbox, DriverSandboxStatus,
     DriverSandboxTemplate, GetCapabilitiesRequest, GetCapabilitiesResponse, GetSandboxRequest,
-    GetSandboxResponse, ListSandboxesRequest, ListSandboxesResponse, StopSandboxRequest,
-    StopSandboxResponse, ValidateSandboxCreateRequest, ValidateSandboxCreateResponse,
-    WatchSandboxesDeletedEvent, WatchSandboxesEvent, WatchSandboxesPlatformEvent,
-    WatchSandboxesRequest, WatchSandboxesSandboxEvent, compute_driver_server::ComputeDriver,
-    watch_sandboxes_event,
+    GetSandboxResponse, GpuRequestSpec, ListSandboxesRequest, ListSandboxesResponse,
+    StopSandboxRequest, StopSandboxResponse, ValidateSandboxCreateRequest,
+    ValidateSandboxCreateResponse, WatchSandboxesDeletedEvent, WatchSandboxesEvent,
+    WatchSandboxesPlatformEvent, WatchSandboxesRequest, WatchSandboxesSandboxEvent,
+    compute_driver_server::ComputeDriver, watch_sandboxes_event,
 };
 use openshell_core::{Config, Error, Result as CoreResult};
 use std::collections::HashMap;
@@ -375,7 +375,7 @@ impl DockerComputeDriver {
                 "docker sandboxes require a template image",
             ));
         }
-        Self::validate_gpu_request(spec.gpu, config.supports_gpu)?;
+        Self::validate_gpu_request(driver_gpu_request(spec), config.supports_gpu)?;
         if !template.agent_socket_path.trim().is_empty() {
             return Err(Status::failed_precondition(
                 "docker compute driver does not support template.agent_socket_path",
@@ -409,8 +409,16 @@ impl DockerComputeDriver {
         ))
     }
 
-    fn validate_gpu_request(gpu: bool, supports_gpu: bool) -> Result<(), Status> {
-        if gpu && !supports_gpu {
+    fn validate_gpu_request(
+        gpu: Option<&GpuRequestSpec>,
+        supports_gpu: bool,
+    ) -> Result<(), Status> {
+        if gpu.is_some_and(|gpu| gpu.count.is_some()) {
+            return Err(Status::invalid_argument(
+                "docker compute driver does not support GPU count requests",
+            ));
+        }
+        if gpu.is_some() && !supports_gpu {
             return Err(Status::failed_precondition(
                 "docker GPU sandboxes require Docker CDI support. Enable CDI on the Docker daemon, then restart the OpenShell gateway/server so GPU capability is detected.",
             ));
@@ -1713,8 +1721,8 @@ fn build_environment(sandbox: &DriverSandbox, config: &DockerDriverRuntimeConfig
         .collect()
 }
 
-fn docker_gpu_device_requests(gpu: bool, gpu_device: &str) -> Option<Vec<DeviceRequest>> {
-    cdi_gpu_device_ids(gpu, gpu_device).map(|device_ids| {
+fn docker_gpu_device_requests(gpu: Option<&GpuRequestSpec>) -> Option<Vec<DeviceRequest>> {
+    cdi_gpu_device_ids(gpu).map(|device_ids| {
         vec![DeviceRequest {
             driver: Some("cdi".to_string()),
             device_ids: Some(device_ids),
@@ -1765,7 +1773,7 @@ fn build_container_create_body(
             nano_cpus: resource_limits.nano_cpus,
             memory: resource_limits.memory_bytes,
             pids_limit: docker_pids_limit(config.sandbox_pids_limit)?,
-            device_requests: docker_gpu_device_requests(spec.gpu, &spec.gpu_device),
+            device_requests: docker_gpu_device_requests(driver_gpu_request(spec)),
             binds: Some(build_binds(sandbox, config)?),
             restart_policy: Some(RestartPolicy {
                 name: Some(RestartPolicyNameEnum::UNLESS_STOPPED),
diff --git a/crates/openshell-driver-docker/src/tests.rs b/crates/openshell-driver-docker/src/tests.rs
index c9b34ff8f..07a68177e 100644
--- a/crates/openshell-driver-docker/src/tests.rs
+++ b/crates/openshell-driver-docker/src/tests.rs
@@ -13,7 +13,7 @@ use openshell_core::progress::{
     PROGRESS_STEP_STARTING_SANDBOX,
 };
 use openshell_core::proto::compute::v1::{
-    DriverResourceRequirements, DriverSandboxSpec, DriverSandboxTemplate,
+    DriverResourceRequirements, DriverSandboxSpec, DriverSandboxTemplate, GpuRequestSpec,
 };
 use std::fs;
 use std::net::{IpAddr, Ipv4Addr, SocketAddr};
@@ -42,8 +42,7 @@ fn test_sandbox() -> DriverSandbox {
                 resources: None,
                 platform_config: None,
             }),
-            gpu: false,
-            gpu_device: String::new(),
+            gpu: None,
             sandbox_token: String::new(),
         }),
         status: None,
@@ -605,7 +604,10 @@ fn build_container_create_body_clears_inherited_cmd() {
 fn validate_sandbox_rejects_gpu_when_cdi_unavailable() {
     let config = runtime_config();
     let mut sandbox = test_sandbox();
-    sandbox.spec.as_mut().unwrap().gpu = true;
+    sandbox.spec.as_mut().unwrap().gpu = Some(GpuRequestSpec {
+        device_id: vec![],
+        count: None,
+    });
 
     let err = DockerComputeDriver::validate_sandbox(&sandbox, &config).unwrap_err();
 
@@ -613,6 +615,22 @@ fn validate_sandbox_rejects_gpu_when_cdi_unavailable() {
     assert!(err.message().contains("Docker CDI"));
 }
 
+#[test]
+fn validate_sandbox_rejects_gpu_count() {
+    let mut config = runtime_config();
+    config.supports_gpu = true;
+    let mut sandbox = test_sandbox();
+    sandbox.spec.as_mut().unwrap().gpu = Some(GpuRequestSpec {
+        device_id: vec![],
+        count: Some(2),
+    });
+
+    let err = DockerComputeDriver::validate_sandbox(&sandbox, &config).unwrap_err();
+
+    assert_eq!(err.code(), tonic::Code::InvalidArgument);
+    assert!(err.message().contains("does not support GPU count"));
+}
+
 #[test]
 fn validate_sandbox_auth_requires_gateway_token() {
     let mut sandbox = test_sandbox();
@@ -640,7 +658,10 @@ fn build_container_create_body_maps_gpu_to_all_cdi_device() {
     let mut config = runtime_config();
     config.supports_gpu = true;
     let mut sandbox = test_sandbox();
-    sandbox.spec.as_mut().unwrap().gpu = true;
+    sandbox.spec.as_mut().unwrap().gpu = Some(GpuRequestSpec {
+        device_id: vec![],
+        count: None,
+    });
 
     let create_body = build_container_create_body(&sandbox, &config).unwrap();
     let request = create_body
@@ -658,13 +679,17 @@ fn build_container_create_body_maps_gpu_to_all_cdi_device() {
 }
 
 #[test]
-fn build_container_create_body_passes_explicit_cdi_device_id_through() {
+fn build_container_create_body_passes_explicit_cdi_device_ids_through() {
     let mut config = runtime_config();
     config.supports_gpu = true;
     let mut sandbox = test_sandbox();
-    let spec = sandbox.spec.as_mut().unwrap();
-    spec.gpu = true;
-    spec.gpu_device = "nvidia.com/gpu=0".to_string();
+    sandbox.spec.as_mut().unwrap().gpu = Some(GpuRequestSpec {
+        device_id: vec![
+            "nvidia.com/gpu=0".to_string(),
+            "nvidia.com/gpu=1".to_string(),
+        ],
+        count: None,
+    });
 
     let create_body = build_container_create_body(&sandbox, &config).unwrap();
     let request = create_body
@@ -677,7 +702,10 @@ fn build_container_create_body_passes_explicit_cdi_device_id_through() {
     assert_eq!(request.driver.as_deref(), Some("cdi"));
     assert_eq!(
         request.device_ids.as_ref().unwrap(),
-        &vec!["nvidia.com/gpu=0".to_string()]
+        &vec![
+            "nvidia.com/gpu=0".to_string(),
+            "nvidia.com/gpu=1".to_string()
+        ]
     );
 }
 
diff --git a/crates/openshell-driver-kubernetes/README.md b/crates/openshell-driver-kubernetes/README.md
index 1d45a1d83..329cde120 100644
--- a/crates/openshell-driver-kubernetes/README.md
+++ b/crates/openshell-driver-kubernetes/README.md
@@ -50,6 +50,6 @@ pods do not need direct external ingress for SSH.
 ## GPU Support
 
 When a sandbox requests GPU support, the driver checks node allocatable capacity
-for `nvidia.com/gpu` and requests one GPU resource in the workload spec. The
-sandbox image must provide the user-space libraries needed by the agent
-workload.
+for `nvidia.com/gpu` and sets the workload's `nvidia.com/gpu` resource limit.
+Requests without an explicit count use one GPU. The sandbox image must provide
+the user-space libraries needed by the agent workload.
diff --git a/crates/openshell-driver-kubernetes/src/driver.rs b/crates/openshell-driver-kubernetes/src/driver.rs
index 79487c04d..d35046b82 100644
--- a/crates/openshell-driver-kubernetes/src/driver.rs
+++ b/crates/openshell-driver-kubernetes/src/driver.rs
@@ -17,6 +17,7 @@ use kube::{Client, Error as KubeError};
 use openshell_core::driver_utils::{
     LABEL_MANAGED_BY, LABEL_MANAGED_BY_VALUE, LABEL_SANDBOX_ID, SUPERVISOR_IMAGE_BINARY_PATH,
 };
+use openshell_core::gpu::driver_gpu_request;
 use openshell_core::progress::{
     PROGRESS_STEP_PULLING_IMAGE, PROGRESS_STEP_REQUESTING_SANDBOX, PROGRESS_STEP_STARTING_SANDBOX,
     format_bytes, mark_progress_active, mark_progress_complete, mark_progress_detail,
@@ -25,7 +26,7 @@ use openshell_core::proto::compute::v1::{
     DriverCondition as SandboxCondition, DriverPlatformEvent as PlatformEvent,
     DriverSandbox as Sandbox, DriverSandboxSpec as SandboxSpec,
     DriverSandboxStatus as SandboxStatus, DriverSandboxTemplate as SandboxTemplate,
-    GetCapabilitiesResponse, WatchSandboxesDeletedEvent, WatchSandboxesEvent,
+    GetCapabilitiesResponse, GpuRequestSpec, WatchSandboxesDeletedEvent, WatchSandboxesEvent,
     WatchSandboxesPlatformEvent, WatchSandboxesSandboxEvent, watch_sandboxes_event,
 };
 use std::collections::BTreeMap;
@@ -77,7 +78,11 @@ const SANDBOX_VERSION: &str = "v1alpha1";
 pub const SANDBOX_KIND: &str = "Sandbox";
 
 const GPU_RESOURCE_NAME: &str = "nvidia.com/gpu";
-const GPU_RESOURCE_QUANTITY: &str = "1";
+const DEFAULT_GPU_COUNT: u32 = 1;
+
+fn gpu_has_explicit_device_ids(gpu: Option<&GpuRequestSpec>) -> bool {
+    gpu.is_some_and(|gpu| !gpu.device_id.is_empty())
+}
 
 // ---------------------------------------------------------------------------
 // Default workspace persistence (temporary — will be replaced by snapshotting)
@@ -203,12 +208,20 @@ impl KubernetesComputeDriver {
     }
 
     pub async fn validate_sandbox_create(&self, sandbox: &Sandbox) -> Result<(), tonic::Status> {
-        let gpu_requested = sandbox.spec.as_ref().is_some_and(|spec| spec.gpu);
-        self.validate_gpu_request(gpu_requested).await
+        let gpu = sandbox.spec.as_ref().and_then(driver_gpu_request);
+        self.validate_gpu_request(gpu).await
     }
 
-    async fn validate_gpu_request(&self, gpu_requested: bool) -> Result<(), tonic::Status> {
-        if gpu_requested
+    async fn validate_gpu_request(
+        &self,
+        gpu: Option<&GpuRequestSpec>,
+    ) -> Result<(), tonic::Status> {
+        if gpu_has_explicit_device_ids(gpu) {
+            return Err(tonic::Status::invalid_argument(
+                "kubernetes compute driver does not support explicit GPU device IDs",
+            ));
+        }
+        if gpu.is_some()
             && !self.has_gpu_capacity().await.map_err(|err| {
                 tonic::Status::internal(format!("check GPU node capacity failed: {err}"))
             })?
@@ -300,6 +313,14 @@ impl KubernetesComputeDriver {
     }
 
     pub async fn create_sandbox(&self, sandbox: &Sandbox) -> Result<(), KubernetesDriverError> {
+        if let Some(gpu) = sandbox.spec.as_ref().and_then(driver_gpu_request)
+            && gpu_has_explicit_device_ids(Some(gpu))
+        {
+            return Err(KubernetesDriverError::Precondition(
+                "kubernetes compute driver does not support explicit GPU device IDs".to_string(),
+            ));
+        }
+
         let name = sandbox.name.as_str();
         info!(
             sandbox_id = %sandbox.id,
@@ -1109,7 +1130,13 @@ fn sandbox_to_k8s_spec(
         if let Some(template) = spec.template.as_ref() {
             root.insert(
                 "podTemplate".to_string(),
-                sandbox_template_to_k8s(template, spec.gpu, &pod_env, inject_workspace, params),
+                sandbox_template_to_k8s(
+                    template,
+                    driver_gpu_request(spec),
+                    &pod_env,
+                    inject_workspace,
+                    params,
+                ),
             );
             if !template.agent_socket_path.is_empty() {
                 root.insert(
@@ -1141,7 +1168,7 @@ fn sandbox_to_k8s_spec(
             "podTemplate".to_string(),
             sandbox_template_to_k8s(
                 &SandboxTemplate::default(),
-                spec.is_some_and(|s| s.gpu),
+                spec.and_then(|s| s.gpu.as_ref()),
                 &pod_env,
                 inject_workspace,
                 params,
@@ -1156,7 +1183,7 @@ fn sandbox_to_k8s_spec(
 
 fn sandbox_template_to_k8s(
     template: &SandboxTemplate,
-    gpu: bool,
+    gpu: Option<&GpuRequestSpec>,
     spec_environment: &std::collections::HashMap<String, String>,
     inject_workspace: bool,
     params: &SandboxPodParams<'_>,
@@ -1214,7 +1241,7 @@ fn sandbox_template_to_k8s(
 
     if use_user_namespaces {
         spec.insert("hostUsers".to_string(), serde_json::json!(false));
-        if gpu {
+        if gpu.is_some() {
             warn!(
                 "GPU sandbox with user namespaces enabled — \
                  NVIDIA device plugin compatibility is unverified"
@@ -1395,7 +1422,10 @@ fn image_pull_secret_refs(secrets: &[String]) -> Vec<serde_json::Value> {
         .collect()
 }
 
-fn container_resources(template: &SandboxTemplate, gpu: bool) -> Option<serde_json::Value> {
+fn container_resources(
+    template: &SandboxTemplate,
+    gpu: Option<&GpuRequestSpec>,
+) -> Option<serde_json::Value> {
     // Start from the raw resources passthrough in platform_config (preserves
     // custom resource types like GPU limits that users set via the public API
     // Struct), then overlay the typed DriverResourceRequirements on top.
@@ -1428,8 +1458,8 @@ fn container_resources(template: &SandboxTemplate, gpu: bool) -> Option<serde_js
         apply("requests", "memory", memory_request);
     }
 
-    if gpu {
-        apply_gpu_limit(&mut resources);
+    if let Some(gpu) = gpu {
+        apply_gpu_limit(&mut resources, gpu.count.unwrap_or(DEFAULT_GPU_COUNT));
     }
     if resources.as_object().is_some_and(serde_json::Map::is_empty) {
         None
@@ -1438,10 +1468,10 @@ fn container_resources(template: &SandboxTemplate, gpu: bool) -> Option<serde_js
     }
 }
 
-fn apply_gpu_limit(resources: &mut serde_json::Value) {
+fn apply_gpu_limit(resources: &mut serde_json::Value, count: u32) {
     let Some(resources_obj) = resources.as_object_mut() else {
         *resources = serde_json::json!({});
-        return apply_gpu_limit(resources);
+        return apply_gpu_limit(resources, count);
     };
 
     let limits = resources_obj
@@ -1449,12 +1479,12 @@ fn apply_gpu_limit(resources: &mut serde_json::Value) {
         .or_insert_with(|| serde_json::json!({}));
     let Some(limits_obj) = limits.as_object_mut() else {
         *limits = serde_json::json!({});
-        return apply_gpu_limit(resources);
+        return apply_gpu_limit(resources, count);
     };
 
     limits_obj.insert(
         GPU_RESOURCE_NAME.to_string(),
-        serde_json::json!(GPU_RESOURCE_QUANTITY),
+        serde_json::json!(count.to_string()),
     );
 }
 
@@ -1694,6 +1724,13 @@ mod tests {
     static ENV_LOCK: std::sync::LazyLock<std::sync::Mutex<()>> =
         std::sync::LazyLock::new(|| std::sync::Mutex::new(()));
 
+    fn gpu_request(count: Option<u32>) -> GpuRequestSpec {
+        GpuRequestSpec {
+            device_id: vec![],
+            count,
+        }
+    }
+
     #[test]
     fn kube_pulling_event_adds_image_progress_metadata() {
         let mut metadata = std::collections::HashMap::new();
@@ -2005,7 +2042,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &SandboxTemplate::default(),
-                true,
+                Some(&gpu_request(None)),
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2018,10 +2055,44 @@ mod tests {
         );
         assert_eq!(
             pod_template["spec"]["containers"][0]["resources"]["limits"][GPU_RESOURCE_NAME],
-            serde_json::json!(GPU_RESOURCE_QUANTITY)
+            serde_json::json!(DEFAULT_GPU_COUNT.to_string())
+        );
+    }
+
+    #[test]
+    fn gpu_sandbox_uses_requested_gpu_count() {
+        let pod_template = {
+            let params = SandboxPodParams::default();
+            sandbox_template_to_k8s(
+                &SandboxTemplate::default(),
+                Some(&gpu_request(Some(2))),
+                &std::collections::HashMap::new(),
+                true,
+                &params,
+            )
+        };
+
+        assert_eq!(
+            pod_template["spec"]["containers"][0]["resources"]["limits"][GPU_RESOURCE_NAME],
+            serde_json::json!("2")
         );
     }
 
+    #[test]
+    fn gpu_has_explicit_device_ids_only_when_ids_are_present() {
+        use openshell_core::proto::compute::v1::GpuRequestSpec;
+
+        assert!(!gpu_has_explicit_device_ids(None));
+        assert!(!gpu_has_explicit_device_ids(Some(&GpuRequestSpec {
+            device_id: vec![],
+            count: None,
+        })));
+        assert!(gpu_has_explicit_device_ids(Some(&GpuRequestSpec {
+            device_id: vec!["nvidia.com/gpu=0".to_string()],
+            count: None,
+        })));
+    }
+
     #[test]
     fn gpu_sandbox_uses_template_runtime_class_name_when_set() {
         let template = SandboxTemplate {
@@ -2041,7 +2112,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &template,
-                true,
+                Some(&gpu_request(None)),
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2073,7 +2144,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &template,
-                false,
+                None,
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2179,7 +2250,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &template,
-                true,
+                Some(&gpu_request(None)),
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2190,7 +2261,7 @@ mod tests {
         assert_eq!(limits["cpu"], serde_json::json!("2"));
         assert_eq!(
             limits[GPU_RESOURCE_NAME],
-            serde_json::json!(GPU_RESOURCE_QUANTITY)
+            serde_json::json!(DEFAULT_GPU_COUNT.to_string())
         );
     }
 
@@ -2210,7 +2281,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &template,
-                false,
+                None,
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2233,7 +2304,7 @@ mod tests {
             };
             sandbox_template_to_k8s(
                 &SandboxTemplate::default(),
-                false,
+                None,
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2258,7 +2329,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &SandboxTemplate::default(),
-                false,
+                None,
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2281,7 +2352,7 @@ mod tests {
             };
             sandbox_template_to_k8s(
                 &template,
-                false,
+                None,
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2420,7 +2491,7 @@ mod tests {
         };
         let pod_template = sandbox_template_to_k8s(
             &SandboxTemplate::default(),
-            false,
+            None,
             &std::collections::HashMap::new(),
             false, // user provided custom VCTs
             &params,
@@ -2458,7 +2529,7 @@ mod tests {
         };
         sandbox_template_to_k8s(
             &SandboxTemplate::default(),
-            false,
+            None,
             &std::collections::HashMap::new(),
             true,
             &params,
@@ -2523,7 +2594,7 @@ mod tests {
         let params = SandboxPodParams::default(); // cluster default is off
         let pod_template = sandbox_template_to_k8s(
             &template,
-            false,
+            None,
             &std::collections::HashMap::new(),
             true,
             &params,
@@ -2561,7 +2632,7 @@ mod tests {
         };
         let pod_template = sandbox_template_to_k8s(
             &template,
-            false,
+            None,
             &std::collections::HashMap::new(),
             true,
             &params,
@@ -2587,7 +2658,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &SandboxTemplate::default(),
-                false,
+                None,
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2609,7 +2680,7 @@ mod tests {
         };
         let pod_template = sandbox_template_to_k8s(
             &SandboxTemplate::default(),
-            false,
+            None,
             &std::collections::HashMap::new(),
             true,
             &params,
@@ -2631,7 +2702,7 @@ mod tests {
     fn sandbox_template_omits_empty_image_pull_secrets() {
         let pod_template = sandbox_template_to_k8s(
             &SandboxTemplate::default(),
-            false,
+            None,
             &std::collections::HashMap::new(),
             true,
             &SandboxPodParams::default(),
@@ -2656,7 +2727,7 @@ mod tests {
         };
         let pod_template = sandbox_template_to_k8s(
             &SandboxTemplate::default(),
-            false,
+            None,
             &std::collections::HashMap::new(),
             true,
             &params,
@@ -2685,7 +2756,7 @@ mod tests {
         };
         let pod_template = sandbox_template_to_k8s(
             &template,
-            false,
+            None,
             &std::collections::HashMap::new(),
             true,
             &params,
@@ -2813,7 +2884,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &template,
-                false,
+                None,
                 &std::collections::HashMap::new(),
                 false,
                 &params,
@@ -2874,7 +2945,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &template,
-                false,
+                None,
                 &std::collections::HashMap::new(),
                 false,
                 &params,
diff --git a/crates/openshell-driver-podman/README.md b/crates/openshell-driver-podman/README.md
index 77b42ba37..e4183f75b 100644
--- a/crates/openshell-driver-podman/README.md
+++ b/crates/openshell-driver-podman/README.md
@@ -46,7 +46,7 @@ The container spec in `container.rs` sets these security-critical fields:
 | `no_new_privileges` | `true` | Prevents privilege escalation after exec. |
 | `seccomp_profile_path` | `unconfined` | The supervisor installs its own policy-aware BPF filter. A container-level profile can block Landlock/seccomp syscalls during setup. |
 | `mounts` | Private tmpfs at `/run/netns` | Lets the supervisor create named network namespaces in rootless Podman. |
-| CDI GPU devices | Sandbox `gpu_device` value when set, otherwise all NVIDIA GPUs | Exposes requested GPUs to GPU-enabled sandbox containers. |
+| CDI GPU devices | Explicit GPU request device IDs when set, otherwise all NVIDIA GPUs | Exposes requested GPUs to GPU-enabled sandbox containers. Count-based GPU requests are rejected until Podman CDI selection can map counts to concrete devices. |
 
 The restricted agent child does not retain these supervisor privileges.
 
diff --git a/crates/openshell-driver-podman/src/container.rs b/crates/openshell-driver-podman/src/container.rs
index 13f053e93..3c2bd7791 100644
--- a/crates/openshell-driver-podman/src/container.rs
+++ b/crates/openshell-driver-podman/src/container.rs
@@ -4,7 +4,7 @@
 //! Container spec construction for the Podman driver.
 
 use crate::config::PodmanComputeConfig;
-use openshell_core::gpu::cdi_gpu_device_ids;
+use openshell_core::gpu::{cdi_gpu_device_ids, driver_gpu_request};
 use openshell_core::proto::compute::v1::DriverSandbox;
 use serde::Serialize;
 use serde_json::Value;
@@ -379,8 +379,8 @@ fn podman_pids_limit(value: i64) -> Option<i64> {
 
 /// Build CDI GPU device list if GPU is requested.
 fn build_devices(sandbox: &DriverSandbox) -> Option<Vec<LinuxDevice>> {
-    let spec = sandbox.spec.as_ref()?;
-    cdi_gpu_device_ids(spec.gpu, &spec.gpu_device).map(|device_ids| {
+    let gpu = sandbox.spec.as_ref().and_then(driver_gpu_request);
+    cdi_gpu_device_ids(gpu).map(|device_ids| {
         device_ids
             .into_iter()
             .map(|path| LinuxDevice { path })
@@ -808,11 +808,14 @@ mod tests {
     #[test]
     fn container_spec_maps_empty_gpu_request_to_all_cdi_device() {
         use openshell_core::config::CDI_GPU_DEVICE_ALL;
-        use openshell_core::proto::compute::v1::DriverSandboxSpec;
+        use openshell_core::proto::compute::v1::{DriverSandboxSpec, GpuRequestSpec};
 
         let mut sandbox = test_sandbox("test-id", "test-name");
         sandbox.spec = Some(DriverSandboxSpec {
-            gpu: true,
+            gpu: Some(GpuRequestSpec {
+                device_id: vec![],
+                count: None,
+            }),
             ..Default::default()
         });
         let config = test_config();
@@ -826,12 +829,14 @@ mod tests {
 
     #[test]
     fn container_spec_passes_explicit_cdi_device_id_through() {
-        use openshell_core::proto::compute::v1::DriverSandboxSpec;
+        use openshell_core::proto::compute::v1::{DriverSandboxSpec, GpuRequestSpec};
 
         let mut sandbox = test_sandbox("test-id", "test-name");
         sandbox.spec = Some(DriverSandboxSpec {
-            gpu: true,
-            gpu_device: "nvidia.com/gpu=0".to_string(),
+            gpu: Some(GpuRequestSpec {
+                device_id: vec!["nvidia.com/gpu=0".to_string()],
+                count: None,
+            }),
             ..Default::default()
         });
         let config = test_config();
diff --git a/crates/openshell-driver-podman/src/driver.rs b/crates/openshell-driver-podman/src/driver.rs
index e2deb1c63..9593c4b87 100644
--- a/crates/openshell-driver-podman/src/driver.rs
+++ b/crates/openshell-driver-podman/src/driver.rs
@@ -10,7 +10,8 @@ use crate::watcher::{
     self, WatchStream, driver_sandbox_from_inspect, driver_sandbox_from_list_entry,
 };
 use openshell_core::ComputeDriverError;
-use openshell_core::proto::compute::v1::{DriverSandbox, GetCapabilitiesResponse};
+use openshell_core::gpu::driver_gpu_request;
+use openshell_core::proto::compute::v1::{DriverSandbox, GetCapabilitiesResponse, GpuRequestSpec};
 use std::path::PathBuf;
 use std::time::Duration;
 use tracing::{info, warn};
@@ -280,12 +281,17 @@ impl PodmanComputeDriver {
         &self,
         sandbox: &DriverSandbox,
     ) -> Result<(), ComputeDriverError> {
-        let gpu_requested = sandbox.spec.as_ref().is_some_and(|s| s.gpu);
-        Self::validate_gpu_request(gpu_requested)
+        let gpu = sandbox.spec.as_ref().and_then(driver_gpu_request);
+        Self::validate_gpu_request(gpu)
     }
 
-    fn validate_gpu_request(gpu_requested: bool) -> Result<(), ComputeDriverError> {
-        if gpu_requested && !Self::has_gpu_capacity() {
+    fn validate_gpu_request(gpu: Option<&GpuRequestSpec>) -> Result<(), ComputeDriverError> {
+        if gpu.is_some_and(|gpu| gpu.count.is_some()) {
+            return Err(ComputeDriverError::Precondition(
+                "podman compute driver does not support GPU count requests".to_string(),
+            ));
+        }
+        if gpu.is_some() && !Self::has_gpu_capacity() {
             return Err(ComputeDriverError::Precondition(
                 "GPU sandbox requested, but no NVIDIA GPU devices are available.".to_string(),
             ));
@@ -305,6 +311,7 @@ impl PodmanComputeDriver {
                 "sandbox id is required".into(),
             ));
         }
+        self.validate_sandbox_create(sandbox)?;
 
         // Validate the composed container name early, before creating any
         // resources (volume), so we don't leave orphans when the name is
@@ -667,6 +674,19 @@ mod tests {
         assert!(matches!(err, ComputeDriverError::Message(_)));
     }
 
+    #[test]
+    fn validate_gpu_request_rejects_count() {
+        let err = PodmanComputeDriver::validate_gpu_request(Some(&GpuRequestSpec {
+            device_id: vec![],
+            count: Some(2),
+        }))
+        .expect_err("GPU count should be rejected");
+
+        assert!(
+            matches!(err, ComputeDriverError::Precondition(message) if message.contains("does not support GPU count"))
+        );
+    }
+
     // ── grpc_endpoint auto-detection ───────────────────────────────────
     //
     // PodmanComputeDriver::new() fills grpc_endpoint when it is empty.
diff --git a/crates/openshell-driver-vm/src/driver.rs b/crates/openshell-driver-vm/src/driver.rs
index 56e431f38..dc257eda7 100644
--- a/crates/openshell-driver-vm/src/driver.rs
+++ b/crates/openshell-driver-vm/src/driver.rs
@@ -24,6 +24,7 @@ use oci_client::manifest::{
 };
 use oci_client::secrets::RegistryAuth;
 use oci_client::{Reference, RegistryOperation};
+use openshell_core::gpu::driver_gpu_request;
 use openshell_core::progress::{
     PROGRESS_STEP_PULLING_IMAGE, PROGRESS_STEP_REQUESTING_SANDBOX, PROGRESS_STEP_STARTING_SANDBOX,
     format_bytes, mark_progress_active, mark_progress_complete, mark_progress_detail,
@@ -32,11 +33,11 @@ use openshell_core::proto::compute::v1::{
     CreateSandboxRequest, CreateSandboxResponse, DeleteSandboxRequest, DeleteSandboxResponse,
     DriverCondition as SandboxCondition, DriverPlatformEvent as PlatformEvent,
     DriverSandbox as Sandbox, DriverSandboxStatus as SandboxStatus, GetCapabilitiesRequest,
-    GetCapabilitiesResponse, GetSandboxRequest, GetSandboxResponse, ListSandboxesRequest,
-    ListSandboxesResponse, StopSandboxRequest, StopSandboxResponse, ValidateSandboxCreateRequest,
-    ValidateSandboxCreateResponse, WatchSandboxesDeletedEvent, WatchSandboxesEvent,
-    WatchSandboxesPlatformEvent, WatchSandboxesRequest, WatchSandboxesSandboxEvent,
-    compute_driver_server::ComputeDriver, watch_sandboxes_event,
+    GetCapabilitiesResponse, GetSandboxRequest, GetSandboxResponse, GpuRequestSpec,
+    ListSandboxesRequest, ListSandboxesResponse, StopSandboxRequest, StopSandboxResponse,
+    ValidateSandboxCreateRequest, ValidateSandboxCreateResponse, WatchSandboxesDeletedEvent,
+    WatchSandboxesEvent, WatchSandboxesPlatformEvent, WatchSandboxesRequest,
+    WatchSandboxesSandboxEvent, compute_driver_server::ComputeDriver, watch_sandboxes_event,
 };
 use openshell_vfio::SysfsRoot;
 use prost::Message;
@@ -618,7 +619,7 @@ impl VmDriver {
         let gpu_device = sandbox
             .spec
             .as_ref()
-            .and_then(|spec| requested_gpu_device(spec.gpu, &spec.gpu_device));
+            .and_then(|spec| requested_gpu_device(driver_gpu_request(spec)));
         let gpu_bdf = if let Some(gpu_device) = gpu_device {
             Some(self.assign_gpu_to_record(&sandbox.id, gpu_device).await?)
         } else {
@@ -2578,7 +2579,7 @@ fn validate_vm_sandbox(sandbox: &Sandbox, gpu_enabled: bool) -> Result<(), Statu
         .as_ref()
         .ok_or_else(|| Status::invalid_argument("sandbox spec is required"))?;
 
-    validate_gpu_request(spec.gpu, &spec.gpu_device, gpu_enabled)?;
+    validate_gpu_request(driver_gpu_request(spec), gpu_enabled)?;
 
     if let Some(template) = spec.template.as_ref() {
         if !template.agent_socket_path.is_empty() {
@@ -2621,20 +2622,29 @@ fn validate_sandbox_id(sandbox_id: &str) -> Result<(), Status> {
     Ok(())
 }
 
-fn requested_gpu_device(gpu: bool, gpu_device: &str) -> Option<&str> {
-    gpu.then_some(gpu_device)
+fn requested_gpu_device(gpu: Option<&GpuRequestSpec>) -> Option<&str> {
+    let gpu = gpu?;
+    Some(gpu.device_id.first().map_or("", String::as_str))
 }
 
 #[allow(clippy::result_large_err)]
-fn validate_gpu_request(gpu: bool, gpu_device: &str, gpu_enabled: bool) -> Result<(), Status> {
-    if gpu && !gpu_enabled {
+fn validate_gpu_request(gpu: Option<&GpuRequestSpec>, gpu_enabled: bool) -> Result<(), Status> {
+    if gpu.is_some() && !gpu_enabled {
         return Err(Status::failed_precondition(
             "GPU support is not enabled on this driver; start with --gpu",
         ));
     }
 
-    if !gpu && !gpu_device.is_empty() {
-        return Err(Status::invalid_argument("gpu_device requires gpu=true"));
+    if gpu.is_some_and(|gpu| gpu.count.is_some_and(|count| count > 1)) {
+        return Err(Status::invalid_argument(
+            "vm compute driver supports at most one GPU",
+        ));
+    }
+
+    if gpu.is_some_and(|gpu| gpu.device_id.len() > 1) {
+        return Err(Status::invalid_argument(
+            "vm compute driver supports at most one GPU device ID",
+        ));
     }
     Ok(())
 }
@@ -4423,7 +4433,7 @@ mod tests {
         PROGRESS_COMPLETE_STEP_KEY,
     };
     use openshell_core::proto::compute::v1::{
-        DriverSandboxSpec as SandboxSpec, DriverSandboxTemplate as SandboxTemplate,
+        DriverSandboxSpec as SandboxSpec, DriverSandboxTemplate as SandboxTemplate, GpuRequestSpec,
     };
     use prost_types::{Struct, Value, value::Kind};
     use std::fs;
@@ -4502,7 +4512,10 @@ mod tests {
         let sandbox = Sandbox {
             id: "sandbox-123".to_string(),
             spec: Some(SandboxSpec {
-                gpu: true,
+                gpu: Some(GpuRequestSpec {
+                    device_id: vec![],
+                    count: None,
+                }),
                 ..Default::default()
             }),
             ..Default::default()
@@ -4518,7 +4531,10 @@ mod tests {
         let sandbox = Sandbox {
             id: "sandbox-123".to_string(),
             spec: Some(SandboxSpec {
-                gpu: true,
+                gpu: Some(GpuRequestSpec {
+                    device_id: vec![],
+                    count: None,
+                }),
                 ..Default::default()
             }),
             ..Default::default()
@@ -4527,38 +4543,82 @@ mod tests {
     }
 
     #[test]
-    fn validate_vm_sandbox_rejects_gpu_device_without_gpu() {
+    fn validate_vm_sandbox_accepts_gpu_count_one_when_enabled() {
+        let sandbox = Sandbox {
+            id: "sandbox-123".to_string(),
+            spec: Some(SandboxSpec {
+                gpu: Some(GpuRequestSpec {
+                    device_id: vec![],
+                    count: Some(1),
+                }),
+                ..Default::default()
+            }),
+            ..Default::default()
+        };
+        validate_vm_sandbox(&sandbox, true).expect("gpu count one should be accepted");
+    }
+
+    #[test]
+    fn validate_vm_sandbox_rejects_gpu_count_greater_than_one() {
         let sandbox = Sandbox {
             id: "sandbox-123".to_string(),
             spec: Some(SandboxSpec {
-                gpu: false,
-                gpu_device: "0000:2d:00.0".to_string(),
+                gpu: Some(GpuRequestSpec {
+                    device_id: vec![],
+                    count: Some(2),
+                }),
+                ..Default::default()
+            }),
+            ..Default::default()
+        };
+        let err =
+            validate_vm_sandbox(&sandbox, true).expect_err("gpu count > 1 should be rejected");
+        assert_eq!(err.code(), Code::InvalidArgument);
+        assert!(err.message().contains("at most one GPU"));
+    }
+
+    #[test]
+    fn validate_vm_sandbox_rejects_multiple_gpu_device_ids() {
+        let sandbox = Sandbox {
+            id: "sandbox-123".to_string(),
+            spec: Some(SandboxSpec {
+                gpu: Some(GpuRequestSpec {
+                    device_id: vec!["0000:2d:00.0".to_string(), "0000:3d:00.0".to_string()],
+                    count: None,
+                }),
                 ..Default::default()
             }),
             ..Default::default()
         };
         let err = validate_vm_sandbox(&sandbox, true)
-            .expect_err("gpu_device without gpu should be rejected");
+            .expect_err("multiple GPU device IDs should be rejected");
         assert_eq!(err.code(), Code::InvalidArgument);
-        assert!(err.message().contains("gpu_device requires gpu=true"));
+        assert!(err.message().contains("at most one GPU device ID"));
     }
 
     #[test]
     fn requested_gpu_device_returns_none_without_gpu_request() {
-        assert_eq!(requested_gpu_device(false, ""), None);
+        assert_eq!(requested_gpu_device(None), None);
     }
 
     #[test]
     fn requested_gpu_device_defaults_empty_request_to_inventory_choice() {
-        assert_eq!(requested_gpu_device(true, ""), Some(""));
+        let gpu = GpuRequestSpec {
+            device_id: vec![],
+            count: None,
+        };
+
+        assert_eq!(requested_gpu_device(Some(&gpu)), Some(""));
     }
 
     #[test]
-    fn requested_gpu_device_returns_explicit_device_id() {
-        assert_eq!(
-            requested_gpu_device(true, "0000:2d:00.0"),
-            Some("0000:2d:00.0")
-        );
+    fn requested_gpu_device_returns_first_explicit_device_id() {
+        let gpu = GpuRequestSpec {
+            device_id: vec!["0000:2d:00.0".to_string()],
+            count: None,
+        };
+
+        assert_eq!(requested_gpu_device(Some(&gpu)), Some("0000:2d:00.0"));
     }
 
     #[test]
diff --git a/crates/openshell-server/src/compute/mod.rs b/crates/openshell-server/src/compute/mod.rs
index 0122f9178..ac85f7269 100644
--- a/crates/openshell-server/src/compute/mod.rs
+++ b/crates/openshell-server/src/compute/mod.rs
@@ -19,10 +19,10 @@ use openshell_core::ComputeDriverKind;
 use openshell_core::proto::compute::v1::{
     CreateSandboxRequest, DeleteSandboxRequest, DriverCondition, DriverPlatformEvent,
     DriverResourceRequirements, DriverSandbox, DriverSandboxSpec, DriverSandboxStatus,
-    DriverSandboxTemplate, GetCapabilitiesRequest, GetSandboxRequest, ListSandboxesRequest,
-    ValidateSandboxCreateRequest, WatchSandboxesEvent, WatchSandboxesRequest,
-    compute_driver_client::ComputeDriverClient, compute_driver_server::ComputeDriver,
-    watch_sandboxes_event,
+    DriverSandboxTemplate, GetCapabilitiesRequest, GetSandboxRequest,
+    GpuRequestSpec as DriverGpuRequestSpec, ListSandboxesRequest, ValidateSandboxCreateRequest,
+    WatchSandboxesEvent, WatchSandboxesRequest, compute_driver_client::ComputeDriverClient,
+    compute_driver_server::ComputeDriver, watch_sandboxes_event,
 };
 use openshell_core::proto::{
     PlatformEvent, Sandbox, SandboxCondition, SandboxPhase, SandboxSpec, SandboxStatus,
@@ -1267,8 +1267,10 @@ fn driver_sandbox_spec_from_public(spec: &SandboxSpec) -> DriverSandboxSpec {
             .template
             .as_ref()
             .map(driver_sandbox_template_from_public),
-        gpu: spec.gpu,
-        gpu_device: spec.gpu_device.clone(),
+        gpu: spec.gpu.as_ref().map(|gpu| DriverGpuRequestSpec {
+            device_id: gpu.device_id.clone(),
+            count: gpu.count,
+        }),
         sandbox_token: String::new(),
     }
 }
@@ -1623,7 +1625,7 @@ fn derive_phase(status: Option<&DriverSandboxStatus>) -> SandboxPhase {
 }
 
 fn rewrite_user_facing_conditions(status: &mut Option<SandboxStatus>, spec: Option<&SandboxSpec>) {
-    let gpu_requested = spec.is_some_and(|sandbox_spec| sandbox_spec.gpu);
+    let gpu_requested = spec.is_some_and(|sandbox_spec| sandbox_spec.gpu.is_some());
     if !gpu_requested {
         return;
     }
@@ -1781,6 +1783,7 @@ pub async fn new_test_runtime(store: Arc<Store>) -> ComputeRuntime {
 mod tests {
     use super::*;
     use futures::stream;
+    use openshell_core::proto::GpuRequestSpec;
     use openshell_core::proto::compute::v1::{
         CreateSandboxResponse, DeleteSandboxResponse, GetCapabilitiesResponse, GetSandboxRequest,
         GetSandboxResponse, StopSandboxRequest, StopSandboxResponse, ValidateSandboxCreateResponse,
@@ -1801,6 +1804,48 @@ mod tests {
         }
     }
 
+    #[test]
+    fn driver_sandbox_spec_from_public_preserves_gpu_request_device_ids() {
+        let public = SandboxSpec {
+            gpu: Some(GpuRequestSpec {
+                device_id: vec!["nvidia.com/gpu=0".to_string()],
+                count: None,
+            }),
+            ..Default::default()
+        };
+
+        let driver = driver_sandbox_spec_from_public(&public);
+
+        assert_eq!(
+            driver
+                .gpu
+                .expect("driver GPU request should be present")
+                .device_id,
+            vec!["nvidia.com/gpu=0".to_string()]
+        );
+    }
+
+    #[test]
+    fn driver_sandbox_spec_from_public_preserves_gpu_count() {
+        let public = SandboxSpec {
+            gpu: Some(GpuRequestSpec {
+                device_id: vec![],
+                count: Some(2),
+            }),
+            ..Default::default()
+        };
+
+        let driver = driver_sandbox_spec_from_public(&public);
+
+        assert_eq!(
+            driver
+                .gpu
+                .expect("driver GPU request should be present")
+                .count,
+            Some(2)
+        );
+    }
+
     fn struct_value(
         fields: impl IntoIterator<Item = (impl Into<String>, prost_types::Value)>,
     ) -> prost_types::Value {
@@ -2258,7 +2303,10 @@ mod tests {
         rewrite_user_facing_conditions(
             &mut status,
             Some(&SandboxSpec {
-                gpu: true,
+                gpu: Some(GpuRequestSpec {
+                    device_id: vec![],
+                    count: None,
+                }),
                 ..Default::default()
             }),
         );
@@ -2289,7 +2337,7 @@ mod tests {
         rewrite_user_facing_conditions(
             &mut status,
             Some(&SandboxSpec {
-                gpu: false,
+                gpu: None,
                 ..Default::default()
             }),
         );
@@ -2571,7 +2619,10 @@ mod tests {
 
         let sandbox = Sandbox {
             spec: Some(SandboxSpec {
-                gpu: true,
+                gpu: Some(GpuRequestSpec {
+                    device_id: vec![],
+                    count: None,
+                }),
                 ..Default::default()
             }),
             ..sandbox_record("sb-1", "sandbox-a", SandboxPhase::Provisioning)
@@ -2594,7 +2645,7 @@ mod tests {
             SandboxPhase::try_from(stored.phase()).unwrap(),
             SandboxPhase::Ready
         );
-        assert!(stored.spec.as_ref().is_some_and(|spec| spec.gpu));
+        assert!(stored.spec.as_ref().is_some_and(|spec| spec.gpu.is_some()));
     }
 
     #[tokio::test]
diff --git a/crates/openshell-server/src/grpc/sandbox.rs b/crates/openshell-server/src/grpc/sandbox.rs
index e60ce3995..4413e3ce7 100644
--- a/crates/openshell-server/src/grpc/sandbox.rs
+++ b/crates/openshell-server/src/grpc/sandbox.rs
@@ -100,7 +100,7 @@ fn emit_sandbox_create_telemetry(
     };
     openshell_core::telemetry::emit_sandbox_create(
         outcome,
-        spec.gpu,
+        spec.gpu.is_some(),
         spec.providers.len() as u64,
         spec.policy.is_some(),
         template_source,
diff --git a/crates/openshell-server/src/grpc/validation.rs b/crates/openshell-server/src/grpc/validation.rs
index 53f292053..a9f1e984f 100644
--- a/crates/openshell-server/src/grpc/validation.rs
+++ b/crates/openshell-server/src/grpc/validation.rs
@@ -131,6 +131,11 @@ pub(super) fn validate_sandbox_spec(
         validate_sandbox_template(tmpl)?;
     }
 
+    // --- spec.gpu ---
+    if let Some(ref gpu) = spec.gpu {
+        validate_gpu_request(gpu)?;
+    }
+
     // --- spec.policy serialized size ---
     if let Some(ref policy) = spec.policy {
         let size = policy.encoded_len();
@@ -144,6 +149,18 @@ pub(super) fn validate_sandbox_spec(
     Ok(())
 }
 
+fn validate_gpu_request(gpu: &openshell_core::proto::GpuRequestSpec) -> Result<(), Status> {
+    if gpu.count.is_some() && !gpu.device_id.is_empty() {
+        return Err(Status::invalid_argument(
+            "gpu.count is mutually exclusive with gpu.device_id",
+        ));
+    }
+    if gpu.count == Some(0) {
+        return Err(Status::invalid_argument("gpu.count must be greater than 0"));
+    }
+    Ok(())
+}
+
 /// Validate template-level field sizes.
 fn validate_sandbox_template(tmpl: &SandboxTemplate) -> Result<(), Status> {
     // String fields.
@@ -661,7 +678,7 @@ pub(super) fn level_matches(log_level: &str, min_level: &str) -> bool {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use openshell_core::proto::SandboxSpec;
+    use openshell_core::proto::{GpuRequestSpec, SandboxSpec};
     use std::collections::HashMap;
     use tonic::Code;
 
@@ -687,12 +704,59 @@ mod tests {
     #[test]
     fn validate_sandbox_spec_accepts_gpu_flag() {
         let spec = SandboxSpec {
-            gpu: true,
+            gpu: Some(GpuRequestSpec {
+                device_id: vec![],
+                count: None,
+            }),
             ..Default::default()
         };
         assert!(validate_sandbox_spec("gpu-sandbox", &spec).is_ok());
     }
 
+    #[test]
+    fn validate_sandbox_spec_accepts_gpu_count() {
+        let spec = SandboxSpec {
+            gpu: Some(GpuRequestSpec {
+                device_id: vec![],
+                count: Some(2),
+            }),
+            ..Default::default()
+        };
+        assert!(validate_sandbox_spec("gpu-count-sandbox", &spec).is_ok());
+    }
+
+    #[test]
+    fn validate_sandbox_spec_rejects_zero_gpu_count() {
+        let spec = SandboxSpec {
+            gpu: Some(GpuRequestSpec {
+                device_id: vec![],
+                count: Some(0),
+            }),
+            ..Default::default()
+        };
+
+        let err = validate_sandbox_spec("gpu-count-sandbox", &spec).unwrap_err();
+
+        assert_eq!(err.code(), Code::InvalidArgument);
+        assert!(err.message().contains("count must be greater than 0"));
+    }
+
+    #[test]
+    fn validate_sandbox_spec_rejects_gpu_count_with_device_id() {
+        let spec = SandboxSpec {
+            gpu: Some(GpuRequestSpec {
+                device_id: vec!["nvidia.com/gpu=0".to_string()],
+                count: Some(1),
+            }),
+            ..Default::default()
+        };
+
+        let err = validate_sandbox_spec("gpu-count-sandbox", &spec).unwrap_err();
+
+        assert_eq!(err.code(), Code::InvalidArgument);
+        assert!(err.message().contains("mutually exclusive"));
+    }
+
     #[test]
     fn validate_sandbox_spec_accepts_empty_defaults() {
         assert!(validate_sandbox_spec("", &default_spec()).is_ok());
diff --git a/docs/sandboxes/manage-sandboxes.mdx b/docs/sandboxes/manage-sandboxes.mdx
index 512abfd3d..0b8469612 100644
--- a/docs/sandboxes/manage-sandboxes.mdx
+++ b/docs/sandboxes/manage-sandboxes.mdx
@@ -51,10 +51,20 @@ To request GPU resources, add `--gpu`:
 openshell sandbox create --gpu -- claude
 ```
 
+Request a specific number of GPUs with `--gpu-count`:
+
+```shell
+openshell sandbox create --gpu-count 2 -- claude
+```
+
 For Docker-backed sandboxes, GPU injection uses Docker CDI. If you enable Docker
 CDI after the gateway starts, restart the gateway so OpenShell can detect the
 updated Docker daemon capability.
 
+Kubernetes gateways honor `--gpu-count` by setting the `nvidia.com/gpu` resource
+limit. Docker and Podman support explicit CDI device IDs through `--gpu-device`
+but do not support count-based selection yet. VM gateways accept only one GPU.
+
 ### Custom Containers
 
 Use `--from` to create a sandbox from the base image, another pre-built sandbox name, a local directory, or a container image:
diff --git a/proto/compute_driver.proto b/proto/compute_driver.proto
index 610d491c7..3ac04380c 100644
--- a/proto/compute_driver.proto
+++ b/proto/compute_driver.proto
@@ -77,18 +77,16 @@ message DriverSandbox {
 
 // Driver-owned provisioning inputs required to create a sandbox.
 message DriverSandboxSpec {
+  reserved 10;
+
   // Log level exposed to processes running inside the sandbox.
   string log_level = 1;
   // Environment variables injected into the sandbox runtime.
   map<string, string> environment = 5;
   // Runtime template consumed by the driver during provisioning.
   DriverSandboxTemplate template = 6;
-  // Request NVIDIA GPU resources for this sandbox.
-  bool gpu = 9;
-  // Optional PCI BDF address (e.g. "0000:2d:00.0") or device index
-  // (e.g. "0", "1"). When empty with gpu=true, the driver assigns the
-  // first available GPU.
-  string gpu_device = 10;
+  // Request GPU resources for this sandbox. Presence indicates a GPU request.
+  GpuRequestSpec gpu = 9;
   // Gateway-minted JWT identifying this sandbox to the gateway. Set by
   // the gateway on create; the driver materialises it via its native
   // secret mechanism (Docker/Podman/VM bind-mount a per-sandbox file;
@@ -98,6 +96,15 @@ message DriverSandboxSpec {
   string sandbox_token = 11;
 }
 
+// Driver-native GPU request details.
+message GpuRequestSpec {
+  // Optional number of GPUs requested. Mutually exclusive with device_id.
+  optional uint32 count = 1;
+  // Optional driver-native device identifiers. Mutually exclusive with count.
+  // Empty means the driver chooses its default GPU assignment behavior.
+  repeated string device_id = 2;
+}
+
 // Driver-owned runtime template consumed by the compute platform.
 //
 // This message describes the sandbox workload in backend-neutral terms.
diff --git a/proto/openshell.proto b/proto/openshell.proto
index a8ead0d31..b15001586 100644
--- a/proto/openshell.proto
+++ b/proto/openshell.proto
@@ -307,6 +307,9 @@ message Sandbox {
 
 // Desired sandbox configuration provided through the public API.
 message SandboxSpec {
+  reserved 10, 11;
+  reserved "gpu_device", "proposal_approval_mode";
+
   // Log level exposed to processes running inside the sandbox.
   string log_level = 1;
   // Environment variables injected into the sandbox runtime.
@@ -317,18 +320,18 @@ message SandboxSpec {
   openshell.sandbox.v1.SandboxPolicy policy = 7;
   // Provider names to attach to this sandbox.
   repeated string providers = 8;
-  // Request NVIDIA GPU resources for this sandbox.
-  bool gpu = 9;
-  // Optional PCI BDF address (e.g. "0000:2d:00.0") or device index
-  // (e.g. "0", "1"). When empty with gpu=true, the driver assigns the
-  // first available GPU.
-  string gpu_device = 10;
-  // Field 11 was `proposal_approval_mode`. The approval mode is now a
-  // runtime setting (gateway or sandbox scope) read via UpdateConfig /
-  // GetSandboxConfig, so it can be flipped on a running sandbox and
-  // managed fleet-wide.
-  reserved 11;
-  reserved "proposal_approval_mode";
+  // Request GPU resources for this sandbox. Presence indicates a GPU request.
+  GpuRequestSpec gpu = 9;
+}
+
+// Public GPU request details. Device identifiers are interpreted by the
+// selected compute driver.
+message GpuRequestSpec {
+  // Optional number of GPUs requested. Mutually exclusive with device_id.
+  optional uint32 count = 1;
+  // Optional driver-native device identifiers. Mutually exclusive with count.
+  // Empty means the driver chooses its default GPU assignment behavior.
+  repeated string device_id = 2;
 }
 
 // Public sandbox template mapped onto compute-driver template inputs.

From cec0e213f9618dc0d35de7ad458bfff859fade66 Mon Sep 17 00:00:00 2001
From: Evan Lezar <elezar@nvidia.com>
Date: Wed, 3 Jun 2026 14:59:26 +0200
Subject: [PATCH 5/5] refactor(gpu): use resource requirements for GPU requests

Signed-off-by: Evan Lezar <elezar@nvidia.com>
---
 architecture/compute-runtimes.md              |   3 +
 crates/openshell-cli/src/run.rs               | 126 +++++++++++-------
 .../sandbox_create_lifecycle_integration.rs   |  11 +-
 crates/openshell-core/src/gpu.rs              |  31 +++--
 crates/openshell-driver-docker/README.md      |   2 +-
 crates/openshell-driver-docker/src/lib.rs     |  18 +--
 crates/openshell-driver-docker/src/tests.rs   |  40 +++---
 crates/openshell-driver-kubernetes/README.md  |   8 +-
 .../openshell-driver-kubernetes/src/driver.rs | 104 ++++++++-------
 crates/openshell-driver-podman/README.md      |   2 +-
 .../openshell-driver-podman/src/container.rs  |  32 +++--
 crates/openshell-driver-podman/src/driver.rs  |  16 ++-
 crates/openshell-driver-vm/README.md          |   5 +-
 crates/openshell-driver-vm/src/driver.rs      |  89 +++++++------
 crates/openshell-server/src/compute/mod.rs    | 100 +++++++++-----
 crates/openshell-server/src/grpc/sandbox.rs   |   4 +-
 .../openshell-server/src/grpc/validation.rs   |  61 ++++++---
 docs/sandboxes/manage-sandboxes.mdx           |  23 +++-
 proto/compute_driver.proto                    |  21 +--
 proto/openshell.proto                         |  23 ++--
 20 files changed, 438 insertions(+), 281 deletions(-)

diff --git a/architecture/compute-runtimes.md b/architecture/compute-runtimes.md
index 58f46eeb3..31356a86f 100644
--- a/architecture/compute-runtimes.md
+++ b/architecture/compute-runtimes.md
@@ -40,6 +40,9 @@ template resource limits. Docker and Podman apply them as runtime limits.
 Kubernetes mirrors each limit into the matching request. VM accepts the fields
 but currently ignores them.
 
+GPU requests enter the driver layer through
+`SandboxSpec.resource_requirements.gpu`.
+
 VM runtime state paths are derived only from driver-validated sandbox IDs
 matching `[A-Za-z0-9._-]{1,128}`. The gateway-owned VM driver socket uses a
 private `run/` directory plus Unix peer UID/PID checks. Standalone
diff --git a/crates/openshell-cli/src/run.rs b/crates/openshell-cli/src/run.rs
index 83234f7e7..e5ad32ce2 100644
--- a/crates/openshell-cli/src/run.rs
+++ b/crates/openshell-cli/src/run.rs
@@ -39,18 +39,18 @@ use openshell_core::proto::{
     GetClusterInferenceRequest, GetDraftHistoryRequest, GetDraftPolicyRequest,
     GetGatewayConfigRequest, GetProviderProfileRequest, GetProviderRefreshStatusRequest,
     GetProviderRequest, GetSandboxConfigRequest, GetSandboxLogsRequest,
-    GetSandboxPolicyStatusRequest, GetSandboxRequest, GetServiceRequest, GpuRequestSpec,
+    GetSandboxPolicyStatusRequest, GetSandboxRequest, GetServiceRequest, GpuResourceRequirement,
     HealthRequest, ImportProviderProfilesRequest, LintProviderProfilesRequest,
     ListProviderProfilesRequest, ListProvidersRequest, ListSandboxPoliciesRequest,
     ListSandboxProvidersRequest, ListSandboxesRequest, ListServicesRequest, PlatformEvent,
     PolicySource, PolicyStatus, Provider, ProviderCredentialRefreshStatus,
     ProviderCredentialRefreshStrategy, ProviderProfile, ProviderProfileDiagnostic,
     ProviderProfileImportItem, RejectDraftChunkRequest, RevokeSshSessionRequest,
-    RotateProviderCredentialRequest, Sandbox, SandboxPhase, SandboxPolicy, SandboxSpec,
-    SandboxTemplate, ServiceEndpointResponse, SetClusterInferenceRequest, SettingScope,
-    SettingValue, TcpForwardFrame, TcpForwardInit, TcpRelayTarget, UpdateConfigRequest,
-    UpdateProviderRequest, WatchSandboxRequest, exec_sandbox_event, setting_value,
-    tcp_forward_init,
+    RotateProviderCredentialRequest, Sandbox, SandboxPhase, SandboxPolicy,
+    SandboxResourceRequirements, SandboxSpec, SandboxTemplate, ServiceEndpointResponse,
+    SetClusterInferenceRequest, SettingScope, SettingValue, TcpForwardFrame, TcpForwardInit,
+    TcpRelayTarget, UpdateConfigRequest, UpdateProviderRequest, WatchSandboxRequest,
+    exec_sandbox_event, setting_value, tcp_forward_init,
 };
 use openshell_core::settings::{self, SettingValueKind};
 use openshell_core::{ObjectId, ObjectName};
@@ -1734,11 +1734,6 @@ pub async fn sandbox_create(
         }
         None => None,
     };
-    let requested_gpu = gpu
-        || gpu_device.is_some_and(|device_id| !device_id.is_empty())
-        || gpu_count.is_some()
-        || image.as_deref().is_some_and(image_requests_gpu);
-
     let providers_v2_enabled = gateway_providers_v2_enabled(&mut client).await?;
     let inferred_types: Vec<String> = if providers_v2_enabled {
         Vec::new()
@@ -1755,6 +1750,11 @@ pub async fn sandbox_create(
 
     let policy = load_sandbox_policy(policy)?;
     let resource_limits = build_sandbox_resource_limits(cpu, memory)?;
+    let resource_requirements =
+        resource_requirements_from_cli(image.as_deref(), gpu, gpu_device, gpu_count);
+    let requested_gpu = resource_requirements
+        .as_ref()
+        .is_some_and(|requirements| requirements.gpu.is_some());
 
     let template = if image.is_some() || resource_limits.is_some() {
         Some(SandboxTemplate {
@@ -1768,7 +1768,7 @@ pub async fn sandbox_create(
 
     let request = CreateSandboxRequest {
         spec: Some(SandboxSpec {
-            gpu: gpu_request_from_cli(requested_gpu, gpu_device, gpu_count),
+            resource_requirements,
             policy,
             providers: configured_providers,
             template,
@@ -2193,17 +2193,26 @@ pub async fn sandbox_create(
     }
 }
 
-fn gpu_request_from_cli(
-    requested_gpu: bool,
+fn resource_requirements_from_cli(
+    image: Option<&str>,
+    gpu: bool,
     gpu_device: Option<&str>,
     gpu_count: Option<u32>,
-) -> Option<GpuRequestSpec> {
-    requested_gpu.then(|| GpuRequestSpec {
-        device_id: gpu_device
-            .filter(|device_id| !device_id.is_empty())
-            .map(|device_id| vec![device_id.to_string()])
-            .unwrap_or_default(),
-        count: gpu_count,
+) -> Option<SandboxResourceRequirements> {
+    let device_ids = gpu_device
+        .filter(|device_id| !device_id.is_empty())
+        .map(|device_id| vec![device_id.to_string()])
+        .unwrap_or_default();
+    let requested_gpu = gpu
+        || gpu_count.is_some()
+        || !device_ids.is_empty()
+        || image.is_some_and(image_requests_gpu);
+
+    requested_gpu.then_some(SandboxResourceRequirements {
+        gpu: Some(GpuResourceRequirement {
+            device_ids,
+            count: gpu_count,
+        }),
     })
 }
 
@@ -7456,14 +7465,14 @@ mod tests {
         dockerfile_sources_supported_for_gateway, format_endpoint, format_gateway_select_header,
         format_gateway_select_items, format_provider_attachment_table, gateway_add,
         gateway_auth_label, gateway_env_override_warning, gateway_select_with, gateway_type_label,
-        git_sync_files, gpu_request_from_cli, http_health_check, image_requests_gpu,
-        import_local_package_mtls_bundle, inferred_provider_type, package_managed_tls_dirs,
-        parse_cli_setting_value, parse_credential_expiry_cli_value, parse_credential_expiry_pairs,
-        parse_credential_pairs, plaintext_gateway_is_remote, progress_step_from_metadata,
+        git_sync_files, http_health_check, image_requests_gpu, import_local_package_mtls_bundle,
+        inferred_provider_type, package_managed_tls_dirs, parse_cli_setting_value,
+        parse_credential_expiry_cli_value, parse_credential_expiry_pairs, parse_credential_pairs,
+        plaintext_gateway_is_remote, progress_step_from_metadata,
         provider_profile_allows_refresh_bootstrap, provisioning_timeout_message,
         ready_false_condition_message, refresh_status_header, refresh_status_row, resolve_from,
-        sandbox_should_persist, sandbox_upload_plan, service_expose_status_error,
-        service_url_for_gateway,
+        resource_requirements_from_cli, sandbox_should_persist, sandbox_upload_plan,
+        service_expose_status_error, service_url_for_gateway,
     };
     use crate::TEST_ENV_LOCK;
     use hyper::StatusCode;
@@ -7943,43 +7952,64 @@ mod tests {
     }
 
     #[test]
-    fn gpu_request_from_cli_uses_presence_with_empty_device_ids_for_default_gpu() {
-        let request =
-            gpu_request_from_cli(true, None, None).expect("gpu request should be present");
+    fn resource_requirements_from_cli_uses_presence_for_default_gpu() {
+        let requirements = resource_requirements_from_cli(None, true, None, None)
+            .expect("resource requirements should be present");
+        let gpu = requirements.gpu.expect("GPU requirement should be present");
 
-        assert!(request.device_id.is_empty());
-        assert_eq!(request.count, None);
+        assert!(gpu.device_ids.is_empty());
+        assert_eq!(gpu.count, None);
     }
 
     #[test]
-    fn gpu_request_from_cli_maps_gpu_device_to_one_device_id() {
-        let request = gpu_request_from_cli(true, Some("0000:2d:00.0"), None)
-            .expect("gpu request should be present");
+    fn resource_requirements_from_cli_maps_gpu_device_to_one_device_id() {
+        let requirements = resource_requirements_from_cli(None, false, Some("0000:2d:00.0"), None)
+            .expect("resource requirements should be present");
+        let gpu = requirements.gpu.expect("GPU requirement should be present");
 
-        assert_eq!(request.device_id, vec!["0000:2d:00.0"]);
-        assert_eq!(request.count, None);
+        assert_eq!(gpu.device_ids, vec!["0000:2d:00.0"]);
+        assert_eq!(gpu.count, None);
     }
 
     #[test]
-    fn gpu_request_from_cli_maps_gpu_count() {
-        let request = gpu_request_from_cli(true, None, Some(2)).expect("gpu request should exist");
+    fn resource_requirements_from_cli_maps_gpu_count() {
+        let requirements = resource_requirements_from_cli(None, false, None, Some(2))
+            .expect("requirements should exist");
+        let gpu = requirements.gpu.expect("GPU requirement should be present");
 
-        assert!(request.device_id.is_empty());
-        assert_eq!(request.count, Some(2));
+        assert!(gpu.device_ids.is_empty());
+        assert_eq!(gpu.count, Some(2));
     }
 
     #[test]
-    fn gpu_request_from_cli_preserves_device_and_gpu_count_for_gateway_validation() {
-        let request = gpu_request_from_cli(true, Some("nvidia.com/gpu=0"), Some(2))
-            .expect("gpu request should exist");
+    fn resource_requirements_from_cli_preserves_device_and_gpu_count_for_gateway_validation() {
+        let requirements =
+            resource_requirements_from_cli(None, false, Some("nvidia.com/gpu=0"), Some(2))
+                .expect("requirements should exist");
+        let gpu = requirements.gpu.expect("GPU requirement should be present");
 
-        assert_eq!(request.device_id, vec!["nvidia.com/gpu=0"]);
-        assert_eq!(request.count, Some(2));
+        assert_eq!(gpu.device_ids, vec!["nvidia.com/gpu=0"]);
+        assert_eq!(gpu.count, Some(2));
     }
 
     #[test]
-    fn gpu_request_from_cli_omits_gpu_request_when_not_requested() {
-        assert!(gpu_request_from_cli(false, Some("0"), None).is_none());
+    fn resource_requirements_from_cli_omits_gpu_request_when_not_requested() {
+        assert!(resource_requirements_from_cli(None, false, None, None).is_none());
+    }
+
+    #[test]
+    fn resource_requirements_from_cli_infers_gpu_from_image() {
+        let requirements = resource_requirements_from_cli(
+            Some("ghcr.io/nvidia/openshell-community/sandboxes/nvidia-gpu:latest"),
+            false,
+            None,
+            None,
+        )
+        .expect("resource requirements should be present");
+        let gpu = requirements.gpu.expect("GPU requirement should be present");
+
+        assert!(gpu.device_ids.is_empty());
+        assert_eq!(gpu.count, None);
     }
 
     #[test]
diff --git a/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs b/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs
index e25d7df8a..ea08abb4f 100644
--- a/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs
+++ b/crates/openshell-cli/tests/sandbox_create_lifecycle_integration.rs
@@ -907,6 +907,7 @@ async fn sandbox_create_sends_gpu_device_request_without_gpu_flag() {
         None,
         None,
         None,
+        None,
         &[],
         None,
         None,
@@ -924,10 +925,11 @@ async fn sandbox_create_sends_gpu_device_request_without_gpu_flag() {
     let gpu = requests[0]
         .spec
         .as_ref()
-        .and_then(|spec| spec.gpu.as_ref())
+        .and_then(|spec| spec.resource_requirements.as_ref())
+        .and_then(|requirements| requirements.gpu.as_ref())
         .expect("GPU request should be sent");
 
-    assert_eq!(gpu.device_id, vec!["nvidia.com/gpu=0"]);
+    assert_eq!(gpu.device_ids, vec!["nvidia.com/gpu=0"]);
     assert_eq!(gpu.count, None);
 }
 
@@ -970,10 +972,11 @@ async fn sandbox_create_sends_gpu_count_request() {
     let gpu = requests[0]
         .spec
         .as_ref()
-        .and_then(|spec| spec.gpu.as_ref())
+        .and_then(|spec| spec.resource_requirements.as_ref())
+        .and_then(|requirements| requirements.gpu.as_ref())
         .expect("GPU request should be sent");
 
-    assert!(gpu.device_id.is_empty());
+    assert!(gpu.device_ids.is_empty());
     assert_eq!(gpu.count, Some(2));
 }
 
diff --git a/crates/openshell-core/src/gpu.rs b/crates/openshell-core/src/gpu.rs
index 9c6eed8cd..59e1ca3f3 100644
--- a/crates/openshell-core/src/gpu.rs
+++ b/crates/openshell-core/src/gpu.rs
@@ -4,23 +4,26 @@
 //! Shared GPU request helpers.
 
 use crate::config::CDI_GPU_DEVICE_ALL;
-use crate::proto::compute::v1::{DriverSandboxSpec, GpuRequestSpec};
+use crate::proto::compute::v1::{DriverGpuResourceRequirement, DriverSandboxSpec};
 
-/// Extract the driver GPU request from a sandbox spec.
+/// Extract the driver GPU requirement from a sandbox spec.
 #[must_use]
-pub fn driver_gpu_request(spec: &DriverSandboxSpec) -> Option<&GpuRequestSpec> {
-    spec.gpu.as_ref()
+pub fn driver_gpu_requirement(spec: &DriverSandboxSpec) -> Option<&DriverGpuResourceRequirement> {
+    spec.resource_requirements
+        .as_ref()
+        .and_then(|requirements| requirements.gpu.as_ref())
 }
 
 /// Resolve a driver GPU request into CDI device identifiers.
 ///
 /// `None` means no GPU was requested. Presence with no explicit device IDs
-/// uses the CDI all-GPU request; otherwise the driver-native IDs pass through.
+/// uses the CDI all-GPU request, preserving the current default GPU behavior;
+/// otherwise the driver-native IDs pass through.
 #[must_use]
-pub fn cdi_gpu_device_ids(gpu: Option<&GpuRequestSpec>) -> Option<Vec<String>> {
+pub fn cdi_gpu_device_ids(gpu: Option<&DriverGpuResourceRequirement>) -> Option<Vec<String>> {
     match gpu {
-        Some(gpu) if gpu.device_id.is_empty() => Some(vec![CDI_GPU_DEVICE_ALL.to_string()]),
-        Some(gpu) => Some(gpu.device_id.clone()),
+        Some(gpu) if gpu.device_ids.is_empty() => Some(vec![CDI_GPU_DEVICE_ALL.to_string()]),
+        Some(gpu) => Some(gpu.device_ids.clone()),
         None => None,
     }
 }
@@ -36,8 +39,8 @@ mod tests {
 
     #[test]
     fn cdi_gpu_device_ids_defaults_empty_request_to_all_gpus() {
-        let request = GpuRequestSpec {
-            device_id: vec![],
+        let request = DriverGpuResourceRequirement {
+            device_ids: vec![],
             count: None,
         };
 
@@ -49,8 +52,8 @@ mod tests {
 
     #[test]
     fn cdi_gpu_device_ids_passes_single_device_id_through() {
-        let request = GpuRequestSpec {
-            device_id: vec!["nvidia.com/gpu=0".to_string()],
+        let request = DriverGpuResourceRequirement {
+            device_ids: vec!["nvidia.com/gpu=0".to_string()],
             count: None,
         };
 
@@ -62,8 +65,8 @@ mod tests {
 
     #[test]
     fn cdi_gpu_device_ids_passes_multiple_device_ids_through() {
-        let request = GpuRequestSpec {
-            device_id: vec![
+        let request = DriverGpuResourceRequirement {
+            device_ids: vec![
                 "nvidia.com/gpu=0".to_string(),
                 "nvidia.com/gpu=1".to_string(),
             ],
diff --git a/crates/openshell-driver-docker/README.md b/crates/openshell-driver-docker/README.md
index df4069059..b44c7056f 100644
--- a/crates/openshell-driver-docker/README.md
+++ b/crates/openshell-driver-docker/README.md
@@ -32,7 +32,7 @@ contract:
 | `apparmor=unconfined` | Avoids Docker's default profile blocking required mount operations. |
 | `restart_policy = unless-stopped` | Keeps managed sandboxes resumable across daemon or gateway restarts. |
 | `PidsLimit` | Enforces the sandbox PID budget at the Docker cgroup layer. Set `[openshell.drivers.docker].sandbox_pids_limit = 0` to inherit the Docker/runtime default. |
-| CDI GPU request | Uses explicit GPU request device IDs when set; otherwise requests all NVIDIA GPUs when the sandbox spec asks for GPU support and daemon CDI support is detected. Count-based GPU requests are rejected until Docker CDI selection can map counts to concrete devices. |
+| CDI GPU request | Uses explicit `resource_requirements.gpu.device_ids` when set; otherwise requests all NVIDIA GPUs when `resource_requirements.gpu` is present and daemon CDI support is detected. Count-based GPU requests are rejected until Docker CDI selection can map counts to concrete devices. |
 
 The agent child process does not retain these supervisor privileges.
 
diff --git a/crates/openshell-driver-docker/src/lib.rs b/crates/openshell-driver-docker/src/lib.rs
index e7c8d77c3..4f12a3110 100644
--- a/crates/openshell-driver-docker/src/lib.rs
+++ b/crates/openshell-driver-docker/src/lib.rs
@@ -25,16 +25,16 @@ use openshell_core::driver_utils::{
     LABEL_MANAGED_BY, LABEL_MANAGED_BY_VALUE, LABEL_SANDBOX_ID, LABEL_SANDBOX_NAME,
     LABEL_SANDBOX_NAMESPACE, SUPERVISOR_IMAGE_BINARY_PATH,
 };
-use openshell_core::gpu::{cdi_gpu_device_ids, driver_gpu_request};
+use openshell_core::gpu::{cdi_gpu_device_ids, driver_gpu_requirement};
 use openshell_core::progress::{
     PROGRESS_STEP_PULLING_IMAGE, PROGRESS_STEP_REQUESTING_SANDBOX, PROGRESS_STEP_STARTING_SANDBOX,
     format_bytes, mark_progress_active, mark_progress_complete, mark_progress_detail,
 };
 use openshell_core::proto::compute::v1::{
     CreateSandboxRequest, CreateSandboxResponse, DeleteSandboxRequest, DeleteSandboxResponse,
-    DriverCondition, DriverPlatformEvent, DriverSandbox, DriverSandboxStatus,
-    DriverSandboxTemplate, GetCapabilitiesRequest, GetCapabilitiesResponse, GetSandboxRequest,
-    GetSandboxResponse, GpuRequestSpec, ListSandboxesRequest, ListSandboxesResponse,
+    DriverCondition, DriverGpuResourceRequirement, DriverPlatformEvent, DriverSandbox,
+    DriverSandboxStatus, DriverSandboxTemplate, GetCapabilitiesRequest, GetCapabilitiesResponse,
+    GetSandboxRequest, GetSandboxResponse, ListSandboxesRequest, ListSandboxesResponse,
     StopSandboxRequest, StopSandboxResponse, ValidateSandboxCreateRequest,
     ValidateSandboxCreateResponse, WatchSandboxesDeletedEvent, WatchSandboxesEvent,
     WatchSandboxesPlatformEvent, WatchSandboxesRequest, WatchSandboxesSandboxEvent,
@@ -375,7 +375,7 @@ impl DockerComputeDriver {
                 "docker sandboxes require a template image",
             ));
         }
-        Self::validate_gpu_request(driver_gpu_request(spec), config.supports_gpu)?;
+        Self::validate_gpu_request(driver_gpu_requirement(spec), config.supports_gpu)?;
         if !template.agent_socket_path.trim().is_empty() {
             return Err(Status::failed_precondition(
                 "docker compute driver does not support template.agent_socket_path",
@@ -410,7 +410,7 @@ impl DockerComputeDriver {
     }
 
     fn validate_gpu_request(
-        gpu: Option<&GpuRequestSpec>,
+        gpu: Option<&DriverGpuResourceRequirement>,
         supports_gpu: bool,
     ) -> Result<(), Status> {
         if gpu.is_some_and(|gpu| gpu.count.is_some()) {
@@ -1721,7 +1721,9 @@ fn build_environment(sandbox: &DriverSandbox, config: &DockerDriverRuntimeConfig
         .collect()
 }
 
-fn docker_gpu_device_requests(gpu: Option<&GpuRequestSpec>) -> Option<Vec<DeviceRequest>> {
+fn docker_gpu_device_requests(
+    gpu: Option<&DriverGpuResourceRequirement>,
+) -> Option<Vec<DeviceRequest>> {
     cdi_gpu_device_ids(gpu).map(|device_ids| {
         vec![DeviceRequest {
             driver: Some("cdi".to_string()),
@@ -1773,7 +1775,7 @@ fn build_container_create_body(
             nano_cpus: resource_limits.nano_cpus,
             memory: resource_limits.memory_bytes,
             pids_limit: docker_pids_limit(config.sandbox_pids_limit)?,
-            device_requests: docker_gpu_device_requests(driver_gpu_request(spec)),
+            device_requests: docker_gpu_device_requests(driver_gpu_requirement(spec)),
             binds: Some(build_binds(sandbox, config)?),
             restart_policy: Some(RestartPolicy {
                 name: Some(RestartPolicyNameEnum::UNLESS_STOPPED),
diff --git a/crates/openshell-driver-docker/src/tests.rs b/crates/openshell-driver-docker/src/tests.rs
index 07a68177e..308605fae 100644
--- a/crates/openshell-driver-docker/src/tests.rs
+++ b/crates/openshell-driver-docker/src/tests.rs
@@ -13,7 +13,8 @@ use openshell_core::progress::{
     PROGRESS_STEP_STARTING_SANDBOX,
 };
 use openshell_core::proto::compute::v1::{
-    DriverResourceRequirements, DriverSandboxSpec, DriverSandboxTemplate, GpuRequestSpec,
+    DriverGpuResourceRequirement, DriverResourceRequirements, DriverSandboxResourceRequirements,
+    DriverSandboxSpec, DriverSandboxTemplate,
 };
 use std::fs;
 use std::net::{IpAddr, Ipv4Addr, SocketAddr};
@@ -23,6 +24,15 @@ use tempfile::TempDir;
 const TLS_MOUNT_DIR: &str = "/etc/openshell/tls/client";
 static ENV_LOCK: LazyLock<Mutex<()>> = LazyLock::new(|| Mutex::new(()));
 
+fn gpu_resource_requirements(
+    device_ids: Vec<String>,
+    count: Option<u32>,
+) -> DriverSandboxResourceRequirements {
+    DriverSandboxResourceRequirements {
+        gpu: Some(DriverGpuResourceRequirement { device_ids, count }),
+    }
+}
+
 fn test_sandbox() -> DriverSandbox {
     // Mirrors the gateway-supplied request: the public `Sandbox` API no
     // longer carries `namespace`, so the gateway elides the field and the
@@ -42,8 +52,8 @@ fn test_sandbox() -> DriverSandbox {
                 resources: None,
                 platform_config: None,
             }),
-            gpu: None,
             sandbox_token: String::new(),
+            resource_requirements: None,
         }),
         status: None,
     }
@@ -604,10 +614,8 @@ fn build_container_create_body_clears_inherited_cmd() {
 fn validate_sandbox_rejects_gpu_when_cdi_unavailable() {
     let config = runtime_config();
     let mut sandbox = test_sandbox();
-    sandbox.spec.as_mut().unwrap().gpu = Some(GpuRequestSpec {
-        device_id: vec![],
-        count: None,
-    });
+    sandbox.spec.as_mut().unwrap().resource_requirements =
+        Some(gpu_resource_requirements(vec![], None));
 
     let err = DockerComputeDriver::validate_sandbox(&sandbox, &config).unwrap_err();
 
@@ -620,10 +628,8 @@ fn validate_sandbox_rejects_gpu_count() {
     let mut config = runtime_config();
     config.supports_gpu = true;
     let mut sandbox = test_sandbox();
-    sandbox.spec.as_mut().unwrap().gpu = Some(GpuRequestSpec {
-        device_id: vec![],
-        count: Some(2),
-    });
+    sandbox.spec.as_mut().unwrap().resource_requirements =
+        Some(gpu_resource_requirements(vec![], Some(2)));
 
     let err = DockerComputeDriver::validate_sandbox(&sandbox, &config).unwrap_err();
 
@@ -658,10 +664,8 @@ fn build_container_create_body_maps_gpu_to_all_cdi_device() {
     let mut config = runtime_config();
     config.supports_gpu = true;
     let mut sandbox = test_sandbox();
-    sandbox.spec.as_mut().unwrap().gpu = Some(GpuRequestSpec {
-        device_id: vec![],
-        count: None,
-    });
+    sandbox.spec.as_mut().unwrap().resource_requirements =
+        Some(gpu_resource_requirements(vec![], None));
 
     let create_body = build_container_create_body(&sandbox, &config).unwrap();
     let request = create_body
@@ -683,13 +687,13 @@ fn build_container_create_body_passes_explicit_cdi_device_ids_through() {
     let mut config = runtime_config();
     config.supports_gpu = true;
     let mut sandbox = test_sandbox();
-    sandbox.spec.as_mut().unwrap().gpu = Some(GpuRequestSpec {
-        device_id: vec![
+    sandbox.spec.as_mut().unwrap().resource_requirements = Some(gpu_resource_requirements(
+        vec![
             "nvidia.com/gpu=0".to_string(),
             "nvidia.com/gpu=1".to_string(),
         ],
-        count: None,
-    });
+        None,
+    ));
 
     let create_body = build_container_create_body(&sandbox, &config).unwrap();
     let request = create_body
diff --git a/crates/openshell-driver-kubernetes/README.md b/crates/openshell-driver-kubernetes/README.md
index 329cde120..a57b7453d 100644
--- a/crates/openshell-driver-kubernetes/README.md
+++ b/crates/openshell-driver-kubernetes/README.md
@@ -49,7 +49,7 @@ pods do not need direct external ingress for SSH.
 
 ## GPU Support
 
-When a sandbox requests GPU support, the driver checks node allocatable capacity
-for `nvidia.com/gpu` and sets the workload's `nvidia.com/gpu` resource limit.
-Requests without an explicit count use one GPU. The sandbox image must provide
-the user-space libraries needed by the agent workload.
+When `resource_requirements.gpu` is present, the driver checks node allocatable
+capacity for `nvidia.com/gpu` and sets the workload's `nvidia.com/gpu` resource
+limit. The default is to request a single GPU. The sandbox image must
+provide the user-space libraries needed by the agent workload.
diff --git a/crates/openshell-driver-kubernetes/src/driver.rs b/crates/openshell-driver-kubernetes/src/driver.rs
index d35046b82..35df394a9 100644
--- a/crates/openshell-driver-kubernetes/src/driver.rs
+++ b/crates/openshell-driver-kubernetes/src/driver.rs
@@ -17,17 +17,18 @@ use kube::{Client, Error as KubeError};
 use openshell_core::driver_utils::{
     LABEL_MANAGED_BY, LABEL_MANAGED_BY_VALUE, LABEL_SANDBOX_ID, SUPERVISOR_IMAGE_BINARY_PATH,
 };
-use openshell_core::gpu::driver_gpu_request;
+use openshell_core::gpu::driver_gpu_requirement;
 use openshell_core::progress::{
     PROGRESS_STEP_PULLING_IMAGE, PROGRESS_STEP_REQUESTING_SANDBOX, PROGRESS_STEP_STARTING_SANDBOX,
     format_bytes, mark_progress_active, mark_progress_complete, mark_progress_detail,
 };
 use openshell_core::proto::compute::v1::{
-    DriverCondition as SandboxCondition, DriverPlatformEvent as PlatformEvent,
-    DriverSandbox as Sandbox, DriverSandboxSpec as SandboxSpec,
-    DriverSandboxStatus as SandboxStatus, DriverSandboxTemplate as SandboxTemplate,
-    GetCapabilitiesResponse, GpuRequestSpec, WatchSandboxesDeletedEvent, WatchSandboxesEvent,
-    WatchSandboxesPlatformEvent, WatchSandboxesSandboxEvent, watch_sandboxes_event,
+    DriverCondition as SandboxCondition, DriverGpuResourceRequirement,
+    DriverPlatformEvent as PlatformEvent, DriverSandbox as Sandbox,
+    DriverSandboxSpec as SandboxSpec, DriverSandboxStatus as SandboxStatus,
+    DriverSandboxTemplate as SandboxTemplate, GetCapabilitiesResponse, WatchSandboxesDeletedEvent,
+    WatchSandboxesEvent, WatchSandboxesPlatformEvent, WatchSandboxesSandboxEvent,
+    watch_sandboxes_event,
 };
 use std::collections::BTreeMap;
 use std::pin::Pin;
@@ -79,9 +80,23 @@ pub const SANDBOX_KIND: &str = "Sandbox";
 
 const GPU_RESOURCE_NAME: &str = "nvidia.com/gpu";
 const DEFAULT_GPU_COUNT: u32 = 1;
+const EXPLICIT_GPU_DEVICE_IDS_UNSUPPORTED_MESSAGE: &str =
+    "kubernetes compute driver does not support explicit GPU device IDs";
 
-fn gpu_has_explicit_device_ids(gpu: Option<&GpuRequestSpec>) -> bool {
-    gpu.is_some_and(|gpu| !gpu.device_id.is_empty())
+fn gpu_has_explicit_device_ids(gpu: Option<&DriverGpuResourceRequirement>) -> bool {
+    gpu.is_some_and(|gpu| !gpu.device_ids.is_empty())
+}
+
+#[allow(clippy::result_large_err)]
+fn validate_gpu_request_shape(
+    gpu: Option<&DriverGpuResourceRequirement>,
+) -> Result<(), tonic::Status> {
+    if gpu_has_explicit_device_ids(gpu) {
+        return Err(tonic::Status::invalid_argument(
+            EXPLICIT_GPU_DEVICE_IDS_UNSUPPORTED_MESSAGE,
+        ));
+    }
+    Ok(())
 }
 
 // ---------------------------------------------------------------------------
@@ -208,19 +223,15 @@ impl KubernetesComputeDriver {
     }
 
     pub async fn validate_sandbox_create(&self, sandbox: &Sandbox) -> Result<(), tonic::Status> {
-        let gpu = sandbox.spec.as_ref().and_then(driver_gpu_request);
+        let gpu = sandbox.spec.as_ref().and_then(driver_gpu_requirement);
         self.validate_gpu_request(gpu).await
     }
 
     async fn validate_gpu_request(
         &self,
-        gpu: Option<&GpuRequestSpec>,
+        gpu: Option<&DriverGpuResourceRequirement>,
     ) -> Result<(), tonic::Status> {
-        if gpu_has_explicit_device_ids(gpu) {
-            return Err(tonic::Status::invalid_argument(
-                "kubernetes compute driver does not support explicit GPU device IDs",
-            ));
-        }
+        validate_gpu_request_shape(gpu)?;
         if gpu.is_some()
             && !self.has_gpu_capacity().await.map_err(|err| {
                 tonic::Status::internal(format!("check GPU node capacity failed: {err}"))
@@ -313,11 +324,11 @@ impl KubernetesComputeDriver {
     }
 
     pub async fn create_sandbox(&self, sandbox: &Sandbox) -> Result<(), KubernetesDriverError> {
-        if let Some(gpu) = sandbox.spec.as_ref().and_then(driver_gpu_request)
+        if let Some(gpu) = sandbox.spec.as_ref().and_then(driver_gpu_requirement)
             && gpu_has_explicit_device_ids(Some(gpu))
         {
             return Err(KubernetesDriverError::Precondition(
-                "kubernetes compute driver does not support explicit GPU device IDs".to_string(),
+                EXPLICIT_GPU_DEVICE_IDS_UNSUPPORTED_MESSAGE.to_string(),
             ));
         }
 
@@ -1132,7 +1143,7 @@ fn sandbox_to_k8s_spec(
                 "podTemplate".to_string(),
                 sandbox_template_to_k8s(
                     template,
-                    driver_gpu_request(spec),
+                    driver_gpu_requirement(spec),
                     &pod_env,
                     inject_workspace,
                     params,
@@ -1168,7 +1179,7 @@ fn sandbox_to_k8s_spec(
             "podTemplate".to_string(),
             sandbox_template_to_k8s(
                 &SandboxTemplate::default(),
-                spec.and_then(|s| s.gpu.as_ref()),
+                spec.and_then(driver_gpu_requirement),
                 &pod_env,
                 inject_workspace,
                 params,
@@ -1183,7 +1194,7 @@ fn sandbox_to_k8s_spec(
 
 fn sandbox_template_to_k8s(
     template: &SandboxTemplate,
-    gpu: Option<&GpuRequestSpec>,
+    gpu: Option<&DriverGpuResourceRequirement>,
     spec_environment: &std::collections::HashMap<String, String>,
     inject_workspace: bool,
     params: &SandboxPodParams<'_>,
@@ -1424,7 +1435,7 @@ fn image_pull_secret_refs(secrets: &[String]) -> Vec<serde_json::Value> {
 
 fn container_resources(
     template: &SandboxTemplate,
-    gpu: Option<&GpuRequestSpec>,
+    gpu: Option<&DriverGpuResourceRequirement>,
 ) -> Option<serde_json::Value> {
     // Start from the raw resources passthrough in platform_config (preserves
     // custom resource types like GPU limits that users set via the public API
@@ -1724,13 +1735,31 @@ mod tests {
     static ENV_LOCK: std::sync::LazyLock<std::sync::Mutex<()>> =
         std::sync::LazyLock::new(|| std::sync::Mutex::new(()));
 
-    fn gpu_request(count: Option<u32>) -> GpuRequestSpec {
-        GpuRequestSpec {
-            device_id: vec![],
+    fn gpu_request(count: Option<u32>) -> DriverGpuResourceRequirement {
+        DriverGpuResourceRequirement {
+            device_ids: vec![],
             count,
         }
     }
 
+    fn default_gpu_request() -> DriverGpuResourceRequirement {
+        gpu_request(None)
+    }
+
+    #[test]
+    fn validate_gpu_request_shape_rejects_explicit_device_ids() {
+        let gpu = DriverGpuResourceRequirement {
+            device_ids: vec!["nvidia.com/gpu=0".to_string()],
+            count: None,
+        };
+
+        let err = validate_gpu_request_shape(Some(&gpu))
+            .expect_err("explicit GPU device IDs should be rejected");
+
+        assert_eq!(err.code(), tonic::Code::InvalidArgument);
+        assert_eq!(err.message(), EXPLICIT_GPU_DEVICE_IDS_UNSUPPORTED_MESSAGE);
+    }
+
     #[test]
     fn kube_pulling_event_adds_image_progress_metadata() {
         let mut metadata = std::collections::HashMap::new();
@@ -2042,7 +2071,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &SandboxTemplate::default(),
-                Some(&gpu_request(None)),
+                Some(&default_gpu_request()),
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2078,21 +2107,6 @@ mod tests {
         );
     }
 
-    #[test]
-    fn gpu_has_explicit_device_ids_only_when_ids_are_present() {
-        use openshell_core::proto::compute::v1::GpuRequestSpec;
-
-        assert!(!gpu_has_explicit_device_ids(None));
-        assert!(!gpu_has_explicit_device_ids(Some(&GpuRequestSpec {
-            device_id: vec![],
-            count: None,
-        })));
-        assert!(gpu_has_explicit_device_ids(Some(&GpuRequestSpec {
-            device_id: vec!["nvidia.com/gpu=0".to_string()],
-            count: None,
-        })));
-    }
-
     #[test]
     fn gpu_sandbox_uses_template_runtime_class_name_when_set() {
         let template = SandboxTemplate {
@@ -2112,7 +2126,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &template,
-                Some(&gpu_request(None)),
+                Some(&default_gpu_request()),
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2167,7 +2181,7 @@ mod tests {
             };
             sandbox_template_to_k8s(
                 &template,
-                false,
+                None,
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2202,7 +2216,7 @@ mod tests {
             };
             sandbox_template_to_k8s(
                 &template,
-                false,
+                None,
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2222,7 +2236,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &template,
-                false,
+                None,
                 &std::collections::HashMap::new(),
                 true,
                 &params,
@@ -2250,7 +2264,7 @@ mod tests {
             let params = SandboxPodParams::default();
             sandbox_template_to_k8s(
                 &template,
-                Some(&gpu_request(None)),
+                Some(&default_gpu_request()),
                 &std::collections::HashMap::new(),
                 true,
                 &params,
diff --git a/crates/openshell-driver-podman/README.md b/crates/openshell-driver-podman/README.md
index e4183f75b..7bca6e653 100644
--- a/crates/openshell-driver-podman/README.md
+++ b/crates/openshell-driver-podman/README.md
@@ -46,7 +46,7 @@ The container spec in `container.rs` sets these security-critical fields:
 | `no_new_privileges` | `true` | Prevents privilege escalation after exec. |
 | `seccomp_profile_path` | `unconfined` | The supervisor installs its own policy-aware BPF filter. A container-level profile can block Landlock/seccomp syscalls during setup. |
 | `mounts` | Private tmpfs at `/run/netns` | Lets the supervisor create named network namespaces in rootless Podman. |
-| CDI GPU devices | Explicit GPU request device IDs when set, otherwise all NVIDIA GPUs | Exposes requested GPUs to GPU-enabled sandbox containers. Count-based GPU requests are rejected until Podman CDI selection can map counts to concrete devices. |
+| CDI GPU devices | Explicit `resource_requirements.gpu.device_ids` when set, otherwise all NVIDIA GPUs | Exposes requested GPUs to GPU-enabled sandbox containers. Count-based GPU requests are rejected until Podman CDI selection can map counts to concrete devices. |
 
 The restricted agent child does not retain these supervisor privileges.
 
diff --git a/crates/openshell-driver-podman/src/container.rs b/crates/openshell-driver-podman/src/container.rs
index 3c2bd7791..a392fd772 100644
--- a/crates/openshell-driver-podman/src/container.rs
+++ b/crates/openshell-driver-podman/src/container.rs
@@ -4,7 +4,7 @@
 //! Container spec construction for the Podman driver.
 
 use crate::config::PodmanComputeConfig;
-use openshell_core::gpu::{cdi_gpu_device_ids, driver_gpu_request};
+use openshell_core::gpu::{cdi_gpu_device_ids, driver_gpu_requirement};
 use openshell_core::proto::compute::v1::DriverSandbox;
 use serde::Serialize;
 use serde_json::Value;
@@ -379,7 +379,7 @@ fn podman_pids_limit(value: i64) -> Option<i64> {
 
 /// Build CDI GPU device list if GPU is requested.
 fn build_devices(sandbox: &DriverSandbox) -> Option<Vec<LinuxDevice>> {
-    let gpu = sandbox.spec.as_ref().and_then(driver_gpu_request);
+    let gpu = sandbox.spec.as_ref().and_then(driver_gpu_requirement);
     cdi_gpu_device_ids(gpu).map(|device_ids| {
         device_ids
             .into_iter()
@@ -699,6 +699,13 @@ mod tests {
     static ENV_LOCK: std::sync::LazyLock<std::sync::Mutex<()>> =
         std::sync::LazyLock::new(|| std::sync::Mutex::new(()));
 
+    fn default_gpu_request() -> openshell_core::proto::compute::v1::DriverGpuResourceRequirement {
+        openshell_core::proto::compute::v1::DriverGpuResourceRequirement {
+            device_ids: vec![],
+            count: None,
+        }
+    }
+
     #[test]
     fn parse_cpu_millicore() {
         assert_eq!(parse_cpu_to_microseconds("500m"), Some(50_000));
@@ -808,13 +815,14 @@ mod tests {
     #[test]
     fn container_spec_maps_empty_gpu_request_to_all_cdi_device() {
         use openshell_core::config::CDI_GPU_DEVICE_ALL;
-        use openshell_core::proto::compute::v1::{DriverSandboxSpec, GpuRequestSpec};
+        use openshell_core::proto::compute::v1::{
+            DriverSandboxResourceRequirements, DriverSandboxSpec,
+        };
 
         let mut sandbox = test_sandbox("test-id", "test-name");
         sandbox.spec = Some(DriverSandboxSpec {
-            gpu: Some(GpuRequestSpec {
-                device_id: vec![],
-                count: None,
+            resource_requirements: Some(DriverSandboxResourceRequirements {
+                gpu: Some(default_gpu_request()),
             }),
             ..Default::default()
         });
@@ -829,13 +837,17 @@ mod tests {
 
     #[test]
     fn container_spec_passes_explicit_cdi_device_id_through() {
-        use openshell_core::proto::compute::v1::{DriverSandboxSpec, GpuRequestSpec};
+        use openshell_core::proto::compute::v1::{
+            DriverGpuResourceRequirement, DriverSandboxResourceRequirements, DriverSandboxSpec,
+        };
 
         let mut sandbox = test_sandbox("test-id", "test-name");
         sandbox.spec = Some(DriverSandboxSpec {
-            gpu: Some(GpuRequestSpec {
-                device_id: vec!["nvidia.com/gpu=0".to_string()],
-                count: None,
+            resource_requirements: Some(DriverSandboxResourceRequirements {
+                gpu: Some(DriverGpuResourceRequirement {
+                    device_ids: vec!["nvidia.com/gpu=0".to_string()],
+                    count: None,
+                }),
             }),
             ..Default::default()
         });
diff --git a/crates/openshell-driver-podman/src/driver.rs b/crates/openshell-driver-podman/src/driver.rs
index 9593c4b87..c14fade65 100644
--- a/crates/openshell-driver-podman/src/driver.rs
+++ b/crates/openshell-driver-podman/src/driver.rs
@@ -10,8 +10,10 @@ use crate::watcher::{
     self, WatchStream, driver_sandbox_from_inspect, driver_sandbox_from_list_entry,
 };
 use openshell_core::ComputeDriverError;
-use openshell_core::gpu::driver_gpu_request;
-use openshell_core::proto::compute::v1::{DriverSandbox, GetCapabilitiesResponse, GpuRequestSpec};
+use openshell_core::gpu::driver_gpu_requirement;
+use openshell_core::proto::compute::v1::{
+    DriverGpuResourceRequirement, DriverSandbox, GetCapabilitiesResponse,
+};
 use std::path::PathBuf;
 use std::time::Duration;
 use tracing::{info, warn};
@@ -281,11 +283,13 @@ impl PodmanComputeDriver {
         &self,
         sandbox: &DriverSandbox,
     ) -> Result<(), ComputeDriverError> {
-        let gpu = sandbox.spec.as_ref().and_then(driver_gpu_request);
+        let gpu = sandbox.spec.as_ref().and_then(driver_gpu_requirement);
         Self::validate_gpu_request(gpu)
     }
 
-    fn validate_gpu_request(gpu: Option<&GpuRequestSpec>) -> Result<(), ComputeDriverError> {
+    fn validate_gpu_request(
+        gpu: Option<&DriverGpuResourceRequirement>,
+    ) -> Result<(), ComputeDriverError> {
         if gpu.is_some_and(|gpu| gpu.count.is_some()) {
             return Err(ComputeDriverError::Precondition(
                 "podman compute driver does not support GPU count requests".to_string(),
@@ -676,8 +680,8 @@ mod tests {
 
     #[test]
     fn validate_gpu_request_rejects_count() {
-        let err = PodmanComputeDriver::validate_gpu_request(Some(&GpuRequestSpec {
-            device_id: vec![],
+        let err = PodmanComputeDriver::validate_gpu_request(Some(&DriverGpuResourceRequirement {
+            device_ids: vec![],
             count: Some(2),
         }))
         .expect_err("GPU count should be rejected");
diff --git a/crates/openshell-driver-vm/README.md b/crates/openshell-driver-vm/README.md
index 724bde06c..c5860f9cd 100644
--- a/crates/openshell-driver-vm/README.md
+++ b/crates/openshell-driver-vm/README.md
@@ -52,8 +52,9 @@ sudo -E env "PATH=$PATH" mise run gateway:vm -- --gpu
 ```
 
 GPU passthrough uses VFIO and requires host support for IOMMU, root privileges
-for bind/unbind operations, and a compatible sandbox image. The public GPU
-overview lives in the repository `README.md`.
+for bind/unbind operations, and a compatible sandbox image. Sandbox GPU requests
+arrive as `resource_requirements.gpu`; the VM driver accepts the default request,
+one explicit device ID, or a count of one.
 
 Point the CLI at the gateway with one of:
 
diff --git a/crates/openshell-driver-vm/src/driver.rs b/crates/openshell-driver-vm/src/driver.rs
index dc257eda7..759895dcd 100644
--- a/crates/openshell-driver-vm/src/driver.rs
+++ b/crates/openshell-driver-vm/src/driver.rs
@@ -24,20 +24,21 @@ use oci_client::manifest::{
 };
 use oci_client::secrets::RegistryAuth;
 use oci_client::{Reference, RegistryOperation};
-use openshell_core::gpu::driver_gpu_request;
+use openshell_core::gpu::driver_gpu_requirement;
 use openshell_core::progress::{
     PROGRESS_STEP_PULLING_IMAGE, PROGRESS_STEP_REQUESTING_SANDBOX, PROGRESS_STEP_STARTING_SANDBOX,
     format_bytes, mark_progress_active, mark_progress_complete, mark_progress_detail,
 };
 use openshell_core::proto::compute::v1::{
     CreateSandboxRequest, CreateSandboxResponse, DeleteSandboxRequest, DeleteSandboxResponse,
-    DriverCondition as SandboxCondition, DriverPlatformEvent as PlatformEvent,
-    DriverSandbox as Sandbox, DriverSandboxStatus as SandboxStatus, GetCapabilitiesRequest,
-    GetCapabilitiesResponse, GetSandboxRequest, GetSandboxResponse, GpuRequestSpec,
-    ListSandboxesRequest, ListSandboxesResponse, StopSandboxRequest, StopSandboxResponse,
-    ValidateSandboxCreateRequest, ValidateSandboxCreateResponse, WatchSandboxesDeletedEvent,
-    WatchSandboxesEvent, WatchSandboxesPlatformEvent, WatchSandboxesRequest,
-    WatchSandboxesSandboxEvent, compute_driver_server::ComputeDriver, watch_sandboxes_event,
+    DriverCondition as SandboxCondition, DriverGpuResourceRequirement,
+    DriverPlatformEvent as PlatformEvent, DriverSandbox as Sandbox,
+    DriverSandboxStatus as SandboxStatus, GetCapabilitiesRequest, GetCapabilitiesResponse,
+    GetSandboxRequest, GetSandboxResponse, ListSandboxesRequest, ListSandboxesResponse,
+    StopSandboxRequest, StopSandboxResponse, ValidateSandboxCreateRequest,
+    ValidateSandboxCreateResponse, WatchSandboxesDeletedEvent, WatchSandboxesEvent,
+    WatchSandboxesPlatformEvent, WatchSandboxesRequest, WatchSandboxesSandboxEvent,
+    compute_driver_server::ComputeDriver, watch_sandboxes_event,
 };
 use openshell_vfio::SysfsRoot;
 use prost::Message;
@@ -619,7 +620,8 @@ impl VmDriver {
         let gpu_device = sandbox
             .spec
             .as_ref()
-            .and_then(|spec| requested_gpu_device(driver_gpu_request(spec)));
+            .and_then(driver_gpu_requirement)
+            .and_then(|gpu| requested_gpu_device(Some(gpu)));
         let gpu_bdf = if let Some(gpu_device) = gpu_device {
             Some(self.assign_gpu_to_record(&sandbox.id, gpu_device).await?)
         } else {
@@ -2579,7 +2581,7 @@ fn validate_vm_sandbox(sandbox: &Sandbox, gpu_enabled: bool) -> Result<(), Statu
         .as_ref()
         .ok_or_else(|| Status::invalid_argument("sandbox spec is required"))?;
 
-    validate_gpu_request(driver_gpu_request(spec), gpu_enabled)?;
+    validate_gpu_request(driver_gpu_requirement(spec), gpu_enabled)?;
 
     if let Some(template) = spec.template.as_ref() {
         if !template.agent_socket_path.is_empty() {
@@ -2622,26 +2624,33 @@ fn validate_sandbox_id(sandbox_id: &str) -> Result<(), Status> {
     Ok(())
 }
 
-fn requested_gpu_device(gpu: Option<&GpuRequestSpec>) -> Option<&str> {
+fn requested_gpu_device(gpu: Option<&DriverGpuResourceRequirement>) -> Option<&str> {
     let gpu = gpu?;
-    Some(gpu.device_id.first().map_or("", String::as_str))
+    Some(gpu.device_ids.first().map_or("", String::as_str))
 }
 
 #[allow(clippy::result_large_err)]
-fn validate_gpu_request(gpu: Option<&GpuRequestSpec>, gpu_enabled: bool) -> Result<(), Status> {
-    if gpu.is_some() && !gpu_enabled {
+fn validate_gpu_request(
+    gpu: Option<&DriverGpuResourceRequirement>,
+    gpu_enabled: bool,
+) -> Result<(), Status> {
+    let Some(gpu) = gpu else {
+        return Ok(());
+    };
+
+    if !gpu_enabled {
         return Err(Status::failed_precondition(
             "GPU support is not enabled on this driver; start with --gpu",
         ));
     }
 
-    if gpu.is_some_and(|gpu| gpu.count.is_some_and(|count| count > 1)) {
+    if gpu.count.is_some_and(|count| count > 1) {
         return Err(Status::invalid_argument(
             "vm compute driver supports at most one GPU",
         ));
     }
 
-    if gpu.is_some_and(|gpu| gpu.device_id.len() > 1) {
+    if gpu.device_ids.len() > 1 {
         return Err(Status::invalid_argument(
             "vm compute driver supports at most one GPU device ID",
         ));
@@ -4433,7 +4442,8 @@ mod tests {
         PROGRESS_COMPLETE_STEP_KEY,
     };
     use openshell_core::proto::compute::v1::{
-        DriverSandboxSpec as SandboxSpec, DriverSandboxTemplate as SandboxTemplate, GpuRequestSpec,
+        DriverGpuResourceRequirement, DriverSandboxResourceRequirements,
+        DriverSandboxSpec as SandboxSpec, DriverSandboxTemplate as SandboxTemplate,
     };
     use prost_types::{Struct, Value, value::Kind};
     use std::fs;
@@ -4445,6 +4455,15 @@ mod tests {
     static ENV_LOCK: std::sync::LazyLock<std::sync::Mutex<()>> =
         std::sync::LazyLock::new(|| std::sync::Mutex::new(()));
 
+    fn gpu_resource_requirements(
+        device_ids: Vec<String>,
+        count: Option<u32>,
+    ) -> DriverSandboxResourceRequirements {
+        DriverSandboxResourceRequirements {
+            gpu: Some(DriverGpuResourceRequirement { device_ids, count }),
+        }
+    }
+
     #[test]
     fn vm_pulling_layer_event_adds_progress_detail_metadata() {
         let mut event = platform_event(
@@ -4512,10 +4531,7 @@ mod tests {
         let sandbox = Sandbox {
             id: "sandbox-123".to_string(),
             spec: Some(SandboxSpec {
-                gpu: Some(GpuRequestSpec {
-                    device_id: vec![],
-                    count: None,
-                }),
+                resource_requirements: Some(gpu_resource_requirements(vec![], None)),
                 ..Default::default()
             }),
             ..Default::default()
@@ -4531,10 +4547,7 @@ mod tests {
         let sandbox = Sandbox {
             id: "sandbox-123".to_string(),
             spec: Some(SandboxSpec {
-                gpu: Some(GpuRequestSpec {
-                    device_id: vec![],
-                    count: None,
-                }),
+                resource_requirements: Some(gpu_resource_requirements(vec![], None)),
                 ..Default::default()
             }),
             ..Default::default()
@@ -4547,10 +4560,7 @@ mod tests {
         let sandbox = Sandbox {
             id: "sandbox-123".to_string(),
             spec: Some(SandboxSpec {
-                gpu: Some(GpuRequestSpec {
-                    device_id: vec![],
-                    count: Some(1),
-                }),
+                resource_requirements: Some(gpu_resource_requirements(vec![], Some(1))),
                 ..Default::default()
             }),
             ..Default::default()
@@ -4563,10 +4573,7 @@ mod tests {
         let sandbox = Sandbox {
             id: "sandbox-123".to_string(),
             spec: Some(SandboxSpec {
-                gpu: Some(GpuRequestSpec {
-                    device_id: vec![],
-                    count: Some(2),
-                }),
+                resource_requirements: Some(gpu_resource_requirements(vec![], Some(2))),
                 ..Default::default()
             }),
             ..Default::default()
@@ -4582,10 +4589,10 @@ mod tests {
         let sandbox = Sandbox {
             id: "sandbox-123".to_string(),
             spec: Some(SandboxSpec {
-                gpu: Some(GpuRequestSpec {
-                    device_id: vec!["0000:2d:00.0".to_string(), "0000:3d:00.0".to_string()],
-                    count: None,
-                }),
+                resource_requirements: Some(gpu_resource_requirements(
+                    vec!["0000:2d:00.0".to_string(), "0000:3d:00.0".to_string()],
+                    None,
+                )),
                 ..Default::default()
             }),
             ..Default::default()
@@ -4603,8 +4610,8 @@ mod tests {
 
     #[test]
     fn requested_gpu_device_defaults_empty_request_to_inventory_choice() {
-        let gpu = GpuRequestSpec {
-            device_id: vec![],
+        let gpu = DriverGpuResourceRequirement {
+            device_ids: vec![],
             count: None,
         };
 
@@ -4613,8 +4620,8 @@ mod tests {
 
     #[test]
     fn requested_gpu_device_returns_first_explicit_device_id() {
-        let gpu = GpuRequestSpec {
-            device_id: vec!["0000:2d:00.0".to_string()],
+        let gpu = DriverGpuResourceRequirement {
+            device_ids: vec!["0000:2d:00.0".to_string()],
             count: None,
         };
 
diff --git a/crates/openshell-server/src/compute/mod.rs b/crates/openshell-server/src/compute/mod.rs
index ac85f7269..666a7174a 100644
--- a/crates/openshell-server/src/compute/mod.rs
+++ b/crates/openshell-server/src/compute/mod.rs
@@ -17,12 +17,13 @@ use crate::tracing_bus::TracingLogBus;
 use futures::{Stream, StreamExt};
 use openshell_core::ComputeDriverKind;
 use openshell_core::proto::compute::v1::{
-    CreateSandboxRequest, DeleteSandboxRequest, DriverCondition, DriverPlatformEvent,
-    DriverResourceRequirements, DriverSandbox, DriverSandboxSpec, DriverSandboxStatus,
-    DriverSandboxTemplate, GetCapabilitiesRequest, GetSandboxRequest,
-    GpuRequestSpec as DriverGpuRequestSpec, ListSandboxesRequest, ValidateSandboxCreateRequest,
-    WatchSandboxesEvent, WatchSandboxesRequest, compute_driver_client::ComputeDriverClient,
-    compute_driver_server::ComputeDriver, watch_sandboxes_event,
+    CreateSandboxRequest, DeleteSandboxRequest, DriverCondition, DriverGpuResourceRequirement,
+    DriverPlatformEvent, DriverResourceRequirements, DriverSandbox,
+    DriverSandboxResourceRequirements, DriverSandboxSpec, DriverSandboxStatus,
+    DriverSandboxTemplate, GetCapabilitiesRequest, GetSandboxRequest, ListSandboxesRequest,
+    ValidateSandboxCreateRequest, WatchSandboxesEvent, WatchSandboxesRequest,
+    compute_driver_client::ComputeDriverClient, compute_driver_server::ComputeDriver,
+    watch_sandboxes_event,
 };
 use openshell_core::proto::{
     PlatformEvent, Sandbox, SandboxCondition, SandboxPhase, SandboxSpec, SandboxStatus,
@@ -1267,14 +1268,28 @@ fn driver_sandbox_spec_from_public(spec: &SandboxSpec) -> DriverSandboxSpec {
             .template
             .as_ref()
             .map(driver_sandbox_template_from_public),
-        gpu: spec.gpu.as_ref().map(|gpu| DriverGpuRequestSpec {
-            device_id: gpu.device_id.clone(),
-            count: gpu.count,
-        }),
+        resource_requirements: spec
+            .resource_requirements
+            .as_ref()
+            .map(driver_resource_requirements_from_public),
         sandbox_token: String::new(),
     }
 }
 
+fn driver_resource_requirements_from_public(
+    requirements: &openshell_core::proto::SandboxResourceRequirements,
+) -> DriverSandboxResourceRequirements {
+    DriverSandboxResourceRequirements {
+        gpu: requirements
+            .gpu
+            .as_ref()
+            .map(|gpu| DriverGpuResourceRequirement {
+                device_ids: gpu.device_ids.clone(),
+                count: gpu.count,
+            }),
+    }
+}
+
 fn driver_sandbox_template_from_public(template: &SandboxTemplate) -> DriverSandboxTemplate {
     DriverSandboxTemplate {
         image: template.image.clone(),
@@ -1625,7 +1640,12 @@ fn derive_phase(status: Option<&DriverSandboxStatus>) -> SandboxPhase {
 }
 
 fn rewrite_user_facing_conditions(status: &mut Option<SandboxStatus>, spec: Option<&SandboxSpec>) {
-    let gpu_requested = spec.is_some_and(|sandbox_spec| sandbox_spec.gpu.is_some());
+    let gpu_requested = spec.is_some_and(|sandbox_spec| {
+        sandbox_spec
+            .resource_requirements
+            .as_ref()
+            .is_some_and(|requirements| requirements.gpu.is_some())
+    });
     if !gpu_requested {
         return;
     }
@@ -1783,11 +1803,11 @@ pub async fn new_test_runtime(store: Arc<Store>) -> ComputeRuntime {
 mod tests {
     use super::*;
     use futures::stream;
-    use openshell_core::proto::GpuRequestSpec;
     use openshell_core::proto::compute::v1::{
         CreateSandboxResponse, DeleteSandboxResponse, GetCapabilitiesResponse, GetSandboxRequest,
         GetSandboxResponse, StopSandboxRequest, StopSandboxResponse, ValidateSandboxCreateResponse,
     };
+    use openshell_core::proto::{GpuResourceRequirement, SandboxResourceRequirements};
     use std::collections::HashMap;
     use std::sync::Arc;
     use tokio::sync::{mpsc, oneshot};
@@ -1807,9 +1827,11 @@ mod tests {
     #[test]
     fn driver_sandbox_spec_from_public_preserves_gpu_request_device_ids() {
         let public = SandboxSpec {
-            gpu: Some(GpuRequestSpec {
-                device_id: vec!["nvidia.com/gpu=0".to_string()],
-                count: None,
+            resource_requirements: Some(SandboxResourceRequirements {
+                gpu: Some(GpuResourceRequirement {
+                    device_ids: vec!["nvidia.com/gpu=0".to_string()],
+                    count: None,
+                }),
             }),
             ..Default::default()
         };
@@ -1818,9 +1840,11 @@ mod tests {
 
         assert_eq!(
             driver
+                .resource_requirements
+                .expect("driver resource requirements should be present")
                 .gpu
-                .expect("driver GPU request should be present")
-                .device_id,
+                .expect("driver GPU requirement should be present")
+                .device_ids,
             vec!["nvidia.com/gpu=0".to_string()]
         );
     }
@@ -1828,9 +1852,11 @@ mod tests {
     #[test]
     fn driver_sandbox_spec_from_public_preserves_gpu_count() {
         let public = SandboxSpec {
-            gpu: Some(GpuRequestSpec {
-                device_id: vec![],
-                count: Some(2),
+            resource_requirements: Some(SandboxResourceRequirements {
+                gpu: Some(GpuResourceRequirement {
+                    device_ids: vec![],
+                    count: Some(2),
+                }),
             }),
             ..Default::default()
         };
@@ -1839,8 +1865,10 @@ mod tests {
 
         assert_eq!(
             driver
+                .resource_requirements
+                .expect("driver resource requirements should be present")
                 .gpu
-                .expect("driver GPU request should be present")
+                .expect("driver GPU requirement should be present")
                 .count,
             Some(2)
         );
@@ -2303,9 +2331,11 @@ mod tests {
         rewrite_user_facing_conditions(
             &mut status,
             Some(&SandboxSpec {
-                gpu: Some(GpuRequestSpec {
-                    device_id: vec![],
-                    count: None,
+                resource_requirements: Some(SandboxResourceRequirements {
+                    gpu: Some(GpuResourceRequirement {
+                        device_ids: vec![],
+                        count: None,
+                    }),
                 }),
                 ..Default::default()
             }),
@@ -2334,13 +2364,7 @@ mod tests {
             ..Default::default()
         });
 
-        rewrite_user_facing_conditions(
-            &mut status,
-            Some(&SandboxSpec {
-                gpu: None,
-                ..Default::default()
-            }),
-        );
+        rewrite_user_facing_conditions(&mut status, Some(&SandboxSpec::default()));
 
         assert_eq!(status.unwrap().conditions[0].message, original);
     }
@@ -2619,9 +2643,11 @@ mod tests {
 
         let sandbox = Sandbox {
             spec: Some(SandboxSpec {
-                gpu: Some(GpuRequestSpec {
-                    device_id: vec![],
-                    count: None,
+                resource_requirements: Some(SandboxResourceRequirements {
+                    gpu: Some(GpuResourceRequirement {
+                        device_ids: vec![],
+                        count: None,
+                    }),
                 }),
                 ..Default::default()
             }),
@@ -2645,7 +2671,11 @@ mod tests {
             SandboxPhase::try_from(stored.phase()).unwrap(),
             SandboxPhase::Ready
         );
-        assert!(stored.spec.as_ref().is_some_and(|spec| spec.gpu.is_some()));
+        assert!(stored.spec.as_ref().is_some_and(|spec| {
+            spec.resource_requirements
+                .as_ref()
+                .is_some_and(|requirements| requirements.gpu.is_some())
+        }));
     }
 
     #[tokio::test]
diff --git a/crates/openshell-server/src/grpc/sandbox.rs b/crates/openshell-server/src/grpc/sandbox.rs
index 4413e3ce7..3e8ed0e1e 100644
--- a/crates/openshell-server/src/grpc/sandbox.rs
+++ b/crates/openshell-server/src/grpc/sandbox.rs
@@ -100,7 +100,9 @@ fn emit_sandbox_create_telemetry(
     };
     openshell_core::telemetry::emit_sandbox_create(
         outcome,
-        spec.gpu.is_some(),
+        spec.resource_requirements
+            .as_ref()
+            .is_some_and(|requirements| requirements.gpu.is_some()),
         spec.providers.len() as u64,
         spec.policy.is_some(),
         template_source,
diff --git a/crates/openshell-server/src/grpc/validation.rs b/crates/openshell-server/src/grpc/validation.rs
index a9f1e984f..0f3b3fd7c 100644
--- a/crates/openshell-server/src/grpc/validation.rs
+++ b/crates/openshell-server/src/grpc/validation.rs
@@ -131,9 +131,9 @@ pub(super) fn validate_sandbox_spec(
         validate_sandbox_template(tmpl)?;
     }
 
-    // --- spec.gpu ---
-    if let Some(ref gpu) = spec.gpu {
-        validate_gpu_request(gpu)?;
+    // --- spec.resource_requirements ---
+    if let Some(ref requirements) = spec.resource_requirements {
+        validate_resource_requirements(requirements)?;
     }
 
     // --- spec.policy serialized size ---
@@ -149,14 +149,27 @@ pub(super) fn validate_sandbox_spec(
     Ok(())
 }
 
-fn validate_gpu_request(gpu: &openshell_core::proto::GpuRequestSpec) -> Result<(), Status> {
-    if gpu.count.is_some() && !gpu.device_id.is_empty() {
+fn validate_resource_requirements(
+    requirements: &openshell_core::proto::SandboxResourceRequirements,
+) -> Result<(), Status> {
+    if let Some(ref gpu) = requirements.gpu {
+        validate_gpu_requirement(gpu)?;
+    }
+    Ok(())
+}
+
+fn validate_gpu_requirement(
+    gpu: &openshell_core::proto::GpuResourceRequirement,
+) -> Result<(), Status> {
+    if gpu.count.is_some() && !gpu.device_ids.is_empty() {
         return Err(Status::invalid_argument(
-            "gpu.count is mutually exclusive with gpu.device_id",
+            "resource_requirements.gpu.count is mutually exclusive with resource_requirements.gpu.device_ids",
         ));
     }
     if gpu.count == Some(0) {
-        return Err(Status::invalid_argument("gpu.count must be greater than 0"));
+        return Err(Status::invalid_argument(
+            "resource_requirements.gpu.count must be greater than 0",
+        ));
     }
     Ok(())
 }
@@ -678,7 +691,7 @@ pub(super) fn level_matches(log_level: &str, min_level: &str) -> bool {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use openshell_core::proto::{GpuRequestSpec, SandboxSpec};
+    use openshell_core::proto::{GpuResourceRequirement, SandboxResourceRequirements, SandboxSpec};
     use std::collections::HashMap;
     use tonic::Code;
 
@@ -704,9 +717,11 @@ mod tests {
     #[test]
     fn validate_sandbox_spec_accepts_gpu_flag() {
         let spec = SandboxSpec {
-            gpu: Some(GpuRequestSpec {
-                device_id: vec![],
-                count: None,
+            resource_requirements: Some(SandboxResourceRequirements {
+                gpu: Some(GpuResourceRequirement {
+                    device_ids: vec![],
+                    count: None,
+                }),
             }),
             ..Default::default()
         };
@@ -716,9 +731,11 @@ mod tests {
     #[test]
     fn validate_sandbox_spec_accepts_gpu_count() {
         let spec = SandboxSpec {
-            gpu: Some(GpuRequestSpec {
-                device_id: vec![],
-                count: Some(2),
+            resource_requirements: Some(SandboxResourceRequirements {
+                gpu: Some(GpuResourceRequirement {
+                    device_ids: vec![],
+                    count: Some(2),
+                }),
             }),
             ..Default::default()
         };
@@ -728,9 +745,11 @@ mod tests {
     #[test]
     fn validate_sandbox_spec_rejects_zero_gpu_count() {
         let spec = SandboxSpec {
-            gpu: Some(GpuRequestSpec {
-                device_id: vec![],
-                count: Some(0),
+            resource_requirements: Some(SandboxResourceRequirements {
+                gpu: Some(GpuResourceRequirement {
+                    device_ids: vec![],
+                    count: Some(0),
+                }),
             }),
             ..Default::default()
         };
@@ -744,9 +763,11 @@ mod tests {
     #[test]
     fn validate_sandbox_spec_rejects_gpu_count_with_device_id() {
         let spec = SandboxSpec {
-            gpu: Some(GpuRequestSpec {
-                device_id: vec!["nvidia.com/gpu=0".to_string()],
-                count: Some(1),
+            resource_requirements: Some(SandboxResourceRequirements {
+                gpu: Some(GpuResourceRequirement {
+                    device_ids: vec!["nvidia.com/gpu=0".to_string()],
+                    count: Some(1),
+                }),
             }),
             ..Default::default()
         };
diff --git a/docs/sandboxes/manage-sandboxes.mdx b/docs/sandboxes/manage-sandboxes.mdx
index 0b8469612..8ec69c709 100644
--- a/docs/sandboxes/manage-sandboxes.mdx
+++ b/docs/sandboxes/manage-sandboxes.mdx
@@ -57,13 +57,26 @@ Request a specific number of GPUs with `--gpu-count`:
 openshell sandbox create --gpu-count 2 -- claude
 ```
 
+Request a specific GPU device with `--gpu-device`; this also requests GPU
+resources:
+
+```shell
+openshell sandbox create --gpu-device nvidia.com/gpu=0 -- claude
+```
+
+Support for `--gpu-count` and `--gpu-device` is driver-dependent:
+
+| Driver     | `--gpu` default request       | `--gpu-count`         | `--gpu-device`                             |
+| ---------- | ----------------------------- | --------------------- | ------------------------------------------ |
+| Docker     | All CDI GPU devices           | Not supported         | One CDI device ID, such as `nvidia.com/gpu=0` |
+| Podman     | All CDI GPU devices           | Not supported         | One CDI device ID, such as `nvidia.com/gpu=0` |
+| Kubernetes | One `nvidia.com/gpu` resource | Supported             | Not supported                              |
+| VM         | One GPU                       | Only `1` is supported | One PCI BDF or GPU index                   |
+
 For Docker-backed sandboxes, GPU injection uses Docker CDI. If you enable Docker
 CDI after the gateway starts, restart the gateway so OpenShell can detect the
-updated Docker daemon capability.
-
-Kubernetes gateways honor `--gpu-count` by setting the `nvidia.com/gpu` resource
-limit. Docker and Podman support explicit CDI device IDs through `--gpu-device`
-but do not support count-based selection yet. VM gateways accept only one GPU.
+updated Docker daemon capability. In the API, these flags populate
+`SandboxSpec.resource_requirements.gpu`.
 
 ### Custom Containers
 
diff --git a/proto/compute_driver.proto b/proto/compute_driver.proto
index 3ac04380c..79bff06e2 100644
--- a/proto/compute_driver.proto
+++ b/proto/compute_driver.proto
@@ -77,16 +77,14 @@ message DriverSandbox {
 
 // Driver-owned provisioning inputs required to create a sandbox.
 message DriverSandboxSpec {
-  reserved 10;
-
   // Log level exposed to processes running inside the sandbox.
   string log_level = 1;
   // Environment variables injected into the sandbox runtime.
   map<string, string> environment = 5;
   // Runtime template consumed by the driver during provisioning.
   DriverSandboxTemplate template = 6;
-  // Request GPU resources for this sandbox. Presence indicates a GPU request.
-  GpuRequestSpec gpu = 9;
+  // Portable resource requirements for this sandbox.
+  DriverSandboxResourceRequirements resource_requirements = 9;
   // Gateway-minted JWT identifying this sandbox to the gateway. Set by
   // the gateway on create; the driver materialises it via its native
   // secret mechanism (Docker/Podman/VM bind-mount a per-sandbox file;
@@ -96,13 +94,20 @@ message DriverSandboxSpec {
   string sandbox_token = 11;
 }
 
-// Driver-native GPU request details.
-message GpuRequestSpec {
-  // Optional number of GPUs requested. Mutually exclusive with device_id.
+// Driver-owned resource requirements for the sandbox workload.
+message DriverSandboxResourceRequirements {
+  // GPU requirement for the sandbox. Presence indicates a GPU request.
+  DriverGpuResourceRequirement gpu = 1;
+}
+
+// Driver-owned GPU resource requirement. Device identifiers are interpreted by
+// the selected compute driver and are an interim compatibility surface.
+message DriverGpuResourceRequirement {
+  // Optional number of GPUs requested. Mutually exclusive with device_ids.
   optional uint32 count = 1;
   // Optional driver-native device identifiers. Mutually exclusive with count.
   // Empty means the driver chooses its default GPU assignment behavior.
-  repeated string device_id = 2;
+  repeated string device_ids = 2;
 }
 
 // Driver-owned runtime template consumed by the compute platform.
diff --git a/proto/openshell.proto b/proto/openshell.proto
index b15001586..6be740409 100644
--- a/proto/openshell.proto
+++ b/proto/openshell.proto
@@ -307,9 +307,6 @@ message Sandbox {
 
 // Desired sandbox configuration provided through the public API.
 message SandboxSpec {
-  reserved 10, 11;
-  reserved "gpu_device", "proposal_approval_mode";
-
   // Log level exposed to processes running inside the sandbox.
   string log_level = 1;
   // Environment variables injected into the sandbox runtime.
@@ -320,18 +317,24 @@ message SandboxSpec {
   openshell.sandbox.v1.SandboxPolicy policy = 7;
   // Provider names to attach to this sandbox.
   repeated string providers = 8;
-  // Request GPU resources for this sandbox. Presence indicates a GPU request.
-  GpuRequestSpec gpu = 9;
+  // Portable resource requirements for this sandbox.
+  SandboxResourceRequirements resource_requirements = 9;
+}
+
+// Public resource requirements for the sandbox workload.
+message SandboxResourceRequirements {
+  // GPU requirement for the sandbox. Presence indicates a GPU request.
+  GpuResourceRequirement gpu = 1;
 }
 
-// Public GPU request details. Device identifiers are interpreted by the
-// selected compute driver.
-message GpuRequestSpec {
-  // Optional number of GPUs requested. Mutually exclusive with device_id.
+// Public GPU resource requirement. Device identifiers are interpreted by the
+// selected compute driver and are an interim compatibility surface.
+message GpuResourceRequirement {
+  // Optional number of GPUs requested. Mutually exclusive with device_ids.
   optional uint32 count = 1;
   // Optional driver-native device identifiers. Mutually exclusive with count.
   // Empty means the driver chooses its default GPU assignment behavior.
-  repeated string device_id = 2;
+  repeated string device_ids = 2;
 }
 
 // Public sandbox template mapped onto compute-driver template inputs.