Enable CDI in runtime if CDI_ENABLED is set

This change also enables CDI in the configured runtime when the toolkit
is installed with CDI enabled.

Signed-off-by: Evan Lezar <elezar@nvidia.com>
This commit is contained in:
Evan Lezar 2025-01-29 11:03:10 +01:00
parent b71bb87d91
commit eb48d2d5fd
No known key found for this signature in database
4 changed files with 32 additions and 22 deletions

View File

@ -163,7 +163,7 @@ func (m command) build() *cli.Command {
}, },
&cli.BoolFlag{ &cli.BoolFlag{
Name: "cdi.enabled", Name: "cdi.enabled",
Aliases: []string{"cdi.enable"}, Aliases: []string{"cdi.enable", "enable-cdi"},
Usage: "Enable CDI in the configured runtime", Usage: "Enable CDI in the configured runtime",
Destination: &config.cdi.enabled, Destination: &config.cdi.enabled,
}, },

View File

@ -129,14 +129,14 @@ func main() {
log.Infof("Completed %v", c.Name) log.Infof("Completed %v", c.Name)
} }
func validateFlags(_ *cli.Context, o *options) error { func validateFlags(c *cli.Context, o *options) error {
if filepath.Base(o.pidFile) != toolkitPidFilename { if filepath.Base(o.pidFile) != toolkitPidFilename {
return fmt.Errorf("invalid toolkit.pid path %v", o.pidFile) return fmt.Errorf("invalid toolkit.pid path %v", o.pidFile)
} }
if err := toolkit.ValidateOptions(&o.toolkitOptions, o.toolkitRoot()); err != nil { if err := toolkit.ValidateOptions(&o.toolkitOptions, o.toolkitRoot()); err != nil {
return err return err
} }
if err := runtime.ValidateOptions(&o.runtimeOptions, o.runtime, o.toolkitRoot()); err != nil { if err := runtime.ValidateOptions(c, &o.runtimeOptions, o.runtime, o.toolkitRoot(), &o.toolkitOptions); err != nil {
return err return err
} }
return nil return nil

View File

@ -25,6 +25,7 @@ import (
"github.com/NVIDIA/nvidia-container-toolkit/tools/container/runtime/containerd" "github.com/NVIDIA/nvidia-container-toolkit/tools/container/runtime/containerd"
"github.com/NVIDIA/nvidia-container-toolkit/tools/container/runtime/crio" "github.com/NVIDIA/nvidia-container-toolkit/tools/container/runtime/crio"
"github.com/NVIDIA/nvidia-container-toolkit/tools/container/runtime/docker" "github.com/NVIDIA/nvidia-container-toolkit/tools/container/runtime/docker"
"github.com/NVIDIA/nvidia-container-toolkit/tools/container/toolkit"
) )
const ( const (
@ -104,10 +105,14 @@ func Flags(opts *Options) []cli.Flag {
} }
// ValidateOptions checks whether the specified options are valid // ValidateOptions checks whether the specified options are valid
func ValidateOptions(opts *Options, runtime string, toolkitRoot string) error { func ValidateOptions(c *cli.Context, opts *Options, runtime string, toolkitRoot string, to *toolkit.Options) error {
// We set this option here to ensure that it is available in future calls. // We set this option here to ensure that it is available in future calls.
opts.RuntimeDir = toolkitRoot opts.RuntimeDir = toolkitRoot
if !c.IsSet("enable-cdi-in-runtime") {
opts.EnableCDI = to.CDI.Enabled
}
// Apply the runtime-specific config changes. // Apply the runtime-specific config changes.
switch runtime { switch runtime {
case containerd.Name: case containerd.Name:

View File

@ -48,6 +48,14 @@ const (
toolkitPidFilename = "toolkit.pid" toolkitPidFilename = "toolkit.pid"
) )
type cdiOptions struct {
Enabled bool
outputDir string
kind string
vendor string
class string
}
type Options struct { type Options struct {
DriverRoot string DriverRoot string
DevRoot string DevRoot string
@ -67,11 +75,8 @@ type Options struct {
ContainerCLIDebug string ContainerCLIDebug string
cdiEnabled bool // CDI stores the CDI options for the toolkit.
cdiOutputDir string CDI cdiOptions
cdiKind string
cdiVendor string
cdiClass string
createDeviceNodes cli.StringSlice createDeviceNodes cli.StringSlice
@ -174,21 +179,21 @@ func Flags(opts *Options) []cli.Flag {
Name: "cdi-enabled", Name: "cdi-enabled",
Aliases: []string{"enable-cdi"}, Aliases: []string{"enable-cdi"},
Usage: "enable the generation of a CDI specification", Usage: "enable the generation of a CDI specification",
Destination: &opts.cdiEnabled, Destination: &opts.CDI.Enabled,
EnvVars: []string{"CDI_ENABLED", "ENABLE_CDI"}, EnvVars: []string{"CDI_ENABLED", "ENABLE_CDI"},
}, },
&cli.StringFlag{ &cli.StringFlag{
Name: "cdi-output-dir", Name: "cdi-output-dir",
Usage: "the directory where the CDI output files are to be written. If this is set to '', no CDI specification is generated.", Usage: "the directory where the CDI output files are to be written. If this is set to '', no CDI specification is generated.",
Value: "/var/run/cdi", Value: "/var/run/cdi",
Destination: &opts.cdiOutputDir, Destination: &opts.CDI.outputDir,
EnvVars: []string{"CDI_OUTPUT_DIR"}, EnvVars: []string{"CDI_OUTPUT_DIR"},
}, },
&cli.StringFlag{ &cli.StringFlag{
Name: "cdi-kind", Name: "cdi-kind",
Usage: "the vendor string to use for the generated CDI specification", Usage: "the vendor string to use for the generated CDI specification",
Value: "management.nvidia.com/gpu", Value: "management.nvidia.com/gpu",
Destination: &opts.cdiKind, Destination: &opts.CDI.kind,
EnvVars: []string{"CDI_KIND"}, EnvVars: []string{"CDI_KIND"},
}, },
&cli.BoolFlag{ &cli.BoolFlag{
@ -221,19 +226,19 @@ func ValidateOptions(opts *Options, toolkitRoot string) error {
return fmt.Errorf("invalid --toolkit-root option: %v", toolkitRoot) return fmt.Errorf("invalid --toolkit-root option: %v", toolkitRoot)
} }
vendor, class := parser.ParseQualifier(opts.cdiKind) vendor, class := parser.ParseQualifier(opts.CDI.kind)
if err := parser.ValidateVendorName(vendor); err != nil { if err := parser.ValidateVendorName(vendor); err != nil {
return fmt.Errorf("invalid CDI vendor name: %v", err) return fmt.Errorf("invalid CDI vendor name: %v", err)
} }
if err := parser.ValidateClassName(class); err != nil { if err := parser.ValidateClassName(class); err != nil {
return fmt.Errorf("invalid CDI class name: %v", err) return fmt.Errorf("invalid CDI class name: %v", err)
} }
opts.cdiVendor = vendor opts.CDI.vendor = vendor
opts.cdiClass = class opts.CDI.class = class
if opts.cdiEnabled && opts.cdiOutputDir == "" { if opts.CDI.Enabled && opts.CDI.outputDir == "" {
log.Warning("Skipping CDI spec generation (no output directory specified)") log.Warning("Skipping CDI spec generation (no output directory specified)")
opts.cdiEnabled = false opts.CDI.Enabled = false
} }
isDisabled := false isDisabled := false
@ -246,7 +251,7 @@ func ValidateOptions(opts *Options, toolkitRoot string) error {
break break
} }
} }
if !opts.cdiEnabled && !isDisabled { if !opts.CDI.Enabled && !isDisabled {
log.Info("disabling device node creation since --cdi-enabled=false") log.Info("disabling device node creation since --cdi-enabled=false")
isDisabled = true isDisabled = true
} }
@ -761,7 +766,7 @@ func createDeviceNodes(opts *Options) error {
// generateCDISpec generates a CDI spec for use in management containers // generateCDISpec generates a CDI spec for use in management containers
func generateCDISpec(opts *Options, nvidiaCDIHookPath string) error { func generateCDISpec(opts *Options, nvidiaCDIHookPath string) error {
if !opts.cdiEnabled { if !opts.CDI.Enabled {
return nil return nil
} }
log.Info("Generating CDI spec for management containers") log.Info("Generating CDI spec for management containers")
@ -770,8 +775,8 @@ func generateCDISpec(opts *Options, nvidiaCDIHookPath string) error {
nvcdi.WithDriverRoot(opts.DriverRootCtrPath), nvcdi.WithDriverRoot(opts.DriverRootCtrPath),
nvcdi.WithDevRoot(opts.DevRootCtrPath), nvcdi.WithDevRoot(opts.DevRootCtrPath),
nvcdi.WithNVIDIACDIHookPath(nvidiaCDIHookPath), nvcdi.WithNVIDIACDIHookPath(nvidiaCDIHookPath),
nvcdi.WithVendor(opts.cdiVendor), nvcdi.WithVendor(opts.CDI.vendor),
nvcdi.WithClass(opts.cdiClass), nvcdi.WithClass(opts.CDI.class),
) )
if err != nil { if err != nil {
return fmt.Errorf("failed to create CDI library for management containers: %v", err) return fmt.Errorf("failed to create CDI library for management containers: %v", err)
@ -796,7 +801,7 @@ func generateCDISpec(opts *Options, nvidiaCDIHookPath string) error {
if err != nil { if err != nil {
return fmt.Errorf("failed to generate CDI name for management containers: %v", err) return fmt.Errorf("failed to generate CDI name for management containers: %v", err)
} }
err = spec.Save(filepath.Join(opts.cdiOutputDir, name)) err = spec.Save(filepath.Join(opts.CDI.outputDir, name))
if err != nil { if err != nil {
return fmt.Errorf("failed to save CDI spec for management containers: %v", err) return fmt.Errorf("failed to save CDI spec for management containers: %v", err)
} }