2022-06-20 11:53:16 +00:00
/ * *
# Copyright ( c ) 2022 , NVIDIA CORPORATION . All rights reserved .
#
# Licensed under the Apache License , Version 2.0 ( the "License" ) ;
# you may not use this file except in compliance with the License .
# You may obtain a copy of the License at
#
# http : //www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing , software
# distributed under the License is distributed on an "AS IS" BASIS ,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND , either express or implied .
# See the License for the specific language governing permissions and
# limitations under the License .
* * /
2022-11-01 19:05:23 +00:00
package generate
2022-06-20 11:53:16 +00:00
import (
"fmt"
"io"
"os"
"path/filepath"
"strings"
2023-02-17 09:11:18 +00:00
"github.com/NVIDIA/nvidia-container-toolkit/internal/discover"
2022-11-23 15:29:18 +00:00
"github.com/NVIDIA/nvidia-container-toolkit/internal/edits"
2022-12-02 13:17:52 +00:00
"github.com/NVIDIA/nvidia-container-toolkit/pkg/nvcdi"
2022-10-21 11:29:21 +00:00
"github.com/container-orchestrated-devices/container-device-interface/pkg/cdi"
2022-06-20 11:53:16 +00:00
specs "github.com/container-orchestrated-devices/container-device-interface/specs-go"
"github.com/sirupsen/logrus"
"github.com/urfave/cli/v2"
"gitlab.com/nvidia/cloud-native/go-nvlib/pkg/nvlib/device"
"gitlab.com/nvidia/cloud-native/go-nvlib/pkg/nvml"
"sigs.k8s.io/yaml"
)
const (
2023-02-13 15:04:30 +00:00
discoveryModeAuto = "auto"
2023-02-08 14:29:35 +00:00
discoveryModeNVML = "nvml"
2023-02-06 17:53:24 +00:00
discoveryModeWSL = "wsl"
2023-02-08 14:29:35 +00:00
2022-11-23 20:39:06 +00:00
formatJSON = "json"
formatYAML = "yaml"
2023-02-06 17:53:24 +00:00
allDeviceName = "all"
2022-06-20 11:53:16 +00:00
)
type command struct {
logger * logrus . Logger
}
type config struct {
2023-01-20 14:58:04 +00:00
output string
format string
deviceNameStrategy string
2023-02-02 14:42:01 +00:00
driverRoot string
2023-01-20 14:58:04 +00:00
nvidiaCTKPath string
2023-02-08 14:29:35 +00:00
discoveryMode string
2022-06-20 11:53:16 +00:00
}
// NewCommand constructs a generate-cdi command with the specified logger
func NewCommand ( logger * logrus . Logger ) * cli . Command {
c := command {
logger : logger ,
}
return c . build ( )
}
// build creates the CLI command
func ( m command ) build ( ) * cli . Command {
cfg := config { }
// Create the 'generate-cdi' command
c := cli . Command {
2022-11-01 19:05:23 +00:00
Name : "generate" ,
2022-06-20 11:53:16 +00:00
Usage : "Generate CDI specifications for use with CDI-enabled runtimes" ,
2022-11-23 20:39:06 +00:00
Before : func ( c * cli . Context ) error {
return m . validateFlags ( c , & cfg )
} ,
2022-06-20 11:53:16 +00:00
Action : func ( c * cli . Context ) error {
return m . run ( c , & cfg )
} ,
}
c . Flags = [ ] cli . Flag {
& cli . StringFlag {
Name : "output" ,
2022-11-23 20:39:06 +00:00
Usage : "Specify the file to output the generated CDI specification to. If this is '' the specification is output to STDOUT" ,
2022-06-20 11:53:16 +00:00
Destination : & cfg . output ,
} ,
2022-11-23 20:39:06 +00:00
& cli . StringFlag {
Name : "format" ,
Usage : "The output format for the generated spec [json | yaml]. This overrides the format defined by the output file extension (if specified)." ,
Value : formatYAML ,
Destination : & cfg . format ,
2022-06-20 11:53:16 +00:00
} ,
2023-02-08 14:29:35 +00:00
& cli . StringFlag {
Name : "discovery-mode" ,
2023-02-13 15:04:30 +00:00
Usage : "The mode to use when discovering the available entities. One of [auto | nvml | wsl]. I mode is set to 'auto' the mode will be determined based on the system configuration." ,
Value : discoveryModeAuto ,
2023-02-08 14:29:35 +00:00
Destination : & cfg . discoveryMode ,
} ,
2023-01-20 14:58:04 +00:00
& cli . StringFlag {
Name : "device-name-strategy" ,
2023-01-30 12:36:11 +00:00
Usage : "Specify the strategy for generating device names. One of [index | uuid | type-index]" ,
2022-12-02 13:17:52 +00:00
Value : nvcdi . DeviceNameStrategyIndex ,
2023-01-20 14:58:04 +00:00
Destination : & cfg . deviceNameStrategy ,
} ,
2022-12-01 16:21:35 +00:00
& cli . StringFlag {
2023-02-02 14:42:01 +00:00
Name : "driver-root" ,
Usage : "Specify the NVIDIA GPU driver root to use when discovering the entities that should be included in the CDI specification." ,
Destination : & cfg . driverRoot ,
2022-12-01 16:21:35 +00:00
} ,
2022-12-12 14:26:21 +00:00
& cli . StringFlag {
Name : "nvidia-ctk-path" ,
Usage : "Specify the path to use for the nvidia-ctk in the generated CDI specification. If this is left empty, the path will be searched." ,
Destination : & cfg . nvidiaCTKPath ,
} ,
2022-06-20 11:53:16 +00:00
}
return & c
}
2022-11-23 20:39:06 +00:00
func ( m command ) validateFlags ( r * cli . Context , cfg * config ) error {
cfg . format = strings . ToLower ( cfg . format )
switch cfg . format {
case formatJSON :
case formatYAML :
default :
return fmt . Errorf ( "invalid output format: %v" , cfg . format )
}
2023-02-08 14:29:35 +00:00
cfg . discoveryMode = strings . ToLower ( cfg . discoveryMode )
switch cfg . discoveryMode {
2023-02-13 15:04:30 +00:00
case discoveryModeAuto :
2023-02-08 14:29:35 +00:00
case discoveryModeNVML :
2023-02-06 17:53:24 +00:00
case discoveryModeWSL :
2023-02-08 14:29:35 +00:00
default :
return fmt . Errorf ( "invalid discovery mode: %v" , cfg . discoveryMode )
}
2022-12-02 13:17:52 +00:00
_ , err := nvcdi . NewDeviceNamer ( cfg . deviceNameStrategy )
2023-01-20 14:58:04 +00:00
if err != nil {
return err
}
2023-02-17 09:11:18 +00:00
cfg . nvidiaCTKPath = discover . FindNvidiaCTK ( m . logger , cfg . nvidiaCTKPath )
2022-11-23 20:39:06 +00:00
return nil
}
2022-06-20 11:53:16 +00:00
func ( m command ) run ( c * cli . Context , cfg * config ) error {
2022-12-02 13:17:52 +00:00
spec , err := m . generateSpec ( cfg )
2022-06-20 11:53:16 +00:00
if err != nil {
return fmt . Errorf ( "failed to generate CDI spec: %v" , err )
}
var outputTo io . Writer
2022-11-23 20:39:06 +00:00
if cfg . output == "" {
2022-06-20 11:53:16 +00:00
outputTo = os . Stdout
} else {
2022-11-24 09:13:21 +00:00
err := createParentDirsIfRequired ( cfg . output )
if err != nil {
return fmt . Errorf ( "failed to create parent folders for output file: %v" , err )
}
2022-06-20 11:53:16 +00:00
outputFile , err := os . Create ( cfg . output )
if err != nil {
return fmt . Errorf ( "failed to create output file: %v" , err )
}
defer outputFile . Close ( )
outputTo = outputFile
}
2022-11-23 20:39:06 +00:00
if outputFileFormat := formatFromFilename ( cfg . output ) ; outputFileFormat != "" {
m . logger . Debugf ( "Inferred output format as %q from output file name" , outputFileFormat )
if ! c . IsSet ( "format" ) {
cfg . format = outputFileFormat
} else if outputFileFormat != cfg . format {
m . logger . Warningf ( "Requested output format %q does not match format implied by output file name: %q" , cfg . format , outputFileFormat )
}
2022-06-20 11:53:16 +00:00
}
data , err := yaml . Marshal ( spec )
if err != nil {
return fmt . Errorf ( "failed to marshal CDI spec: %v" , err )
}
2022-11-23 20:39:06 +00:00
if strings . ToLower ( cfg . format ) == formatJSON {
2022-06-20 11:53:16 +00:00
data , err = yaml . YAMLToJSONStrict ( data )
if err != nil {
return fmt . Errorf ( "failed to convert CDI spec from YAML to JSON: %v" , err )
}
}
2022-12-01 15:21:50 +00:00
err = writeToOutput ( cfg . format , data , outputTo )
2022-06-20 11:53:16 +00:00
if err != nil {
return fmt . Errorf ( "failed to write output: %v" , err )
}
return nil
}
2022-11-23 20:39:06 +00:00
func formatFromFilename ( filename string ) string {
ext := filepath . Ext ( filename )
switch strings . ToLower ( ext ) {
case ".json" :
return formatJSON
case ".yaml" :
return formatYAML
case ".yml" :
return formatYAML
}
return ""
}
2022-12-01 15:21:50 +00:00
func writeToOutput ( format string , data [ ] byte , output io . Writer ) error {
if format == formatYAML {
2022-11-02 13:59:04 +00:00
_ , err := output . Write ( [ ] byte ( "---\n" ) )
if err != nil {
return fmt . Errorf ( "failed to write YAML separator: %v" , err )
}
}
_ , err := output . Write ( data )
if err != nil {
return fmt . Errorf ( "failed to write data: %v" , err )
}
return nil
}
2022-12-02 13:17:52 +00:00
func ( m command ) generateSpec ( cfg * config ) ( * specs . Spec , error ) {
deviceNamer , err := nvcdi . NewDeviceNamer ( cfg . deviceNameStrategy )
if err != nil {
return nil , fmt . Errorf ( "failed to create device namer: %v" , err )
}
2022-06-20 11:53:16 +00:00
nvmllib := nvml . New ( )
if r := nvmllib . Init ( ) ; r != nvml . SUCCESS {
return nil , r
}
defer nvmllib . Shutdown ( )
devicelib := device . New ( device . WithNvml ( nvmllib ) )
2022-12-02 13:17:52 +00:00
cdilib := nvcdi . New (
nvcdi . WithLogger ( m . logger ) ,
nvcdi . WithDriverRoot ( cfg . driverRoot ) ,
nvcdi . WithNVIDIACTKPath ( cfg . nvidiaCTKPath ) ,
nvcdi . WithDeviceNamer ( deviceNamer ) ,
nvcdi . WithDeviceLib ( devicelib ) ,
nvcdi . WithNvmlLib ( nvmllib ) ,
2023-02-08 14:29:35 +00:00
nvcdi . WithMode ( string ( cfg . discoveryMode ) ) ,
2022-12-02 13:17:52 +00:00
)
deviceSpecs , err := cdilib . GetAllDeviceSpecs ( )
2022-06-20 11:53:16 +00:00
if err != nil {
2022-11-23 15:29:18 +00:00
return nil , fmt . Errorf ( "failed to create device CDI specs: %v" , err )
2022-06-20 11:53:16 +00:00
}
2023-02-06 17:53:24 +00:00
var hasAll bool
for _ , deviceSpec := range deviceSpecs {
if deviceSpec . Name == allDeviceName {
hasAll = true
break
}
}
if ! hasAll {
allDevice , err := MergeDeviceSpecs ( deviceSpecs , allDeviceName )
if err != nil {
return nil , fmt . Errorf ( "failed to create CDI specification for %q device: %v" , allDeviceName , err )
}
deviceSpecs = append ( deviceSpecs , allDevice )
}
2022-10-10 08:19:08 +00:00
2022-12-02 13:17:52 +00:00
commonEdits , err := cdilib . GetCommonEdits ( )
2022-11-23 15:29:18 +00:00
if err != nil {
2022-12-02 13:17:52 +00:00
return nil , fmt . Errorf ( "failed to create edits common for entities: %v" , err )
2022-10-21 13:28:45 +00:00
}
2022-12-02 13:17:52 +00:00
deviceFolderPermissionEdits , err := GetDeviceFolderPermissionHookEdits ( m . logger , cfg . driverRoot , cfg . nvidiaCTKPath , deviceSpecs )
2022-10-21 11:29:21 +00:00
if err != nil {
2022-12-02 13:17:52 +00:00
return nil , fmt . Errorf ( "failed to generated edits for device folder permissions: %v" , err )
2022-10-21 11:29:21 +00:00
}
2022-12-02 13:17:52 +00:00
commonEdits . Append ( deviceFolderPermissionEdits )
2022-10-07 14:23:18 +00:00
2023-01-19 10:48:36 +00:00
// We construct the spec and determine the minimum required version based on the specification.
2022-11-23 15:29:18 +00:00
spec := specs . Spec {
2023-01-19 10:48:36 +00:00
Version : "NOT_SET" ,
2022-11-23 15:29:18 +00:00
Kind : "nvidia.com/gpu" ,
Devices : deviceSpecs ,
2023-02-07 11:16:58 +00:00
ContainerEdits : * commonEdits . ContainerEdits ,
2022-06-20 11:53:16 +00:00
}
2023-01-19 10:48:36 +00:00
minVersion , err := cdi . MinimumRequiredVersion ( & spec )
if err != nil {
return nil , fmt . Errorf ( "failed to get minumum required CDI spec version: %v" , err )
}
2023-01-30 12:39:08 +00:00
m . logger . Infof ( "Using minimum required CDI spec version: %s" , minVersion )
2023-01-19 10:48:36 +00:00
spec . Version = minVersion
2022-11-23 15:29:18 +00:00
return & spec , nil
2022-06-20 11:53:16 +00:00
}
2023-02-06 17:53:24 +00:00
// MergeDeviceSpecs creates a device with the specified name which combines the edits from the previous devices.
// If a device of the specified name already exists, an error is returned.
func MergeDeviceSpecs ( deviceSpecs [ ] specs . Device , mergedDeviceName string ) ( specs . Device , error ) {
if err := cdi . ValidateDeviceName ( mergedDeviceName ) ; err != nil {
return specs . Device { } , fmt . Errorf ( "invalid device name %q: %v" , mergedDeviceName , err )
}
for _ , d := range deviceSpecs {
if d . Name == mergedDeviceName {
return specs . Device { } , fmt . Errorf ( "device %q already exists" , mergedDeviceName )
}
}
mergedEdits := edits . NewContainerEdits ( )
2022-10-21 11:29:21 +00:00
2022-11-23 15:29:18 +00:00
for _ , d := range deviceSpecs {
edit := cdi . ContainerEdits {
ContainerEdits : & d . ContainerEdits ,
2022-10-21 11:29:21 +00:00
}
2023-02-06 17:53:24 +00:00
mergedEdits . Append ( & edit )
2022-10-21 11:29:21 +00:00
}
2023-02-06 17:53:24 +00:00
merged := specs . Device {
Name : mergedDeviceName ,
ContainerEdits : * mergedEdits . ContainerEdits ,
2022-10-21 11:29:21 +00:00
}
2023-02-06 17:53:24 +00:00
return merged , nil
2022-10-21 11:29:21 +00:00
}
2022-11-24 09:13:21 +00:00
// createParentDirsIfRequired creates the parent folders of the specified path if requried.
// Note that MkdirAll does not specifically check whether the specified path is non-empty and raises an error if it is.
// The path will be empty if filename in the current folder is specified, for example
func createParentDirsIfRequired ( filename string ) error {
dir := filepath . Dir ( filename )
if dir == "" {
return nil
}
return os . MkdirAll ( dir , 0755 )
}