mirror of
https://github.com/NVIDIA/nvidia-container-toolkit
synced 2025-01-24 11:37:09 +00:00
35df24d63a
This change adds an --nvidia-ctk-path to the nvidia-ctk cdi generate command. This ensures that the executable path for the generated hooks can be specified consistently. Since the NVIDIA Container Runtime already allows for the executable path to be specified in the config the utility code to update the LDCache and create other nvidia-ctk hooks are also updated. Signed-off-by: Evan Lezar <elezar@nvidia.com>
169 lines
4.8 KiB
Go
169 lines
4.8 KiB
Go
/**
|
|
# Copyright (c) NVIDIA CORPORATION. All rights reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
**/
|
|
|
|
package generate
|
|
|
|
import (
|
|
"fmt"
|
|
"path/filepath"
|
|
"strings"
|
|
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/discover"
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/ldcache"
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/lookup"
|
|
"github.com/sirupsen/logrus"
|
|
"gitlab.com/nvidia/cloud-native/go-nvlib/pkg/nvml"
|
|
)
|
|
|
|
type driverLibraries struct {
|
|
logger *logrus.Logger
|
|
root string
|
|
nvidiaCTKPath string
|
|
libraries []string
|
|
}
|
|
|
|
var _ discover.Discover = (*driverLibraries)(nil)
|
|
|
|
// NewDriverDiscoverer creates a discoverer for the libraries and binaries associated with a driver installation.
|
|
// The supplied NVML Library is used to query the expected driver version.
|
|
func NewDriverDiscoverer(logger *logrus.Logger, root string, nvidiaCTKPath string, nvmllib nvml.Interface) (discover.Discover, error) {
|
|
version, r := nvmllib.SystemGetDriverVersion()
|
|
if r != nvml.SUCCESS {
|
|
return nil, fmt.Errorf("failed to determine driver version: %v", r)
|
|
}
|
|
|
|
libraries, err := NewDriverLibraryDiscoverer(logger, root, nvidiaCTKPath, version)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to create discoverer for driver libraries: %v", err)
|
|
}
|
|
|
|
firmwares := NewDriverFirmwareDiscoverer(logger, root, version)
|
|
|
|
binaries := NewDriverBinariesDiscoverer(logger, root)
|
|
|
|
d := discover.Merge(
|
|
libraries,
|
|
firmwares,
|
|
binaries,
|
|
)
|
|
|
|
return d, nil
|
|
}
|
|
|
|
// NewDriverLibraryDiscoverer creates a discoverer for the libraries associated with the specified driver version.
|
|
func NewDriverLibraryDiscoverer(logger *logrus.Logger, root string, nvidiaCTKPath, version string) (discover.Discover, error) {
|
|
libraries, err := findVersionLibs(logger, root, version)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to get libraries for driver version: %v", err)
|
|
}
|
|
|
|
d := driverLibraries{
|
|
logger: logger,
|
|
root: root,
|
|
nvidiaCTKPath: nvidiaCTKPath,
|
|
libraries: libraries,
|
|
}
|
|
|
|
return &d, nil
|
|
}
|
|
|
|
// NewDriverFirmwareDiscoverer creates a discoverer for GSP firmware associated with the specified driver version.
|
|
func NewDriverFirmwareDiscoverer(logger *logrus.Logger, root string, version string) discover.Discover {
|
|
gspFirmwarePath := filepath.Join("/lib/firmware/nvidia", version, "gsp.bin")
|
|
return discover.NewMounts(
|
|
logger,
|
|
lookup.NewFileLocator(
|
|
lookup.WithLogger(logger),
|
|
lookup.WithRoot(root),
|
|
),
|
|
root,
|
|
[]string{gspFirmwarePath},
|
|
)
|
|
}
|
|
|
|
// NewDriverBinariesDiscoverer creates a discoverer for GSP firmware associated with the GPU driver.
|
|
func NewDriverBinariesDiscoverer(logger *logrus.Logger, root string) discover.Discover {
|
|
return discover.NewMounts(
|
|
logger,
|
|
lookup.NewExecutableLocator(logger, root),
|
|
root,
|
|
[]string{
|
|
"nvidia-smi", /* System management interface */
|
|
"nvidia-debugdump", /* GPU coredump utility */
|
|
"nvidia-persistenced", /* Persistence mode utility */
|
|
"nvidia-cuda-mps-control", /* Multi process service CLI */
|
|
"nvidia-cuda-mps-server", /* Multi process service server */
|
|
},
|
|
)
|
|
}
|
|
|
|
// Devices are empty for this discoverer
|
|
func (d *driverLibraries) Devices() ([]discover.Device, error) {
|
|
return nil, nil
|
|
}
|
|
|
|
// Mounts returns the mounts for the driver libraries
|
|
func (d *driverLibraries) Mounts() ([]discover.Mount, error) {
|
|
var mounts []discover.Mount
|
|
for _, d := range d.libraries {
|
|
mount := discover.Mount{
|
|
HostPath: d,
|
|
Path: d,
|
|
}
|
|
mounts = append(mounts, mount)
|
|
}
|
|
|
|
return mounts, nil
|
|
}
|
|
|
|
// Hooks returns a hook that updates the LDCache for the specified driver library paths.
|
|
func (d *driverLibraries) Hooks() ([]discover.Hook, error) {
|
|
hook := discover.CreateLDCacheUpdateHook(
|
|
d.nvidiaCTKPath,
|
|
d.libraries,
|
|
)
|
|
|
|
return []discover.Hook{hook}, nil
|
|
}
|
|
|
|
func findVersionLibs(logger *logrus.Logger, root string, version string) ([]string, error) {
|
|
logger.Infof("Using driver version %v", version)
|
|
|
|
cache, err := ldcache.New(logger, root)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to load ldcache: %v", err)
|
|
}
|
|
|
|
libs32, libs64 := cache.List()
|
|
|
|
var libs []string
|
|
for _, l := range libs64 {
|
|
if strings.HasSuffix(l, version) {
|
|
logger.Infof("found 64-bit driver lib: %v", l)
|
|
libs = append(libs, l)
|
|
}
|
|
}
|
|
|
|
for _, l := range libs32 {
|
|
if strings.HasSuffix(l, version) {
|
|
logger.Infof("found 32-bit driver lib: %v", l)
|
|
libs = append(libs, l)
|
|
}
|
|
}
|
|
|
|
return libs, nil
|
|
}
|