mirror of
https://github.com/NVIDIA/nvidia-container-toolkit
synced 2024-12-02 00:54:48 +00:00
a77331f8f0
This change implements the discovery of versioned driver libaries by reusing the mounts and update ldcache discoverers use for, for example, CVS file discovery. This allows the container paths to be correctly generated without requiring specific manipulation. Signed-off-by: Evan Lezar <elezar@nvidia.com>
157 lines
4.7 KiB
Go
157 lines
4.7 KiB
Go
/**
|
|
# Copyright (c) NVIDIA CORPORATION. All rights reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
**/
|
|
|
|
package generate
|
|
|
|
import (
|
|
"fmt"
|
|
"path/filepath"
|
|
"strings"
|
|
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/discover"
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/ldcache"
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/lookup"
|
|
"github.com/sirupsen/logrus"
|
|
"gitlab.com/nvidia/cloud-native/go-nvlib/pkg/nvml"
|
|
)
|
|
|
|
// NewDriverDiscoverer creates a discoverer for the libraries and binaries associated with a driver installation.
|
|
// The supplied NVML Library is used to query the expected driver version.
|
|
func NewDriverDiscoverer(logger *logrus.Logger, root string, nvidiaCTKPath string, nvmllib nvml.Interface) (discover.Discover, error) {
|
|
version, r := nvmllib.SystemGetDriverVersion()
|
|
if r != nvml.SUCCESS {
|
|
return nil, fmt.Errorf("failed to determine driver version: %v", r)
|
|
}
|
|
|
|
libraries, err := NewDriverLibraryDiscoverer(logger, root, nvidiaCTKPath, version)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to create discoverer for driver libraries: %v", err)
|
|
}
|
|
|
|
firmwares := NewDriverFirmwareDiscoverer(logger, root, version)
|
|
|
|
binaries := NewDriverBinariesDiscoverer(logger, root)
|
|
|
|
d := discover.Merge(
|
|
libraries,
|
|
firmwares,
|
|
binaries,
|
|
)
|
|
|
|
return d, nil
|
|
}
|
|
|
|
// NewDriverLibraryDiscoverer creates a discoverer for the libraries associated with the specified driver version.
|
|
func NewDriverLibraryDiscoverer(logger *logrus.Logger, root string, nvidiaCTKPath string, version string) (discover.Discover, error) {
|
|
libraryPaths, err := getVersionLibs(logger, root, version)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to get libraries for driver version: %v", err)
|
|
}
|
|
|
|
libraries := discover.NewMounts(
|
|
logger,
|
|
lookup.NewFileLocator(
|
|
lookup.WithLogger(logger),
|
|
lookup.WithRoot(root),
|
|
),
|
|
root,
|
|
libraryPaths,
|
|
)
|
|
|
|
cfg := &discover.Config{
|
|
Root: root,
|
|
NvidiaCTKPath: nvidiaCTKPath,
|
|
}
|
|
hooks, _ := discover.NewLDCacheUpdateHook(logger, libraries, cfg)
|
|
|
|
d := discover.Merge(
|
|
libraries,
|
|
hooks,
|
|
)
|
|
|
|
return d, nil
|
|
}
|
|
|
|
// NewDriverFirmwareDiscoverer creates a discoverer for GSP firmware associated with the specified driver version.
|
|
func NewDriverFirmwareDiscoverer(logger *logrus.Logger, root string, version string) discover.Discover {
|
|
gspFirmwarePath := filepath.Join("/lib/firmware/nvidia", version, "gsp.bin")
|
|
return discover.NewMounts(
|
|
logger,
|
|
lookup.NewFileLocator(
|
|
lookup.WithLogger(logger),
|
|
lookup.WithRoot(root),
|
|
),
|
|
root,
|
|
[]string{gspFirmwarePath},
|
|
)
|
|
}
|
|
|
|
// NewDriverBinariesDiscoverer creates a discoverer for GSP firmware associated with the GPU driver.
|
|
func NewDriverBinariesDiscoverer(logger *logrus.Logger, root string) discover.Discover {
|
|
return discover.NewMounts(
|
|
logger,
|
|
lookup.NewExecutableLocator(logger, root),
|
|
root,
|
|
[]string{
|
|
"nvidia-smi", /* System management interface */
|
|
"nvidia-debugdump", /* GPU coredump utility */
|
|
"nvidia-persistenced", /* Persistence mode utility */
|
|
"nvidia-cuda-mps-control", /* Multi process service CLI */
|
|
"nvidia-cuda-mps-server", /* Multi process service server */
|
|
},
|
|
)
|
|
}
|
|
|
|
// getVersionLibs checks the LDCache for libraries ending in the specified driver version.
|
|
// Although the ldcache at the specified root is queried, the paths are returned relative to this root.
|
|
// This allows the standard mount location logic to be used for resolving the mounts.
|
|
func getVersionLibs(logger *logrus.Logger, root string, version string) ([]string, error) {
|
|
logger.Infof("Using driver version %v", version)
|
|
|
|
cache, err := ldcache.New(logger, root)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to load ldcache: %v", err)
|
|
}
|
|
|
|
libs32, libs64 := cache.List()
|
|
|
|
var libs []string
|
|
for _, l := range libs64 {
|
|
if strings.HasSuffix(l, version) {
|
|
logger.Infof("found 64-bit driver lib: %v", l)
|
|
libs = append(libs, l)
|
|
}
|
|
}
|
|
|
|
for _, l := range libs32 {
|
|
if strings.HasSuffix(l, version) {
|
|
logger.Infof("found 32-bit driver lib: %v", l)
|
|
libs = append(libs, l)
|
|
}
|
|
}
|
|
|
|
if root == "/" || root == "" {
|
|
return libs, nil
|
|
}
|
|
|
|
var relative []string
|
|
for _, l := range libs {
|
|
relative = append(relative, strings.TrimPrefix(l, root))
|
|
}
|
|
|
|
return relative, nil
|
|
}
|