2022-07-20 08:52:43 +00:00
/ * *
# Copyright ( c ) 2022 , NVIDIA CORPORATION . All rights reserved .
#
# Licensed under the Apache License , Version 2.0 ( the "License" ) ;
# you may not use this file except in compliance with the License .
# You may obtain a copy of the License at
#
# http : //www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing , software
# distributed under the License is distributed on an "AS IS" BASIS ,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND , either express or implied .
# See the License for the specific language governing permissions and
# limitations under the License .
* * /
package discover
import (
"fmt"
2022-09-29 12:47:04 +00:00
"os"
"path/filepath"
2023-03-07 19:57:24 +00:00
"strings"
2022-07-20 08:52:43 +00:00
2022-09-29 12:47:04 +00:00
"github.com/NVIDIA/nvidia-container-toolkit/internal/config/image"
"github.com/NVIDIA/nvidia-container-toolkit/internal/info/drm"
"github.com/NVIDIA/nvidia-container-toolkit/internal/info/proc"
2023-03-22 12:27:43 +00:00
"github.com/NVIDIA/nvidia-container-toolkit/internal/logger"
2022-07-20 08:52:43 +00:00
"github.com/NVIDIA/nvidia-container-toolkit/internal/lookup"
2023-03-07 19:57:24 +00:00
"github.com/NVIDIA/nvidia-container-toolkit/internal/lookup/cuda"
2023-11-21 15:08:16 +00:00
"github.com/NVIDIA/nvidia-container-toolkit/internal/lookup/root"
2022-07-20 08:52:43 +00:00
)
2024-01-23 00:48:11 +00:00
// NewDRMNodesDiscoverer returns a discoverer for the DRM device nodes associated with the specified visible devices.
2023-11-20 21:32:46 +00:00
//
// TODO: The logic for creating DRM devices should be consolidated between this
// and the logic for generating CDI specs for a single device. This is only used
// when applying OCI spec modifications to an incoming spec in "legacy" mode.
func NewDRMNodesDiscoverer ( logger logger . Interface , devices image . VisibleDevices , devRoot string , nvidiaCTKPath string ) ( Discover , error ) {
2023-11-14 15:57:37 +00:00
drmDeviceNodes , err := newDRMDeviceDiscoverer ( logger , devices , devRoot )
2022-11-23 15:26:30 +00:00
if err != nil {
return nil , fmt . Errorf ( "failed to create DRM device discoverer: %v" , err )
}
2023-11-14 15:57:37 +00:00
drmByPathSymlinks := newCreateDRMByPathSymlinks ( logger , drmDeviceNodes , devRoot , nvidiaCTKPath )
2022-11-23 15:26:30 +00:00
2023-11-20 21:32:46 +00:00
discover := Merge ( drmDeviceNodes , drmByPathSymlinks )
2022-11-23 15:26:30 +00:00
return discover , nil
}
// NewGraphicsMountsDiscoverer creates a discoverer for the mounts required by graphics tools such as vulkan.
2023-11-21 15:08:16 +00:00
func NewGraphicsMountsDiscoverer ( logger logger . Interface , driver * root . Driver , nvidiaCTKPath string ) ( Discover , error ) {
2022-07-20 08:52:43 +00:00
libraries := NewMounts (
logger ,
2023-11-21 15:08:16 +00:00
driver . Libraries ( ) ,
driver . Root ,
2022-07-20 08:52:43 +00:00
[ ] string {
2023-11-22 18:50:03 +00:00
"libnvidia-egl-gbm.so.*" ,
2024-05-10 14:12:49 +00:00
"gbm/nvidia-drm_gbm.so" ,
"libnvidia-egl-wayland.so.*" ,
"libnvidia-vulkan-producer.so*" ,
2022-07-20 08:52:43 +00:00
} ,
)
jsonMounts := NewMounts (
logger ,
2023-11-22 20:57:03 +00:00
driver . Configs ( ) ,
2023-11-21 15:08:16 +00:00
driver . Root ,
2022-07-20 08:52:43 +00:00
[ ] string {
2022-11-25 13:19:59 +00:00
"glvnd/egl_vendor.d/10_nvidia.json" ,
"vulkan/icd.d/nvidia_icd.json" ,
2023-11-22 12:48:58 +00:00
"vulkan/icd.d/nvidia_layers.json" ,
2022-11-25 13:19:59 +00:00
"vulkan/implicit_layer.d/nvidia_layers.json" ,
"egl/egl_external_platform.d/15_nvidia_gbm.json" ,
"egl/egl_external_platform.d/10_nvidia_wayland.json" ,
2023-11-22 12:48:11 +00:00
"nvidia/nvoptix.bin" ,
2022-07-20 08:52:43 +00:00
} ,
)
2023-11-21 15:08:16 +00:00
xorg := optionalXorgDiscoverer ( logger , driver , nvidiaCTKPath )
2023-05-10 14:53:10 +00:00
2022-07-20 08:52:43 +00:00
discover := Merge (
libraries ,
jsonMounts ,
2023-05-10 14:53:10 +00:00
xorg ,
2022-07-20 08:52:43 +00:00
)
return discover , nil
}
2022-09-29 12:47:04 +00:00
type drmDevicesByPath struct {
None
2023-03-22 12:27:43 +00:00
logger logger . Interface
2023-01-18 10:43:05 +00:00
nvidiaCTKPath string
2023-11-14 15:57:37 +00:00
devRoot string
2023-01-18 10:43:05 +00:00
devicesFrom Discover
2022-09-29 12:47:04 +00:00
}
// newCreateDRMByPathSymlinks creates a discoverer for a hook to create the by-path symlinks for DRM devices discovered by the specified devices discoverer
2023-11-14 15:57:37 +00:00
func newCreateDRMByPathSymlinks ( logger logger . Interface , devices Discover , devRoot string , nvidiaCTKPath string ) Discover {
2022-09-29 12:47:04 +00:00
d := drmDevicesByPath {
2023-01-18 10:43:05 +00:00
logger : logger ,
2023-05-10 12:49:59 +00:00
nvidiaCTKPath : nvidiaCTKPath ,
2023-11-14 15:57:37 +00:00
devRoot : devRoot ,
2023-01-18 10:43:05 +00:00
devicesFrom : devices ,
2022-09-29 12:47:04 +00:00
}
return & d
}
// Hooks returns a hook to create the symlinks from the required CSV files
func ( d drmDevicesByPath ) Hooks ( ) ( [ ] Hook , error ) {
devices , err := d . devicesFrom . Devices ( )
if err != nil {
return nil , fmt . Errorf ( "failed to discover devices for by-path symlinks: %v" , err )
}
if len ( devices ) == 0 {
return nil , nil
}
2022-11-23 20:49:02 +00:00
links , err := d . getSpecificLinkArgs ( devices )
if err != nil {
return nil , fmt . Errorf ( "failed to determine specific links: %v" , err )
}
if len ( links ) == 0 {
return nil , nil
}
2022-09-29 12:47:04 +00:00
2023-01-19 09:37:10 +00:00
var args [ ] string
2022-09-29 12:47:04 +00:00
for _ , l := range links {
args = append ( args , "--link" , l )
}
2023-01-19 09:37:10 +00:00
hook := CreateNvidiaCTKHook (
d . nvidiaCTKPath ,
"create-symlinks" ,
args ... ,
)
2022-09-29 12:47:04 +00:00
2023-01-19 09:37:10 +00:00
return [ ] Hook { hook } , nil
2022-09-29 12:47:04 +00:00
}
2024-01-23 00:48:11 +00:00
// getSpecificLinkArgs returns the required specific links that need to be created
2022-09-29 12:47:04 +00:00
func ( d drmDevicesByPath ) getSpecificLinkArgs ( devices [ ] Device ) ( [ ] string , error ) {
selectedDevices := make ( map [ string ] bool )
for _ , d := range devices {
selectedDevices [ filepath . Base ( d . HostPath ) ] = true
}
2022-12-02 10:38:40 +00:00
linkLocator := lookup . NewFileLocator (
lookup . WithLogger ( d . logger ) ,
2023-11-14 15:57:37 +00:00
lookup . WithRoot ( d . devRoot ) ,
2022-12-02 10:38:40 +00:00
)
2022-09-29 12:47:04 +00:00
candidates , err := linkLocator . Locate ( "/dev/dri/by-path/pci-*-*" )
if err != nil {
2022-11-23 20:49:02 +00:00
d . logger . Warningf ( "Failed to locate by-path links: %v; ignoring" , err )
return nil , nil
2022-09-29 12:47:04 +00:00
}
var links [ ] string
for _ , c := range candidates {
device , err := os . Readlink ( c )
if err != nil {
d . logger . Warningf ( "Failed to evaluate symlink %v; ignoring" , c )
continue
}
if selectedDevices [ filepath . Base ( device ) ] {
d . logger . Debugf ( "adding device symlink %v -> %v" , c , device )
links = append ( links , fmt . Sprintf ( "%v::%v" , device , c ) )
}
}
return links , nil
}
// newDRMDeviceDiscoverer creates a discoverer for the DRM devices associated with the requested devices.
2023-11-14 15:57:37 +00:00
func newDRMDeviceDiscoverer ( logger logger . Interface , devices image . VisibleDevices , devRoot string ) ( Discover , error ) {
2023-11-20 14:03:36 +00:00
allDevices := NewCharDeviceDiscoverer (
2022-09-29 12:47:04 +00:00
logger ,
2023-11-14 15:57:37 +00:00
devRoot ,
2022-09-29 12:47:04 +00:00
[ ] string {
"/dev/dri/card*" ,
"/dev/dri/renderD*" ,
} ,
)
2024-01-23 00:48:11 +00:00
filter , err := newDRMDeviceFilter ( devices , devRoot )
2022-09-29 12:47:04 +00:00
if err != nil {
return nil , fmt . Errorf ( "failed to construct DRM device filter: %v" , err )
}
// We return a discoverer that applies the DRM device filter created above to all discovered DRM device nodes.
2024-01-23 00:48:11 +00:00
d := newFilteredDiscoverer (
2022-09-29 12:47:04 +00:00
logger ,
allDevices ,
filter ,
)
return d , err
}
// newDRMDeviceFilter creates a filter that matches DRM devices nodes for the visible devices.
2024-01-23 00:48:11 +00:00
func newDRMDeviceFilter ( devices image . VisibleDevices , devRoot string ) ( Filter , error ) {
2023-11-14 15:57:37 +00:00
gpuInformationPaths , err := proc . GetInformationFilePaths ( devRoot )
2022-09-29 12:47:04 +00:00
if err != nil {
return nil , fmt . Errorf ( "failed to read GPU information: %v" , err )
}
var selectedBusIds [ ] string
for _ , f := range gpuInformationPaths {
info , err := proc . ParseGPUInformationFile ( f )
if err != nil {
return nil , fmt . Errorf ( "failed to parse %v: %v" , f , err )
}
uuid := info [ proc . GPUInfoGPUUUID ]
busID := info [ proc . GPUInfoBusLocation ]
minor := info [ proc . GPUInfoDeviceMinor ]
if devices . Has ( minor ) || devices . Has ( uuid ) || devices . Has ( busID ) {
selectedBusIds = append ( selectedBusIds , busID )
}
}
filter := make ( selectDeviceByPath )
for _ , busID := range selectedBusIds {
drmDeviceNodes , err := drm . GetDeviceNodesByBusID ( busID )
if err != nil {
return nil , fmt . Errorf ( "failed to determine DRM devices for %v: %v" , busID , err )
}
for _ , drmDeviceNode := range drmDeviceNodes {
2023-08-25 14:55:04 +00:00
filter [ drmDeviceNode ] = true
2022-09-29 12:47:04 +00:00
}
}
return filter , nil
}
2023-03-07 19:57:24 +00:00
type xorgHooks struct {
libraries Discover
driverVersion string
nvidiaCTKPath string
}
var _ Discover = ( * xorgHooks ) ( nil )
2023-04-13 12:21:57 +00:00
// optionalXorgDiscoverer creates a discoverer for Xorg libraries.
// If the creation of the discoverer fails, a None discoverer is returned.
2023-11-21 15:08:16 +00:00
func optionalXorgDiscoverer ( logger logger . Interface , driver * root . Driver , nvidiaCTKPath string ) Discover {
xorg , err := newXorgDiscoverer ( logger , driver , nvidiaCTKPath )
2023-04-13 12:21:57 +00:00
if err != nil {
2023-06-06 19:46:38 +00:00
logger . Warningf ( "Failed to create Xorg discoverer: %v; skipping xorg libraries" , err )
2023-04-13 12:21:57 +00:00
return None { }
}
return xorg
}
2023-11-21 15:08:16 +00:00
func newXorgDiscoverer ( logger logger . Interface , driver * root . Driver , nvidiaCTKPath string ) ( Discover , error ) {
2023-03-07 19:57:24 +00:00
libCudaPaths , err := cuda . New (
2023-11-21 15:08:16 +00:00
driver . Libraries ( ) ,
2023-05-22 11:53:19 +00:00
) . Locate ( ".*.*" )
2023-03-07 19:57:24 +00:00
if err != nil {
return nil , fmt . Errorf ( "failed to locate libcuda.so: %v" , err )
}
libcudaPath := libCudaPaths [ 0 ]
version := strings . TrimPrefix ( filepath . Base ( libcudaPath ) , "libcuda.so." )
if version == "" {
return nil , fmt . Errorf ( "failed to determine libcuda.so version from path: %q" , libcudaPath )
}
libRoot := filepath . Dir ( libcudaPath )
xorgLibs := NewMounts (
logger ,
lookup . NewFileLocator (
lookup . WithLogger ( logger ) ,
2023-11-21 15:08:16 +00:00
lookup . WithRoot ( driver . Root ) ,
2024-05-10 14:12:49 +00:00
lookup . WithSearchPaths ( [ ] string {
libRoot + "/nvidia/xorg" ,
libRoot + "/xorg/modules/extensions" ,
libRoot + "/xorg/modules/drivers" ,
"/usr/lib/xorg/modules/extensions" ,
"/usr/lib/xorg/modules/drivers" ,
"/usr/X11R6/modules/extensions" ,
"/usr/X11R6/modules/drivers" ,
"/usr/lib64/xorg/modules/extensions" ,
"/usr/lib64/xorg/modules/drivers" ,
} ) ,
2023-03-07 19:57:24 +00:00
lookup . WithCount ( 1 ) ,
) ,
2023-11-21 15:08:16 +00:00
driver . Root ,
2023-03-07 19:57:24 +00:00
[ ] string {
2024-05-10 14:12:49 +00:00
"nvidia_drv.so" ,
fmt . Sprintf ( "libglxserver_nvidia.so.%s" , version ) ,
2023-03-07 19:57:24 +00:00
} ,
)
xorgHooks := xorgHooks {
libraries : xorgLibs ,
driverVersion : version ,
2023-05-10 12:49:59 +00:00
nvidiaCTKPath : nvidiaCTKPath ,
2023-03-07 19:57:24 +00:00
}
2024-01-23 00:48:11 +00:00
xorgConfig := NewMounts (
2023-03-07 19:57:24 +00:00
logger ,
2023-11-22 20:57:03 +00:00
driver . Configs ( ) ,
2023-11-21 15:08:16 +00:00
driver . Root ,
2024-05-10 14:12:49 +00:00
[ ] string {
"X11/xorg.conf.d/10-nvidia.conf" ,
"X11/xorg.conf.d/nvidia-drm-outputclass.conf" ,
} ,
2023-03-07 19:57:24 +00:00
)
d := Merge (
xorgLibs ,
2024-01-23 00:48:11 +00:00
xorgConfig ,
2023-03-07 19:57:24 +00:00
xorgHooks ,
)
return d , nil
}
// Devices returns no devices for Xorg
func ( m xorgHooks ) Devices ( ) ( [ ] Device , error ) {
return nil , nil
}
// Hooks returns a hook to create symlinks for Xorg libraries
func ( m xorgHooks ) Hooks ( ) ( [ ] Hook , error ) {
mounts , err := m . libraries . Mounts ( )
if err != nil {
return nil , fmt . Errorf ( "failed to get mounts: %v" , err )
}
if len ( mounts ) == 0 {
return nil , nil
}
var target string
for _ , mount := range mounts {
filename := filepath . Base ( mount . HostPath )
if filename == "libglxserver_nvidia.so." + m . driverVersion {
target = mount . Path
}
}
if target == "" {
return nil , nil
}
link := strings . TrimSuffix ( target , "." + m . driverVersion )
links := [ ] string { fmt . Sprintf ( "%s::%s" , filepath . Base ( target ) , link ) }
symlinkHook := CreateCreateSymlinkHook (
m . nvidiaCTKPath ,
links ,
)
return symlinkHook . Hooks ( )
}
// Mounts returns the libraries required for Xorg
func ( m xorgHooks ) Mounts ( ) ( [ ] Mount , error ) {
return nil , nil
}
2022-09-29 12:47:04 +00:00
// selectDeviceByPath is a filter that allows devices to be selected by the path
type selectDeviceByPath map [ string ] bool
var _ Filter = ( * selectDeviceByPath ) ( nil )
// DeviceIsSelected determines whether the device's path has been selected
func ( s selectDeviceByPath ) DeviceIsSelected ( device Device ) bool {
return s [ device . Path ]
}
// MountIsSelected is always true
func ( s selectDeviceByPath ) MountIsSelected ( Mount ) bool {
return true
}
// HookIsSelected is always true
func ( s selectDeviceByPath ) HookIsSelected ( Hook ) bool {
return true
}