mirror of
https://github.com/NVIDIA/nvidia-container-toolkit
synced 2024-11-25 05:21:33 +00:00
155 lines
4.2 KiB
Go
155 lines
4.2 KiB
Go
|
/**
|
||
|
# Copyright (c) NVIDIA CORPORATIOm. All rights reserved.
|
||
|
#
|
||
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
||
|
# you may not use this file except in compliance with the License.
|
||
|
# You may obtain a copy of the License at
|
||
|
#
|
||
|
# http://www.apache.org/licenses/LICENSE-2.0
|
||
|
#
|
||
|
# Unless required by applicable law or agreed to in writing, software
|
||
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
||
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
|
# See the License for the specific language governing permissions and
|
||
|
# limitations under the License.
|
||
|
**/
|
||
|
|
||
|
package nvdevices
|
||
|
|
||
|
import (
|
||
|
"errors"
|
||
|
"fmt"
|
||
|
"os"
|
||
|
"path/filepath"
|
||
|
"strings"
|
||
|
|
||
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/info/proc/devices"
|
||
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/logger"
|
||
|
)
|
||
|
|
||
|
var errInvalidDeviceNode = errors.New("invalid device node")
|
||
|
|
||
|
// Interface provides a set of utilities for interacting with NVIDIA devices on the system.
|
||
|
type Interface struct {
|
||
|
devices.Devices
|
||
|
|
||
|
logger logger.Interface
|
||
|
|
||
|
dryRun bool
|
||
|
// devRoot is the root directory where device nodes are expected to exist.
|
||
|
devRoot string
|
||
|
|
||
|
mknoder
|
||
|
}
|
||
|
|
||
|
// New constructs a new Interface struct with the specified options.
|
||
|
func New(opts ...Option) (*Interface, error) {
|
||
|
i := &Interface{}
|
||
|
for _, opt := range opts {
|
||
|
opt(i)
|
||
|
}
|
||
|
|
||
|
if i.logger == nil {
|
||
|
i.logger = logger.New()
|
||
|
}
|
||
|
if i.devRoot == "" {
|
||
|
i.devRoot = "/"
|
||
|
}
|
||
|
if i.Devices == nil {
|
||
|
devices, err := devices.GetNVIDIADevices()
|
||
|
if err != nil {
|
||
|
return nil, fmt.Errorf("failed to create devices info: %v", err)
|
||
|
}
|
||
|
i.Devices = devices
|
||
|
}
|
||
|
|
||
|
if i.dryRun {
|
||
|
i.mknoder = &mknodLogger{i.logger}
|
||
|
} else {
|
||
|
i.mknoder = &mknodUnix{}
|
||
|
}
|
||
|
return i, nil
|
||
|
}
|
||
|
|
||
|
// CreateNVIDIAControlDevices creates the NVIDIA control device nodes at the configured devRoot.
|
||
|
func (m *Interface) CreateNVIDIAControlDevices() error {
|
||
|
controlNodes := []string{"nvidiactl", "nvidia-modeset", "nvidia-uvm", "nvidia-uvm-tools"}
|
||
|
for _, node := range controlNodes {
|
||
|
err := m.CreateNVIDIADevice(node)
|
||
|
if err != nil {
|
||
|
return fmt.Errorf("failed to create device node %s: %w", node, err)
|
||
|
}
|
||
|
}
|
||
|
return nil
|
||
|
}
|
||
|
|
||
|
// CreateNVIDIADevice creates the specified NVIDIA device node at the configured devRoot.
|
||
|
func (m *Interface) CreateNVIDIADevice(node string) error {
|
||
|
node = filepath.Base(node)
|
||
|
if !strings.HasPrefix(node, "nvidia") {
|
||
|
return fmt.Errorf("invalid device node %q: %w", node, errInvalidDeviceNode)
|
||
|
}
|
||
|
|
||
|
major, err := m.Major(node)
|
||
|
if err != nil {
|
||
|
return fmt.Errorf("failed to determine major: %w", err)
|
||
|
}
|
||
|
|
||
|
minor, err := m.Minor(node)
|
||
|
if err != nil {
|
||
|
return fmt.Errorf("failed to determine minor: %w", err)
|
||
|
}
|
||
|
|
||
|
return m.createDeviceNode(filepath.Join("dev", node), int(major), int(minor))
|
||
|
}
|
||
|
|
||
|
// createDeviceNode creates the specified device node with the require major and minor numbers.
|
||
|
// If a devRoot is configured, this is prepended to the path.
|
||
|
func (m *Interface) createDeviceNode(path string, major int, minor int) error {
|
||
|
path = filepath.Join(m.devRoot, path)
|
||
|
if _, err := os.Stat(path); err == nil {
|
||
|
m.logger.Infof("Skipping: %s already exists", path)
|
||
|
return nil
|
||
|
} else if !os.IsNotExist(err) {
|
||
|
return fmt.Errorf("failed to stat %s: %v", path, err)
|
||
|
}
|
||
|
|
||
|
return m.Mknode(path, major, minor)
|
||
|
}
|
||
|
|
||
|
// Major returns the major number for the specified NVIDIA device node.
|
||
|
// If the device node is not supported, an error is returned.
|
||
|
func (m *Interface) Major(node string) (int64, error) {
|
||
|
var valid bool
|
||
|
var major devices.Major
|
||
|
switch node {
|
||
|
case "nvidia-uvm", "nvidia-uvm-tools":
|
||
|
major, valid = m.Get(devices.NVIDIAUVM)
|
||
|
case "nvidia-modeset", "nvidiactl":
|
||
|
major, valid = m.Get(devices.NVIDIAGPU)
|
||
|
}
|
||
|
|
||
|
if valid {
|
||
|
return int64(major), nil
|
||
|
}
|
||
|
|
||
|
return 0, errInvalidDeviceNode
|
||
|
}
|
||
|
|
||
|
// Minor returns the minor number for the specified NVIDIA device node.
|
||
|
// If the device node is not supported, an error is returned.
|
||
|
func (m *Interface) Minor(node string) (int64, error) {
|
||
|
switch node {
|
||
|
case "nvidia-modeset":
|
||
|
return devices.NVIDIAModesetMinor, nil
|
||
|
case "nvidia-uvm-tools":
|
||
|
return devices.NVIDIAUVMToolsMinor, nil
|
||
|
case "nvidia-uvm":
|
||
|
return devices.NVIDIAUVMMinor, nil
|
||
|
case "nvidiactl":
|
||
|
return devices.NVIDIACTLMinor, nil
|
||
|
}
|
||
|
|
||
|
return 0, errInvalidDeviceNode
|
||
|
}
|