2022-03-15 12:29:14 +00:00
|
|
|
/**
|
|
|
|
# Copyright (c) 2022, NVIDIA CORPORATION. All rights reserved.
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
**/
|
|
|
|
|
|
|
|
package modifier
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
|
|
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/config"
|
2022-05-02 08:28:25 +00:00
|
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/config/image"
|
|
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/cuda"
|
2023-03-22 12:27:43 +00:00
|
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/logger"
|
2023-06-22 13:42:26 +00:00
|
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/modifier/cdi"
|
2022-03-15 12:29:14 +00:00
|
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/oci"
|
2023-06-22 13:49:27 +00:00
|
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/platform-support/tegra/csv"
|
2022-05-02 08:28:25 +00:00
|
|
|
"github.com/NVIDIA/nvidia-container-toolkit/internal/requirements"
|
2023-06-22 13:42:26 +00:00
|
|
|
"github.com/NVIDIA/nvidia-container-toolkit/pkg/nvcdi"
|
2022-03-15 12:29:14 +00:00
|
|
|
)
|
|
|
|
|
2022-05-09 13:42:59 +00:00
|
|
|
// NewCSVModifier creates a modifier that applies modications to an OCI spec if required by the runtime wrapper.
|
|
|
|
// The modifications are defined by CSV MountSpecs.
|
2024-10-14 13:06:06 +00:00
|
|
|
func NewCSVModifier(logger logger.Interface, cfg *config.Config, container image.CUDA) (oci.SpecModifier, error) {
|
|
|
|
if devices := container.VisibleDevicesFromEnvVar(); len(devices) == 0 {
|
2022-06-29 15:33:57 +00:00
|
|
|
logger.Infof("No modification required; no devices requested")
|
2022-02-25 08:54:04 +00:00
|
|
|
return nil, nil
|
|
|
|
}
|
2022-05-05 15:27:36 +00:00
|
|
|
logger.Infof("Constructing modifier from config: %+v", *cfg)
|
2022-03-15 12:29:14 +00:00
|
|
|
|
2024-10-14 13:06:06 +00:00
|
|
|
if err := checkRequirements(logger, container); err != nil {
|
2022-05-09 13:42:59 +00:00
|
|
|
return nil, fmt.Errorf("requirements not met: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
csvFiles, err := csv.GetFileList(cfg.NVIDIAContainerRuntimeConfig.Modes.CSV.MountSpecPath)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to get list of CSV files: %v", err)
|
|
|
|
}
|
|
|
|
|
2024-10-14 13:06:06 +00:00
|
|
|
if container.Getenv(image.EnvVarNvidiaRequireJetpack) != "csv-mounts=all" {
|
2022-05-09 13:42:59 +00:00
|
|
|
csvFiles = csv.BaseFilesOnly(csvFiles)
|
|
|
|
}
|
|
|
|
|
2023-06-22 13:42:26 +00:00
|
|
|
cdilib, err := nvcdi.New(
|
|
|
|
nvcdi.WithLogger(logger),
|
|
|
|
nvcdi.WithDriverRoot(cfg.NVIDIAContainerCLIConfig.Root),
|
2024-04-24 08:47:45 +00:00
|
|
|
nvcdi.WithNVIDIACDIHookPath(cfg.NVIDIACTKConfig.Path),
|
2023-06-22 13:42:26 +00:00
|
|
|
nvcdi.WithMode(nvcdi.ModeCSV),
|
|
|
|
nvcdi.WithCSVFiles(csvFiles),
|
2022-07-15 10:18:36 +00:00
|
|
|
)
|
2023-05-23 19:14:02 +00:00
|
|
|
if err != nil {
|
2023-06-22 13:42:26 +00:00
|
|
|
return nil, fmt.Errorf("failed to construct CDI library: %v", err)
|
2023-05-23 19:14:02 +00:00
|
|
|
}
|
2022-05-09 13:42:59 +00:00
|
|
|
|
2023-06-22 13:42:26 +00:00
|
|
|
spec, err := cdilib.GetSpec()
|
2022-03-15 12:29:14 +00:00
|
|
|
if err != nil {
|
2023-06-22 13:42:26 +00:00
|
|
|
return nil, fmt.Errorf("failed to get CDI spec: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
cdiModifier, err := cdi.New(
|
|
|
|
cdi.WithLogger(logger),
|
|
|
|
cdi.WithSpec(spec.Raw()),
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to construct CDI modifier: %v", err)
|
2022-03-15 12:29:14 +00:00
|
|
|
}
|
|
|
|
|
2022-06-15 12:12:17 +00:00
|
|
|
modifiers := Merge(
|
2022-06-02 15:10:31 +00:00
|
|
|
nvidiaContainerRuntimeHookRemover{logger},
|
2023-06-22 13:42:26 +00:00
|
|
|
cdiModifier,
|
2022-06-02 15:10:31 +00:00
|
|
|
)
|
2022-03-15 12:29:14 +00:00
|
|
|
|
2022-06-02 15:10:31 +00:00
|
|
|
return modifiers, nil
|
2022-03-15 12:29:14 +00:00
|
|
|
}
|
2022-04-06 12:30:49 +00:00
|
|
|
|
2023-03-22 12:27:43 +00:00
|
|
|
func checkRequirements(logger logger.Interface, image image.CUDA) error {
|
2022-05-02 08:28:25 +00:00
|
|
|
if image.HasDisableRequire() {
|
|
|
|
// TODO: We could print the real value here instead
|
|
|
|
logger.Debugf("NVIDIA_DISABLE_REQUIRE=%v; skipping requirement checks", true)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
imageRequirements, err := image.GetRequirements()
|
|
|
|
if err != nil {
|
|
|
|
// TODO: Should we treat this as a failure, or just issue a warning?
|
|
|
|
return fmt.Errorf("failed to get image requirements: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
r := requirements.New(logger, imageRequirements)
|
|
|
|
|
|
|
|
cudaVersion, err := cuda.Version()
|
|
|
|
if err != nil {
|
2023-06-06 19:46:38 +00:00
|
|
|
logger.Warningf("Failed to get CUDA version: %v", err)
|
2022-05-02 08:28:25 +00:00
|
|
|
} else {
|
|
|
|
r.AddVersionProperty(requirements.CUDA, cudaVersion)
|
|
|
|
}
|
|
|
|
|
2022-05-05 12:11:30 +00:00
|
|
|
compteCapability, err := cuda.ComputeCapability(0)
|
|
|
|
if err != nil {
|
2023-06-06 19:46:38 +00:00
|
|
|
logger.Warningf("Failed to get CUDA Compute Capability: %v", err)
|
2022-05-05 12:11:30 +00:00
|
|
|
} else {
|
|
|
|
r.AddVersionProperty(requirements.ARCH, compteCapability)
|
|
|
|
}
|
|
|
|
|
2022-05-02 08:28:25 +00:00
|
|
|
return r.Assert()
|
|
|
|
}
|