// Copyright 2017 Intel Corporation. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. package main import ( "flag" "fmt" "io/ioutil" "os" "path" "regexp" "strings" "time" "github.com/pkg/errors" "k8s.io/klog" pluginapi "k8s.io/kubelet/pkg/apis/deviceplugin/v1beta1" dpapi "github.com/intel/intel-device-plugins-for-kubernetes/pkg/deviceplugin" ) const ( sysfsDrmDirectory = "/sys/class/drm" devfsDriDirectory = "/dev/dri" gpuDeviceRE = `^card[0-9]+$` controlDeviceRE = `^controlD[0-9]+$` vendorString = "0x8086" // Device plugin settings. namespace = "gpu.intel.com" deviceType = "i915" // Period of device scans. scanPeriod = 5 * time.Second ) type devicePlugin struct { sysfsDir string devfsDir string sharedDevNum int gpuDeviceReg *regexp.Regexp controlDeviceReg *regexp.Regexp scanTicker *time.Ticker scanDone chan bool } func newDevicePlugin(sysfsDir, devfsDir string, sharedDevNum int) *devicePlugin { return &devicePlugin{ sysfsDir: sysfsDir, devfsDir: devfsDir, sharedDevNum: sharedDevNum, gpuDeviceReg: regexp.MustCompile(gpuDeviceRE), controlDeviceReg: regexp.MustCompile(controlDeviceRE), scanTicker: time.NewTicker(scanPeriod), scanDone: make(chan bool, 1), // buffered as we may send to it before Scan starts receiving from it } } func (dp *devicePlugin) Scan(notifier dpapi.Notifier) error { defer dp.scanTicker.Stop() var previouslyFound int = -1 for { devTree, err := dp.scan() if err != nil { klog.Warning("Failed to scan: ", err) } found := len(devTree) if found != previouslyFound { klog.V(1).Info("GPU scan update: devices found: ", found) previouslyFound = found } notifier.Notify(devTree) select { case <-dp.scanDone: return nil case <-dp.scanTicker.C: } } } func (dp *devicePlugin) scan() (dpapi.DeviceTree, error) { files, err := ioutil.ReadDir(dp.sysfsDir) if err != nil { return nil, errors.Wrap(err, "Can't read sysfs folder") } devTree := dpapi.NewDeviceTree() for _, f := range files { var nodes []pluginapi.DeviceSpec if !dp.gpuDeviceReg.MatchString(f.Name()) { klog.V(4).Info("Not compatible device", f.Name()) continue } dat, err := ioutil.ReadFile(path.Join(dp.sysfsDir, f.Name(), "device/vendor")) if err != nil { klog.Warning("Skipping. Can't read vendor file: ", err) continue } if strings.TrimSpace(string(dat)) != vendorString { klog.V(4).Info("Non-Intel GPU", f.Name()) continue } drmFiles, err := ioutil.ReadDir(path.Join(dp.sysfsDir, f.Name(), "device/drm")) if err != nil { return nil, errors.Wrap(err, "Can't read device folder") } for _, drmFile := range drmFiles { if dp.controlDeviceReg.MatchString(drmFile.Name()) { //Skipping possible drm control node continue } devPath := path.Join(dp.devfsDir, drmFile.Name()) if _, err := os.Stat(devPath); err != nil { continue } klog.V(4).Infof("Adding %s to GPU %s", devPath, f.Name()) nodes = append(nodes, pluginapi.DeviceSpec{ HostPath: devPath, ContainerPath: devPath, Permissions: "rw", }) } if len(nodes) > 0 { for i := 0; i < dp.sharedDevNum; i++ { devID := fmt.Sprintf("%s-%d", f.Name(), i) // Currently only one device type (i915) is supported. // TODO: check model ID to differentiate device models. devTree.AddDevice(deviceType, devID, dpapi.NewDeviceInfo(pluginapi.Healthy, nodes, nil, nil)) } } } return devTree, nil } func main() { var sharedDevNum int flag.IntVar(&sharedDevNum, "shared-dev-num", 1, "number of containers sharing the same GPU device") flag.Parse() if sharedDevNum < 1 { klog.Warning("The number of containers sharing the same GPU must greater than zero") os.Exit(1) } klog.V(1).Info("GPU device plugin started") plugin := newDevicePlugin(sysfsDrmDirectory, devfsDriDirectory, sharedDevNum) manager := dpapi.NewManager(namespace, plugin) manager.Run() }