mirror of
https://github.com/intel/intel-device-plugins-for-kubernetes.git
synced 2025-06-03 03:59:37 +00:00

Plugin sets container annotation com.intel.fpga.mode to intel.com/fpga-region in region mode. This should allow to configure CRI-O to run reprogramming hooks only when annotation is set.
198 lines
6.0 KiB
Go
198 lines
6.0 KiB
Go
// Copyright 2017 Intel Corporation. All Rights Reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package main
|
|
|
|
import (
|
|
"flag"
|
|
"fmt"
|
|
"os"
|
|
|
|
"github.com/golang/glog"
|
|
"golang.org/x/net/context"
|
|
|
|
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
|
|
"k8s.io/client-go/kubernetes"
|
|
"k8s.io/client-go/rest"
|
|
"k8s.io/client-go/tools/clientcmd"
|
|
pluginapi "k8s.io/kubernetes/pkg/kubelet/apis/deviceplugin/v1beta1"
|
|
utilnode "k8s.io/kubernetes/pkg/util/node"
|
|
|
|
"github.com/intel/intel-device-plugins-for-kubernetes/cmd/fpga_plugin/devicecache"
|
|
"github.com/intel/intel-device-plugins-for-kubernetes/internal/deviceplugin"
|
|
)
|
|
|
|
const (
|
|
sysfsDirectory = "/sys/class/fpga"
|
|
devfsDirectory = "/dev"
|
|
|
|
// Device plugin settings.
|
|
pluginEndpointPrefix = "intel-fpga"
|
|
resourceNamePrefix = "intel.com/fpga"
|
|
annotationName = "com.intel.fpga.mode"
|
|
)
|
|
|
|
// deviceManager manages Intel FPGA devices.
|
|
type deviceManager struct {
|
|
srv deviceplugin.Server
|
|
fpgaID string
|
|
name string
|
|
mode string
|
|
ch chan map[string]deviceplugin.DeviceInfo
|
|
devices map[string]deviceplugin.DeviceInfo
|
|
}
|
|
|
|
func newDeviceManager(resourceName string, fpgaID string, mode string, ch chan map[string]deviceplugin.DeviceInfo) *deviceManager {
|
|
return &deviceManager{
|
|
fpgaID: fpgaID,
|
|
name: resourceName,
|
|
mode: mode,
|
|
ch: ch,
|
|
devices: make(map[string]deviceplugin.DeviceInfo),
|
|
}
|
|
}
|
|
|
|
func (dm *deviceManager) GetDevicePluginOptions(ctx context.Context, empty *pluginapi.Empty) (*pluginapi.DevicePluginOptions, error) {
|
|
fmt.Println("GetDevicePluginOptions: return empty options")
|
|
return new(pluginapi.DevicePluginOptions), nil
|
|
}
|
|
|
|
// ListAndWatch returns a list of devices
|
|
// Whenever a device state change or a device disappears, ListAndWatch returns the new list
|
|
func (dm *deviceManager) ListAndWatch(empty *pluginapi.Empty, stream pluginapi.DevicePlugin_ListAndWatchServer) error {
|
|
glog.V(2).Info("Started ListAndWatch for ", dm.fpgaID)
|
|
|
|
for dm.devices = range dm.ch {
|
|
resp := new(pluginapi.ListAndWatchResponse)
|
|
for id, device := range dm.devices {
|
|
resp.Devices = append(resp.Devices, &pluginapi.Device{id, device.State})
|
|
}
|
|
glog.V(2).Info("Sending to kubelet ", resp.Devices)
|
|
if err := stream.Send(resp); err != nil {
|
|
dm.srv.Stop()
|
|
return fmt.Errorf("device-plugin: cannot update device list: %v", err)
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
func (dm *deviceManager) Allocate(ctx context.Context, rqt *pluginapi.AllocateRequest) (*pluginapi.AllocateResponse, error) {
|
|
response, err := deviceplugin.MakeAllocateResponse(rqt, dm.devices)
|
|
// Set container annotations when programming is allowed
|
|
if dm.mode == devicecache.RegionMode {
|
|
for _, containerResponse := range response.GetContainerResponses() {
|
|
containerResponse.Annotations = map[string]string{
|
|
annotationName: fmt.Sprintf("%s-%s", resourceNamePrefix, dm.mode),
|
|
}
|
|
}
|
|
}
|
|
return response, err
|
|
}
|
|
|
|
func (dm *deviceManager) PreStartContainer(ctx context.Context, rqt *pluginapi.PreStartContainerRequest) (*pluginapi.PreStartContainerResponse, error) {
|
|
glog.Warning("PreStartContainer() should not be called")
|
|
return new(pluginapi.PreStartContainerResponse), nil
|
|
}
|
|
|
|
func startDeviceManager(dm *deviceManager, pluginPrefix string) {
|
|
err := dm.srv.Serve(dm, dm.name, pluginPrefix)
|
|
if err != nil {
|
|
glog.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func handleUpdate(dms map[string]*deviceManager, updateInfo devicecache.UpdateInfo, start func(*deviceManager, string), mode string) {
|
|
glog.V(2).Info("Received dev updates: ", updateInfo)
|
|
for fpgaID, devices := range updateInfo.Added {
|
|
devCh := make(chan map[string]deviceplugin.DeviceInfo, 1)
|
|
resourceName := resourceNamePrefix + "-" + fpgaID
|
|
pPrefix := pluginEndpointPrefix + "-" + fpgaID
|
|
dms[fpgaID] = newDeviceManager(resourceName, fpgaID, mode, devCh)
|
|
go start(dms[fpgaID], pPrefix)
|
|
devCh <- devices
|
|
}
|
|
for fpgaID, devices := range updateInfo.Updated {
|
|
dms[fpgaID].ch <- devices
|
|
}
|
|
for fpgaID := range updateInfo.Removed {
|
|
dms[fpgaID].srv.Stop()
|
|
close(dms[fpgaID].ch)
|
|
delete(dms, fpgaID)
|
|
}
|
|
}
|
|
|
|
func main() {
|
|
var mode string
|
|
var kubeconfig string
|
|
var master string
|
|
var config *rest.Config
|
|
var err error
|
|
|
|
flag.StringVar(&kubeconfig, "kubeconfig", "", "absolute path to the kubeconfig file")
|
|
flag.StringVar(&master, "master", "", "master url")
|
|
flag.StringVar(&mode, "mode", string(devicecache.AfMode),
|
|
fmt.Sprintf("device plugin mode: '%s' (default), '%s' or '%s'", devicecache.AfMode, devicecache.RegionMode, devicecache.RegionDevelMode))
|
|
flag.Parse()
|
|
|
|
if kubeconfig == "" {
|
|
config, err = rest.InClusterConfig()
|
|
} else {
|
|
config, err = clientcmd.BuildConfigFromFlags(master, kubeconfig)
|
|
}
|
|
if err != nil {
|
|
glog.Fatal(err)
|
|
}
|
|
|
|
// if NODE_NAME is not set then try to use hostname
|
|
nodeName := utilnode.GetHostname(os.Getenv("NODE_NAME"))
|
|
|
|
clientset, err := kubernetes.NewForConfig(config)
|
|
if err != nil {
|
|
glog.Fatal(err)
|
|
}
|
|
|
|
node, err := clientset.CoreV1().Nodes().Get(nodeName, metav1.GetOptions{})
|
|
if err != nil {
|
|
glog.Fatal(err)
|
|
}
|
|
|
|
if nodeMode, ok := node.ObjectMeta.Annotations["fpga.intel.com/device-plugin-mode"]; ok {
|
|
glog.Info("Overriding mode to ", nodeMode)
|
|
mode = nodeMode
|
|
}
|
|
|
|
updatesCh := make(chan devicecache.UpdateInfo)
|
|
|
|
cache, err := devicecache.NewCache(sysfsDirectory, devfsDirectory, mode, updatesCh)
|
|
if err != nil {
|
|
glog.Error(err)
|
|
os.Exit(1)
|
|
}
|
|
|
|
glog.Info("FPGA device plugin started in ", mode, " mode")
|
|
|
|
go func() {
|
|
err := cache.Run()
|
|
if err != nil {
|
|
glog.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
dms := make(map[string]*deviceManager)
|
|
for updateInfo := range updatesCh {
|
|
handleUpdate(dms, updateInfo, startDeviceManager, mode)
|
|
}
|
|
}
|