| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188 |
- // Copyright 2019 Yunion
- //
- // Licensed under the Apache License, Version 2.0 (the "License");
- // you may not use this file except in compliance with the License.
- // You may obtain a copy of the License at
- //
- // http://www.apache.org/licenses/LICENSE-2.0
- //
- // Unless required by applicable law or agreed to in writing, software
- // distributed under the License is distributed on an "AS IS" BASIS,
- // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- // See the License for the specific language governing permissions and
- // limitations under the License.
- package predicates
- import (
- "context"
- "fmt"
- "yunion.io/x/onecloud/pkg/apis/compute"
- "yunion.io/x/onecloud/pkg/scheduler/core"
- )
- // IsolatedDevicePredicate check mode, and number of scheduled
- // device configurations and current resources.
- type IsolatedDevicePredicate struct {
- BasePredicate
- }
- func (f *IsolatedDevicePredicate) Name() string {
- return "host_isolated_device"
- }
- func (f *IsolatedDevicePredicate) Clone() core.FitPredicate {
- return &IsolatedDevicePredicate{}
- }
- func (f *IsolatedDevicePredicate) PreExecute(ctx context.Context, u *core.Unit, cs []core.Candidater) (bool, error) {
- data := u.SchedData()
- if data.ResetCpuNumaPin {
- return false, nil
- }
- if len(data.IsolatedDevices) > 0 {
- return true, nil
- }
- networks := data.Networks
- for i := 0; i < len(networks); i++ {
- if networks[i].SriovDevice != nil {
- return true, nil
- }
- }
- disks := data.Disks
- for i := 0; i < len(disks); i++ {
- if disks[i].NVMEDevice != nil {
- return true, nil
- }
- }
- return false, nil
- }
- func (f *IsolatedDevicePredicate) getIsolatedDeviceCountByType(getter core.CandidatePropertyGetter, devType string) int {
- devs := getter.UnusedIsolatedDevicesByType(devType)
- if devType != compute.CONTAINER_DEV_NVIDIA_MPS && devType != compute.CONTAINER_DEV_NVIDIA_GPU_SHARE {
- return len(devs)
- } else {
- devMap := map[string]struct{}{}
- for _, dev := range devs {
- devMap[dev.DevicePath] = struct{}{}
- }
- return len(devMap)
- }
- }
- func (f *IsolatedDevicePredicate) Execute(ctx context.Context, u *core.Unit, c core.Candidater) (bool, []core.PredicateFailureReason, error) {
- h := NewPredicateHelper(f, u, c)
- reqIsoDevs := u.SchedData().IsolatedDevices
- if reqIsoDevs == nil {
- reqIsoDevs = []*compute.IsolatedDeviceConfig{}
- }
- networks := u.SchedData().Networks
- for i := 0; i < len(networks); i++ {
- if networks[i].SriovDevice != nil {
- reqIsoDevs = append(reqIsoDevs, networks[i].SriovDevice)
- }
- }
- disks := u.SchedData().Disks
- for i := 0; i < len(disks); i++ {
- if disks[i].NVMEDevice != nil {
- reqIsoDevs = append(reqIsoDevs, disks[i].NVMEDevice)
- }
- }
- getter := c.Getter()
- minCapacity := int64(0xFFFFFFFF)
- // check by specify device id
- for _, dev := range reqIsoDevs {
- if len(dev.Id) == 0 {
- continue
- }
- if fDev := getter.GetIsolatedDevice(dev.Id); fDev != nil {
- if len(fDev.GuestID) != 0 {
- h.Exclude(fmt.Sprintf("IsolatedDevice %q already used by guest %q", dev.Id, fDev.GuestID))
- return h.GetResult()
- }
- } else {
- h.Exclude(fmt.Sprintf("Not found IsolatedDevice %q", dev.Id))
- return h.GetResult()
- }
- minCapacity = 1
- }
- reqCount := len(reqIsoDevs)
- freeCount := len(getter.UnusedIsolatedDevices()) - getter.GetPendingUsage().IsolatedDevice
- totalCount := len(getter.GetIsolatedDevices())
- // check host isolated device count
- if freeCount < reqCount {
- h.AppendInsufficientResourceError(int64(reqCount), int64(totalCount), int64(freeCount))
- h.Exclude(fmt.Sprintf(
- "IsolatedDevice count not enough, request: %d, hostTotal: %d, hostFree: %d",
- reqCount, totalCount, freeCount))
- return h.GetResult()
- }
- // check host device by type
- devTypeRequest := make(map[string]int, 0)
- for _, dev := range reqIsoDevs {
- if len(dev.DevType) != 0 {
- devTypeRequest[dev.DevType] += 1
- }
- }
- for devType, reqCount := range devTypeRequest {
- freeCount := f.getIsolatedDeviceCountByType(getter, devType)
- if freeCount < reqCount {
- h.Exclude(fmt.Sprintf("IsolatedDevice type %q not enough, request: %d, hostFree: %d", devType, reqCount, freeCount))
- return h.GetResult()
- }
- cap := freeCount / reqCount
- if int64(cap) < minCapacity {
- minCapacity = int64(cap)
- }
- }
- // check host device by model
- devVendorModelRequest := make(map[string]int, 0)
- for _, dev := range reqIsoDevs {
- if len(dev.Model) != 0 {
- devVendorModelRequest[fmt.Sprintf("%s:%s", dev.Vendor, dev.Model)] += 1
- }
- }
- for vendorModel, reqCount := range devVendorModelRequest {
- freeCount := len(getter.UnusedIsolatedDevicesByVendorModel(vendorModel))
- if freeCount < reqCount {
- h.Exclude(fmt.Sprintf("IsolatedDevice vendor:model %q not enough, request: %d, hostFree: %d", vendorModel, reqCount, freeCount))
- return h.GetResult()
- }
- cap := freeCount / reqCount
- if int64(cap) < minCapacity {
- minCapacity = int64(cap)
- }
- }
- // check host device by device_path
- devicePathReq := make(map[string]int, 0)
- for _, dev := range reqIsoDevs {
- if len(dev.DevicePath) != 0 {
- devicePathReq[dev.DevicePath] += 1
- }
- }
- for devPath, reqCnt := range devicePathReq {
- freeCount := len(getter.UnusedIsolatedDevicesByDevicePath(devPath))
- if freeCount < reqCount {
- h.Exclude(fmt.Sprintf("IsolatedDevice device_path %q not enough, request: %d, hostFree: %d", devPath, reqCount, freeCount))
- return h.GetResult()
- }
- cap := freeCount / reqCnt
- if int64(cap) < minCapacity {
- minCapacity = int64(cap)
- }
- }
- h.SetCapacity(minCapacity)
- return h.GetResult()
- }
|