Skip to content

Commit

Permalink
Merge pull request #702 from luomingmeng/dev/refine-qrm-plugin-state
Browse files Browse the repository at this point in the history
Refactor the QRM plugin state
  • Loading branch information
luomingmeng authored Oct 11, 2024
2 parents f6623f4 + 8f8f24e commit 56ba904
Show file tree
Hide file tree
Showing 58 changed files with 4,596 additions and 4,326 deletions.
10 changes: 5 additions & 5 deletions cmd/katalyst-agent/app/options/qrm/cpu_plugin.go
Original file line number Diff line number Diff line change
Expand Up @@ -19,8 +19,8 @@ package qrm
import (
cliflag "k8s.io/component-base/cli/flag"

"github.com/kubewharf/katalyst-core/pkg/agent/qrm-plugins/commonstate"
cpuconsts "github.com/kubewharf/katalyst-core/pkg/agent/qrm-plugins/cpu/consts"
"github.com/kubewharf/katalyst-core/pkg/agent/qrm-plugins/cpu/dynamicpolicy/state"
qrmconfig "github.com/kubewharf/katalyst-core/pkg/config/agent/qrm"
)

Expand Down Expand Up @@ -60,10 +60,10 @@ func NewCPUOptions() *CPUOptions {
EnableCPUIdle: false,
CPUNUMAHintPreferPolicy: cpuconsts.CPUNUMAHintPreferPolicySpreading,
LoadPressureEvictionSkipPools: []string{
state.PoolNameReclaim,
state.PoolNameDedicated,
state.PoolNameFallback,
state.PoolNameReserve,
commonstate.PoolNameReclaim,
commonstate.PoolNameDedicated,
commonstate.PoolNameFallback,
commonstate.PoolNameReserve,
},
},
CPUNativePolicyOptions: CPUNativePolicyOptions{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -20,7 +20,7 @@ import (
"github.com/spf13/pflag"

"github.com/kubewharf/katalyst-core/cmd/katalyst-agent/app/options/util"
"github.com/kubewharf/katalyst-core/pkg/agent/qrm-plugins/cpu/dynamicpolicy/state"
"github.com/kubewharf/katalyst-core/pkg/agent/qrm-plugins/commonstate"
"github.com/kubewharf/katalyst-core/pkg/config/agent/sysadvisor/qosaware/resource/memory/plugins"
"github.com/kubewharf/katalyst-core/pkg/consts"
)
Expand Down Expand Up @@ -80,7 +80,7 @@ func NewNumaBalancerOptions() *NumaBalancerOptions {

BalancedReclaimedPodsSingleRoundTotalRSSThreshold: 3 * 1024 * 1024 * 1024,

SupportedPools: []string{state.PoolNameShare},
SupportedPools: []string{commonstate.PoolNameShare},
}
}

Expand Down
90 changes: 90 additions & 0 deletions pkg/agent/qrm-plugins/commonstate/pool.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,90 @@
/*
Copyright 2022 The Katalyst Authors.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/

package commonstate

import (
"strings"

apiconsts "github.com/kubewharf/katalyst-api/pkg/consts"
)

// notice that pool-name may not have direct mapping relations with qos-level, for instance
// - both isolated_shared_cores and dedicated_cores fall into PoolNameDedicated
const (
PoolNameShare = "share"
PoolNameReclaim = "reclaim"
PoolNameDedicated = "dedicated"
PoolNameReserve = "reserve"
PoolNamePrefixIsolation = "isolation"
PoolNamePrefixSystem = "system"

EmptyOwnerPoolName = ""

// PoolNameFallback is not a real pool, and is a union of
// all none-reclaimed pools to put pod should have been isolated
PoolNameFallback = "fallback"
)

// FakedContainerName represents a placeholder since pool entry has no container-level
// FakedNUMAID represents a placeholder since pools like shared/reclaimed will not contain a specific numa
const (
FakedContainerName = ""
FakedNUMAID = -1
NameSeparator = "#"
NUMAPoolInfix = "-NUMA"
)

func IsIsolationPool(poolName string) bool {
return strings.HasPrefix(poolName, PoolNamePrefixIsolation)
}

func IsSystemPool(poolName string) bool {
return strings.HasPrefix(poolName, PoolNamePrefixSystem)
}

func GetPoolType(poolName string) string {
if IsIsolationPool(poolName) {
return PoolNamePrefixIsolation
} else if IsSystemPool(poolName) {
return PoolNamePrefixSystem
}
switch poolName {
case PoolNameReclaim, PoolNameDedicated, PoolNameReserve, PoolNameFallback:
return poolName
default:
return PoolNameShare
}
}

// GetSpecifiedPoolName todo: this function (along with pool-name consts) should be moved to generic qos conf
func GetSpecifiedPoolName(qosLevel, cpusetEnhancementValue string) string {
switch qosLevel {
case apiconsts.PodAnnotationQoSLevelSharedCores:
if cpusetEnhancementValue != EmptyOwnerPoolName {
return cpusetEnhancementValue
}
return PoolNameShare
case apiconsts.PodAnnotationQoSLevelSystemCores:
return cpusetEnhancementValue
case apiconsts.PodAnnotationQoSLevelReclaimedCores:
return PoolNameReclaim
case apiconsts.PodAnnotationQoSLevelDedicatedCores:
return PoolNameDedicated
default:
return EmptyOwnerPoolName
}
}
232 changes: 232 additions & 0 deletions pkg/agent/qrm-plugins/commonstate/state.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,232 @@
/*
Copyright 2022 The Katalyst Authors.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/

package commonstate

import (
"fmt"

pluginapi "k8s.io/kubelet/pkg/apis/resourceplugin/v1alpha1"

"github.com/kubewharf/katalyst-api/pkg/consts"
cpuconsts "github.com/kubewharf/katalyst-core/pkg/agent/qrm-plugins/cpu/consts"
"github.com/kubewharf/katalyst-core/pkg/util/general"
"github.com/kubewharf/katalyst-core/pkg/util/machine"
)

type AllocationMeta struct {
PodUid string `json:"pod_uid,omitempty"`
PodNamespace string `json:"pod_namespace,omitempty"`
PodName string `json:"pod_name,omitempty"`
ContainerName string `json:"container_name,omitempty"`
ContainerType string `json:"container_type,omitempty"`
ContainerIndex uint64 `json:"container_index,omitempty"`
OwnerPoolName string `json:"owner_pool_name,omitempty"`
PodRole string `json:"pod_role,omitempty"`
PodType string `json:"pod_type,omitempty"`

Labels map[string]string `json:"labels"`
Annotations map[string]string `json:"annotations"`
QoSLevel string `json:"qosLevel"`
}

func (am *AllocationMeta) Clone() *AllocationMeta {
clone := &AllocationMeta{
PodUid: am.PodUid,
PodNamespace: am.PodNamespace,
PodName: am.PodName,
ContainerName: am.ContainerName,
ContainerType: am.ContainerType,
ContainerIndex: am.ContainerIndex,
OwnerPoolName: am.OwnerPoolName,
PodRole: am.PodRole,
PodType: am.PodType,
QoSLevel: am.QoSLevel,
Labels: general.DeepCopyMap(am.Labels),
Annotations: general.DeepCopyMap(am.Annotations),
}

return clone
}

// GetPoolName parses the owner pool name for AllocationInfo
// if owner exists, just return; otherwise, parse from qos-level
func (am *AllocationMeta) GetPoolName() string {
if am == nil {
return EmptyOwnerPoolName
}

if ownerPoolName := am.GetOwnerPoolName(); ownerPoolName != EmptyOwnerPoolName {
return ownerPoolName
}
return am.GetSpecifiedPoolName()
}

// GetOwnerPoolName parses the owner pool name for AllocationInfo
func (am *AllocationMeta) GetOwnerPoolName() string {
if am == nil {
return EmptyOwnerPoolName
}
return am.OwnerPoolName
}

// GetSpecifiedPoolName parses the owner pool name for AllocationInfo from qos-level
func (am *AllocationMeta) GetSpecifiedPoolName() string {
if am == nil {
return EmptyOwnerPoolName
}

return GetSpecifiedPoolName(am.QoSLevel, am.Annotations[consts.PodAnnotationCPUEnhancementCPUSet])
}

// GetSpecifiedNUMABindingPoolName get numa_binding pool name
// for numa_binding shared_cores according to enhancements and NUMA hint
func (am *AllocationMeta) GetSpecifiedNUMABindingPoolName() (string, error) {
if !am.CheckSharedNUMABinding() {
return EmptyOwnerPoolName, fmt.Errorf("GetSpecifiedNUMABindingPoolName only for numa_binding shared_cores")
}

numaSet, pErr := machine.Parse(am.Annotations[cpuconsts.CPUStateAnnotationKeyNUMAHint])
if pErr != nil {
return EmptyOwnerPoolName, fmt.Errorf("parse numaHintStr: %s failed with error: %v",
am.Annotations[cpuconsts.CPUStateAnnotationKeyNUMAHint], pErr)
} else if numaSet.Size() != 1 {
return EmptyOwnerPoolName, fmt.Errorf("parse numaHintStr: %s with invalid size", numaSet.String())
}

specifiedPoolName := am.GetSpecifiedPoolName()

if specifiedPoolName == EmptyOwnerPoolName {
return EmptyOwnerPoolName, fmt.Errorf("empty specifiedPoolName")
}

return GetNUMAPoolName(specifiedPoolName, numaSet.ToSliceNoSortUInt64()[0]), nil
}

func GetNUMAPoolName(candidateSpecifiedPoolName string, targetNUMANode uint64) string {
return fmt.Sprintf("%s%s%d", candidateSpecifiedPoolName, NUMAPoolInfix, targetNUMANode)
}

// CheckMainContainer returns true if the AllocationInfo is for main container
func (am *AllocationMeta) CheckMainContainer() bool {
if am == nil {
return false
}

return am.ContainerType == pluginapi.ContainerType_MAIN.String()
}

// CheckSideCar returns true if the AllocationInfo is for side-car container
func (am *AllocationMeta) CheckSideCar() bool {
if am == nil {
return false
}

return am.ContainerType == pluginapi.ContainerType_SIDECAR.String()
}

func (am *AllocationMeta) GetSpecifiedSystemPoolName() (string, error) {
if !am.CheckSystem() {
return EmptyOwnerPoolName, fmt.Errorf("GetSpecifiedSystemPoolName only for system_cores")
}

specifiedPoolName := am.GetSpecifiedPoolName()
if specifiedPoolName == EmptyOwnerPoolName {
return specifiedPoolName, nil
}

return fmt.Sprintf("%s%s%s", PoolNamePrefixSystem, "-", specifiedPoolName), nil
}

func (am *AllocationMeta) CheckSystem() bool {
if am == nil {
return false
}
return am.QoSLevel == consts.PodAnnotationQoSLevelSystemCores
}

// CheckDedicated returns true if the AllocationInfo is for pod with dedicated-qos
func (am *AllocationMeta) CheckDedicated() bool {
if am == nil {
return false
}
return am.QoSLevel == consts.PodAnnotationQoSLevelDedicatedCores
}

// CheckShared returns true if the AllocationInfo is for pod with shared-qos
func (am *AllocationMeta) CheckShared() bool {
if am == nil {
return false
}
return am.QoSLevel == consts.PodAnnotationQoSLevelSharedCores
}

// CheckReclaimed returns true if the AllocationInfo is for pod with reclaimed-qos
func (am *AllocationMeta) CheckReclaimed() bool {
if am == nil {
return false
}
return am.QoSLevel == consts.PodAnnotationQoSLevelReclaimedCores
}

// CheckNUMABinding returns true if the AllocationInfo is for pod with numa-binding enhancement
func (am *AllocationMeta) CheckNUMABinding() bool {
if am == nil {
return false
}
return am.Annotations[consts.PodAnnotationMemoryEnhancementNumaBinding] ==
consts.PodAnnotationMemoryEnhancementNumaBindingEnable
}

// CheckDedicatedNUMABinding returns true if the AllocationInfo is for pod with
// dedicated-qos and numa-binding enhancement
func (am *AllocationMeta) CheckDedicatedNUMABinding() bool {
return am.CheckDedicated() && am.CheckNUMABinding()
}

// CheckSharedNUMABinding returns true if the AllocationInfo is for pod with
// shared-qos and numa-binding enhancement
func (am *AllocationMeta) CheckSharedNUMABinding() bool {
return am.CheckShared() && am.CheckNUMABinding()
}

// CheckSharedOrDedicatedNUMABinding returns true if the AllocationInfo is for pod with
// shared-qos or dedicated-qos and numa-binding enhancement
func (am *AllocationMeta) CheckSharedOrDedicatedNUMABinding() bool {
if am == nil {
return false
}

return am.CheckSharedNUMABinding() || am.CheckDedicatedNUMABinding()
}

// CheckNumaExclusive returns true if the AllocationInfo is for pod with numa-exclusive enhancement
func (am *AllocationMeta) CheckNumaExclusive() bool {
if am == nil {
return false
}

return am.Annotations[consts.PodAnnotationMemoryEnhancementNumaExclusive] ==
consts.PodAnnotationMemoryEnhancementNumaExclusiveEnable
}

// CheckDedicatedPool returns true if the AllocationInfo is for a container in the dedicated pool
func (am *AllocationMeta) CheckDedicatedPool() bool {
if am == nil {
return false
}
return am.OwnerPoolName == PoolNameDedicated
}
Loading

0 comments on commit 56ba904

Please sign in to comment.