diff --git a/cluster-autoscaler/proposals/plugable-provider-grpc.md b/cluster-autoscaler/proposals/plugable-provider-grpc.md index 75d684482a69..66aca4767432 100644 --- a/cluster-autoscaler/proposals/plugable-provider-grpc.md +++ b/cluster-autoscaler/proposals/plugable-provider-grpc.md @@ -118,8 +118,6 @@ option go_package = "clusterautoscaler.cloudprovider"; service CloudProvider { // CloudProvider specific RPC functions - rpc Name(NameRequest) - returns (NameResponse) {} rpc NodeGroups(NodeGroupsRequest) returns (GetNameResponse) {} @@ -127,18 +125,15 @@ service CloudProvider { rpc NodeGroupForNode(NodeGroupForNodeRequest) returns (NodeGroupForNodeResponse) {} - rpc PricingNodePrice(PricingNodePriceRequest) + rpc PricingNodePrice(PricingNodePriceRequest) // Optional returns (PricingNodePriceResponse) {} - rpc PricingPodPrice(PricingPodPriceRequest) + rpc PricingPodPrice(PricingPodPriceRequest) // Optional returns (PricingPodPriceResponse) rpc NewNodeGroup(NewNodeGroupRequest) returns (NewNodeGroupResponse) {} - rpc GetResourceLimiter(GetResourceLimiterRequest) - returns (GetResourceLimiterResponse) {} - rpc GPULabel(GPULabelRequest) returns (GPULabelResponse) {} @@ -165,13 +160,7 @@ service CloudProvider { returns (NodeGroupDecreaseTargetSizeResponse) {} rpc NodeGroupNodes(NodeGroupNodesRequest) - returns (NodeGroupNodesResponse) {} - - rpc NodeGroupDelete(NodeGroupDeleteRequest) - returns (NodeGroupDeleteResponse) {} - - rpc NodeGroupCreate(NodeGroupCreateRequest) - returns (NodeGroupCreateResponse) {} + returns (NodeGroupNodesResponse) {} rpc NodeGroupTemplateNodeInfo(NodeGroupDTemplateNodeInfoRequest) returns (NodeGroupTemplateNodeInfoResponse) {} @@ -180,6 +169,12 @@ service CloudProvider { Note that, the rest of message used in these calls are detailed in the [Appendix](#appendix) section. +Among all the operations, the CA calls in many places the function `NodeGroupForNode`. +As a consequence this operation might impact the overall performance of the CA when calling it via a remote external cloud provider. +A solution is to cache the rpc responses of this operation to avoid causing a performance degradation. +Another proposed alternative could be to move the entire logic of this function to the CA source code. +Initially this proposal assumes the rpc responses for this operation are cached to avoid any performance degradation. + In order to talk to the custom cloud provider server, this new cloud provider has to be registered when bootstrapping the CA. Consequently, the CA needs to expose new flags to specify the cloud provider and all the required properties @@ -231,39 +226,58 @@ message NodeGroupsResponse { } ``` +### ExternalGrpcNode + +ExternalGrpcNode is a custom type. This object defines the minimum required properties of a given Kubernetes node for a node group. +This new type reduces the amount of data transferred in all the operations instead of +sending the whole `k8s.io.api.core.v1.Node` rpc message. + +```protobuf +message ExternalGrpcNode{ + // ID of the node assigned by the cloud provider in the format: :// + // +optional + optional string providerID = 1; + + // Name of the node assigned by the cloud provider + optional string name = 2; + + // labels is a map of {key,value} pairs with the node's labels. + map labels = 3; + + + // If specified, the node's annotations. + map annotations = 4; +} +``` + +Initially, we defined a list of 4 properties, but this list could increase during the implementation phase. + ### NodeGroupForNode NodeGroupForNode returns the node group for the given node, nil if the node should not be processed by cluster autoscaler, or non-nil error if such occurred. Must be implemented. +**IMPORTANT:** Please note, this operation is extensively used by CA and can cause some performance degradations on large clusters. +The initial proposal assumes the rpc responses are cached. There is another alternative solution that consists on +moving the whole logic to the CA instead of being implemented in a rpc service. + ```protobuf message NodeGroupForNodeRequest { // Node group for the given node - k8s.io.api.core.v1.Node node = 1; + ExternalGrpcNode node = 1; } message NodeGroupForNodeResponse { // The node group for the given node. repeated NodeGroup nodeGroup = 1; } -``` - -### GetResourceLimiter -GetResourceLimiter types store struct containing limits (max, min) for resources (cores, memory etc.). - -```protobuf -message GetResourceLimiterRequest { - // Intentionally empty. +message NodeGroupForNodeRequest { + // Node group for the given node + ExternalGrpcNode node = 1; } -message GetResourceLimiterResponse { - // All the machine types that the cloud provider service supports. This - // field is OPTIONAL. - repeated string machineTypes = 1; -} ``` - ### GetAvailableGPUTypes GetAvailableGPUTypes handles all available GPU types cloud provider supports. @@ -297,10 +311,11 @@ message GPULabelResponse { ### PricingNodePrice NodePrice handles an operation that returns a price of running the given node for a given period of time. +PricingNodePrice is an optional operation that is not implemented by all the providers. ```protobuf message PricingNodePriceRequest { - k8s.io.api.core.v1.Node node = 1;, + ExternalGrpcNode node = 1;, k8s.io.apimachinery.pkg.apis.meta.v1.Time startTime = 2; @@ -316,6 +331,8 @@ message PricingNodePriceResponse { ### PricingPodPrice PodPrice handles an operation that returns a theoretical minimum price of running a pod for a given period of time on a perfectly matching machine. +PricingPodPrice is an optional operation that is not implemented by all the providers. + ```protobuf message PricingPodPriceRequest { @@ -360,24 +377,6 @@ message NewNodeGroupResponse { } ``` -### GetResourceLimiter - -GetResourceLimiter holds a struct containing limits (max, min) for resources (cores, memory etc.). - -```protobuf -message GetResourceLimiterRequest { - // Intentionally empty. -} - -message GetResourceLimiterResponse { - // Contains the minimum limits for resources (cores, memory etc.). - map minLimits = 1; - - // Contains the maximum limits for resources (cores, memory etc.). - map maxLimits = 2; -} -``` - ### Refresh Refresh is called before every main loop and can be used to dynamically update cloud provider state. @@ -407,28 +406,10 @@ message CleanupResponse { } ``` -### Name - -Name stores the name of the cloud provider. - -```protobuf -message NameRequest { - // Intentionally empty. -} - -message NameResponse { - // Name of the node group - string name = 1; -} -``` - ### NodeGroup ```protobuf message NodeGroup { - // Name of the node group on the cloud provider - string name = 1; - // ID of the node group on the cloud provider string id = 1; @@ -438,14 +419,8 @@ message NodeGroup { // MaxSize of the node group on the cloud provider int32 maxSize = 3; - // Exist reports if the node group really exists on the cloud provider - bool exist = 4; - - // Autoprovisioned returns true if the node group is autoprovisioned - bool autoProvisioned = 5; - // Debug returns a string containing all information regarding this node group. - string debug = 6; + string debug = 4; } ``` @@ -488,7 +463,7 @@ NodeGroupDeleteNodes deletes nodes from this node group. ```protobuf message NodeGroupDeleteNodesRequest { - repeated k8s.io.api.core.v1.Node nodes = 1; + repeated ExternalGrpcNode nodes = 1; // ID of the group node on the cloud provider string id = 2; @@ -539,8 +514,15 @@ message Instance { // InstanceStatus represents instance status. message InstanceStatus { - // State tells if instance is running, being created or being deleted - int state = 1; + // InstanceState tells if instance is running, being created or being deleted + enum InstanceState { + // InstanceRunning means instance is running + InstanceRunning = 1 + // InstanceCreating means instance is being created + InstanceCreating = 2 + // InstanceDeleting means instance is being deleted + InstanceDeleting = 3; + } // ErrorInfo is not nil if there is error condition related to instance. InstanceErrorInfo errorInfo = 2; } @@ -556,40 +538,13 @@ message InstanceErrorInfo { } ``` -### NodeGroupDelete - -NodeGroupDelete deletes the node group on the cloud provider side. - -```protobuf -message NodeGroupDeleteRequest { - // ID of the group node on the cloud provider - string id = 1; -} - -message NodeGroupDeleteResponse { - // Intentionally empty. -} -``` - -### NodeGroupCreate - -NodeGroupCreate creates the node group on the cloud provider side. - -```protobuf -message NodeGroupCreateRequest { - // NodeGroup to be created on the cloud provider - NodeGroup nodeGroup = 1; -} - -message NodeGroupCreateResponse { - // NodeGroup that was created on the cloud provider - NodeGroup nodeGroup = 1; -} -``` - ### NodeGroupTemplateNodeInfo -TemplateNodeInfo returns a NodeInfo structure of an empty (as if just started) node. +TemplateNodeInfo returns a NodeInfo as a structure of an empty (as if just started) node. +The definition of a generic `NodeInfo` for each potential provider is a pretty complex approach and does not cover all the scenarios. +For the sake of simplicity, the `nodeInfo` is defined as a Kubernetes `k8s.io.api.core.v1.Node` type +where the system could still extract certain info about the node. + ```protobuf message NodeGroupTemplateNodeInfoRequest { @@ -598,7 +553,7 @@ message NodeGroupTemplateNodeInfoRequest { } message NodeGroupTemplateNodeInfoResponse { - // nodeInfo extracted of the template node on the cloud provider - NodeInfo nodeInfo = 1; + // nodeInfo extracted data from the cloud provider node using a primitive Kubernetes Node type. + k8s.io.api.core.v1.Node nodeInfo = 1; } ```