zouy414
diff --git a/‎api/openapi-spec/swagger.json‎
Lines changed: 1 addition & 1 deletion b/‎api/openapi-spec/swagger.json‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎staging/src/k8s.io/apiserver/BUILD‎
Lines changed: 1 addition & 0 deletions b/‎staging/src/k8s.io/apiserver/BUILD‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/BUILD‎
Lines changed: 1 addition & 4 deletions b/‎staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/BUILD‎
Lines changed: 1 addition & 4 deletions
diff --git a/‎staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/interface.go‎
Lines changed: 13 additions & 11 deletions b/‎staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/interface.go‎
Lines changed: 13 additions & 11 deletions
diff --git a/‎staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/queueset/BUILD‎
Lines changed: 8 additions & 1 deletion b/‎staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/queueset/BUILD‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/queueset/doc.go‎
Lines changed: 120 additions & 0 deletions b/‎staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/queueset/doc.go‎
Lines changed: 120 additions & 0 deletions
@@ -47,6 +47,7 @@ filegroup(
         "//staging/src/k8s.io/apiserver/pkg/util/flowcontrol/metrics:all-srcs",
         "//staging/src/k8s.io/apiserver/pkg/util/flushwriter:all-srcs",
         "//staging/src/k8s.io/apiserver/pkg/util/openapi:all-srcs",
+        "//staging/src/k8s.io/apiserver/pkg/util/promise:all-srcs",
         "//staging/src/k8s.io/apiserver/pkg/util/proxy:all-srcs",
         "//staging/src/k8s.io/apiserver/pkg/util/shufflesharding:all-srcs",
         "//staging/src/k8s.io/apiserver/pkg/util/term:all-srcs",
 
@@ -2,10 +2,7 @@ load("@io_bazel_rules_go//go:def.bzl", "go_library")
 
 go_library(
     name = "go_default_library",
-    srcs = [
-        "interface.go",
-        "types.go",
-    ],
+    srcs = ["interface.go"],
     importmap = "k8s.io/kubernetes/vendor/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing",
     importpath = "k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing",
     visibility = ["//visibility:public"],
 
@@ -49,17 +49,19 @@ type QueueSet interface {
 	// triggering state and the required call).
 	Quiesce(EmptyHandler)
 
-	// Wait uses the given hashValue as the source of entropy
-	// as it shuffle-shards a request into a queue and waits for
-	// a decision on what to do with that request.  If tryAnother==true
-	// at return then the QueueSet has become undesirable and the client
-	// should try to find a different QueueSet to use; execute and
-	// afterExecution are irrelevant in this case.  Otherwise, if execute
-	// then the client should start executing the request and, once the
-	// request finishes execution or is canceled, call afterExecution().
-	// Otherwise the client should not execute the
-	// request and afterExecution is irrelevant.
-	Wait(ctx context.Context, hashValue uint64) (tryAnother, execute bool, afterExecution func())
+	// Wait uses the given hashValue as the source of entropy as it
+	// shuffle-shards a request into a queue and waits for a decision
+	// on what to do with that request.  The descr1 and descr2 values
+	// play no role in the logic but appear in log messages.  If
+	// tryAnother==true at return then the QueueSet has become
+	// undesirable and the client should try to find a different
+	// QueueSet to use; execute and afterExecution are irrelevant in
+	// this case.  Otherwise, if execute then the client should start
+	// executing the request and, once the request finishes execution
+	// or is canceled, call afterExecution().  Otherwise the client
+	// should not execute the request and afterExecution is
+	// irrelevant.
+	Wait(ctx context.Context, hashValue uint64, descr1, descr2 interface{}) (tryAnother, execute bool, afterExecution func())
 }
 
 // QueueSetConfig defines the configuration of a QueueSet.
 
@@ -2,7 +2,11 @@ load("@io_bazel_rules_go//go:def.bzl", "go_library", "go_test")
 
 go_library(
     name = "go_default_library",
-    srcs = ["queueset.go"],
+    srcs = [
+        "doc.go",
+        "queueset.go",
+        "types.go",
+    ],
     importmap = "k8s.io/kubernetes/vendor/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/queueset",
     importpath = "k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/queueset",
     visibility = ["//visibility:public"],
@@ -12,6 +16,8 @@ go_library(
         "//staging/src/k8s.io/apiserver/pkg/util/flowcontrol/counter:go_default_library",
         "//staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing:go_default_library",
         "//staging/src/k8s.io/apiserver/pkg/util/flowcontrol/metrics:go_default_library",
+        "//staging/src/k8s.io/apiserver/pkg/util/promise:go_default_library",
+        "//staging/src/k8s.io/apiserver/pkg/util/promise/lockingpromise:go_default_library",
         "//staging/src/k8s.io/apiserver/pkg/util/shufflesharding:go_default_library",
         "//vendor/github.com/pkg/errors:go_default_library",
         "//vendor/k8s.io/klog:go_default_library",
@@ -27,6 +33,7 @@ go_test(
         "//staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing:go_default_library",
         "//staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/testing:go_default_library",
         "//staging/src/k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing/testing/clock:go_default_library",
+        "//vendor/k8s.io/klog:go_default_library",
     ],
 )
 
 
@@ -0,0 +1,120 @@
+/*
+Copyright 2019 The Kubernetes Authors.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+
+package queueset
+
+// This package implements a technique called "fair queuing for server
+// requests".  One QueueSet is a set of queues operating according to
+// this technique.
+
+// Fair queuing for server requests is inspired by the fair queuing
+// technique from the world of networking.  You can find a good paper
+// on that at https://dl.acm.org/citation.cfm?doid=75247.75248 or
+// http://people.csail.mit.edu/imcgraw/links/research/pubs/networks/WFQ.pdf
+// and there is an implementation outline in the Wikipedia article at
+// https://en.wikipedia.org/wiki/Fair_queuing .
+
+// Fair queuing for server requests differs from traditional fair
+// queuing in three ways: (1) we are dispatching requests to be
+// executed within a process rather than transmitting packets on a
+// network link, (2) multiple requests can be executing at once, and
+// (3) the service time (execution duration) is not known until the
+// execution completes.
+
+// The first two differences can easily be handled by straightforward
+// adaptation of the concept called "R(t)" in the original paper and
+// "virtual time" in the implementation outline. In that
+// implementation outline, the notation now() is used to mean reading
+// the virtual clock. In the original paper’s terms, "R(t)" is the
+// number of "rounds" that have been completed at real time t, where a
+// round consists of virtually transmitting one bit from every
+// non-empty queue in the router (regardless of which queue holds the
+// packet that is really being transmitted at the moment); in this
+// conception, a packet is considered to be "in" its queue until the
+// packet’s transmission is finished. For our problem, we can define a
+// round to be giving one nanosecond of CPU to every non-empty queue
+// in the apiserver (where emptiness is judged based on both queued
+// and executing requests from that queue), and define R(t) = (server
+// start time) + (1 ns) * (number of rounds since server start). Let
+// us write NEQ(t) for that number of non-empty queues in the
+// apiserver at time t.  Let us also write C for the concurrency
+// limit.  In the original paper, the partial derivative of R(t) with
+// respect to t is
+//
+//                 1 / NEQ(t) .
+
+// To generalize from transmitting one packet at a time to executing C
+// requests at a time, that derivative becomes
+//
+//                C / NEQ(t) .
+
+// However, sometimes there are fewer than C requests available to
+// execute.  For a given queue "q", let us also write "reqs(q, t)" for
+// the number of requests of that queue that are executing at that
+// time.  The total number of requests executing is sum[over q]
+// reqs(q, t) and if that is less than C then virtual time is not
+// advancing as fast as it would if all C seats were occupied; in this
+// case the numerator of the quotient in that derivative should be
+// adjusted proportionally.  Putting it all together for fair queing
+// for server requests: at a particular time t, the partial derivative
+// of R(t) with respect to t is
+//
+//      min( C, sum[over q] reqs(q, t) ) / NEQ(t) .
+//
+// In terms of the implementation outline, this is the rate at which
+// virtual time is advancing at time t (in virtual nanoseconds per
+// real nanosecond). Where the networking implementation outline adds
+// packet size to a virtual time, in our version this corresponds to
+// adding a service time (i.e., duration) to virtual time.
+
+// The third difference is handled by modifying the algorithm to
+// dispatch based on an initial guess at the request’s service time
+// (duration) and then make the corresponding adjustments once the
+// request’s actual service time is known. This is similar, although
+// not exactly isomorphic, to the original paper’s adjustment by
+// `$delta` for the sake of promptness.
+
+// For implementation simplicity (see below), let us use the same
+// initial service time guess for every request; call that duration
+// G. A good choice might be the service time limit (1
+// minute). Different guesses will give slightly different dynamics,
+// but any positive number can be used for G without ruining the
+// long-term behavior.
+
+// As in ordinary fair queuing, there is a bound on divergence from
+// the ideal. In plain fair queuing the bound is one packet; in our
+// version it is C requests.
+
+// To support efficiently making the necessary adjustments once a
+// request’s actual service time is known, the virtual finish time of
+// a request and the last virtual finish time of a queue are not
+// represented directly but instead computed from queue length,
+// request position in the queue, and an alternate state variable that
+// holds the queue’s virtual start time. While the queue is empty and
+// has no requests executing: the value of its virtual start time
+// variable is ignored and its last virtual finish time is considered
+// to be in the virtual past. When a request arrives to an empty queue
+// with no requests executing, the queue’s virtual start time is set
+// to the current virtual time. The virtual finish time of request
+// number J in the queue (counting from J=1 for the head) is J * G +
+// (queue's virtual start time). While the queue is non-empty: the
+// last virtual finish time of the queue is the virtual finish time of
+// the last request in the queue. While the queue is empty and has a
+// request executing: the last virtual finish time is the queue’s
+// virtual start time. When a request is dequeued for service the
+// queue’s virtual start time is advanced by G. When a request
+// finishes being served, and the actual service time was S, the
+// queue’s virtual start time is decremented by G - S.