kubernetes · alowde · May 22, 2023 · May 22, 2023 · May 23, 2023 · May 28, 2023
diff --git a/docs/user-guide/nginx-configuration/configmap.md b/docs/user-guide/nginx-configuration/configmap.md
@@ -773,6 +773,11 @@ The value can either be:
 
 - round_robin: to use the default round robin loadbalancer
 - ewma: to use the Peak EWMA method for routing ([implementation](https://github.com/kubernetes/ingress-nginx/blob/main/rootfs/etc/nginx/lua/balancer/ewma.lua))
+- least_connections: to route incoming connections to the upstream with the least connections open at the time. This is
+  recommended for use with evenly-resourced upstream servers when requests have a broad distribution in time to
+  process, for example if some requests require the upstream server to make a connection to a slow external service. If
+  all requests take a fairly similar time to process or the upstream servers serve at different speeds then ewma or
+  round_robin are likely more appropriate.
 
 The default is `round_robin`.
 

diff --git a/internal/ingress/controller/template/configmap.go b/internal/ingress/controller/template/configmap.go
@@ -78,6 +78,7 @@ var (
 		"balancer_ewma":                 10240,
 		"balancer_ewma_last_touched_at": 10240,
 		"balancer_ewma_locks":           1024,
+		"balancer_leastconn":            5120,
 		"certificate_servers":           5120,
 		"ocsp_response_cache":           5120, // keep this same as certificate_servers
 		"global_throttle_cache":         10240,

diff --git a/rootfs/etc/nginx/lua/balancer.lua b/rootfs/etc/nginx/lua/balancer.lua
@@ -9,6 +9,7 @@ local chashsubset = require("balancer.chashsubset")
 local sticky_balanced = require("balancer.sticky_balanced")
 local sticky_persistent = require("balancer.sticky_persistent")
 local ewma = require("balancer.ewma")
+local leastconn = require("balancer.leastconn")
 local string = string
 local ipairs = ipairs
 local table = table
@@ -32,6 +33,7 @@ local IMPLEMENTATIONS = {
   sticky_balanced = sticky_balanced,
   sticky_persistent = sticky_persistent,
   ewma = ewma,
+  least_connections = leastconn,
 }
 
 local PROHIBITED_LOCALHOST_PORT = configuration.prohibited_localhost_port or '10246'

diff --git a/rootfs/etc/nginx/lua/balancer/leastconn.lua b/rootfs/etc/nginx/lua/balancer/leastconn.lua
@@ -0,0 +1,115 @@
+local util = require("util")
+local split = require("util.split")
+require("resty.core")
+
+local ngx = ngx
+local ipairs = ipairs
+local tostring = tostring
+local string = string
+local tonumber = tonumber
+local setmetatable = setmetatable
+local string_format = string.format
+local ngx_log = ngx.log
+local INFO = ngx.INFO
+local WARN = ngx.WARN
+
+
+local _M = { name = "leastconn" }
+
+function _M.new(self, backend)
+    local o = {
+        peers = backend.endpoints
+    }
+    setmetatable(o, self)
+    self.__index = self
+    return o
+end
+
+function _M.is_affinitized()
+    return false
+end
+
+
+local function get_upstream_name(upstream)
+    return upstream.address .. ":" .. upstream.port
+end
+
+
+function _M.balance(self)
+    local peers = self.peers
+    local endpoint = peers[1]
+    local endpoints = ngx.shared.balancer_leastconn
+    local feasible_endpoints = {}
+
+    if #peers ~= 1 then
+        local lowestconns = 9999
+        -- find the lowest connection count
+        for _, peer in pairs(peers) do
+            local conns = endpoints:get(get_upstream_name(peer))
+            if conns == nil then
+              endpoints:set(get_upstream_name(peer),0,600)
+              conns = 0
+            end
+            ngx_log(WARN, "Found ", conns, " conns for peer ", get_upstream_name(peer))
+            if conns <= lowestconns then
+                lowestconns = conns
+            end
+        end
+
+        -- get peers with lowest connections
+        for _, peer in pairs(peers) do
+            local conns = endpoints:get(get_upstream_name(peer))
+            if conns ~= nil and conns == lowestconns then
+                feasible_endpoints[#feasible_endpoints+1] = peer
+            end
+        end
+        ngx_log(WARN, "got ", #feasible_endpoints, " feasible endpoints")
+
+        endpoint = feasible_endpoints[math.random(1,#feasible_endpoints)]
+    end
+
+
+    ngx_log(WARN, "chose endpoint ", get_upstream_name(endpoint))
+    -- Update the endpoint connection count with a TTL of 10 minutes
+    endpoints:incr(get_upstream_name(endpoint),1,1,600)
+
+    return get_upstream_name(endpoint)
+end
+
+function _M.after_balance(_)
+    local endpoints = ngx.shared.balancer_leastconn
+    local upstream = split.get_last_value(ngx.var.upstream_addr)
+
+    ngx_log(WARN, "decrement conn count for upstream ", upstream)
+
+    if util.is_blank(upstream) then
+        return
+    end
+    ngx_log(WARN, "decrement endpoints", upstream)
+    ngx_log(WARN, endpoints:incr(upstream,-1,0,600))
+end
+
+function _M.sync(self, backend)
+    local normalized_endpoints_added, normalized_endpoints_removed =
+        util.diff_endpoints(self.peers, backend.endpoints)
+
+    if #normalized_endpoints_added == 0 and #normalized_endpoints_removed == 0 then
+        ngx_log(WARN, "endpoints did not change for backend " .. tostring(backend.name))
+        return
+    end
+
+    ngx_log(WARN, string_format("[%s] peers have changed for backend %s", self.name, backend.name))
+
+    self.peers = backend.endpoints
+
+    for _, endpoint_string in ipairs(normalized_endpoints_removed) do
+        ngx.shared.balancer_leastconn:delete(endpoint_string)
+    end
+
+    for _, endpoint_string in ipairs(normalized_endpoints_added) do
+        ngx.shared.balancer_leastconn:set(endpoint_string,0,600)
+    end
+
+end
+
+return _M
diff --git a/rootfs/etc/nginx/lua/test/balancer/leastconn_test.lua b/rootfs/etc/nginx/lua/test/balancer/leastconn_test.lua
@@ -0,0 +1,160 @@
+local util = require("util")
+local say  = require("say")
+
+local original_ngx = ngx
+local function reset_ngx()
+  _G.ngx = original_ngx
+end
+
+local function included_in(state, arguments)
+   if not type(arguments[1]) == "table" or #arguments ~= 2 then
+    return false
+  end
+
+  local table = arguments[1]
+  for _, value in pairs(table) do
+    if value == arguments[2] then
+      return true
+    end
+  end
+  return false
+end
+assert:register("assertion", "included_in", included_in, "assertion.has_property.positive", "assertion.has_property.negative")
+
+local function mock_ngx(mock)
+  local _ngx = mock
+  setmetatable(_ngx, { __index = ngx })
+  _G.ngx = _ngx
+end
+
+local function flush_connection_count()
+  ngx.shared.balancer_leastconn:flush_all()
+end
+
+local function set_backend_count(endpoint_string, count)
+  ngx.shared.balancer_leastconn:set(endpoint_string, count)
+end
+
+describe("Balancer leastconn", function()
+  local balancer_leastconn = require("balancer.leastconn")
+  local ngx_now = 1543238266
+  local backend, instance
+
+  before_each(function()
+    package.loaded["balancer.leastconn"] = nil
+    balancer_leastconn = require("balancer.leastconn")
+
+    backend = {
+      name = "namespace-service-port",
+      ["load-balance"] = "least_connections",
+      endpoints = {
+        { address = "10.10.10.1", port = "8080" },
+        { address = "10.10.10.2", port = "8080" },
+        { address = "10.10.10.3", port = "8080" },
+      }
+    }
+    set_backend_count("10.10.10.1:8080", 0)
+    set_backend_count("10.10.10.2:8080", 1)
+    set_backend_count("10.10.10.3:8080", 5)
+
+    instance = balancer_leastconn:new(backend)
+  end)
+
+  after_each(function()
+    reset_ngx()
+    flush_connection_count()
+  end)
+
+  describe("after_balance()", function()
+    it("updates connection count", function()
+      ngx.var = { upstream_addr = "10.10.10.2:8080" }
+
+      local count_before = ngx.shared.balancer_leastconn:get(ngx.var.upstream_addr)
+      instance:after_balance()
+      local count_after = ngx.shared.balancer_leastconn:get(ngx.var.upstream_addr)
+
+      assert.are.equals(count_before - 1, count_after)
+    end)
+  end)
+
+  describe("balance()", function()
+    it("increments connection count on selected peer", function()
+      local single_endpoint_backend = util.deepcopy(backend)
+      table.remove(single_endpoint_backend.endpoints, 3)
+      table.remove(single_endpoint_backend.endpoints, 2)
+      local single_endpoint_instance = balancer_leastconn:new(single_endpoint_backend)
+
+      local upstream = single_endpoint_backend.endpoints[1]
+      local upstream_name = upstream.address .. ":" .. upstream.port
+
+      set_backend_count(upstream_name, 0)
+      single_endpoint_instance:balance()
+      local count_after = ngx.shared.balancer_leastconn:get(upstream_name)
+
+      assert.are.equals(1, count_after)
+    end)
+
+    it("returns single endpoint when the given backend has only one endpoint", function()
+      local single_endpoint_backend = util.deepcopy(backend)
+      table.remove(single_endpoint_backend.endpoints, 3)
+      table.remove(single_endpoint_backend.endpoints, 2)
+      local single_endpoint_instance = balancer_leastconn:new(single_endpoint_backend)
+
+      local peer = single_endpoint_instance:balance()
+
+      assert.are.equals("10.10.10.1:8080", peer)
+    end)
+
+    it("picks the endpoint with lowest connection count", function()
+      local two_endpoints_backend = util.deepcopy(backend)
+      table.remove(two_endpoints_backend.endpoints, 2)
+      local two_endpoints_instance = balancer_leastconn:new(two_endpoints_backend)
+
+      local peer = two_endpoints_instance:balance()
+
+      assert.equal("10.10.10.1:8080", peer)
+    end)
+
+    it("picks one of the endpoints with tied lowest connection count", function()
+      set_backend_count("10.10.10.1:8080", 8)
+      set_backend_count("10.10.10.2:8080", 5)
+      set_backend_count("10.10.10.3:8080", 5)
+
+      local peer = instance:balance()
+      assert.included_in({"10.10.10.2:8080", "10.10.10.3:8080"}, peer)
+    end)
+
+  end)
+
+  describe("sync()", function()
+    it("does not reset stats when endpoints do not change", function()
+      local new_backend = util.deepcopy(backend)
+
+      instance:sync(new_backend)
+
+      assert.are.same(new_backend.endpoints, instance.peers)
+      assert.are.same(new_backend.endpoints, backend.endpoints)
+    end)
+
+    it("updates peers, deletes stats for old endpoints and sets connection count to zero for new ones", function()
+      local new_backend = util.deepcopy(backend)
+
+      -- existing endpoint 10.10.10.2 got deleted
+      -- and replaced with 10.10.10.4
+      new_backend.endpoints[2].address = "10.10.10.4"
+      -- and there's one new extra endpoint
+      table.insert(new_backend.endpoints, { address = "10.10.10.5", port = "8080" })
+
+      instance:sync(new_backend)
+
+      assert.are.same(new_backend.endpoints, instance.peers)
+
+      assert.are.equals(ngx.shared.balancer_leastconn:get("10.10.10.1:8080"), 0)
+      assert.are.equals(ngx.shared.balancer_leastconn:get("10.10.10.2:8080"), nil)
+      assert.are.equals(ngx.shared.balancer_leastconn:get("10.10.10.3:8080"), 5)
+      assert.are.equals(ngx.shared.balancer_leastconn:get("10.10.10.4:8080"), 0)
+      assert.are.equals(ngx.shared.balancer_leastconn:get("10.10.10.5:8080"), 0)
+    end)
+  end)
+
+end)
diff --git a/rootfs/etc/nginx/lua/test/balancer_test.lua b/rootfs/etc/nginx/lua/test/balancer_test.lua
@@ -37,7 +37,8 @@ local function reset_expected_implementations()
     ["my-dummy-app-3"] = package.loaded["balancer.sticky_persistent"],
     ["my-dummy-app-4"] = package.loaded["balancer.ewma"],
     ["my-dummy-app-5"] = package.loaded["balancer.sticky_balanced"],
-    ["my-dummy-app-6"] = package.loaded["balancer.chashsubset"]
+    ["my-dummy-app-6"] = package.loaded["balancer.chashsubset"],
+    ["my-dummy-app-7"] = package.loaded["balancer.leastconn"]
   }
 end
 
@@ -88,6 +89,10 @@ local function reset_backends()
       ["load-balance"] = "ewma",                  -- upstreamHashByConfig will take priority.
       upstreamHashByConfig = { ["upstream-hash-by"] = "$request_uri", ["upstream-hash-by-subset"] = "true", }
     },
+    {
+      name = "my-dummy-app-7",
+      ["load-balance"] = "least_connections",
+    },
   }
 end
 

diff --git a/test/data/cleanConf.expected.conf b/test/data/cleanConf.expected.conf
@@ -23,6 +23,7 @@ http {
 	lua_shared_dict balancer_ewma 10M;
 	lua_shared_dict balancer_ewma_last_touched_at 10M;
 	lua_shared_dict balancer_ewma_locks 1M;
+	lua_shared_dict balancer_leastconn 5M;
 	lua_shared_dict certificate_data 20M;
 	lua_shared_dict certificate_servers 5M;
 	lua_shared_dict configuration_data 20M;

diff --git a/test/data/cleanConf.src.conf b/test/data/cleanConf.src.conf
@@ -40,6 +40,7 @@ http {
     lua_shared_dict balancer_ewma 10M;
 lua_shared_dict balancer_ewma_last_touched_at 10M;
 lua_shared_dict balancer_ewma_locks 1M;
+lua_shared_dict balancer_leastconn 5M;
 lua_shared_dict certificate_data 20M;
 lua_shared_dict certificate_servers 5M;
 lua_shared_dict configuration_data 20M;