From 8d5973d29d60c0c615838c534ee27f93377cf5af Mon Sep 17 00:00:00 2001 From: Chi Wang Date: Tue, 16 Nov 2021 07:39:45 -0800 Subject: [PATCH] Remote: Limit max number of gRPC connections by --remote_max_connections. `--remote_max_connections` is only applied to HTTP remote cache. This PR makes it apply to gRPC cache/executor as well. Note that `--remote_max_connections` limits the number of concurrent connections. For HTTP remote cache, one connection could handle one request at one time. For gRPC remote cache/executor, one connection could handle 100+ concurrent requests. So the default value `100` means we could make up to `100` concurrent requests for HTTP remote cache or `10000+` concurrent requests for gRPC remote cache/executor. Fixes: #14178. Closes #14202. PiperOrigin-RevId: 410249542 --- .../lib/remote/ReferenceCountedChannel.java | 11 ++++-- .../build/lib/remote/RemoteModule.java | 13 +++++-- .../remote/grpc/DynamicConnectionPool.java | 39 +++++++++++++------ .../lib/remote/options/RemoteOptions.java | 10 +++-- 4 files changed, 52 insertions(+), 21 deletions(-) diff --git a/src/main/java/com/google/devtools/build/lib/remote/ReferenceCountedChannel.java b/src/main/java/com/google/devtools/build/lib/remote/ReferenceCountedChannel.java index 5c5af7e013400a..36df5e77a1a78f 100644 --- a/src/main/java/com/google/devtools/build/lib/remote/ReferenceCountedChannel.java +++ b/src/main/java/com/google/devtools/build/lib/remote/ReferenceCountedChannel.java @@ -62,8 +62,13 @@ public ReferenceCounted touch(Object o) { private final AtomicReference authorityRef = new AtomicReference<>(); public ReferenceCountedChannel(ChannelConnectionFactory connectionFactory) { + this(connectionFactory, /*maxConnections=*/ 0); + } + + public ReferenceCountedChannel(ChannelConnectionFactory connectionFactory, int maxConnections) { this.dynamicConnectionPool = - new DynamicConnectionPool(connectionFactory, connectionFactory.maxConcurrency()); + new DynamicConnectionPool( + connectionFactory, connectionFactory.maxConcurrency(), maxConnections); } public boolean isShutdown() { @@ -87,12 +92,12 @@ public void start(Listener responseListener, Metadata headers) { responseListener) { @Override public void onClose(Status status, Metadata trailers) { - super.onClose(status, trailers); - try { connection.close(); } catch (IOException e) { throw new AssertionError(e.getMessage(), e); + } finally { + super.onClose(status, trailers); } } }, diff --git a/src/main/java/com/google/devtools/build/lib/remote/RemoteModule.java b/src/main/java/com/google/devtools/build/lib/remote/RemoteModule.java index 6ad97fb2a1ece2..5b857ca0eaced4 100644 --- a/src/main/java/com/google/devtools/build/lib/remote/RemoteModule.java +++ b/src/main/java/com/google/devtools/build/lib/remote/RemoteModule.java @@ -352,6 +352,10 @@ public void beforeCommand(CommandEnvironment env) throws AbruptExitException { // based on the resolved IPs of that server. We assume servers normally have 2 IPs. So the // max concurrency per connection is 100. int maxConcurrencyPerConnection = 100; + int maxConnections = 0; + if (remoteOptions.remoteMaxConnections > 0) { + maxConnections = remoteOptions.remoteMaxConnections; + } if (enableRemoteExecution) { ImmutableList.Builder interceptors = ImmutableList.builder(); @@ -367,7 +371,8 @@ public void beforeCommand(CommandEnvironment env) throws AbruptExitException { remoteOptions.remoteProxy, authAndTlsOptions, interceptors.build(), - maxConcurrencyPerConnection)); + maxConcurrencyPerConnection), + maxConnections); // Create a separate channel if --remote_executor and --remote_cache point to different // endpoints. @@ -390,7 +395,8 @@ public void beforeCommand(CommandEnvironment env) throws AbruptExitException { remoteOptions.remoteProxy, authAndTlsOptions, interceptors.build(), - maxConcurrencyPerConnection)); + maxConcurrencyPerConnection), + maxConnections); } if (enableRemoteDownloader) { @@ -411,7 +417,8 @@ public void beforeCommand(CommandEnvironment env) throws AbruptExitException { remoteOptions.remoteProxy, authAndTlsOptions, interceptors.build(), - maxConcurrencyPerConnection)); + maxConcurrencyPerConnection), + maxConnections); } } diff --git a/src/main/java/com/google/devtools/build/lib/remote/grpc/DynamicConnectionPool.java b/src/main/java/com/google/devtools/build/lib/remote/grpc/DynamicConnectionPool.java index 6824563d737a38..39b17c6c2e30a9 100644 --- a/src/main/java/com/google/devtools/build/lib/remote/grpc/DynamicConnectionPool.java +++ b/src/main/java/com/google/devtools/build/lib/remote/grpc/DynamicConnectionPool.java @@ -30,6 +30,7 @@ public class DynamicConnectionPool implements ConnectionPool { private final ConnectionFactory connectionFactory; private final int maxConcurrencyPerConnection; + private final int maxConnections; private final AtomicBoolean closed = new AtomicBoolean(false); @GuardedBy("this") @@ -40,8 +41,14 @@ public class DynamicConnectionPool implements ConnectionPool { public DynamicConnectionPool( ConnectionFactory connectionFactory, int maxConcurrencyPerConnection) { + this(connectionFactory, maxConcurrencyPerConnection, /*maxConnections=*/ 0); + } + + public DynamicConnectionPool( + ConnectionFactory connectionFactory, int maxConcurrencyPerConnection, int maxConnections) { this.connectionFactory = connectionFactory; this.maxConcurrencyPerConnection = maxConcurrencyPerConnection; + this.maxConnections = maxConnections; this.factories = new ArrayList<>(); } @@ -61,12 +68,19 @@ public void close() throws IOException { } } + @GuardedBy("this") + private SharedConnectionFactory nextFactory() { + int index = Math.abs(indexTicker % factories.size()); + indexTicker += 1; + return factories.get(index); + } + /** - * Performs a simple round robin on the list of {@link SharedConnectionFactory} and return one - * having available connections at this moment. + * Performs a simple round robin on the list of {@link SharedConnectionFactory}. * - *

If no factory has available connections, it will create a new {@link - * SharedConnectionFactory}. + *

This will try to find a factory that has available connections at this moment. If no factory + * has available connections, and the number of factories is less than {@link #maxConnections}, it + * will create a new {@link SharedConnectionFactory}. */ private SharedConnectionFactory nextAvailableFactory() { if (closed.get()) { @@ -75,19 +89,20 @@ private SharedConnectionFactory nextAvailableFactory() { synchronized (this) { for (int times = 0; times < factories.size(); ++times) { - int index = Math.abs(indexTicker % factories.size()); - indexTicker += 1; - - SharedConnectionFactory factory = factories.get(index); + SharedConnectionFactory factory = nextFactory(); if (factory.numAvailableConnections() > 0) { return factory; } } - SharedConnectionFactory factory = - new SharedConnectionFactory(connectionFactory, maxConcurrencyPerConnection); - factories.add(factory); - return factory; + if (maxConnections <= 0 || factories.size() < maxConnections) { + SharedConnectionFactory factory = + new SharedConnectionFactory(connectionFactory, maxConcurrencyPerConnection); + factories.add(factory); + return factory; + } else { + return nextFactory(); + } } } diff --git a/src/main/java/com/google/devtools/build/lib/remote/options/RemoteOptions.java b/src/main/java/com/google/devtools/build/lib/remote/options/RemoteOptions.java index 1d2586af78df5e..0c7f5812b8c155 100644 --- a/src/main/java/com/google/devtools/build/lib/remote/options/RemoteOptions.java +++ b/src/main/java/com/google/devtools/build/lib/remote/options/RemoteOptions.java @@ -63,9 +63,13 @@ public final class RemoteOptions extends OptionsBase { documentationCategory = OptionDocumentationCategory.REMOTE, effectTags = {OptionEffectTag.HOST_MACHINE_RESOURCE_OPTIMIZATIONS}, help = - "The max. number of concurrent network connections to the remote cache/executor. By " - + "default Bazel limits the number of TCP connections to 100. Setting this flag to " - + "0 will make Bazel choose the number of connections automatically.") + "Limit the max number of concurrent connections to remote cache/executor. By default the" + + " value is 100. Setting this to 0 means no limitation.\n" + + "For HTTP remote cache, one TCP connection could handle one request at one time, so" + + " Bazel could make up to --remote_max_connections concurrent requests.\n" + + "For gRPC remote cache/executor, one gRPC channel could usually handle 100+" + + " concurrent requests, so Bazel could make around `--remote_max_connections * 100`" + + " concurrent requests.") public int remoteMaxConnections; @Option(