Skip to content

Commit 71f9e75

Browse files
authored
[FSSDK-10095] fix events dropped on staled connections. (#545)
Events can be discarded for staled connections with httpclient connection pooling. This PR fixs it with - - reduce the time for connection validation from 5 to 1sec. - enable retries (x3) for event POST.
1 parent 8fdbfbf commit 71f9e75

File tree

8 files changed

+147
-33
lines changed

8 files changed

+147
-33
lines changed

core-api/src/test/java/com/optimizely/ab/odp/ODPEventManagerTest.java

-5
Original file line numberDiff line numberDiff line change
@@ -51,11 +51,6 @@ public class ODPEventManagerTest {
5151
@Captor
5252
ArgumentCaptor<String> payloadCaptor;
5353

54-
@Before
55-
public void setup() {
56-
mockApiManager = mock(ODPApiManager.class);
57-
}
58-
5954
@Test
6055
public void logAndDiscardEventWhenEventManagerIsNotRunning() {
6156
ODPConfig odpConfig = new ODPConfig("key", "host", null);

core-httpclient-impl/README.md

+5-5
Original file line numberDiff line numberDiff line change
@@ -107,23 +107,23 @@ The number of workers determines the number of threads the thread pool uses.
107107
The following builder methods can be used to custom configure the `AsyncEventHandler`.
108108

109109
|Method Name|Default Value|Description|
110-
|---|---|---|
110+
|---|---|-----------------------------------------------|
111111
|`withQueueCapacity(int)`|10000|Queue size for pending logEvents|
112112
|`withNumWorkers(int)`|2|Number of worker threads|
113113
|`withMaxTotalConnections(int)`|200|Maximum number of connections|
114114
|`withMaxPerRoute(int)`|20|Maximum number of connections per route|
115-
|`withValidateAfterInactivity(int)`|5000|Time to maintain idol connections (in milliseconds)|
115+
|`withValidateAfterInactivity(int)`|1000|Time to maintain idle connections (in milliseconds)|
116116

117117
### Advanced configuration
118118
The following properties can be set to override the default configuration.
119119

120120
|Property Name|Default Value|Description|
121-
|---|---|---|
121+
|---|---|-----------------------------------------------|
122122
|**async.event.handler.queue.capacity**|10000|Queue size for pending logEvents|
123123
|**async.event.handler.num.workers**|2|Number of worker threads|
124124
|**async.event.handler.max.connections**|200|Maximum number of connections|
125125
|**async.event.handler.event.max.per.route**|20|Maximum number of connections per route|
126-
|**async.event.handler.validate.after**|5000|Time to maintain idol connections (in milliseconds)|
126+
|**async.event.handler.validate.after**|1000|Time to maintain idle connections (in milliseconds)|
127127

128128
## HttpProjectConfigManager
129129

@@ -243,4 +243,4 @@ Optimizely optimizely = OptimizelyFactory.newDefaultInstance();
243243
to enable request batching to the Optimizely logging endpoint. By default, a maximum of 10 events are included in each batch
244244
for a maximum interval of 30 seconds. These parameters are configurable via systems properties or through the
245245
`OptimizelyFactory#setMaxEventBatchSize` and `OptimizelyFactory#setMaxEventBatchInterval` methods.
246-
246+

core-httpclient-impl/build.gradle

+1-2
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,8 @@
11
dependencies {
22
compile project(':core-api')
3-
43
compileOnly group: 'com.google.code.gson', name: 'gson', version: gsonVersion
5-
64
compile group: 'org.apache.httpcomponents', name: 'httpclient', version: httpClientVersion
5+
testCompile 'org.mock-server:mockserver-netty:5.1.1'
76
}
87

98
task exhaustiveTest {

core-httpclient-impl/src/main/java/com/optimizely/ab/HttpClientUtils.java

+3-1
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,9 @@ public final class HttpClientUtils {
2626
public static final int CONNECTION_TIMEOUT_MS = 10000;
2727
public static final int CONNECTION_REQUEST_TIMEOUT_MS = 5000;
2828
public static final int SOCKET_TIMEOUT_MS = 10000;
29-
29+
public static final int DEFAULT_VALIDATE_AFTER_INACTIVITY = 1000;
30+
public static final int DEFAULT_MAX_CONNECTIONS = 200;
31+
public static final int DEFAULT_MAX_PER_ROUTE = 20;
3032
private static RequestConfig requestConfigWithTimeout;
3133

3234
private HttpClientUtils() {

core-httpclient-impl/src/main/java/com/optimizely/ab/OptimizelyHttpClient.java

+20-3
Original file line numberDiff line numberDiff line change
@@ -17,11 +17,15 @@
1717
package com.optimizely.ab;
1818

1919
import com.optimizely.ab.annotations.VisibleForTesting;
20+
import com.optimizely.ab.HttpClientUtils;
21+
2022
import org.apache.http.client.HttpClient;
23+
import org.apache.http.client.HttpRequestRetryHandler;
2124
import org.apache.http.client.ResponseHandler;
2225
import org.apache.http.client.methods.CloseableHttpResponse;
2326
import org.apache.http.client.methods.HttpUriRequest;
2427
import org.apache.http.impl.client.CloseableHttpClient;
28+
import org.apache.http.impl.client.DefaultHttpRequestRetryHandler;
2529
import org.apache.http.impl.client.HttpClientBuilder;
2630
import org.apache.http.impl.client.HttpClients;
2731
import org.apache.http.impl.conn.PoolingHttpClientConnectionManager;
@@ -73,16 +77,20 @@ public static class Builder {
7377
// The following static values are public so that they can be tweaked if necessary.
7478
// These are the recommended settings for http protocol. https://hc.apache.org/httpcomponents-client-ga/tutorial/html/connmgmt.html
7579
// The maximum number of connections allowed across all routes.
76-
private int maxTotalConnections = 200;
80+
int maxTotalConnections = HttpClientUtils.DEFAULT_MAX_CONNECTIONS;
7781
// The maximum number of connections allowed for a route
78-
private int maxPerRoute = 20;
82+
int maxPerRoute = HttpClientUtils.DEFAULT_MAX_PER_ROUTE;
7983
// Defines period of inactivity in milliseconds after which persistent connections must be re-validated prior to being leased to the consumer.
80-
private int validateAfterInactivity = 5000;
84+
// If this is too long, it's expected to see more requests dropped on staled connections (dropped by the server or networks).
85+
// We can configure retries (POST for AsyncEventDispatcher) to cover the staled connections.
86+
int validateAfterInactivity = HttpClientUtils.DEFAULT_VALIDATE_AFTER_INACTIVITY;
8187
// force-close the connection after this idle time (with 0, eviction is disabled by default)
8288
long evictConnectionIdleTimePeriod = 0;
89+
HttpRequestRetryHandler customRetryHandler = null;
8390
TimeUnit evictConnectionIdleTimeUnit = TimeUnit.MILLISECONDS;
8491
private int timeoutMillis = HttpClientUtils.CONNECTION_TIMEOUT_MS;
8592

93+
8694
private Builder() {
8795

8896
}
@@ -107,6 +115,12 @@ public Builder withEvictIdleConnections(long maxIdleTime, TimeUnit maxIdleTimeUn
107115
this.evictConnectionIdleTimeUnit = maxIdleTimeUnit;
108116
return this;
109117
}
118+
119+
// customize retryHandler (DefaultHttpRequestRetryHandler will be used by default)
120+
public Builder withRetryHandler(HttpRequestRetryHandler retryHandler) {
121+
this.customRetryHandler = retryHandler;
122+
return this;
123+
}
110124

111125
public Builder setTimeoutMillis(int timeoutMillis) {
112126
this.timeoutMillis = timeoutMillis;
@@ -124,6 +138,9 @@ public OptimizelyHttpClient build() {
124138
.setConnectionManager(poolingHttpClientConnectionManager)
125139
.disableCookieManagement()
126140
.useSystemProperties();
141+
if (customRetryHandler != null) {
142+
builder.setRetryHandler(customRetryHandler);
143+
}
127144

128145
logger.debug("Creating HttpClient with timeout: " + timeoutMillis);
129146

core-httpclient-impl/src/main/java/com/optimizely/ab/event/AsyncEventHandler.java

+11-10
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,7 @@
1616
*/
1717
package com.optimizely.ab.event;
1818

19+
import com.optimizely.ab.HttpClientUtils;
1920
import com.optimizely.ab.NamedThreadFactory;
2021
import com.optimizely.ab.OptimizelyHttpClient;
2122
import com.optimizely.ab.annotations.VisibleForTesting;
@@ -31,6 +32,7 @@
3132
import org.apache.http.client.methods.HttpRequestBase;
3233
import org.apache.http.client.utils.URIBuilder;
3334
import org.apache.http.entity.StringEntity;
35+
import org.apache.http.impl.client.DefaultHttpRequestRetryHandler;
3436
import org.slf4j.Logger;
3537
import org.slf4j.LoggerFactory;
3638

@@ -45,7 +47,6 @@
4547
import java.util.concurrent.TimeUnit;
4648

4749
import javax.annotation.CheckForNull;
48-
import javax.annotation.Nullable;
4950

5051
/**
5152
* {@link EventHandler} implementation that queues events and has a separate pool of threads responsible
@@ -61,9 +62,7 @@ public class AsyncEventHandler implements EventHandler, AutoCloseable {
6162

6263
public static final int DEFAULT_QUEUE_CAPACITY = 10000;
6364
public static final int DEFAULT_NUM_WORKERS = 2;
64-
public static final int DEFAULT_MAX_CONNECTIONS = 200;
65-
public static final int DEFAULT_MAX_PER_ROUTE = 20;
66-
public static final int DEFAULT_VALIDATE_AFTER_INACTIVITY = 5000;
65+
6766

6867
private static final Logger logger = LoggerFactory.getLogger(AsyncEventHandler.class);
6968
private static final ProjectConfigResponseHandler EVENT_RESPONSE_HANDLER = new ProjectConfigResponseHandler();
@@ -135,15 +134,17 @@ public AsyncEventHandler(int queueCapacity,
135134
if (httpClient != null) {
136135
this.httpClient = httpClient;
137136
} else {
138-
maxConnections = validateInput("maxConnections", maxConnections, DEFAULT_MAX_CONNECTIONS);
139-
connectionsPerRoute = validateInput("connectionsPerRoute", connectionsPerRoute, DEFAULT_MAX_PER_ROUTE);
140-
validateAfter = validateInput("validateAfter", validateAfter, DEFAULT_VALIDATE_AFTER_INACTIVITY);
137+
maxConnections = validateInput("maxConnections", maxConnections, HttpClientUtils.DEFAULT_MAX_CONNECTIONS);
138+
connectionsPerRoute = validateInput("connectionsPerRoute", connectionsPerRoute, HttpClientUtils.DEFAULT_MAX_PER_ROUTE);
139+
validateAfter = validateInput("validateAfter", validateAfter, HttpClientUtils.DEFAULT_VALIDATE_AFTER_INACTIVITY);
141140
this.httpClient = OptimizelyHttpClient.builder()
142141
.withMaxTotalConnections(maxConnections)
143142
.withMaxPerRoute(connectionsPerRoute)
144143
.withValidateAfterInactivity(validateAfter)
145144
// infrequent event discards observed. staled connections force-closed after a long idle time.
146145
.withEvictIdleConnections(1L, TimeUnit.MINUTES)
146+
// enable retry on event POST (default: retry on GET only)
147+
.withRetryHandler(new DefaultHttpRequestRetryHandler(3, true))
147148
.build();
148149
}
149150

@@ -310,9 +311,9 @@ public static class Builder {
310311

311312
int queueCapacity = PropertyUtils.getInteger(CONFIG_QUEUE_CAPACITY, DEFAULT_QUEUE_CAPACITY);
312313
int numWorkers = PropertyUtils.getInteger(CONFIG_NUM_WORKERS, DEFAULT_NUM_WORKERS);
313-
int maxTotalConnections = PropertyUtils.getInteger(CONFIG_MAX_CONNECTIONS, DEFAULT_MAX_CONNECTIONS);
314-
int maxPerRoute = PropertyUtils.getInteger(CONFIG_MAX_PER_ROUTE, DEFAULT_MAX_PER_ROUTE);
315-
int validateAfterInactivity = PropertyUtils.getInteger(CONFIG_VALIDATE_AFTER_INACTIVITY, DEFAULT_VALIDATE_AFTER_INACTIVITY);
314+
int maxTotalConnections = PropertyUtils.getInteger(CONFIG_MAX_CONNECTIONS, HttpClientUtils.DEFAULT_MAX_CONNECTIONS);
315+
int maxPerRoute = PropertyUtils.getInteger(CONFIG_MAX_PER_ROUTE, HttpClientUtils.DEFAULT_MAX_PER_ROUTE);
316+
int validateAfterInactivity = PropertyUtils.getInteger(CONFIG_VALIDATE_AFTER_INACTIVITY, HttpClientUtils.DEFAULT_VALIDATE_AFTER_INACTIVITY);
316317
private long closeTimeout = Long.MAX_VALUE;
317318
private TimeUnit closeTimeoutUnit = TimeUnit.MILLISECONDS;
318319
private OptimizelyHttpClient httpClient;

core-httpclient-impl/src/test/java/com/optimizely/ab/OptimizelyHttpClientTest.java

+95-7
Original file line numberDiff line numberDiff line change
@@ -16,27 +16,39 @@
1616
*/
1717
package com.optimizely.ab;
1818

19+
import org.apache.http.HttpException;
20+
import org.apache.http.client.HttpRequestRetryHandler;
1921
import org.apache.http.client.ResponseHandler;
22+
import org.apache.http.client.methods.CloseableHttpResponse;
2023
import org.apache.http.client.methods.HttpGet;
2124
import org.apache.http.client.methods.HttpUriRequest;
2225
import org.apache.http.client.methods.RequestBuilder;
2326
import org.apache.http.conn.HttpHostConnectException;
2427
import org.apache.http.impl.client.CloseableHttpClient;
25-
import org.junit.After;
26-
import org.junit.Before;
27-
import org.junit.Test;
28+
import org.apache.http.impl.client.DefaultHttpRequestRetryHandler;
29+
import org.apache.http.protocol.HttpContext;
30+
import org.junit.*;
31+
import org.mockserver.integration.ClientAndServer;
32+
import org.mockserver.model.ConnectionOptions;
33+
import org.mockserver.model.HttpError;
34+
import org.mockserver.model.HttpRequest;
35+
import org.mockserver.model.HttpResponse;
2836

2937
import java.io.IOException;
38+
import java.util.concurrent.ExecutionException;
3039
import java.util.concurrent.TimeUnit;
3140

3241
import static com.optimizely.ab.OptimizelyHttpClient.builder;
3342
import static java.util.concurrent.TimeUnit.*;
3443
import static org.junit.Assert.*;
35-
import static org.mockito.Mockito.mock;
36-
import static org.mockito.Mockito.when;
44+
import static org.mockito.Mockito.*;
45+
import static org.mockserver.model.HttpForward.forward;
46+
import static org.mockserver.model.HttpRequest.request;
47+
import static org.mockserver.model.HttpResponse.*;
48+
import static org.mockserver.model.HttpResponse.response;
49+
import static org.mockserver.verify.VerificationTimes.exactly;
3750

3851
public class OptimizelyHttpClientTest {
39-
4052
@Before
4153
public void setUp() {
4254
System.setProperty("https.proxyHost", "localhost");
@@ -51,7 +63,13 @@ public void tearDown() {
5163

5264
@Test
5365
public void testDefaultConfiguration() {
54-
OptimizelyHttpClient optimizelyHttpClient = builder().build();
66+
OptimizelyHttpClient.Builder builder = builder();
67+
assertEquals(builder.validateAfterInactivity, 1000);
68+
assertEquals(builder.maxTotalConnections, 200);
69+
assertEquals(builder.maxPerRoute, 20);
70+
assertNull(builder.customRetryHandler);
71+
72+
OptimizelyHttpClient optimizelyHttpClient = builder.build();
5573
assertTrue(optimizelyHttpClient.getHttpClient() instanceof CloseableHttpClient);
5674
}
5775

@@ -101,4 +119,74 @@ public void testExecute() throws IOException {
101119
OptimizelyHttpClient optimizelyHttpClient = new OptimizelyHttpClient(mockHttpClient);
102120
assertTrue(optimizelyHttpClient.execute(httpUriRequest, responseHandler));
103121
}
122+
123+
@Test
124+
public void testRetriesWithCustomRetryHandler() throws IOException {
125+
126+
// [NOTE] Request retries are all handled inside HttpClient. Not easy for unit test.
127+
// - "DefaultHttpRetryHandler" in HttpClient retries only with special types of Exceptions
128+
// like "NoHttpResponseException", etc.
129+
// Other exceptions (SocketTimeout, ProtocolException, etc.) all ignored.
130+
// - Not easy to force the specific exception type in the low-level.
131+
// - This test just validates custom retry handler injected ok by validating the number of retries.
132+
133+
class CustomRetryHandler implements HttpRequestRetryHandler {
134+
private final int maxRetries;
135+
136+
public CustomRetryHandler(int maxRetries) {
137+
this.maxRetries = maxRetries;
138+
}
139+
140+
@Override
141+
public boolean retryRequest(IOException exception, int executionCount, HttpContext context) {
142+
// override to retry for any type of exceptions
143+
return executionCount < maxRetries;
144+
}
145+
}
146+
147+
int port = 9999;
148+
ClientAndServer mockServer;
149+
int retryCount;
150+
151+
// default httpclient (retries enabled by default, but no retry for timeout connection)
152+
153+
mockServer = ClientAndServer.startClientAndServer(port);
154+
mockServer
155+
.when(request().withMethod("GET").withPath("/"))
156+
.error(HttpError.error());
157+
158+
OptimizelyHttpClient clientDefault = OptimizelyHttpClient.builder()
159+
.setTimeoutMillis(100)
160+
.build();
161+
162+
try {
163+
clientDefault.execute(new HttpGet("http://localhost:" + port));
164+
fail();
165+
} catch (Exception e) {
166+
retryCount = mockServer.retrieveRecordedRequests(request()).length;
167+
assertEquals(1, retryCount);
168+
}
169+
mockServer.stop();
170+
171+
// httpclient with custom retry handler (5 times retries for any request)
172+
173+
mockServer = ClientAndServer.startClientAndServer(port);
174+
mockServer
175+
.when(request().withMethod("GET").withPath("/"))
176+
.error(HttpError.error());
177+
178+
OptimizelyHttpClient clientWithRetries = OptimizelyHttpClient.builder()
179+
.withRetryHandler(new CustomRetryHandler(5))
180+
.setTimeoutMillis(100)
181+
.build();
182+
183+
try {
184+
clientWithRetries.execute(new HttpGet("http://localhost:" + port));
185+
fail();
186+
} catch (Exception e) {
187+
retryCount = mockServer.retrieveRecordedRequests(request()).length;
188+
assertEquals(5, retryCount);
189+
}
190+
mockServer.stop();
191+
}
104192
}

core-httpclient-impl/src/test/java/com/optimizely/ab/event/AsyncEventHandlerTest.java

+12
Original file line numberDiff line numberDiff line change
@@ -124,6 +124,7 @@ public void testBuilderWithCustomHttpClient() {
124124

125125
AsyncEventHandler eventHandler = builder()
126126
.withOptimizelyHttpClient(customHttpClient)
127+
// these params will be ignored when customHttpClient is injected
127128
.withMaxTotalConnections(1)
128129
.withMaxPerRoute(2)
129130
.withCloseTimeout(10, TimeUnit.SECONDS)
@@ -134,6 +135,17 @@ public void testBuilderWithCustomHttpClient() {
134135

135136
@Test
136137
public void testBuilderWithDefaultHttpClient() {
138+
AsyncEventHandler.Builder builder = builder();
139+
assertEquals(builder.validateAfterInactivity, 1000);
140+
assertEquals(builder.maxTotalConnections, 200);
141+
assertEquals(builder.maxPerRoute, 20);
142+
143+
AsyncEventHandler eventHandler = builder.build();
144+
assert(eventHandler.httpClient != null);
145+
}
146+
147+
@Test
148+
public void testBuilderWithDefaultHttpClientAndCustomParams() {
137149
AsyncEventHandler eventHandler = builder()
138150
.withMaxTotalConnections(3)
139151
.withMaxPerRoute(4)

0 commit comments

Comments
 (0)