package com.lucidworks.storm.fusion; import com.codahale.metrics.Meter; import com.codahale.metrics.MetricRegistry; import org.apache.http.HttpEntity; import org.apache.http.HttpException; import org.apache.http.HttpRequest; import org.apache.http.HttpRequestInterceptor; import org.apache.http.HttpResponse; import org.apache.http.auth.UsernamePasswordCredentials; import org.apache.http.client.CookieStore; import org.apache.http.client.HttpClient; import org.apache.http.client.methods.HttpPost; import org.apache.http.conn.ssl.NoopHostnameVerifier; import org.apache.http.cookie.Cookie; import org.apache.http.entity.ContentProducer; import org.apache.http.entity.ContentType; import org.apache.http.entity.EntityTemplate; import org.apache.http.entity.StringEntity; import org.apache.http.impl.auth.BasicScheme; import org.apache.http.impl.client.*; import org.apache.http.impl.cookie.BasicClientCookie; import org.apache.http.protocol.HttpContext; import org.apache.http.util.EntityUtils; import com.fasterxml.jackson.databind.ObjectMapper; import org.apache.http.client.config.CookieSpecs; import org.apache.http.client.config.RequestConfig; import org.apache.http.client.protocol.HttpClientContext; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import java.io.BufferedReader; import java.io.IOException; import java.io.InputStreamReader; import java.io.OutputStream; import java.net.URL; import java.nio.charset.StandardCharsets; import java.net.MalformedURLException; import java.util.ArrayList; import java.util.Arrays; import java.util.Date; import java.util.HashMap; import java.util.List; import java.util.Map; import java.util.Random; import java.util.concurrent.TimeUnit; import java.util.concurrent.atomic.AtomicInteger; public class FusionPipelineClient { public static Logger log = LoggerFactory.getLogger(FusionPipelineClient.class); // for basic auth to the pipeline service private static final class PreEmptiveBasicAuthenticator implements HttpRequestInterceptor { private final UsernamePasswordCredentials credentials; public PreEmptiveBasicAuthenticator(String user, String pass) { credentials = new UsernamePasswordCredentials(user, pass); } public void process(HttpRequest request, HttpContext context) throws HttpException, IOException { request.addHeader(BasicScheme.authenticate(credentials, "US-ASCII", false)); } } // holds a context and a client object static class FusionSession { long sessionEstablishedAt = -1; Meter docsSentMeter = null; } List<String> originalEndpoints; RequestConfig globalConfig; CookieStore cookieStore; CloseableHttpClient httpClient; Map<String,FusionSession> sessions; Random random; ObjectMapper jsonObjectMapper; String fusionUser = null; byte[] fusionPass = null; String fusionRealm = null; AtomicInteger requestCounter = null; Map<String,Meter> metersByHost = new HashMap<>(); boolean isKerberos = false; public static MetricRegistry metrics = null; static long maxNanosOfInactivity = TimeUnit.NANOSECONDS.convert(599, TimeUnit.SECONDS); public FusionPipelineClient(String endpointUrl) throws MalformedURLException { this(endpointUrl, null, null, null); } public FusionPipelineClient(String endpointUrl, String fusionUser, String fusionPass, String fusionRealm) throws MalformedURLException { String fusionLoginConf = System.getProperty(FusionKrb5HttpClientConfigurer.LOGIN_CONFIG_PROP); if (fusionLoginConf != null && !fusionLoginConf.isEmpty()) { httpClient = FusionKrb5HttpClientConfigurer.createClient(fusionUser); isKerberos = true; } else { globalConfig = RequestConfig.custom().setCookieSpec(CookieSpecs.BEST_MATCH).build(); cookieStore = new BasicCookieStore(); this.fusionUser = fusionUser; this.fusionPass = fusionPass.getBytes(StandardCharsets.UTF_8); this.fusionRealm = fusionRealm; // build the HttpClient to be used for all requests HttpClientBuilder httpClientBuilder = HttpClientBuilder.create(); httpClientBuilder.setDefaultRequestConfig(globalConfig).setDefaultCookieStore(cookieStore); httpClientBuilder.setMaxConnPerRoute(100); httpClientBuilder.setMaxConnTotal(500); httpClientBuilder.setSSLHostnameVerifier(new NoopHostnameVerifier()); if (fusionUser != null && fusionRealm == null) httpClientBuilder.addInterceptorFirst(new PreEmptiveBasicAuthenticator(fusionUser, fusionPass)); httpClient = httpClientBuilder.build(); } originalEndpoints = Arrays.asList(endpointUrl.split(",")); try { sessions = establishSessions(originalEndpoints); } catch (Exception exc) { if (exc instanceof RuntimeException) { throw (RuntimeException)exc; } else { throw new RuntimeException(exc); } } random = new Random(); jsonObjectMapper = new ObjectMapper(); requestCounter = new AtomicInteger(0); } protected Meter getMeterByHost(String meterName, String host) { if (metrics == null) return null; String key = meterName+" ("+host+")"; Meter meter = metersByHost.get(key); if (meter == null) { meter = metrics.meter(meterName + "-" + host); metersByHost.put(key, meter); } return meter; } protected Map<String,FusionSession> establishSessions(List<String> endpoints) throws Exception { Exception lastError = null; Map<String,FusionSession> map = new HashMap<String, FusionSession>(); for (String url : endpoints) { try { map.put(url, establishSession(url)); } catch (Exception exc) { // just log this ... so long as there is at least one good endpoint we can use it lastError = exc; log.warn("Failed to establish session with Fusion at " + url+" due to: "+exc); } } if (map.isEmpty()) { if (lastError != null) { throw lastError; } else { throw new Exception("Failed to establish session with Fusion endpoint(s): "+endpoints); } } log.info("Established sessions with "+map.size()+" of "+endpoints.size()+ " Fusion endpoints for user "+fusionUser+" in realm "+fusionRealm); return map; } protected FusionSession establishSession(String url) throws Exception { FusionSession fusionSession = new FusionSession(); if (!isKerberos && fusionRealm != null) { int at = url.indexOf("/api"); String proxyUrl = url.substring(0, at); String sessionApi = proxyUrl + "/api/session?realmName=" + fusionRealm; String jsonString = "{\"username\":\"" + fusionUser + "\", \"password\":\"" + new String(fusionPass, StandardCharsets.UTF_8) + "\"}"; // TODO: ugly! URL sessionApiUrl = new URL(sessionApi); String sessionHost = sessionApiUrl.getHost(); try { clearCookieForHost(sessionHost); } catch (Exception exc) { log.warn("Failed to clear session cookie for "+sessionHost+" due to: "+exc); } HttpPost postRequest = new HttpPost(sessionApiUrl.toURI()); postRequest.setEntity(new StringEntity(jsonString, ContentType.create("application/json", StandardCharsets.UTF_8))); HttpClientContext context = HttpClientContext.create(); context.setCookieStore(cookieStore); HttpResponse response = httpClient.execute(postRequest, context); HttpEntity entity = response.getEntity(); try { int statusCode = response.getStatusLine().getStatusCode(); if (statusCode != 200 && statusCode != 201 && statusCode != 204) { String body = extractResponseBodyText(entity); throw new IOException( "POST credentials to Fusion Session API [" + sessionApi + "] failed due to: " + response.getStatusLine() + ": " + body); } else if (statusCode == 401) { // retry in case this is an expired error String body = extractResponseBodyText(entity); if (body != null && body.indexOf("session-idle-timeout") != -1) { EntityUtils.consume(entity); // have to consume the previous entity before re-trying the request log.warn("Received session-idle-timeout error from Fusion Session API, re-trying to establish a new session to " + url); try { clearCookieForHost(sessionHost); } catch (Exception exc) { log.warn("Failed to clear session cookie for "+sessionHost+" due to: "+exc); } response = httpClient.execute(postRequest, context); entity = response.getEntity(); statusCode = response.getStatusLine().getStatusCode(); if (statusCode != 200 && statusCode != 201 && statusCode != 204) { body = extractResponseBodyText(entity); throw new IOException( "POST credentials to Fusion Session API [" + sessionApi + "] failed due to: " + response.getStatusLine() + ": " + body); } } } } finally { if (entity != null) EntityUtils.consume(entity); } log.info("Established secure session with Fusion Session API on " + url + " for user " + fusionUser + " in fusionRealm " + fusionRealm); } fusionSession.sessionEstablishedAt = System.nanoTime(); URL fusionUrl = new URL(url); String hostAndPort = fusionUrl.getHost()+":"+fusionUrl.getPort(); fusionSession.docsSentMeter = getMeterByHost("Docs Sent to Fusion", hostAndPort); return fusionSession; } protected synchronized void clearCookieForHost(String sessionHost) throws Exception { Cookie sessionCookie = null; for (Cookie cookie : cookieStore.getCookies()) { String cookieDomain = cookie.getDomain(); if (cookieDomain != null) { if (sessionHost.equals(cookieDomain) || sessionHost.indexOf(cookieDomain) != -1 || cookieDomain.indexOf(sessionHost) != -1) { sessionCookie = cookie; break; } } } if (sessionCookie != null) { BasicClientCookie httpCookie = new BasicClientCookie(sessionCookie.getName(),sessionCookie.getValue()); httpCookie.setExpiryDate(new Date(0)); httpCookie.setVersion(1); httpCookie.setPath(sessionCookie.getPath()); httpCookie.setDomain(sessionCookie.getDomain()); cookieStore.addCookie(httpCookie); } cookieStore.clearExpired(new Date()); // this should clear the cookie } protected synchronized FusionSession resetSession(String endpoint) throws Exception { // reset the "context" object for the HttpContext for this endpoint FusionSession fusionSession = null; try { fusionSession = establishSession(endpoint); sessions.put(endpoint, fusionSession); } catch (Exception exc) { log.error("Failed to re-establish session with Fusion at " + endpoint + " due to: " + exc); sessions.remove(endpoint); fusionSession = null; } return fusionSession; } public HttpClient getHttpClient() { return httpClient; } protected String getLbEndpoint(List<String> list) { int num = list.size(); if (num == 0) return null; return list.get((num > 1) ? random.nextInt(num) : 0); } public void postBatchToPipeline(List docs) throws Exception { int numDocs = docs.size(); int requestId = requestCounter.incrementAndGet(); ArrayList<String> mutable = null; synchronized (this) { mutable = new ArrayList<String>(sessions.keySet()); } if (mutable.isEmpty()) { // completely hosed ... try to re-establish all sessions synchronized (this) { try { Thread.sleep(2000); } catch (InterruptedException ie) { Thread.interrupted(); } sessions = establishSessions(originalEndpoints); mutable = new ArrayList<String>(sessions.keySet()); } if (mutable.isEmpty()) throw new IllegalStateException("No available endpoints! " + "Check log for previous errors as to why there are no more endpoints available. This is a fatal error."); } if (mutable.size() > 1) { Exception lastExc = null; // try all the endpoints until success is reached ... or we run out of endpoints to try ... while (!mutable.isEmpty()) { String endpoint = getLbEndpoint(mutable); if (endpoint == null) { // no more endpoints available ... fail if (lastExc != null) { log.error("No more endpoints available to retry failed request ("+requestId+")! raising last seen error: "+lastExc); throw lastExc; } else { throw new RuntimeException("No Fusion pipeline endpoints available to process request "+ requestId+"! Check logs for previous errors."); } } if (log.isDebugEnabled()) log.debug("POSTing batch of "+numDocs+" input docs to "+endpoint+" as request "+requestId); Exception retryAfterException = postJsonToPipelineWithRetry(endpoint, docs, mutable, lastExc, requestId); if (retryAfterException == null) { lastExc = null; break; // request succeeded ... } lastExc = retryAfterException; // try next endpoint (if available) after seeing an exception } if (lastExc != null) { // request failed and we exhausted the list of endpoints to try ... log.error("Failing request " + requestId + " due to: " + lastExc); throw lastExc; } } else { String endpoint = getLbEndpoint(mutable); if (log.isDebugEnabled()) log.debug("POSTing batch of "+numDocs+" input docs to "+endpoint+" as request "+requestId); Exception exc = postJsonToPipelineWithRetry(endpoint, docs, mutable, null, requestId); if (exc != null) throw exc; } } protected synchronized Exception postJsonToPipelineWithRetry( String endpoint, List docs, ArrayList<String> mutable, Exception lastExc, int requestId) throws Exception { Exception retryAfterException = null; try { postJsonToPipeline(endpoint, docs, requestId); if (lastExc != null) log.info("Re-try request "+requestId+" to "+endpoint+" succeeded after seeing a "+lastExc.getMessage()); } catch (Exception exc) { log.warn("Failed to send request "+requestId+" to '"+endpoint+"' due to: "+exc); if (mutable.size() > 1) { // try another endpoint but update the cloned list to avoid re-hitting the one having an error if (log.isDebugEnabled()) log.debug("Will re-try failed request " + requestId + " on next endpoint in the list"); mutable.remove(endpoint); retryAfterException = exc; } else { // no other endpoints to try ... brief wait and then retry log.warn("No more endpoints available to try ... will retry to send request "+ requestId+" to "+endpoint+" after waiting 1 sec"); try { Thread.sleep(1000); } catch (InterruptedException ignore) { Thread.interrupted(); } // note we want the exception to propagate from here up the stack since we re-tried and it didn't work postJsonToPipeline(endpoint, docs, requestId); log.info("Re-try request " + requestId + " to " + endpoint + " succeeded"); retryAfterException = null; // return success condition } } return retryAfterException; } private class JacksonContentProducer implements ContentProducer { ObjectMapper mapper; Object jsonObj; JacksonContentProducer(ObjectMapper mapper, Object jsonObj) { this.mapper = mapper; this.jsonObj = jsonObj; } public void writeTo(OutputStream outputStream) throws IOException { mapper.writeValue(outputStream, jsonObj); } } public void postJsonToPipeline(String endpoint, List docs, int requestId) throws Exception { FusionSession fusionSession = null; long currTime = System.nanoTime(); synchronized (this) { fusionSession = sessions.get(endpoint); // ensure last request within the session timeout period, else reset the session if (fusionSession == null || (currTime - fusionSession.sessionEstablishedAt) > maxNanosOfInactivity) { log.info("Fusion session is likely expired (or soon will be) for endpoint "+endpoint+", " + "pre-emptively re-setting this session before processing request "+requestId); fusionSession = resetSession(endpoint); if (fusionSession == null) throw new IllegalStateException("Failed to re-connect to "+endpoint+ " after session loss when processing request "+requestId); } } HttpEntity entity = null; try { HttpPost postRequest = new HttpPost(endpoint); // stream the json directly to the HTTP output EntityTemplate et = new EntityTemplate(new JacksonContentProducer(jsonObjectMapper, docs)); et.setContentType("application/json"); et.setContentEncoding(StandardCharsets.UTF_8.name()); postRequest.setEntity(et); // new BufferedHttpEntity(et)); HttpResponse response = null; HttpClientContext context = null; if (isKerberos) { httpClient = FusionKrb5HttpClientConfigurer.createClient(fusionUser); response = httpClient.execute(postRequest); } else { context = HttpClientContext.create(); if (cookieStore != null) { context.setCookieStore(cookieStore); } response = httpClient.execute(postRequest, context); } entity = response.getEntity(); int statusCode = response.getStatusLine().getStatusCode(); if (statusCode == 401) { // unauth'd - session probably expired? retry to establish log.warn("Unauthorized error (401) when trying to send request " + requestId + " to Fusion at " + endpoint + ", will re-try to establish session"); // re-establish the session and re-try the request try { EntityUtils.consume(entity); } catch (Exception ignore) { log.warn("Failed to consume entity due to: "+ignore); } finally { entity = null; } synchronized (this) { fusionSession = resetSession(endpoint); if (fusionSession == null) throw new IllegalStateException("After re-establishing session when processing request "+ requestId+", endpoint "+endpoint+" is no longer active! Try another endpoint."); } log.info("Going to re-try request "+requestId+" after session re-established with "+endpoint); if (isKerberos) { httpClient = FusionKrb5HttpClientConfigurer.createClient(fusionUser); response = httpClient.execute(postRequest); } else { response = httpClient.execute(postRequest, context); } entity = response.getEntity(); statusCode = response.getStatusLine().getStatusCode(); if (statusCode == 200 || statusCode == 204) { log.info("Re-try request "+requestId+" after session timeout succeeded for: " + endpoint); } else { raiseFusionServerException(endpoint, entity, statusCode, response, requestId); } } else if (statusCode != 200 && statusCode != 204) { raiseFusionServerException(endpoint, entity, statusCode, response, requestId); } else { // OK! if (fusionSession != null && fusionSession.docsSentMeter != null) fusionSession.docsSentMeter.mark(docs.size()); } } finally { if (entity != null) { try { EntityUtils.consume(entity); } catch (Exception ignore) { log.warn("Failed to consume entity due to: "+ignore); } finally { entity = null; } } } } protected void raiseFusionServerException(String endpoint, HttpEntity entity, int statusCode, HttpResponse response, int requestId) { String body = extractResponseBodyText(entity); throw new RuntimeException( "POST request "+requestId+" to [" + endpoint + "] failed due to: ("+statusCode+")" + response.getStatusLine() + ": " + body); } static String extractResponseBodyText(HttpEntity entity) { StringBuilder body = new StringBuilder(); if (entity != null) { BufferedReader reader = null; String line = null; try { reader = new BufferedReader(new InputStreamReader(entity.getContent())); while ((line = reader.readLine()) != null) body.append(line); } catch (Exception ignore) { // squelch it - just trying to compose an error message here log.warn("Failed to read response body due to: "+ignore); } finally { if (reader != null) { try { reader.close(); } catch (Exception ignore){} } } } return body.toString(); } public synchronized void shutdown() { if (sessions != null) { sessions.clear(); sessions = null; } if (httpClient != null) { try { httpClient.close(); } catch (IOException e) { log.warn("Failed to close httpClient object due to: " + e); } finally { httpClient = null; } } else { log.error("Already shutdown."); } } }