/* * Licensed to Elasticsearch under one or more contributor * license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright * ownership. Elasticsearch licenses this file to you under * the Apache License, Version 2.0 (the "License"); you may * not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, * software distributed under the License is distributed on an * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY * KIND, either express or implied. See the License for the * specific language governing permissions and limitations * under the License. */ package org.elasticsearch.index.reindex; import org.elasticsearch.ElasticsearchException; import org.elasticsearch.Version; import org.elasticsearch.action.ActionRequest; import org.elasticsearch.action.ActionRequestValidationException; import org.elasticsearch.action.WriteConsistencyLevel; import org.elasticsearch.action.search.SearchRequest; import org.elasticsearch.action.support.replication.ReplicationRequest; import org.elasticsearch.common.bytes.BytesReference; import org.elasticsearch.common.collect.Tuple; import org.elasticsearch.common.io.stream.StreamInput; import org.elasticsearch.common.io.stream.StreamOutput; import org.elasticsearch.common.unit.TimeValue; import org.elasticsearch.common.xcontent.XContentBuilder; import org.elasticsearch.common.xcontent.XContentFactory; import org.elasticsearch.common.xcontent.XContentHelper; import org.elasticsearch.common.xcontent.XContentType; import org.elasticsearch.search.builder.SearchSourceBuilder; import org.elasticsearch.tasks.Task; import java.io.IOException; import java.util.Arrays; import java.util.Map; import static org.elasticsearch.action.ValidateActions.addValidationError; import static org.elasticsearch.common.unit.TimeValue.timeValueMillis; import static org.elasticsearch.common.unit.TimeValue.timeValueMinutes; import static org.elasticsearch.search.sort.SortBuilders.fieldSort; public abstract class AbstractBulkByScrollRequest<Self extends AbstractBulkByScrollRequest<Self>> extends ActionRequest<Self> { public static final int SIZE_ALL_MATCHES = -1; private static final TimeValue DEFAULT_SCROLL_TIMEOUT = timeValueMinutes(5); private static final int DEFAULT_SCROLL_SIZE = 1000; /** * Default search source. */ private static final BytesReference DEFAULT_SOURCE = new SearchSourceBuilder().version(true) .size(AbstractBulkByScrollRequest.DEFAULT_SCROLL_SIZE).sort(fieldSort("_doc")).buildAsBytes(); /** * The search to be executed. */ private SearchRequest searchRequest; /** * Maximum number of processed documents. Defaults to -1 meaning process all * documents. */ private int size = SIZE_ALL_MATCHES; /** * Should version conflicts cause aborts? Defaults to true. */ private boolean abortOnVersionConflict = true; /** * Call refresh on the indexes we've written to after the request ends? */ private boolean refresh = false; /** * Timeout to wait for the shards on to be available for each bulk request? */ private TimeValue timeout = ReplicationRequest.DEFAULT_TIMEOUT; /** * Consistency level for write requests. */ private WriteConsistencyLevel consistency = WriteConsistencyLevel.DEFAULT; /** * Initial delay after a rejection before retrying a bulk request. With the default maxRetries the total backoff for retrying rejections * is about one minute per bulk request. Once the entire bulk request is successful the retry counter resets. */ private TimeValue retryBackoffInitialTime = timeValueMillis(500); /** * Total number of retries attempted for rejections. There is no way to ask for unlimited retries. */ private int maxRetries = 11; /** * The throttle for this request in sub-requests per second. {@link Float#POSITIVE_INFINITY} means set no throttle and that is the * default. Throttling is done between batches, as we start the next scroll requests. That way we can increase the scroll's timeout to * make sure that it contains any time that we might wait. */ private float requestsPerSecond = Float.POSITIVE_INFINITY; public AbstractBulkByScrollRequest() { } public AbstractBulkByScrollRequest(SearchRequest source) { this.searchRequest = source; source.scroll(DEFAULT_SCROLL_TIMEOUT); } /** * `this` cast to Self. Used for building fluent methods without cast * warnings. */ protected abstract Self self(); /** * Applies the defaults to the request that cannot be applied during construction. This is super inefficient because it must deserialize * and reserialize the request's source but this is the only way to do it in 2.x. */ void applyDefaults() { if (searchRequest.source() == null) { searchRequest.source(DEFAULT_SOURCE); } try { Map<String, Object> newSource = XContentHelper.convertToMap(DEFAULT_SOURCE, true).v2(); Tuple<XContentType, Map<String, Object>> sourceAndContent = XContentHelper.convertToMap(searchRequest.source(), true); XContentHelper.update(newSource, sourceAndContent.v2(), false); XContentBuilder builder = XContentFactory.contentBuilder(sourceAndContent.v1()); builder.map(newSource); searchRequest.source(builder.bytes()); } catch (IOException e) { throw new ElasticsearchException("Strange IOException while apply default source", e); } } @Override public ActionRequestValidationException validate() { ActionRequestValidationException e = searchRequest.validate(); if (maxRetries < 0) { e = addValidationError("retries cannnot be negative", e); } if (false == (size == -1 || size > 0)) { e = addValidationError( "size should be greater than 0 if the request is limited to some number of documents or -1 if it isn't but it was [" + size + "]", e); } return e; } /** * Maximum number of processed documents. Defaults to -1 meaning process all * documents. */ public int getSize() { return size; } /** * Maximum number of processed documents. Defaults to -1 meaning process all * documents. */ public Self setSize(int size) { this.size = size; return self(); } /** * Should version conflicts cause aborts? Defaults to false. */ public boolean isAbortOnVersionConflict() { return abortOnVersionConflict; } /** * Should version conflicts cause aborts? Defaults to false. */ public Self setAbortOnVersionConflict(boolean abortOnVersionConflict) { this.abortOnVersionConflict = abortOnVersionConflict; return self(); } /** * Sets abortOnVersionConflict based on REST-friendly names. */ public void setConflicts(String conflicts) { switch (conflicts) { case "proceed": setAbortOnVersionConflict(false); return; case "abort": setAbortOnVersionConflict(true); return; default: throw new IllegalArgumentException("conflicts may only be \"proceed\" or \"abort\" but was [" + conflicts + "]"); } } /** * The search request that matches the documents to process. */ public SearchRequest getSearchRequest() { return searchRequest; } /** * Call refresh on the indexes we've written to after the request ends? */ public boolean isRefresh() { return refresh; } /** * Call refresh on the indexes we've written to after the request ends? */ public Self setRefresh(boolean refresh) { this.refresh = refresh; return self(); } /** * Timeout to wait for the shards on to be available for each bulk request? */ public TimeValue getTimeout() { return timeout; } /** * Timeout to wait for the shards on to be available for each bulk request? */ public Self setTimeout(TimeValue timeout) { this.timeout = timeout; return self(); } /** * Consistency level for write requests. */ public WriteConsistencyLevel getConsistency() { return consistency; } /** * Consistency level for write requests. */ public Self setConsistency(WriteConsistencyLevel consistency) { this.consistency = consistency; return self(); } /** * Initial delay after a rejection before retrying request. */ public TimeValue getRetryBackoffInitialTime() { return retryBackoffInitialTime; } /** * Set the initial delay after a rejection before retrying request. */ public Self setRetryBackoffInitialTime(TimeValue retryBackoffInitialTime) { this.retryBackoffInitialTime = retryBackoffInitialTime; return self(); } /** * Total number of retries attempted for rejections. */ public int getMaxRetries() { return maxRetries; } /** * Set the total number of retries attempted for rejections. There is no way to ask for unlimited retries. */ public Self setMaxRetries(int maxRetries) { this.maxRetries = maxRetries; return self(); } /** * The throttle for this request in sub-requests per second. {@link Float#POSITIVE_INFINITY} means set no throttle and that is the * default. Throttling is done between batches, as we start the next scroll requests. That way we can increase the scroll's timeout to * make sure that it contains any time that we might wait. */ public float getRequestsPerSecond() { return requestsPerSecond; } /** * Set the throttle for this request in sub-requests per second. {@link Float#POSITIVE_INFINITY} means set no throttle and that is the * default. Throttling is done between batches, as we start the next scroll requests. That way we can increase the scroll's timeout to * make sure that it contains any time that we might wait. */ public Self setRequestsPerSecond(float requestsPerSecond) { if (requestsPerSecond <= 0) { throw new IllegalArgumentException( "[requests_per_second] must be greater than 0. Use Float.POSITIVE_INFINITY to disable throttling."); } this.requestsPerSecond = requestsPerSecond; return self(); } @Override public Task createTask(long id, String type, String action) { return new BulkByScrollTask(id, type, action, getDescription(), requestsPerSecond); } @Override public void readFrom(StreamInput in) throws IOException { super.readFrom(in); searchRequest = new SearchRequest(); searchRequest.readFrom(in); abortOnVersionConflict = in.readBoolean(); size = in.readVInt(); refresh = in.readBoolean(); timeout = TimeValue.readTimeValue(in); consistency = WriteConsistencyLevel.fromId(in.readByte()); retryBackoffInitialTime = TimeValue.readTimeValue(in); maxRetries = in.readVInt(); if (in.getVersion().onOrAfter(Version.V_2_4_0)) { requestsPerSecond = in.readFloat(); } } @Override public void writeTo(StreamOutput out) throws IOException { super.writeTo(out); searchRequest.writeTo(out); out.writeBoolean(abortOnVersionConflict); out.writeVInt(size); out.writeBoolean(refresh); timeout.writeTo(out); out.writeByte(consistency.id()); retryBackoffInitialTime.writeTo(out); out.writeVInt(maxRetries); if (out.getVersion().onOrAfter(Version.V_2_4_0)) { out.writeFloat(requestsPerSecond); } } /** * Append a short description of the search request to a StringBuilder. Used * to make toString. */ protected void searchToString(StringBuilder b) { if (searchRequest.indices() != null && searchRequest.indices().length != 0) { b.append(Arrays.toString(searchRequest.indices())); } else { b.append("[all indices]"); } if (searchRequest.types() != null && searchRequest.types().length != 0) { b.append(Arrays.toString(searchRequest.types())); } } }