Search in sources :

Example 1 with ClusterAllocationExplanation

use of org.opensearch.action.admin.cluster.allocation.ClusterAllocationExplanation in project OpenSearch by opensearch-project.

the class AllocationIdIT method checkNoValidShardCopy.

private void checkNoValidShardCopy(String indexName, ShardId shardId) throws Exception {
    assertBusy(() -> {
        final ClusterAllocationExplanation explanation = client().admin().cluster().prepareAllocationExplain().setIndex(indexName).setShard(shardId.id()).setPrimary(true).get().getExplanation();
        final ShardAllocationDecision shardAllocationDecision = explanation.getShardAllocationDecision();
        assertThat(shardAllocationDecision.isDecisionTaken(), equalTo(true));
        assertThat(shardAllocationDecision.getAllocateDecision().getAllocationDecision(), equalTo(AllocationDecision.NO_VALID_SHARD_COPY));
    });
}
Also used : ClusterAllocationExplanation(org.opensearch.action.admin.cluster.allocation.ClusterAllocationExplanation) ShardAllocationDecision(org.opensearch.cluster.routing.allocation.ShardAllocationDecision)

Example 2 with ClusterAllocationExplanation

use of org.opensearch.action.admin.cluster.allocation.ClusterAllocationExplanation in project OpenSearch by opensearch-project.

the class RemoveCorruptedShardDataCommandIT method testCorruptTranslogTruncation.

public void testCorruptTranslogTruncation() throws Exception {
    internalCluster().startNodes(2);
    final String node1 = internalCluster().getNodeNames()[0];
    final String node2 = internalCluster().getNodeNames()[1];
    final String indexName = "test";
    assertAcked(prepareCreate(indexName).setSettings(Settings.builder().put(IndexMetadata.SETTING_NUMBER_OF_SHARDS, 1).put(IndexMetadata.SETTING_NUMBER_OF_REPLICAS, 1).put(IndexSettings.INDEX_REFRESH_INTERVAL_SETTING.getKey(), "-1").put(MockEngineSupport.DISABLE_FLUSH_ON_CLOSE.getKey(), // never flush - always recover from translog
    true).put("index.routing.allocation.exclude._name", node2)));
    ensureYellow();
    assertAcked(client().admin().indices().prepareUpdateSettings(indexName).setSettings(Settings.builder().putNull("index.routing.allocation.exclude._name")));
    ensureGreen();
    // Index some documents
    int numDocsToKeep = randomIntBetween(10, 100);
    logger.info("--> indexing [{}] docs to be kept", numDocsToKeep);
    IndexRequestBuilder[] builders = new IndexRequestBuilder[numDocsToKeep];
    for (int i = 0; i < builders.length; i++) {
        builders[i] = client().prepareIndex(indexName).setSource("foo", "bar");
    }
    indexRandom(false, false, false, Arrays.asList(builders));
    flush(indexName);
    disableTranslogFlush(indexName);
    // having no extra docs is an interesting case for seq no based recoveries - test it more often
    int numDocsToTruncate = randomBoolean() ? 0 : randomIntBetween(0, 100);
    logger.info("--> indexing [{}] more doc to be truncated", numDocsToTruncate);
    builders = new IndexRequestBuilder[numDocsToTruncate];
    for (int i = 0; i < builders.length; i++) {
        builders[i] = client().prepareIndex(indexName).setSource("foo", "bar");
    }
    indexRandom(false, false, false, Arrays.asList(builders));
    RemoveCorruptedShardDataCommand command = new RemoveCorruptedShardDataCommand();
    MockTerminal terminal = new MockTerminal();
    OptionParser parser = command.getParser();
    if (randomBoolean() && numDocsToTruncate > 0) {
        // flush the replica, so it will have more docs than what the primary will have
        Index index = resolveIndex(indexName);
        IndexShard replica = internalCluster().getInstance(IndicesService.class, node2).getShardOrNull(new ShardId(index, 0));
        replica.flush(new FlushRequest());
        logger.info("--> performed extra flushing on replica");
    }
    final Settings node1PathSettings = internalCluster().dataPathSettings(node1);
    final Settings node2PathSettings = internalCluster().dataPathSettings(node2);
    // shut down the replica node to be tested later
    internalCluster().stopRandomNode(InternalTestCluster.nameFilter(node2));
    final Path translogDir = getPathToShardData(indexName, ShardPath.TRANSLOG_FOLDER_NAME);
    final Path indexDir = getPathToShardData(indexName, ShardPath.INDEX_FOLDER_NAME);
    // Restart the single node
    logger.info("--> restarting node");
    internalCluster().restartRandomDataNode(new InternalTestCluster.RestartCallback() {

        @Override
        public Settings onNodeStopped(String nodeName) throws Exception {
            logger.info("--> corrupting translog on node {}", nodeName);
            TestTranslog.corruptRandomTranslogFile(logger, random(), translogDir);
            return super.onNodeStopped(nodeName);
        }
    });
    // all shards should be failed due to a corrupted translog
    assertBusy(() -> {
        final UnassignedInfo unassignedInfo = client().admin().cluster().prepareAllocationExplain().setIndex(indexName).setShard(0).setPrimary(true).get().getExplanation().getUnassignedInfo();
        assertThat(unassignedInfo.getReason(), equalTo(UnassignedInfo.Reason.ALLOCATION_FAILED));
        assertThat(ExceptionsHelper.unwrap(unassignedInfo.getFailure(), TranslogCorruptedException.class), not(nullValue()));
    });
    // have to shut down primary node - otherwise node lock is present
    internalCluster().restartNode(node1, new InternalTestCluster.RestartCallback() {

        @Override
        public Settings onNodeStopped(String nodeName) throws Exception {
            assertBusy(() -> {
                logger.info("--> checking that lock has been released for {}", indexDir);
                // noinspection EmptyTryBlock since we're just trying to obtain the lock
                try (Directory dir = FSDirectory.open(indexDir, NativeFSLockFactory.INSTANCE);
                    Lock ignored = dir.obtainLock(IndexWriter.WRITE_LOCK_NAME)) {
                } catch (LockObtainFailedException lofe) {
                    logger.info("--> failed acquiring lock for {}", indexDir);
                    throw new AssertionError("still waiting for lock release at [" + indexDir + "]", lofe);
                } catch (IOException ioe) {
                    throw new AssertionError("unexpected IOException [" + indexDir + "]", ioe);
                }
            });
            final Environment environment = TestEnvironment.newEnvironment(Settings.builder().put(internalCluster().getDefaultSettings()).put(node1PathSettings).build());
            terminal.addTextInput("y");
            OptionSet options = parser.parse("-d", translogDir.toAbsolutePath().toString());
            logger.info("--> running command for [{}]", translogDir.toAbsolutePath());
            command.execute(terminal, options, environment);
            logger.info("--> output:\n{}", terminal.getOutput());
            return super.onNodeStopped(nodeName);
        }
    });
    String primaryNodeId = null;
    final ClusterState state = client().admin().cluster().prepareState().get().getState();
    final DiscoveryNodes nodes = state.nodes();
    for (ObjectObjectCursor<String, DiscoveryNode> cursor : nodes.getNodes()) {
        final String name = cursor.value.getName();
        if (name.equals(node1)) {
            primaryNodeId = cursor.key;
            break;
        }
    }
    assertThat(primaryNodeId, notNullValue());
    assertThat(terminal.getOutput(), containsString("allocate_stale_primary"));
    assertThat(terminal.getOutput(), containsString("\"node\" : \"" + primaryNodeId + "\""));
    // there is only _stale_ primary (due to new allocation id)
    assertBusy(() -> {
        final ClusterAllocationExplanation explanation = client().admin().cluster().prepareAllocationExplain().setIndex(indexName).setShard(0).setPrimary(true).get().getExplanation();
        final ShardAllocationDecision shardAllocationDecision = explanation.getShardAllocationDecision();
        assertThat(shardAllocationDecision.isDecisionTaken(), equalTo(true));
        assertThat(shardAllocationDecision.getAllocateDecision().getAllocationDecision(), equalTo(AllocationDecision.NO_VALID_SHARD_COPY));
    });
    client().admin().cluster().prepareReroute().add(new AllocateStalePrimaryAllocationCommand(indexName, 0, primaryNodeId, true)).get();
    assertBusy(() -> {
        final ClusterAllocationExplanation explanation = client().admin().cluster().prepareAllocationExplain().setIndex(indexName).setShard(0).setPrimary(true).get().getExplanation();
        assertThat(explanation.getCurrentNode(), notNullValue());
        assertThat(explanation.getShardState(), equalTo(ShardRoutingState.STARTED));
    });
    ensureYellow(indexName);
    // Run a search and make sure it succeeds
    assertHitCount(client().prepareSearch(indexName).setQuery(matchAllQuery()).get(), numDocsToKeep);
    logger.info("--> starting the replica node to test recovery");
    internalCluster().startNode(node2PathSettings);
    ensureGreen(indexName);
    for (String node : internalCluster().nodesInclude(indexName)) {
        SearchRequestBuilder q = client().prepareSearch(indexName).setPreference("_only_nodes:" + node).setQuery(matchAllQuery());
        assertHitCount(q.get(), numDocsToKeep);
    }
    final RecoveryResponse recoveryResponse = client().admin().indices().prepareRecoveries(indexName).setActiveOnly(false).get();
    final RecoveryState replicaRecoveryState = recoveryResponse.shardRecoveryStates().get(indexName).stream().filter(recoveryState -> recoveryState.getPrimary() == false).findFirst().get();
    assertThat(replicaRecoveryState.getIndex().toString(), replicaRecoveryState.getIndex().recoveredFileCount(), greaterThan(0));
    // Ensure that the global checkpoint and local checkpoint are restored from the max seqno of the last commit.
    final SeqNoStats seqNoStats = getSeqNoStats(indexName, 0);
    assertThat(seqNoStats.getGlobalCheckpoint(), equalTo(seqNoStats.getMaxSeqNo()));
    assertThat(seqNoStats.getLocalCheckpoint(), equalTo(seqNoStats.getMaxSeqNo()));
}
Also used : DiscoveryNode(org.opensearch.cluster.node.DiscoveryNode) UnassignedInfo(org.opensearch.cluster.routing.UnassignedInfo) AllocateStalePrimaryAllocationCommand(org.opensearch.cluster.routing.allocation.command.AllocateStalePrimaryAllocationCommand) Index(org.opensearch.index.Index) InternalTestCluster(org.opensearch.test.InternalTestCluster) Matchers.containsString(org.hamcrest.Matchers.containsString) MockTerminal(org.opensearch.cli.MockTerminal) OptionParser(joptsimple.OptionParser) RecoveryResponse(org.opensearch.action.admin.indices.recovery.RecoveryResponse) SeqNoStats(org.opensearch.index.seqno.SeqNoStats) FlushRequest(org.opensearch.action.admin.indices.flush.FlushRequest) LockObtainFailedException(org.apache.lucene.store.LockObtainFailedException) ShardAllocationDecision(org.opensearch.cluster.routing.allocation.ShardAllocationDecision) RecoveryState(org.opensearch.indices.recovery.RecoveryState) Settings(org.opensearch.common.settings.Settings) IndexSettings(org.opensearch.index.IndexSettings) DiscoveryNodes(org.opensearch.cluster.node.DiscoveryNodes) Directory(org.apache.lucene.store.Directory) FSDirectory(org.apache.lucene.store.FSDirectory) Path(java.nio.file.Path) ClusterState(org.opensearch.cluster.ClusterState) ClusterAllocationExplanation(org.opensearch.action.admin.cluster.allocation.ClusterAllocationExplanation) SearchRequestBuilder(org.opensearch.action.search.SearchRequestBuilder) IndicesService(org.opensearch.indices.IndicesService) IOException(java.io.IOException) TranslogCorruptedException(org.opensearch.index.translog.TranslogCorruptedException) LockObtainFailedException(org.apache.lucene.store.LockObtainFailedException) IOException(java.io.IOException) Lock(org.apache.lucene.store.Lock) IndexRequestBuilder(org.opensearch.action.index.IndexRequestBuilder) TranslogCorruptedException(org.opensearch.index.translog.TranslogCorruptedException) NodeEnvironment(org.opensearch.env.NodeEnvironment) TestEnvironment(org.opensearch.env.TestEnvironment) Environment(org.opensearch.env.Environment) OptionSet(joptsimple.OptionSet)

Example 3 with ClusterAllocationExplanation

use of org.opensearch.action.admin.cluster.allocation.ClusterAllocationExplanation in project OpenSearch by opensearch-project.

the class RemoveCorruptedShardDataCommandIT method testCorruptIndex.

public void testCorruptIndex() throws Exception {
    final String node = internalCluster().startNode();
    final String indexName = "index42";
    assertAcked(prepareCreate(indexName).setSettings(Settings.builder().put(IndexMetadata.SETTING_NUMBER_OF_SHARDS, 1).put(IndexMetadata.SETTING_NUMBER_OF_REPLICAS, 0).put(MergePolicyConfig.INDEX_MERGE_ENABLED, false).put(IndexSettings.INDEX_REFRESH_INTERVAL_SETTING.getKey(), "-1").put(MockEngineSupport.DISABLE_FLUSH_ON_CLOSE.getKey(), true).put(IndexSettings.INDEX_CHECK_ON_STARTUP.getKey(), "checksum")));
    // index some docs in several segments
    int numDocs = 0;
    for (int k = 0, attempts = randomIntBetween(5, 10); k < attempts; k++) {
        final int numExtraDocs = between(10, 100);
        IndexRequestBuilder[] builders = new IndexRequestBuilder[numExtraDocs];
        for (int i = 0; i < builders.length; i++) {
            builders[i] = client().prepareIndex(indexName).setSource("foo", "bar");
        }
        numDocs += numExtraDocs;
        indexRandom(false, false, false, Arrays.asList(builders));
        flush(indexName);
    }
    logger.info("--> indexed {} docs", numDocs);
    final RemoveCorruptedShardDataCommand command = new RemoveCorruptedShardDataCommand();
    final MockTerminal terminal = new MockTerminal();
    final OptionParser parser = command.getParser();
    final Settings nodePathSettings = internalCluster().dataPathSettings(node);
    final Environment environment = TestEnvironment.newEnvironment(Settings.builder().put(internalCluster().getDefaultSettings()).put(nodePathSettings).build());
    final OptionSet options = parser.parse("-index", indexName, "-shard-id", "0");
    // Try running it before the node is stopped (and shard is closed)
    try {
        command.execute(terminal, options, environment);
        fail("expected the command to fail as node is locked");
    } catch (Exception e) {
        assertThat(e.getMessage(), allOf(containsString("failed to lock node's directory"), containsString("is OpenSearch still running?")));
    }
    final Path indexDir = getPathToShardData(indexName, ShardPath.INDEX_FOLDER_NAME);
    internalCluster().restartNode(node, new InternalTestCluster.RestartCallback() {

        @Override
        public Settings onNodeStopped(String nodeName) throws Exception {
            // Try running it before the shard is corrupted, it should flip out because there is no corruption file marker
            try {
                command.execute(terminal, options, environment);
                fail("expected the command to fail as there is no corruption file marker");
            } catch (Exception e) {
                assertThat(e.getMessage(), startsWith("Shard does not seem to be corrupted at"));
            }
            CorruptionUtils.corruptIndex(random(), indexDir, false);
            return super.onNodeStopped(nodeName);
        }
    });
    // shard should be failed due to a corrupted index
    assertBusy(() -> {
        final ClusterAllocationExplanation explanation = client().admin().cluster().prepareAllocationExplain().setIndex(indexName).setShard(0).setPrimary(true).get().getExplanation();
        final ShardAllocationDecision shardAllocationDecision = explanation.getShardAllocationDecision();
        assertThat(shardAllocationDecision.isDecisionTaken(), equalTo(true));
        assertThat(shardAllocationDecision.getAllocateDecision().getAllocationDecision(), equalTo(AllocationDecision.NO_VALID_SHARD_COPY));
    });
    internalCluster().restartNode(node, new InternalTestCluster.RestartCallback() {

        @Override
        public Settings onNodeStopped(String nodeName) throws Exception {
            terminal.addTextInput("y");
            command.execute(terminal, options, environment);
            return super.onNodeStopped(nodeName);
        }
    });
    waitNoPendingTasksOnAll();
    String nodeId = null;
    final ClusterState state = client().admin().cluster().prepareState().get().getState();
    final DiscoveryNodes nodes = state.nodes();
    for (ObjectObjectCursor<String, DiscoveryNode> cursor : nodes.getNodes()) {
        final String name = cursor.value.getName();
        if (name.equals(node)) {
            nodeId = cursor.key;
            break;
        }
    }
    assertThat(nodeId, notNullValue());
    logger.info("--> output:\n{}", terminal.getOutput());
    assertThat(terminal.getOutput(), containsString("allocate_stale_primary"));
    assertThat(terminal.getOutput(), containsString("\"node\" : \"" + nodeId + "\""));
    // there is only _stale_ primary (due to new allocation id)
    assertBusy(() -> {
        final ClusterAllocationExplanation explanation = client().admin().cluster().prepareAllocationExplain().setIndex(indexName).setShard(0).setPrimary(true).get().getExplanation();
        final ShardAllocationDecision shardAllocationDecision = explanation.getShardAllocationDecision();
        assertThat(shardAllocationDecision.isDecisionTaken(), equalTo(true));
        assertThat(shardAllocationDecision.getAllocateDecision().getAllocationDecision(), equalTo(AllocationDecision.NO_VALID_SHARD_COPY));
    });
    client().admin().cluster().prepareReroute().add(new AllocateStalePrimaryAllocationCommand(indexName, 0, nodeId, true)).get();
    assertBusy(() -> {
        final ClusterAllocationExplanation explanation = client().admin().cluster().prepareAllocationExplain().setIndex(indexName).setShard(0).setPrimary(true).get().getExplanation();
        assertThat(explanation.getCurrentNode(), notNullValue());
        assertThat(explanation.getShardState(), equalTo(ShardRoutingState.STARTED));
    });
    final Pattern pattern = Pattern.compile("Corrupted Lucene index segments found -\\s+(?<docs>\\d+) documents will be lost.");
    final Matcher matcher = pattern.matcher(terminal.getOutput());
    assertThat(matcher.find(), equalTo(true));
    final int expectedNumDocs = numDocs - Integer.parseInt(matcher.group("docs"));
    ensureGreen(indexName);
    assertHitCount(client().prepareSearch(indexName).setQuery(matchAllQuery()).get(), expectedNumDocs);
}
Also used : Path(java.nio.file.Path) ClusterAllocationExplanation(org.opensearch.action.admin.cluster.allocation.ClusterAllocationExplanation) ClusterState(org.opensearch.cluster.ClusterState) Pattern(java.util.regex.Pattern) DiscoveryNode(org.opensearch.cluster.node.DiscoveryNode) Matcher(java.util.regex.Matcher) AllocateStalePrimaryAllocationCommand(org.opensearch.cluster.routing.allocation.command.AllocateStalePrimaryAllocationCommand) InternalTestCluster(org.opensearch.test.InternalTestCluster) Matchers.containsString(org.hamcrest.Matchers.containsString) MockTerminal(org.opensearch.cli.MockTerminal) OptionParser(joptsimple.OptionParser) TranslogCorruptedException(org.opensearch.index.translog.TranslogCorruptedException) LockObtainFailedException(org.apache.lucene.store.LockObtainFailedException) IOException(java.io.IOException) IndexRequestBuilder(org.opensearch.action.index.IndexRequestBuilder) NodeEnvironment(org.opensearch.env.NodeEnvironment) TestEnvironment(org.opensearch.env.TestEnvironment) Environment(org.opensearch.env.Environment) OptionSet(joptsimple.OptionSet) ShardAllocationDecision(org.opensearch.cluster.routing.allocation.ShardAllocationDecision) Settings(org.opensearch.common.settings.Settings) IndexSettings(org.opensearch.index.IndexSettings) DiscoveryNodes(org.opensearch.cluster.node.DiscoveryNodes)

Aggregations

ClusterAllocationExplanation (org.opensearch.action.admin.cluster.allocation.ClusterAllocationExplanation)3 ShardAllocationDecision (org.opensearch.cluster.routing.allocation.ShardAllocationDecision)3 IOException (java.io.IOException)2 Path (java.nio.file.Path)2 OptionParser (joptsimple.OptionParser)2 OptionSet (joptsimple.OptionSet)2 LockObtainFailedException (org.apache.lucene.store.LockObtainFailedException)2 Matchers.containsString (org.hamcrest.Matchers.containsString)2 IndexRequestBuilder (org.opensearch.action.index.IndexRequestBuilder)2 MockTerminal (org.opensearch.cli.MockTerminal)2 ClusterState (org.opensearch.cluster.ClusterState)2 DiscoveryNode (org.opensearch.cluster.node.DiscoveryNode)2 DiscoveryNodes (org.opensearch.cluster.node.DiscoveryNodes)2 AllocateStalePrimaryAllocationCommand (org.opensearch.cluster.routing.allocation.command.AllocateStalePrimaryAllocationCommand)2 Settings (org.opensearch.common.settings.Settings)2 Environment (org.opensearch.env.Environment)2 NodeEnvironment (org.opensearch.env.NodeEnvironment)2 TestEnvironment (org.opensearch.env.TestEnvironment)2 IndexSettings (org.opensearch.index.IndexSettings)2 TranslogCorruptedException (org.opensearch.index.translog.TranslogCorruptedException)2