|  | @@ -0,0 +1,198 @@
 | 
	
		
			
				|  |  | +/*
 | 
	
		
			
				|  |  | + * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
 | 
	
		
			
				|  |  | + * or more contributor license agreements. Licensed under the Elastic License
 | 
	
		
			
				|  |  | + * 2.0 and the Server Side Public License, v 1; you may not use this file except
 | 
	
		
			
				|  |  | + * in compliance with, at your election, the Elastic License 2.0 or the Server
 | 
	
		
			
				|  |  | + * Side Public License, v 1.
 | 
	
		
			
				|  |  | + */
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +package org.elasticsearch.index.store;
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +import org.apache.lucene.codecs.CodecUtil;
 | 
	
		
			
				|  |  | +import org.apache.lucene.index.CorruptIndexException;
 | 
	
		
			
				|  |  | +import org.apache.lucene.store.Directory;
 | 
	
		
			
				|  |  | +import org.apache.lucene.store.IOContext;
 | 
	
		
			
				|  |  | +import org.apache.lucene.util.Version;
 | 
	
		
			
				|  |  | +import org.elasticsearch.common.Numbers;
 | 
	
		
			
				|  |  | +import org.elasticsearch.index.IndexVersion;
 | 
	
		
			
				|  |  | +import org.elasticsearch.test.ESTestCase;
 | 
	
		
			
				|  |  | +import org.hamcrest.Matcher;
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +import java.io.IOException;
 | 
	
		
			
				|  |  | +import java.nio.ByteBuffer;
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +import static org.hamcrest.Matchers.allOf;
 | 
	
		
			
				|  |  | +import static org.hamcrest.Matchers.containsString;
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +public class VerifyingIndexOutputTests extends ESTestCase {
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +    private static final int CHECKSUM_LENGTH = 8;
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +    private static final Version MIN_SUPPORTED_LUCENE_VERSION = IndexVersion.MINIMUM_COMPATIBLE.luceneVersion();
 | 
	
		
			
				|  |  | +    private static final Matcher<String> VERIFICATION_FAILURE = containsString("verification failed (hardware problem?)");
 | 
	
		
			
				|  |  | +    private static final Matcher<String> FOOTER_NOT_CHECKED = allOf(VERIFICATION_FAILURE, containsString("footer=<not checked>"));
 | 
	
		
			
				|  |  | +    private static final Matcher<String> INVALID_LENGTH = allOf(VERIFICATION_FAILURE, containsString("footer=<invalid length>"));
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +    public void testVerifyingIndexOutput() throws IOException {
 | 
	
		
			
				|  |  | +        try (var directory = newDirectory()) {
 | 
	
		
			
				|  |  | +            final StoreFileMetadata metadata = createFileWithChecksum(directory);
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +            try (var verifyingOutput = new VerifyingIndexOutput(metadata, directory.createOutput("rewritten.dat", IOContext.DEFAULT))) {
 | 
	
		
			
				|  |  | +                try (var indexInput = directory.openInput(metadata.name(), IOContext.DEFAULT)) {
 | 
	
		
			
				|  |  | +                    final byte[] buffer = new byte[1024];
 | 
	
		
			
				|  |  | +                    int length = Math.toIntExact(metadata.length());
 | 
	
		
			
				|  |  | +                    while (length > 0) {
 | 
	
		
			
				|  |  | +                        if (random().nextInt(10) == 0) {
 | 
	
		
			
				|  |  | +                            verifyingOutput.writeByte(indexInput.readByte());
 | 
	
		
			
				|  |  | +                            length--;
 | 
	
		
			
				|  |  | +                        } else {
 | 
	
		
			
				|  |  | +                            int offset = between(0, buffer.length - 1);
 | 
	
		
			
				|  |  | +                            int len = between(1, Math.min(length, buffer.length - offset));
 | 
	
		
			
				|  |  | +                            indexInput.readBytes(buffer, offset, len);
 | 
	
		
			
				|  |  | +                            verifyingOutput.writeBytes(buffer, offset, len);
 | 
	
		
			
				|  |  | +                            length -= len;
 | 
	
		
			
				|  |  | +                        }
 | 
	
		
			
				|  |  | +                    }
 | 
	
		
			
				|  |  | +                }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +                for (int i = 0; i < 2; i++) {
 | 
	
		
			
				|  |  | +                    // check twice to make sure the first call doesn't leave things in a broken state
 | 
	
		
			
				|  |  | +                    verifyingOutput.verify(); // should not throw
 | 
	
		
			
				|  |  | +                }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +                ensureCorruptAfterRandomWrite(verifyingOutput);
 | 
	
		
			
				|  |  | +            }
 | 
	
		
			
				|  |  | +        }
 | 
	
		
			
				|  |  | +    }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +    public void testVerifyingIndexOutputOnTooShortFile() throws IOException {
 | 
	
		
			
				|  |  | +        final var metadata = new StoreFileMetadata(
 | 
	
		
			
				|  |  | +            "foo.bar",
 | 
	
		
			
				|  |  | +            between(0, CHECKSUM_LENGTH - 1),
 | 
	
		
			
				|  |  | +            randomAlphaOfLength(5),
 | 
	
		
			
				|  |  | +            MIN_SUPPORTED_LUCENE_VERSION.toString()
 | 
	
		
			
				|  |  | +        );
 | 
	
		
			
				|  |  | +        try (
 | 
	
		
			
				|  |  | +            var dir = newDirectory();
 | 
	
		
			
				|  |  | +            var verifyingOutput = new VerifyingIndexOutput(metadata, dir.createOutput("rewritten.dat", IOContext.DEFAULT))
 | 
	
		
			
				|  |  | +        ) {
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +            int length = Math.toIntExact(metadata.length());
 | 
	
		
			
				|  |  | +            final ByteBuffer buffer = ByteBuffer.wrap(randomByteArrayOfLength(length));
 | 
	
		
			
				|  |  | +            while (buffer.remaining() > 0) {
 | 
	
		
			
				|  |  | +                // verify should fail on truncated file
 | 
	
		
			
				|  |  | +                assertThat(expectThrows(CorruptIndexException.class, verifyingOutput::verify).getMessage(), INVALID_LENGTH);
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +                if (randomBoolean()) {
 | 
	
		
			
				|  |  | +                    verifyingOutput.writeByte(buffer.get());
 | 
	
		
			
				|  |  | +                } else {
 | 
	
		
			
				|  |  | +                    var lenToWrite = between(1, buffer.remaining());
 | 
	
		
			
				|  |  | +                    verifyingOutput.writeBytes(buffer.array(), buffer.arrayOffset() + buffer.position(), lenToWrite);
 | 
	
		
			
				|  |  | +                    buffer.position(buffer.position() + lenToWrite);
 | 
	
		
			
				|  |  | +                }
 | 
	
		
			
				|  |  | +            }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +            for (int i = 0; i < 2; i++) {
 | 
	
		
			
				|  |  | +                // check twice to make sure the first call doesn't leave things in a broken state
 | 
	
		
			
				|  |  | +                assertThat(
 | 
	
		
			
				|  |  | +                    expectThrows(CorruptIndexException.class, verifyingOutput::verify).getMessage(),
 | 
	
		
			
				|  |  | +                    allOf(VERIFICATION_FAILURE, containsString("actual=<too short>"))
 | 
	
		
			
				|  |  | +                );
 | 
	
		
			
				|  |  | +            }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +            ensureCorruptAfterRandomWrite(verifyingOutput);
 | 
	
		
			
				|  |  | +        }
 | 
	
		
			
				|  |  | +    }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +    public void testVerifyingIndexOutputOnCorruptFile() throws IOException {
 | 
	
		
			
				|  |  | +        try (var dir = newDirectory()) {
 | 
	
		
			
				|  |  | +            final StoreFileMetadata metadata = createFileWithChecksum(dir);
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +            int length = Math.toIntExact(metadata.length());
 | 
	
		
			
				|  |  | +            final var byteToCorrupt = between(0, length - 1);
 | 
	
		
			
				|  |  | +            final var isExpectedMessage = byteToCorrupt < length - CHECKSUM_LENGTH ? FOOTER_NOT_CHECKED : VERIFICATION_FAILURE;
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +            try (var verifyingOutput = new VerifyingIndexOutput(metadata, dir.createOutput("rewritten.dat", IOContext.DEFAULT))) {
 | 
	
		
			
				|  |  | +                try (var indexInput = dir.openInput(metadata.name(), IOContext.DEFAULT)) {
 | 
	
		
			
				|  |  | +                    final byte[] buffer = new byte[1024];
 | 
	
		
			
				|  |  | +                    while (length > 0) {
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +                        // verify should fail on truncated file
 | 
	
		
			
				|  |  | +                        assertThat(expectThrows(CorruptIndexException.class, verifyingOutput::verify).getMessage(), INVALID_LENGTH);
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +                        int offset = between(0, buffer.length - 1);
 | 
	
		
			
				|  |  | +                        var singleByte = randomInt(10) == 0;
 | 
	
		
			
				|  |  | +                        var len = singleByte ? 1 : between(1, Math.min(length, buffer.length - offset));
 | 
	
		
			
				|  |  | +                        indexInput.readBytes(buffer, offset, len);
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +                        if (verifyingOutput.getFilePointer() <= byteToCorrupt && byteToCorrupt < indexInput.getFilePointer()) {
 | 
	
		
			
				|  |  | +                            // CRC32 will always detect single-bit errors
 | 
	
		
			
				|  |  | +                            final byte oneBit = (byte) (1 << between(0, Byte.SIZE - 1));
 | 
	
		
			
				|  |  | +                            buffer[offset + byteToCorrupt - Math.toIntExact(verifyingOutput.getFilePointer())] ^= oneBit;
 | 
	
		
			
				|  |  | +                        }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +                        if (singleByte) {
 | 
	
		
			
				|  |  | +                            verifyingOutput.writeByte(buffer[offset]);
 | 
	
		
			
				|  |  | +                        } else {
 | 
	
		
			
				|  |  | +                            verifyingOutput.writeBytes(buffer, offset, len);
 | 
	
		
			
				|  |  | +                        }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +                        length -= len;
 | 
	
		
			
				|  |  | +                    }
 | 
	
		
			
				|  |  | +                }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +                assertEquals(metadata.length(), verifyingOutput.getFilePointer());
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +                for (int i = 0; i < 2; i++) {
 | 
	
		
			
				|  |  | +                    // check twice to make sure the first call doesn't leave things in a broken state
 | 
	
		
			
				|  |  | +                    assertThat(expectThrows(CorruptIndexException.class, verifyingOutput::verify).getMessage(), isExpectedMessage);
 | 
	
		
			
				|  |  | +                }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +                ensureCorruptAfterRandomWrite(verifyingOutput);
 | 
	
		
			
				|  |  | +            }
 | 
	
		
			
				|  |  | +        }
 | 
	
		
			
				|  |  | +    }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +    private static StoreFileMetadata createFileWithChecksum(Directory directory) throws IOException {
 | 
	
		
			
				|  |  | +        final var filename = randomAlphaOfLength(10);
 | 
	
		
			
				|  |  | +        final var bytes = randomByteArrayOfLength(scaledRandomIntBetween(0, 2048));
 | 
	
		
			
				|  |  | +        try (var output = directory.createOutput(filename, IOContext.DEFAULT)) {
 | 
	
		
			
				|  |  | +            output.writeBytes(bytes, bytes.length);
 | 
	
		
			
				|  |  | +            if (rarely()) {
 | 
	
		
			
				|  |  | +                // in practice there's always a complete 16-byte footer, but this ensures that we only care about the checksum
 | 
	
		
			
				|  |  | +                final var checksum = output.getChecksum();
 | 
	
		
			
				|  |  | +                final var metadata = new StoreFileMetadata(
 | 
	
		
			
				|  |  | +                    filename,
 | 
	
		
			
				|  |  | +                    bytes.length + Long.BYTES,
 | 
	
		
			
				|  |  | +                    Store.digestToString(checksum),
 | 
	
		
			
				|  |  | +                    MIN_SUPPORTED_LUCENE_VERSION.toString()
 | 
	
		
			
				|  |  | +                );
 | 
	
		
			
				|  |  | +                output.writeBytes(Numbers.longToBytes(checksum), Long.BYTES);
 | 
	
		
			
				|  |  | +                return metadata;
 | 
	
		
			
				|  |  | +            } else {
 | 
	
		
			
				|  |  | +                CodecUtil.writeFooter(output);
 | 
	
		
			
				|  |  | +                // fall through and obtain the checksum using an IndexInput
 | 
	
		
			
				|  |  | +            }
 | 
	
		
			
				|  |  | +        }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +        try (var indexInput = directory.openInput(filename, IOContext.DEFAULT)) {
 | 
	
		
			
				|  |  | +            assertEquals(bytes.length + CodecUtil.footerLength(), indexInput.length());
 | 
	
		
			
				|  |  | +            return new StoreFileMetadata(
 | 
	
		
			
				|  |  | +                filename,
 | 
	
		
			
				|  |  | +                indexInput.length(),
 | 
	
		
			
				|  |  | +                Store.digestToString(CodecUtil.retrieveChecksum(indexInput)),
 | 
	
		
			
				|  |  | +                MIN_SUPPORTED_LUCENE_VERSION.toString()
 | 
	
		
			
				|  |  | +            );
 | 
	
		
			
				|  |  | +        }
 | 
	
		
			
				|  |  | +    }
 | 
	
		
			
				|  |  | +
 | 
	
		
			
				|  |  | +    private static void ensureCorruptAfterRandomWrite(VerifyingIndexOutput verifyingOutput) throws IOException {
 | 
	
		
			
				|  |  | +        if (randomBoolean()) {
 | 
	
		
			
				|  |  | +            verifyingOutput.writeByte(randomByte());
 | 
	
		
			
				|  |  | +        } else {
 | 
	
		
			
				|  |  | +            final var len = between(1, 10);
 | 
	
		
			
				|  |  | +            verifyingOutput.writeBytes(randomByteArrayOfLength(len), 0, len);
 | 
	
		
			
				|  |  | +        }
 | 
	
		
			
				|  |  | +        assertThat(expectThrows(CorruptIndexException.class, verifyingOutput::verify).getMessage(), INVALID_LENGTH);
 | 
	
		
			
				|  |  | +    }
 | 
	
		
			
				|  |  | +}
 |