Java tutorial
/* * Licensed to Elasticsearch under one or more contributor * license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright * ownership. Elasticsearch licenses this file to you under * the Apache License, Version 2.0 (the "License"); you may * not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, * software distributed under the License is distributed on an * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY * KIND, either express or implied. See the License for the * specific language governing permissions and limitations * under the License. */ package org.elasticsearch.smoketest; import org.apache.http.HttpHost; import org.apache.lucene.util.BytesRef; import com.carrotsearch.randomizedtesting.annotations.Name; import com.carrotsearch.randomizedtesting.annotations.ParametersFactory; import org.elasticsearch.Version; import org.elasticsearch.client.RestClient; import org.elasticsearch.common.ParseField; import org.elasticsearch.common.xcontent.ConstructingObjectParser; import org.elasticsearch.common.xcontent.NamedXContentRegistry; import org.elasticsearch.common.xcontent.XContentLocation; import org.elasticsearch.common.xcontent.XContentParser; import org.elasticsearch.common.xcontent.XContentParser.Token; import org.elasticsearch.test.rest.yaml.ClientYamlDocsTestClient; import org.elasticsearch.test.rest.yaml.ClientYamlTestCandidate; import org.elasticsearch.test.rest.yaml.ClientYamlTestClient; import org.elasticsearch.test.rest.yaml.ClientYamlTestExecutionContext; import org.elasticsearch.test.rest.yaml.ClientYamlTestResponse; import org.elasticsearch.test.rest.yaml.ESClientYamlSuiteTestCase; import org.elasticsearch.test.rest.yaml.restspec.ClientYamlSuiteRestSpec; import org.elasticsearch.test.rest.yaml.section.ExecutableSection; import java.io.IOException; import java.util.ArrayList; import java.util.HashMap; import java.util.Iterator; import java.util.List; import java.util.Map; import static org.elasticsearch.common.xcontent.ConstructingObjectParser.constructorArg; import static java.util.Collections.emptyMap; import static java.util.Collections.singletonList; import static java.util.Collections.singletonMap; public class DocsClientYamlTestSuiteIT extends ESClientYamlSuiteTestCase { public DocsClientYamlTestSuiteIT(@Name("yaml") ClientYamlTestCandidate testCandidate) { super(testCandidate); } @ParametersFactory public static Iterable<Object[]> parameters() throws Exception { List<NamedXContentRegistry.Entry> entries = new ArrayList<>( ExecutableSection.DEFAULT_EXECUTABLE_CONTEXTS.size() + 1); entries.addAll(ExecutableSection.DEFAULT_EXECUTABLE_CONTEXTS); entries.add(new NamedXContentRegistry.Entry(ExecutableSection.class, new ParseField("compare_analyzers"), CompareAnalyzers::parse)); NamedXContentRegistry executeableSectionRegistry = new NamedXContentRegistry(entries); return ESClientYamlSuiteTestCase.createParameters(executeableSectionRegistry); } @Override protected void afterIfFailed(List<Throwable> errors) { super.afterIfFailed(errors); String name = getTestName().split("=")[1]; name = name.substring(0, name.length() - 1); name = name.replaceAll("/([^/]+)$", ".asciidoc:$1"); logger.error( "This failing test was generated by documentation starting at {}. It may include many snippets. " + "See docs/README.asciidoc for an explanation of test generation.", name); } @Override protected boolean randomizeContentType() { return false; } @Override protected ClientYamlTestClient initClientYamlTestClient(final ClientYamlSuiteRestSpec restSpec, final RestClient restClient, final List<HttpHost> hosts, final Version esVersion, final Version masterVersion) throws IOException { return new ClientYamlDocsTestClient(restSpec, restClient, hosts, esVersion, masterVersion); } /** * Compares the the results of running two analyzers against many random * strings. The goal is to figure out if two anlayzers are "the same" by * comparing their results. This is far from perfect but should be fairly * accurate, especially for gross things like missing {@code decimal_digit} * token filters, and should be fairly fast because it compares a fairly * small number of tokens. */ private static class CompareAnalyzers implements ExecutableSection { private static ConstructingObjectParser<CompareAnalyzers, XContentLocation> PARSER = new ConstructingObjectParser<>( "test_analyzer", false, (a, location) -> { String index = (String) a[0]; String first = (String) a[1]; String second = (String) a[2]; return new CompareAnalyzers(location, index, first, second); }); static { PARSER.declareString(constructorArg(), new ParseField("index")); PARSER.declareString(constructorArg(), new ParseField("first")); PARSER.declareString(constructorArg(), new ParseField("second")); } private static CompareAnalyzers parse(XContentParser parser) throws IOException { XContentLocation location = parser.getTokenLocation(); CompareAnalyzers section = PARSER.parse(parser, location); assert parser.currentToken() == Token.END_OBJECT : "End of object required"; parser.nextToken(); // throw out the END_OBJECT to conform with other ExecutableSections return section; } private final XContentLocation location; private final String index; private final String first; private final String second; private CompareAnalyzers(XContentLocation location, String index, String first, String second) { this.location = location; this.index = index; this.first = first; this.second = second; } @Override public XContentLocation getLocation() { return location; } @Override public void execute(ClientYamlTestExecutionContext executionContext) throws IOException { int size = 100; int maxLength = 15; List<String> testText = new ArrayList<>(size); for (int i = 0; i < size; i++) { /** * Build a string with a few unicode sequences separated by * spaces. The unicode sequences aren't going to be of the same * code page which is a shame because it makes the entire * string less realistic. But this still provides a fairly * nice string to compare. */ int spaces = between(0, 5); StringBuilder b = new StringBuilder((spaces + 1) * maxLength); b.append(randomRealisticUnicodeOfCodepointLengthBetween(1, maxLength)); for (int t = 0; t < spaces; t++) { b.append(' '); b.append(randomRealisticUnicodeOfCodepointLengthBetween(1, maxLength)); } testText.add(b.toString() // Don't look up stashed values .replace("$", "\\$")); } Map<String, Object> body = new HashMap<>(2); body.put("analyzer", first); body.put("text", testText); ClientYamlTestResponse response = executionContext.callApi("indices.analyze", singletonMap("index", index), singletonList(body), emptyMap()); Iterator<?> firstTokens = ((List<?>) response.evaluate("tokens")).iterator(); body.put("analyzer", second); response = executionContext.callApi("indices.analyze", singletonMap("index", index), singletonList(body), emptyMap()); Iterator<?> secondTokens = ((List<?>) response.evaluate("tokens")).iterator(); Object previousFirst = null; Object previousSecond = null; while (firstTokens.hasNext()) { if (false == secondTokens.hasNext()) { fail(second + " has fewer tokens than " + first + ". " + first + " has [" + firstTokens.next() + "] but " + second + " is out of tokens. " + first + "'s last token was [" + previousFirst + "] and " + second + "'s last token was' [" + previousSecond + "]"); } Map<?, ?> firstToken = (Map<?, ?>) firstTokens.next(); Map<?, ?> secondToken = (Map<?, ?>) secondTokens.next(); String firstText = (String) firstToken.get("token"); String secondText = (String) secondToken.get("token"); // Check the text and produce an error message with the utf8 sequence if they don't match. if (false == secondText.equals(firstText)) { fail("text differs: " + first + " was [" + firstText + "] but " + second + " was [" + secondText + "]. In utf8 those are\n" + new BytesRef(firstText) + " and\n" + new BytesRef(secondText)); } // Now check the whole map just in case the text matches but something else differs assertEquals(firstToken, secondToken); previousFirst = firstToken; previousSecond = secondToken; } if (secondTokens.hasNext()) { fail(second + " has more tokens than " + first + ". " + second + " has [" + secondTokens.next() + "] but " + first + " is out of tokens. " + first + "'s last token was [" + previousFirst + "] and " + second + "'s last token was' [" + previousSecond + "]"); } } } }