com.facebook.presto.verifier.Validator.java Source code

Java tutorial

Introduction

Here is the source code for com.facebook.presto.verifier.Validator.java

Source

/*
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.facebook.presto.verifier;

import com.facebook.presto.jdbc.PrestoConnection;
import com.facebook.presto.spi.type.SqlVarbinary;
import com.facebook.presto.verifier.Validator.ChangedRow.Changed;
import com.google.common.base.Joiner;
import com.google.common.base.Stopwatch;
import com.google.common.base.Throwables;
import com.google.common.collect.ComparisonChain;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableSortedMultiset;
import com.google.common.collect.Iterables;
import com.google.common.collect.Multiset;
import com.google.common.collect.Multisets;
import com.google.common.collect.Ordering;
import com.google.common.collect.SortedMultiset;
import com.google.common.util.concurrent.SimpleTimeLimiter;
import com.google.common.util.concurrent.TimeLimiter;
import com.google.common.util.concurrent.UncheckedTimeoutException;
import io.airlift.units.Duration;

import java.math.BigDecimal;
import java.math.MathContext;
import java.sql.Array;
import java.sql.Connection;
import java.sql.DriverManager;
import java.sql.ResultSet;
import java.sql.SQLClientInfoException;
import java.sql.SQLException;
import java.sql.Statement;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Comparator;
import java.util.List;
import java.util.Map;
import java.util.concurrent.Callable;
import java.util.concurrent.TimeUnit;
import java.util.function.Function;
import java.util.regex.Pattern;

import static com.facebook.presto.verifier.QueryResult.State;
import static com.google.common.base.Preconditions.checkArgument;
import static com.google.common.base.Strings.nullToEmpty;
import static com.google.common.primitives.Doubles.isFinite;
import static io.airlift.units.Duration.nanosSince;
import static java.lang.String.format;
import static java.util.Collections.unmodifiableList;
import static java.util.Objects.requireNonNull;

public class Validator {
    private final String testUsername;
    private final String controlUsername;
    private final String testPassword;
    private final String controlPassword;
    private final String controlGateway;
    private final String testGateway;
    private final Duration controlTimeout;
    private final Duration testTimeout;
    private final int maxRowCount;
    private final boolean checkCorrectness;
    private final boolean verboseResultsComparison;
    private final QueryPair queryPair;
    private final boolean explainOnly;
    private final Map<String, String> sessionProperties;
    private final int precision;

    private Boolean valid;

    private QueryResult controlResult;
    private QueryResult testResult;

    private boolean deterministic = true;

    public Validator(VerifierConfig config, QueryPair queryPair) {
        requireNonNull(config, "config is null");
        this.testUsername = requireNonNull(queryPair.getTest().getUsername(), "test username is null");
        this.controlUsername = requireNonNull(queryPair.getControl().getUsername(), "control username is null");
        this.testPassword = queryPair.getTest().getPassword();
        this.controlPassword = queryPair.getControl().getPassword();
        this.controlGateway = requireNonNull(config.getControlGateway(), "controlGateway is null");
        this.testGateway = requireNonNull(config.getTestGateway(), "testGateway is null");
        this.controlTimeout = config.getControlTimeout();
        this.testTimeout = config.getTestTimeout();
        this.maxRowCount = config.getMaxRowCount();
        this.explainOnly = config.isExplainOnly();
        this.precision = config.getDoublePrecision();
        // Check if either the control query or the test query matches the regex
        if (Pattern.matches(config.getSkipCorrectnessRegex(), queryPair.getTest().getQuery())
                || Pattern.matches(config.getSkipCorrectnessRegex(), queryPair.getControl().getQuery())) {
            // If so disable correctness checking
            this.checkCorrectness = false;
        } else {
            this.checkCorrectness = config.isCheckCorrectnessEnabled();
        }
        this.verboseResultsComparison = config.isVerboseResultsComparison();

        this.queryPair = requireNonNull(queryPair, "queryPair is null");
        // Test and Control always have the same session properties.
        this.sessionProperties = queryPair.getTest().getSessionProperties();
    }

    public boolean isSkipped() {
        if (queryPair.getControl().getQuery().isEmpty() || queryPair.getTest().getQuery().isEmpty()) {
            return true;
        }

        if (getControlResult().getState() != State.SUCCESS) {
            return true;
        }

        if (!isDeterministic()) {
            return true;
        }

        if (getTestResult().getState() == State.TIMEOUT) {
            return true;
        }

        return false;
    }

    public String getSkippedMessage() {
        StringBuilder sb = new StringBuilder();
        if (getControlResult().getState() == State.TOO_MANY_ROWS) {
            sb.append("----------\n");
            sb.append("Name: " + queryPair.getName() + "\n");
            sb.append("Schema (control): " + queryPair.getControl().getSchema() + "\n");
            sb.append("Too many rows.\n");
        } else if (!isDeterministic()) {
            sb.append("----------\n");
            sb.append("Name: " + queryPair.getName() + "\n");
            sb.append("Schema (control): " + queryPair.getControl().getSchema() + "\n");
            sb.append("NON DETERMINISTIC\n");
        } else if (getControlResult().getState() == State.TIMEOUT || getTestResult().getState() == State.TIMEOUT) {
            sb.append("----------\n");
            sb.append("Name: " + queryPair.getName() + "\n");
            sb.append("Schema (control): " + queryPair.getControl().getSchema() + "\n");
            sb.append("TIMEOUT\n");
        } else {
            sb.append("SKIPPED: ");
            if (getControlResult().getException() != null) {
                sb.append(getControlResult().getException().getMessage());
            }
        }
        return sb.toString();
    }

    public boolean valid() {
        if (valid == null) {
            valid = validate();
        }
        return valid;
    }

    public boolean isDeterministic() {
        if (valid == null) {
            valid = validate();
        }
        return deterministic;
    }

    private boolean validate() {
        controlResult = executeQueryControl();

        // query has too many rows. Consider blacklisting.
        if (controlResult.getState() == State.TOO_MANY_ROWS) {
            testResult = new QueryResult(State.INVALID, null, null, ImmutableList.<List<Object>>of());
            return false;
        }
        // query failed in the control
        if (controlResult.getState() != State.SUCCESS) {
            testResult = new QueryResult(State.INVALID, null, null, ImmutableList.<List<Object>>of());
            return true;
        }

        testResult = executeQueryTest();

        if (controlResult.getState() != State.SUCCESS || testResult.getState() != State.SUCCESS) {
            return false;
        }

        if (!checkCorrectness) {
            return true;
        }

        return resultsMatch(controlResult, testResult, precision)
                || checkForDeterministicAndRerunTestQueriesIfNeeded();
    }

    private QueryResult tearDown(Query query, Function<String, QueryResult> executor) {
        for (String postqueryString : query.getPostQueries()) {
            QueryResult queryResult = executor.apply(postqueryString);
            if (queryResult.getState() != State.SUCCESS) {
                return new QueryResult(State.FAILED_TO_TEARDOWN, queryResult.getException(),
                        queryResult.getDuration(), ImmutableList.<List<Object>>of());
            }
        }

        return new QueryResult(State.SUCCESS, null, null, ImmutableList.of());
    }

    private QueryResult setup(Query query, Function<String, QueryResult> executor) {
        for (String prequeryString : query.getPreQueries()) {
            QueryResult queryResult = executor.apply(prequeryString);
            if (queryResult.getState() != State.SUCCESS) {
                return new QueryResult(State.FAILED_TO_SETUP, queryResult.getException(), queryResult.getDuration(),
                        ImmutableList.<List<Object>>of());
            }
        }

        return new QueryResult(State.SUCCESS, null, null, ImmutableList.of());
    }

    private boolean checkForDeterministicAndRerunTestQueriesIfNeeded() {
        // check if the control query is deterministic
        for (int i = 0; i < 3; i++) {
            QueryResult results = executeQueryControl();
            if (results.getState() != State.SUCCESS) {
                return false;
            }

            if (!resultsMatch(controlResult, results, precision)) {
                deterministic = false;
                return false;
            }
        }

        // Re-run the test query to confirm that the results don't match, in case there was caching on the test tier,
        // but require that it matches 3 times in a row to rule out a non-deterministic correctness bug.
        for (int i = 0; i < 3; i++) {
            testResult = executeQueryTest();
            if (testResult.getState() != State.SUCCESS) {
                return false;
            }
            if (!resultsMatch(controlResult, testResult, precision)) {
                return false;
            }
        }

        // test result agrees with control result 3 times in a row although the first test result didn't agree
        return true;
    }

    private QueryResult executeQueryTest() {
        Query query = queryPair.getTest();
        QueryResult queryResult = new QueryResult(State.INVALID, null, null, ImmutableList.<List<Object>>of());
        try {
            // startup
            queryResult = setup(query, testPrequery -> executeQuery(testGateway, testUsername, testPassword,
                    queryPair.getTest(), testPrequery, testTimeout, sessionProperties));

            // if startup is successful -> execute query
            if (queryResult.getState() == State.SUCCESS) {
                queryResult = executeQuery(testGateway, testUsername, testPassword, queryPair.getTest(),
                        query.getQuery(), testTimeout, sessionProperties);
            }
        } finally {
            // teardown no matter what
            QueryResult tearDownResult = tearDown(query, testPostquery -> executeQuery(testGateway, testUsername,
                    testPassword, queryPair.getTest(), testPostquery, testTimeout, sessionProperties));

            // if teardown is not successful the query fails
            queryResult = tearDownResult.getState() == State.SUCCESS ? queryResult : tearDownResult;
        }
        return queryResult;
    }

    private QueryResult executeQueryControl() {
        Query query = queryPair.getControl();
        QueryResult queryResult = new QueryResult(State.INVALID, null, null, ImmutableList.<List<Object>>of());
        try {
            // startup
            queryResult = setup(query, controlPrequery -> executeQuery(controlGateway, controlUsername,
                    controlPassword, queryPair.getControl(), controlPrequery, controlTimeout, sessionProperties));

            // if startup is successful -> execute query
            if (queryResult.getState() == State.SUCCESS) {
                queryResult = executeQuery(controlGateway, controlUsername, controlPassword, queryPair.getControl(),
                        query.getQuery(), controlTimeout, sessionProperties);
            }
        } finally {
            // teardown no matter what
            QueryResult tearDownResult = tearDown(query,
                    controlPostquery -> executeQuery(controlGateway, controlUsername, controlPassword,
                            queryPair.getControl(), controlPostquery, controlTimeout, sessionProperties));

            // if teardown is not successful the query fails
            queryResult = tearDownResult.getState() == State.SUCCESS ? queryResult : tearDownResult;
        }
        return queryResult;
    }

    public QueryPair getQueryPair() {
        return queryPair;
    }

    public QueryResult getControlResult() {
        return controlResult;
    }

    public QueryResult getTestResult() {
        return testResult;
    }

    private QueryResult executeQuery(String url, String username, String password, Query query, String sql,
            Duration timeout, Map<String, String> sessionProperties) {
        try (Connection connection = DriverManager.getConnection(url, username, password)) {
            trySetConnectionProperties(query, connection);
            for (Map.Entry<String, String> entry : sessionProperties.entrySet()) {
                connection.unwrap(PrestoConnection.class).setSessionProperty(entry.getKey(), entry.getValue());
            }
            long start = System.nanoTime();

            try (Statement statement = connection.createStatement()) {
                TimeLimiter limiter = new SimpleTimeLimiter();
                Stopwatch stopwatch = Stopwatch.createStarted();
                Statement limitedStatement = limiter.newProxy(statement, Statement.class, timeout.toMillis(),
                        TimeUnit.MILLISECONDS);
                if (explainOnly) {
                    sql = "EXPLAIN " + sql;
                }
                try (final ResultSet resultSet = limitedStatement.executeQuery(sql)) {
                    List<List<Object>> results = limiter.callWithTimeout(getResultSetConverter(resultSet),
                            timeout.toMillis() - stopwatch.elapsed(TimeUnit.MILLISECONDS), TimeUnit.MILLISECONDS,
                            true);
                    return new QueryResult(State.SUCCESS, null, nanosSince(start), results);
                } catch (AssertionError e) {
                    if (e.getMessage().startsWith("unimplemented type:")) {
                        return new QueryResult(State.INVALID, null, null, ImmutableList.<List<Object>>of());
                    }
                    throw e;
                } catch (SQLException | VerifierException e) {
                    throw e;
                } catch (UncheckedTimeoutException e) {
                    return new QueryResult(State.TIMEOUT, null, null, ImmutableList.<List<Object>>of());
                } catch (InterruptedException e) {
                    Thread.currentThread().interrupt();
                    throw Throwables.propagate(e);
                } catch (Exception e) {
                    throw Throwables.propagate(e);
                }
            }
        } catch (SQLException e) {
            Exception exception = e;
            if (("Error executing query".equals(e.getMessage()) || "Error fetching results".equals(e.getMessage()))
                    && (e.getCause() instanceof Exception)) {
                exception = (Exception) e.getCause();
            }
            State state = isPrestoQueryInvalid(e) ? State.INVALID : State.FAILED;
            return new QueryResult(state, exception, null, null);
        } catch (VerifierException e) {
            return new QueryResult(State.TOO_MANY_ROWS, e, null, null);
        }
    }

    private void trySetConnectionProperties(Query query, Connection connection) throws SQLException {
        // Required for jdbc drivers that do not implement all/some of these functions (eg. impala jdbc driver)
        // For these drivers, set the database default values in the query database
        try {
            connection.setClientInfo("ApplicationName", "verifier-test:" + queryPair.getName());
            connection.setCatalog(query.getCatalog());
            connection.setSchema(query.getSchema());
        } catch (SQLClientInfoException ignored) {
            // Do nothing
        }
    }

    private Callable<List<List<Object>>> getResultSetConverter(final ResultSet resultSet) {
        return new Callable<List<List<Object>>>() {
            @Override
            public List<List<Object>> call() throws Exception {
                return convertJdbcResultSet(resultSet);
            }
        };
    }

    private static boolean isPrestoQueryInvalid(SQLException e) {
        for (Throwable t = e.getCause(); t != null; t = t.getCause()) {
            if (t.toString().contains(".SemanticException:")) {
                return true;
            }
            if (t.toString().contains(".ParsingException:")) {
                return true;
            }
            if (nullToEmpty(t.getMessage()).matches("Function .* not registered")) {
                return true;
            }
        }
        return false;
    }

    private List<List<Object>> convertJdbcResultSet(ResultSet resultSet) throws SQLException, VerifierException {
        int rowCount = 0;
        int columnCount = resultSet.getMetaData().getColumnCount();

        ImmutableList.Builder<List<Object>> rows = ImmutableList.builder();
        while (resultSet.next()) {
            List<Object> row = new ArrayList<>();
            for (int i = 1; i <= columnCount; i++) {
                Object object = resultSet.getObject(i);
                if (object instanceof BigDecimal) {
                    if (((BigDecimal) object).scale() <= 0) {
                        object = ((BigDecimal) object).longValueExact();
                    } else {
                        object = ((BigDecimal) object).doubleValue();
                    }
                }
                if (object instanceof Array) {
                    object = ((Array) object).getArray();
                }
                if (object instanceof byte[]) {
                    object = new SqlVarbinary((byte[]) object);
                }
                row.add(object);
            }
            rows.add(unmodifiableList(row));
            rowCount++;
            if (rowCount > maxRowCount) {
                throw new VerifierException("More than '" + maxRowCount + "' rows, failing query");
            }
        }
        return rows.build();
    }

    private static boolean resultsMatch(QueryResult controlResult, QueryResult testResult, int precision) {
        SortedMultiset<List<Object>> control = ImmutableSortedMultiset.copyOf(rowComparator(precision),
                controlResult.getResults());
        SortedMultiset<List<Object>> test = ImmutableSortedMultiset.copyOf(rowComparator(precision),
                testResult.getResults());
        try {
            return control.equals(test);
        } catch (TypesDoNotMatchException e) {
            return false;
        }
    }

    public String getResultsComparison(int precision) {
        List<List<Object>> controlResults = controlResult.getResults();
        List<List<Object>> testResults = testResult.getResults();

        if (valid() || (controlResults == null) || (testResults == null)) {
            return "";
        }

        Multiset<List<Object>> control = ImmutableSortedMultiset.copyOf(rowComparator(precision), controlResults);
        Multiset<List<Object>> test = ImmutableSortedMultiset.copyOf(rowComparator(precision), testResults);

        try {
            Iterable<ChangedRow> diff = ImmutableSortedMultiset.<ChangedRow>naturalOrder()
                    .addAll(Iterables.transform(Multisets.difference(control, test),
                            row -> new ChangedRow(Changed.REMOVED, row, precision)))
                    .addAll(Iterables.transform(Multisets.difference(test, control),
                            row -> new ChangedRow(Changed.ADDED, row, precision)))
                    .build();
            diff = Iterables.limit(diff, 100);

            StringBuilder sb = new StringBuilder();

            sb.append(format("Control %s rows, Test %s rows%n", control.size(), test.size()));
            if (verboseResultsComparison) {
                Joiner.on("\n").appendTo(sb, diff);
            } else {
                sb.append("RESULTS DO NOT MATCH\n");
            }

            return sb.toString();
        } catch (TypesDoNotMatchException e) {
            return e.getMessage();
        }
    }

    private static Comparator<List<Object>> rowComparator(int precision) {
        final Comparator<Object> comparator = Ordering.from(columnComparator(precision)).nullsFirst();
        return new Comparator<List<Object>>() {
            @Override
            public int compare(List<Object> a, List<Object> b) {
                if (a.size() != b.size()) {
                    return Integer.compare(a.size(), b.size());
                }
                for (int i = 0; i < a.size(); i++) {
                    int r = comparator.compare(a.get(i), b.get(i));
                    if (r != 0) {
                        return r;
                    }
                }
                return 0;
            }
        };
    }

    private static Comparator<Object> columnComparator(int precision) {
        return new Comparator<Object>() {
            @SuppressWarnings("unchecked")
            @Override
            public int compare(Object a, Object b) {
                if (a instanceof Number && b instanceof Number) {
                    Number x = (Number) a;
                    Number y = (Number) b;
                    boolean bothReal = isReal(x) && isReal(y);
                    boolean bothIntegral = isIntegral(x) && isIntegral(y);
                    if (!(bothReal || bothIntegral)) {
                        throw new TypesDoNotMatchException(format("item types do not match: %s vs %s",
                                a.getClass().getName(), b.getClass().getName()));
                    }
                    if (isIntegral(x)) {
                        return Long.compare(x.longValue(), y.longValue());
                    }
                    return precisionCompare(x.doubleValue(), y.doubleValue(), precision);
                }
                if (a.getClass() != b.getClass()) {
                    throw new TypesDoNotMatchException(format("item types do not match: %s vs %s",
                            a.getClass().getName(), b.getClass().getName()));
                }
                if ((a.getClass().isArray() && b.getClass().isArray())) {
                    if (Arrays.deepEquals((Object[]) a, (Object[]) b)) {
                        return 0;
                    }
                    return Arrays.hashCode((Object[]) a) < Arrays.hashCode((Object[]) b) ? -1 : 1;
                }
                if ((a instanceof Map && b instanceof Map)) {
                    if (a.equals(b)) {
                        return 0;
                    }
                    return a.hashCode() < b.hashCode() ? -1 : 1;
                }
                checkArgument(a instanceof Comparable, "item is not Comparable: %s", a.getClass().getName());
                return ((Comparable<Object>) a).compareTo(b);
            }
        };
    }

    private static boolean isReal(Number x) {
        return x instanceof Float || x instanceof Double;
    }

    private static boolean isIntegral(Number x) {
        return x instanceof Byte || x instanceof Short || x instanceof Integer || x instanceof Long;
    }

    private static int precisionCompare(double a, double b, int precision) {
        if (!isFinite(a) || !isFinite(b)) {
            return Double.compare(a, b);
        }

        MathContext context = new MathContext(precision);
        BigDecimal x = new BigDecimal(a).round(context);
        BigDecimal y = new BigDecimal(b).round(context);
        return x.compareTo(y);
    }

    public static class ChangedRow implements Comparable<ChangedRow> {
        public enum Changed {
            ADDED, REMOVED
        }

        private final Changed changed;
        private final List<Object> row;
        private final int precision;

        private ChangedRow(Changed changed, List<Object> row, int precision) {
            this.changed = changed;
            this.row = row;
            this.precision = precision;
        }

        @Override
        public String toString() {
            if (changed == Changed.ADDED) {
                return "+ " + row;
            } else {
                return "- " + row;
            }
        }

        @Override
        public int compareTo(ChangedRow that) {
            return ComparisonChain.start().compare(this.row, that.row, rowComparator(precision))
                    .compareFalseFirst(this.changed == Changed.ADDED, that.changed == Changed.ADDED).result();
        }
    }
}