com.fullcontact.cassandra.io.sstable.Descriptor.java Source code

Java tutorial

Introduction

Here is the source code for com.fullcontact.cassandra.io.sstable.Descriptor.java

Source

/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.fullcontact.cassandra.io.sstable;

import com.google.common.base.Objects;
import org.apache.cassandra.utils.FilterFactory;
import org.apache.cassandra.utils.Pair;
import org.apache.hadoop.fs.Path;

import java.io.File;
import java.util.StringTokenizer;

import static org.apache.cassandra.io.sstable.Component.separator;

/**
 * Cassandra Descriptor ported to work with HDFS.
 * <p/>
 * A SSTable is described by the keyspace and column family it contains data
 * for, a generation (where higher generations contain more recent data) and
 * an alphabetic version string.
 * <p/>
 * A descriptor can be marked as temporary, which influences generated filenames.
 */
public class Descriptor {
    // versions are denoted as [major][minor].  Minor versions must be forward-compatible:
    // new fields are allowed in e.g. the metadata component, but fields can't be removed
    // or have their size changed.
    //
    // Minor versions were introduced with version "hb" for Cassandra 1.0.3; prior to that,
    // we always incremented the major version.  In particular, versions g and h are
    // forwards-compatible with version f, so if the above convention had been followed,
    // we would have labeled them fb and fc.
    public static class Version {
        // This needs to be at the begining for initialization sake
        public static final String current_version = "ic";

        public static final Version LEGACY = new Version("a"); // "pre-history"
        // b (0.7.0): added version to sstable filenames
        // c (0.7.0): bloom filter component computes hashes over raw key bytes instead of strings
        // d (0.7.0): row size in data component becomes a long instead of int
        // e (0.7.0): stores undecorated keys in data and index components
        // f (0.7.0): switched bloom filter implementations in data component
        // g (0.8): tracks flushed-at context in metadata component
        // h (1.0): tracks max client timestamp in metadata component
        // hb (1.0.3): records compression ration in metadata component
        // hc (1.0.4): records partitioner in metadata component
        // hd (1.0.10): includes row tombstones in maxtimestamp
        // he (1.1.3): includes ancestors generation in metadata component
        // hf (1.1.6): marker that replay position corresponds to 1.1.5+ millis-based id (see CASSANDRA-4782)
        // ia (1.2.0): column indexes are promoted to the index file
        //             records estimated histogram of deletion times in tombstones
        //             bloom filter (keys and columns) upgraded to Murmur3
        // ib (1.2.1): tracks min client timestamp in metadata component
        // ic (1.2.5): omits per-row bloom filter of column names

        public static final Version CURRENT = new Version(current_version);

        private final String version;

        public final boolean hasStringsInBloomFilter;
        public final boolean hasIntRowSize;
        public final boolean hasEncodedKeys;
        public final boolean isLatestVersion;
        public final boolean metadataIncludesReplayPosition;
        public final boolean metadataIncludesModernReplayPosition;
        public final boolean tracksMaxTimestamp;
        public final boolean tracksMinTimestamp;
        public final boolean hasCompressionRatio;
        public final boolean hasPartitioner;
        public final boolean tracksTombstones;
        public final boolean hasPromotedIndexes;
        public final FilterFactory.Type filterType;
        public final boolean hasAncestors;
        public final boolean hasRowLevelBF;

        public Version(String version) {
            this.version = version;
            hasStringsInBloomFilter = version.compareTo("c") < 0;
            hasIntRowSize = version.compareTo("d") < 0;
            hasEncodedKeys = version.compareTo("e") < 0;
            metadataIncludesReplayPosition = version.compareTo("g") >= 0;
            hasCompressionRatio = version.compareTo("hb") >= 0;
            hasPartitioner = version.compareTo("hc") >= 0;
            tracksMaxTimestamp = version.compareTo("hd") >= 0;
            tracksMinTimestamp = version.compareTo("ib") >= 0;
            hasAncestors = version.compareTo("he") >= 0;
            metadataIncludesModernReplayPosition = version.compareTo("hf") >= 0;
            tracksTombstones = version.compareTo("ia") >= 0;
            hasPromotedIndexes = version.compareTo("ia") >= 0;
            isLatestVersion = version.compareTo(current_version) == 0;
            if (version.compareTo("f") < 0)
                filterType = FilterFactory.Type.SHA;
            else if (version.compareTo("ia") < 0)
                filterType = FilterFactory.Type.MURMUR2;
            else
                filterType = FilterFactory.Type.MURMUR3;
            hasRowLevelBF = version.compareTo("ic") < 0;
        }

        /**
         * @param ver SSTable version
         * @return True if the given version string matches the format.
         * @see #version
         */
        static boolean validate(String ver) {
            return ver != null && ver.matches("[a-z]+");
        }

        public boolean isCompatible() {
            return version.charAt(0) <= CURRENT.version.charAt(0);
        }

        public boolean isStreamCompatible() {
            // we could add compatibility for earlier versions with the new single-pass streaming
            // (see SSTableWriter.appendFromStream) but versions earlier than 0.7.1 don't have the
            // MessagingService version awareness anyway so there's no point.
            return isCompatible() && version.charAt(0) >= 'i';
        }

        /**
         * Versions [h..hc] contained a timestamp value that was computed incorrectly, ignoring row tombstones.
         * containsTimestamp returns true if there is a timestamp value in the metadata file; to know if it
         * actually contains a *correct* timestamp, see tracksMaxTimestamp.
         */
        public boolean containsTimestamp() {
            return version.compareTo("h") >= 0;
        }

        @Override
        public String toString() {
            return version;
        }

        @Override
        public boolean equals(Object o) {
            if (o == this)
                return true;
            if (!(o instanceof Version))
                return false;
            return version.equals(((Version) o).version);
        }

        @Override
        public int hashCode() {
            return version.hashCode();
        }
    }

    public final Path directory;
    /**
     * version has the following format: <code>[a-z]+</code>
     */
    public final Version version;
    public final String ksname;
    public final String cfname;
    public final int generation;
    public final boolean temporary;
    private final int hashCode;

    /**
     * A descriptor that assumes CURRENT_VERSION.
     */
    public Descriptor(Path directory, String ksname, String cfname, int generation, boolean temp) {
        this(Version.CURRENT, directory, ksname, cfname, generation, temp);
    }

    public Descriptor(String version, Path directory, String ksname, String cfname, int generation, boolean temp) {
        this(new Version(version), directory, ksname, cfname, generation, temp);
    }

    public Descriptor(Version version, Path directory, String ksname, String cfname, int generation, boolean temp) {
        assert version != null && directory != null && ksname != null && cfname != null;
        this.version = version;
        this.directory = directory;
        this.ksname = ksname;
        this.cfname = cfname;
        this.generation = generation;
        temporary = temp;
        hashCode = Objects.hashCode(directory, generation, ksname, cfname, temp);
    }

    public Descriptor withGeneration(int newGeneration) {
        return new Descriptor(version, directory, ksname, cfname, newGeneration, temporary);
    }

    public String filenameFor(Component component) {
        return filenameFor(component.name());
    }

    public String baseFilename() {
        StringBuilder buff = new StringBuilder();
        buff.append(directory).append(File.separatorChar);
        buff.append(ksname).append(separator);
        buff.append(cfname).append(separator);
        if (temporary)
            buff.append(SSTable.TEMPFILE_MARKER).append(separator);
        if (!Version.LEGACY.equals(version))
            buff.append(version).append(separator);
        buff.append(generation);
        return buff.toString();
    }

    /**
     * @param suffix A component suffix, such as 'Data.db'/'Index.db'/etc
     * @return A filename for this descriptor with the given suffix.
     */
    public String filenameFor(String suffix) {
        return baseFilename() + separator + suffix;
    }

    /**
     * @param filename The SSTable filename
     * @return Descriptor of the SSTable initialized from filename
     * @see #fromFilename(org.apache.hadoop.fs.Path, String) (File directory, String name)
     */
    public static Descriptor fromFilename(String filename) {
        Path file = new Path(filename);
        return fromFilename(file.getParent(), file.getName()).left;
    }

    /**
     * Filename of the form "<ksname>-<cfname>-[tmp-][<version>-]<gen>-<component>"
     *
     * @param directory The directory of the SSTable files
     * @param name      The name of the SSTable file
     * @return A Descriptor for the SSTable, and the Component remainder.
     */
    public static Pair<Descriptor, String> fromFilename(Path directory, String name) {
        // tokenize the filename
        StringTokenizer st = new StringTokenizer(name, String.valueOf(separator));
        String nexttok;

        // all filenames must start with keyspace and column family
        String ksname = st.nextToken();
        String cfname = st.nextToken();

        // optional temporary marker
        nexttok = st.nextToken();
        boolean temporary = false;
        if (nexttok.equals(SSTable.TEMPFILE_MARKER)) {
            temporary = true;
            nexttok = st.nextToken();
        }

        // optional version string
        Version version = Version.LEGACY;
        if (Version.validate(nexttok)) {
            version = new Version(nexttok);
            nexttok = st.nextToken();
        }
        int generation = Integer.parseInt(nexttok);

        // component suffix
        String component = st.nextToken();
        directory = directory != null ? directory : new Path(".");
        return Pair.create(new Descriptor(version, directory, ksname, cfname, generation, temporary), component);
    }

    /**
     * @param temporary temporary flag
     * @return A clone of this descriptor with the given 'temporary' status.
     */
    public Descriptor asTemporary(boolean temporary) {
        return new Descriptor(version, directory, ksname, cfname, generation, temporary);
    }

    /**
     * @return true if the current Cassandra version can read the given sstable version
     */
    public boolean isCompatible() {
        return version.isCompatible();
    }

    /**
     * @return true if the current Cassandra version can stream the given sstable version
     *         from another node.  This is stricter than opening it locally [isCompatible] because
     *         streaming needs to rebuild all the non-data components, and it only knows how to write
     *         the latest version.
     */
    public boolean isStreamCompatible() {
        return version.isStreamCompatible();
    }

    @Override
    public String toString() {
        return baseFilename();
    }

    @Override
    public boolean equals(Object o) {
        if (o == this)
            return true;
        if (!(o instanceof Descriptor))
            return false;
        Descriptor that = (Descriptor) o;
        return that.directory.equals(this.directory) && that.generation == this.generation
                && that.ksname.equals(this.ksname) && that.cfname.equals(this.cfname)
                && that.temporary == this.temporary;
    }

    @Override
    public int hashCode() {
        return hashCode;
    }
}