Executable.Input.java Source code

Java tutorial

Introduction

Here is the source code for Executable.Input.java

Source

/*
 * This file is part of LinkImputeR.
 * 
 * LinkImputeR is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * LinkImputeR is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with LinkImpute.  If not, see <http://www.gnu.org/licenses/>.
 */

package Executable;

import Exceptions.OutputException;
import VCF.Changers.GenotypeChanger;
import VCF.Changers.MaxDepthNoReadsChanger;
import VCF.Changers.PositionChanger;
import VCF.Changers.RenameFormatChanger;
import VCF.Changers.StandardizeCountsFormatChanger;
import VCF.Exceptions.VCFException;
import VCF.Filters.BiallelicFilter;
import VCF.Filters.HasDepthFilter;
import VCF.Filters.PositionFilter;
import VCF.Filters.VCFFilter;
import VCF.VCF;
import java.io.File;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
import org.apache.commons.configuration2.HierarchicalConfiguration;
import org.apache.commons.configuration2.tree.ImmutableNode;

/**
 * Represents the input to LinkImputeR
 * @author Daniel Money
 * @version 1.1.3
 */
public class Input {

    /**
     * Constructor
     * @param in The input VCF file
     * @param filters The filters to apply to the VCF as it is read in
     * @param out The file to output the VCF to IMMEDIATELY after the VCF has
     * been read in and the input parameters applied.  Input filters are applied
     * in all cases so it can save time in the final imputation step to save a VCF
     * with the filters applied rather than read it in from scratch and reapply
     * the filters.
     * @param maxdepth The maximum read depth for a genotype.  Genotypes with
     * a higher read depth are set to have no reads and a missing genotype.
     * @param readsformat The formats to read read depths from.  If a single
     * value then assumes the format contains comma separated data for reference
     * alt read depths.  If readsformat is itself comma seperated then assumes
     * the first item is the format containing the reference allele depth, the
     * second the alt allele depth.  If null defaults to the current VCF standard
     * (AD).
     */
    public Input(File in, List<PositionFilter> filters, File out, int maxdepth, String readsformat) {
        this.in = in;
        this.filters = new ArrayList<>();
        this.filters.add(new BiallelicFilter());
        this.filters.addAll(filters);
        this.out = out;
        this.maxdepth = maxdepth;
        this.readsformat = readsformat;
    }

    /**
     * Constructor from a config (read in from a XML file)
     * @param params The config
     */
    public Input(HierarchicalConfiguration<ImmutableNode> params) {
        in = new File(params.getString("filename"));
        filters = new ArrayList<>();
        filters.add(new BiallelicFilter());

        for (HierarchicalConfiguration<ImmutableNode> filter : params.configurationsAt("filter")) {
            filters.add(Available.getPositionFilter(filter));
        }

        String prettyString = params.getString("save", null);
        out = (prettyString == null) ? null : new File(prettyString);

        String readsformatString = params.getString("readsformat", null);
        readsformat = readsformatString;

        maxdepth = params.getInt("maxdepth", 100);
    }

    /**
     * Get the VCF data
     * @return The VCF data
     * @throws VCF.Exceptions.VCFException If there is a problem with VCF file
     * or the data in it.
     * @throws OutputException If there is a problem writing out the immediate
     * output file (see constructor)
     */
    public VCF getVCF() throws VCFException, OutputException {
        List<GenotypeChanger> genotypechangers = new ArrayList<>();
        genotypechangers.add(new MaxDepthNoReadsChanger(maxdepth));
        List<PositionFilter> prefilters = new ArrayList<>();
        prefilters.add(new HasDepthFilter());
        ArrayList<String> requiredFields = new ArrayList<>();
        requiredFields.add("GT");
        requiredFields.add("DP");
        if (readsformat == null) {
            requiredFields.add("AD");
        } else {
            requiredFields.addAll(Arrays.asList(readsformat.split(",")));
        }
        ArrayList<PositionChanger> positionchangers = new ArrayList<>();
        if (readsformat != null) {
            String[] formats = readsformat.split(",");
            if (formats.length == 1) {
                positionchangers.add(new RenameFormatChanger(formats[0], "AD"));
            }
            if (formats.length == 2) {
                positionchangers.add(new StandardizeCountsFormatChanger(formats[0], formats[1]));
            }
        }

        VCF vcf = new VCF(in, prefilters, positionchangers, genotypechangers, filters, requiredFields);
        if (readsformat != null) {
            for (String f : readsformat.split(",")) {
                vcf.getMeta().removeFormat(f);
            }
            vcf.getMeta().addFormat("AD", "##FORMAT=<ID=AD,Number=.,Type=Integer,Description=\"Allelic"
                    + " depths for the reference and alternate alleles" + " in the order listed\">");
        }

        if (out != null) {
            try {
                vcf.writeFile(out);
            } catch (IOException ex) {
                throw new OutputException("Problem writing filtered VCF", ex);
            }
        }
        return vcf;
    }

    /**
     * Get the input config
     * @return The config
     */
    public ImmutableNode getConfig() {
        ImmutableNode Iin = new ImmutableNode.Builder().name("filename").value(in).create();

        ImmutableNode.Builder config = new ImmutableNode.Builder().name("input").addChild(Iin);

        for (VCFFilter filter : filters) {
            config.addChild(filter.getConfig());
        }

        if (out != null) {
            ImmutableNode Iout = new ImmutableNode.Builder().name("save").value(out).create();
            config.addChild(Iout);
        }

        if (readsformat != null) {
            ImmutableNode Ireadformat = new ImmutableNode.Builder().name("readsformat").value(readsformat).create();
            config.addChild(Ireadformat);
        }

        ImmutableNode Imax = new ImmutableNode.Builder().name("maxdepth").value(maxdepth).create();
        config.addChild(Imax);

        return config.create();
    }

    /**
     * Get the input config for the final imputation step
     * @return The config
     */
    public ImmutableNode getImputeConfig() {
        if (out != null) {
            ImmutableNode Iin = new ImmutableNode.Builder().name("filename").value(out).create();
            return new ImmutableNode.Builder().name("input").addChild(Iin).create();
        } else {
            ImmutableNode Iin = new ImmutableNode.Builder().name("filename").value(in).create();

            ImmutableNode.Builder config = new ImmutableNode.Builder().name("input").addChild(Iin);

            for (VCFFilter filter : filters) {
                config.addChild(filter.getConfig());
            }

            return config.create();
        }
    }

    private final int maxdepth;
    private final File in;
    private final List<PositionFilter> filters;
    private final File out;
    private final String readsformat;
}