moa.classifiers.featureselection.OFSP.java Source code

Introduction

Here is the source code for moa.classifiers.featureselection.OFSP.java
Source

/*
 *    OFSP.java
 *    Copyright (C) 2015 Drexel University, Philadelphia, PA
 *    @author Gregory Ditzler (gregory{[dot]}ditzler{[at]}gmail{[dot]}com)
 *
 *    This program is free software; you can redistribute it and/or modify
 *    it under the terms of the GNU General Public License as published by
 *    the Free Software Foundation; either version 3 of the License, or
 *    (at your option) any later version.
 *
 *    This program is distributed in the hope that it will be useful,
 *    but WITHOUT ANY WARRANTY; without even the implied warranty of
 *    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *    GNU General Public License for more details.
 *
 *    You should have received a copy of the GNU General Public License
 *    along with this program. If not, see <http://www.gnu.org/licenses/>.
 *    
 */
package moa.classifiers.featureselection;

import weka.core.Instance;
import moa.classifiers.AbstractClassifier;
import moa.core.Measurement;
import moa.options.FloatOption;
import moa.options.IntOption;
import moa.options.MultiChoiceOption;

import java.util.Random;

<<<<<<<HEAD

public class OFSP extends AbstractClassifier {

    /** serial id */
    private static final long serialVersionUID = 1L;
    /** truncation size or the number of features to select */
    public IntOption numSelectOption = new IntOption("numSelect", 'n', "The number of features to select.", 10, 0,
            Integer.MAX_VALUE);
    /** step size */
    public FloatOption stepSizeOption = new FloatOption("stepSize", 's', "The step size.", 0.2, 0.00,
            Integer.MAX_VALUE);
    /** exploration parameter */
    public FloatOption searchOption = new FloatOption("search", 'e', "Exploration parameter.", 0.2, 0.00,
            Integer.MAX_VALUE);
    /** */
    public FloatOption boundOption = new FloatOption("bound", 'b', "Bound on the l2-norm.", 10, 0.00,
            Integer.MAX_VALUE);
    /** */
    public MultiChoiceOption evalOption = new MultiChoiceOption("evaluation", 'p',
            "Evaluate on a full or partial information instance.", new String[] { "full", "partial" },
            new String[] { "full", "partial" }, 0);
    /** parameter vector for prediction */
    protected double[] weights;
    /** bias parameters */
    protected double bias;
    /** class for generating random numbers */
    protected Random rand;

    @Override
    public boolean isRandomizable() {
        // TODO Auto-generated method stub
        return false;
    }

    @Override
    public double[] getVotesForInstance(Instance inst) {
        if (this.weights == null)
            return (inst.classAttribute().isNominal()) ? new double[2] : new double[1];

        double[] result = (inst.classAttribute().isNominal()) ? new double[2] : new double[1];
        double f_t = 0;
        int[] indices = new int[this.numSelectOption.getValue()];

        if (this.evalOption.getChosenIndex() == 0) {
            f_t = dot(inst.toDoubleArray(), this.weights);
            f_t += this.bias;
        } else {
            for (int i = 0; i < this.numSelectOption.getValue(); i++)
                indices[i] = this.rand.nextInt(inst.numAttributes());
        }

        if (inst.classAttribute().isNumeric()) {
            result[0] = f_t;
            return result;
        }

        if (f_t <= 0) {
            result[0] = 1;
        } else {
            result[1] = 1;
        }

        return result;
    }

    @Override
    public void resetLearningImpl() {
        this.weights = null; // we'll reset when we start learning
        this.bias = 0.0;
        this.rand = new Random();
    }

    @Override
    public void trainOnInstanceImpl(Instance inst) {
        double y_t, f_t, denom, m_bias;
        int[] indices = new int[this.numSelectOption.getValue()];
        double[] m_weights;

        if (this.weights == null) {

            this.weights = new double[inst.numValues()];
            for (int i = 0; i < this.weights.length; i++)
                this.weights[i] = this.rand.nextGaussian();
            this.bias = 0.0;
            this.weights = truncate(this.weights, this.numSelectOption.getValue());
        }

        if (inst.classAttribute().isNominal()) {
            y_t = (inst.classValue() == 0) ? -1 : 1;
        } else {
            y_t = inst.classValue();
        }
        double[] x_t = inst.toDoubleArray();
        double[] x_hat = inst.toDoubleArray();

        if (this.rand.nextDouble() < this.searchOption.getValue()) {
            int[] indices_perm = perm(inst.numAttributes());
            for (int i = 0; i < this.numSelectOption.getValue(); i++)
                indices[i] = indices_perm[i];

        } else {
            int[] sorted_indices = bubblesort_index(abs_vector(this.weights));

            for (int i = 0; i < inst.numAttributes() - this.numSelectOption.getValue(); i++)
                x_hat[sorted_indices[i]] = 0.0;

            for (int i = 0; i < this.numSelectOption.getValue(); i++)
                indices[i] = sorted_indices[sorted_indices.length - i - 1];
        }

        f_t = 0;
        for (int i = 0; i < this.numSelectOption.getValue(); i++)
            f_t += this.weights[indices[i]] * x_t[indices[i]];
        f_t += this.bias;

        if (f_t * y_t < 0) {

            for (int i = 0; i < x_hat.length; i++) {
                denom = this.numSelectOption.getValue() / x_hat.length * this.searchOption.getValue();
                if (this.weights[i] != 0)
                    denom += (1 - this.searchOption.getValue()) * this.weights[i];
                x_hat[i] /= denom;
            }

            m_weights = scalar_vector(y_t * this.stepSizeOption.getValue(), x_hat);
            m_bias = y_t * this.stepSizeOption.getValue() * this.bias;
            m_weights = vector_add(m_weights, this.weights);
            m_bias += m_bias + this.bias;

            m_weights = l2_projection(m_weights, m_bias, this.boundOption.getValue());
            m_weights = truncate(m_weights, this.numSelectOption.getValue());

            for (int i = 0; i < m_weights.length - 1; i++)
                this.weights[i] = m_weights[i];
            this.bias = m_weights[m_weights.length - 1];
        }

    }

    @Override
    protected Measurement[] getModelMeasurementsImpl() {
        // TODO Auto-generated method stub
        return null;
    }

    @Override
    public void getModelDescription(StringBuilder out, int indent) {
        // TODO Auto-generated method stub

    }

    /** 
     * Compute the dot product of two vectors
     * @param x input vector
     * @param y input vector
     * @return dot product between x & y.
     */
    public double dot(double[] x, double[] y) {
        double dp = 0.0;
        for (int i = 0; i < x.length; i++)
            dp += x[i] * y[i];
        return dp;
    }

    /**
     * Compute a*x where a is a scalar and x is a vector
     * @param a scalar (double)
     * @param x vector (double[])
     * @return return the scalar product
     */
    public double[] scalar_vector(double a, double[] x) {
        double[] y = new double[x.length];
        for (int i = 0; i < x.length; i++)
            y[i] = a * x[i];
        return y;
    }

    /**
     * Add two double vectors 
     * @param x
     * @param y
     * @return
     */
    public double[] vector_add(double[] x, double[] y) {
        for (int i = 0; i < x.length; i++) {
            x[i] += y[i];
        }
        return x;
    }

    /**
     * 
     * @param x
     * @params bias
     * @param lambda
     * @return
     */
    public double[] l2_projection(double[] x, double bias, double R) {
        double norm = 0.0;
        double[] y = new double[x.length + 1];

        for (int i = 0; i < x.length; i++)
            norm += x[i] * x[i];
        norm = Math.sqrt(norm + bias * bias);
        double a = Math.sqrt(R) / norm;

        if (a < 1) {
            for (int i = 0; i < x.length; i++)
                y[i] = a * x[i];
            y[y.length - 1] = a * bias;
        } else {
            for (int i = 0; i < x.length; i++)
                y[i] = x[i];
            y[y.length - 1] = bias;
        }
        return y;
    }

    /**
     * Keep only the B largest entries in a vector x 
     * @param x
     * @param B
     * @return
     */
    public double[] truncate(double[] x, int B) {
        int[] sorted_indices = bubblesort_index(abs_vector(x));
        for (int i = 0; i < x.length - B - 1; i++)
            x[sorted_indices[i]] = 0.0;
        return x;
    }

    /** 
     * Sort the elements of a vector 
     * @param x vector to be sorted 
     * @return sorted vector
     */
    public int[] bubblesort_index(double[] x) {
        int[] y = new int[x.length];
        boolean flag = true;
        double t, r;

        /*initialize the indices*/
        for (int i = 0; i < x.length; i++)
            y[i] = i;

        while (flag) {
            flag = false;
            for (int j = 0; j < x.length - 1; j++) {
                if (x[j] < x[j + 1]) {
                    t = x[j];
                    r = y[j];

                    x[j] = x[j + 1];
                    y[j] = y[j + 1];

                    x[j + 1] = t;
                    y[j + 1] = (int) r;
                    flag = true;
                }
            }
        }
        return y;
    }

    /**
     * Compute the absolute value of the elements in a vector
     * @param x
     * @return
     */
    public double[] abs_vector(double[] x) {
        for (int i = 0; i < x.length; i++) {
            if (x[i] < 0)
                x[i] = -x[i];
        }
        return x;
    }

    /**
     * Create a randomly permutation sequence of a pre-specified length.
     * @param length
     * @return
     */
    public int[] perm(int length) {

        // initialize array and fill it with {0,1,2...}
        int[] array = new int[length];
        for (int i = 0; i < array.length; i++)
            array[i] = i;

        for (int i = 0; i < length; i++) {

            // randomly chosen position in array whose element
            // will be swapped with the element in position i
            // note that when i = 0, any position can chosen (0 thru length-1)
            // when i = 1, only positions 1 through length -1
            // NOTE: r is an instance of java.util.Random
            int ran = i + this.rand.nextInt(length - i);

            // perform swap
            int temp = array[i];
            array[i] = array[ran];
            array[ran] = temp;
        }
        return array;
    }=======

    /**
     * Online Feature Selection with Partial Inputs
     * 
     * @author Gregory Ditzler (gregory{[dot]}ditzler{[at]}gmail{[dot]}com)
     */
    public class OFSP extends AbstractClassifier {

        /**
         * serial id
         */
        private static final long serialVersionUID = 1L;
        /**
         * truncation size or the number of features to select
         */
        public IntOption numSelectOption = new IntOption("numSelect", 'n', "The number of features to select.", 10,
                0, Integer.MAX_VALUE);
        /**
         * step size
         */
        public FloatOption stepSizeOption = new FloatOption("stepSize", 's', "The step size.", 0.2, 0.00,
                Integer.MAX_VALUE);
        /**
         * exploration parameter
         */
        public FloatOption searchOption = new FloatOption("search", 'e', "Exploration parameter.", 0.2, 0.00,
                Integer.MAX_VALUE);
        /**
         *      */
        public FloatOption boundOption = new FloatOption("bound", 'b', "Bound on the l2-norm.", 10, 0.00,
                Integer.MAX_VALUE);
        /**
         *      
         */
        public MultiChoiceOption evalOption = new MultiChoiceOption("evaluation", 'p',
                "Evaluate on a full or partial information instance.", new String[] { "full", "partial" },
                new String[] { "full", "partial" }, 0);
        /**
         * parameter vector for prediction
         */
        protected double[] weights;
        /**
         * bias parameters
         */
        protected double bias;
        /**
         * Class for generating random numbers
         */
        protected Random rand;

        @Override
        public boolean isRandomizable() {
            //Not randomizable
            return false;
        }

        @Override
        public double[] getVotesForInstance(Instance inst) {
            if (this.weights == null) {
                return (inst.classAttribute().isNominal()) ? new double[2] : new double[1];
            }

            double[] result = (inst.classAttribute().isNominal()) ? new double[2] : new double[1];
            double f_t = 0;
            int[] indices = new int[this.numSelectOption.getValue()];

            if (this.evalOption.getChosenIndex() == 0) {
                f_t = dot(inst.toDoubleArray(), this.weights);
                f_t += this.bias;
            } else {
                for (int i = 0; i < this.numSelectOption.getValue(); i++) {
                    indices[i] = this.rand.nextInt(inst.numAttributes());
                }
            }

            if (inst.classAttribute().isNumeric()) {
                result[0] = f_t;
                return result;
            }

            if (f_t <= 0) {
                result[0] = 1;
            } else {
                result[1] = 1;
            }

            return result;
        }

        @Override
        public void resetLearningImpl() {
            this.weights = null; // we'll reset when we start learning
            this.bias = 0.0;
            this.rand = new Random();
        }

        @Override
        public void trainOnInstanceImpl(Instance inst) {
            double y_t, f_t, denom, m_bias;
            int[] indices = new int[this.numSelectOption.getValue()];
            double[] m_weights;

            if (this.weights == null) {

                this.weights = new double[inst.numValues()];
                for (int i = 0; i < this.weights.length; i++) {
                    this.weights[i] = this.rand.nextGaussian();
                }
                this.bias = 0.0;
                this.weights = truncate(this.weights, this.numSelectOption.getValue());
            }

            if (inst.classAttribute().isNominal()) {
                y_t = (inst.classValue() == 0) ? -1 : 1;
            } else {
                y_t = inst.classValue();
            }
            double[] x_t = inst.toDoubleArray();
            double[] x_hat = inst.toDoubleArray();

            if (this.rand.nextDouble() < this.searchOption.getValue()) {
                int[] indices_perm = perm(inst.numAttributes());
                for (int i = 0; i < this.numSelectOption.getValue(); i++) {
                    indices[i] = indices_perm[i];
                }

            } else {
                int[] sorted_indices = bubblesort_index(abs_vector(this.weights));

                for (int i = 0; i < inst.numAttributes() - this.numSelectOption.getValue(); i++) {
                    x_hat[sorted_indices[i]] = 0.0;
                }

                for (int i = 0; i < this.numSelectOption.getValue(); i++) {
                    indices[i] = sorted_indices[sorted_indices.length - i - 1];
                }
            }

            f_t = 0;
            for (int i = 0; i < this.numSelectOption.getValue(); i++) {
                f_t += this.weights[indices[i]] * x_t[indices[i]];
            }
            f_t += this.bias;

            if (f_t * y_t < 0) {

                for (int i = 0; i < x_hat.length; i++) {
                    denom = this.numSelectOption.getValue() / x_hat.length * this.searchOption.getValue();
                    if (this.weights[i] != 0) {
                        denom += (1 - this.searchOption.getValue()) * this.weights[i];
                    }
                    x_hat[i] /= denom;
                }

                m_weights = scalar_vector(y_t * this.stepSizeOption.getValue(), x_hat);
                m_bias = y_t * this.stepSizeOption.getValue() * this.bias;
                m_weights = vector_add(m_weights, this.weights);
                m_bias += m_bias + this.bias;

                m_weights = l2_projection(m_weights, m_bias, this.boundOption.getValue());
                m_weights = truncate(m_weights, this.numSelectOption.getValue());

                for (int i = 0; i < m_weights.length - 1; i++) {
                    this.weights[i] = m_weights[i];
                }
                this.bias = m_weights[m_weights.length - 1];
            }

        }

        @Override
        protected Measurement[] getModelMeasurementsImpl() {
            // TODO Auto-generated method stub
            return null;
        }

        @Override
        public void getModelDescription(StringBuilder out, int indent) {
            // TODO Auto-generated method stub

        }

        /**
         * Compute the dot product of two vectors
         *
         * @param x input vector
         * @param y input vector
         * @return dot product between x & y.
         */
        public double dot(double[] x, double[] y) {
            double dp = 0.0;
            for (int i = 0; i < x.length; i++) {
                dp += x[i] * y[i];
            }
            return dp;
        }

        /**
         * Compute a*x where a is a scalar and x is a vector
         *
         * @param a scalar (double)
         * @param x vector (double[])
         * @return return the scalar product
         */
        public double[] scalar_vector(double a, double[] x) {
            double[] y = new double[x.length];
            for (int i = 0; i < x.length; i++) {
                y[i] = a * x[i];
            }
            return y;
        }

        /**
         * Add two double vectors
         *
         * @param x
         * @param y
         * @return
         */
        public double[] vector_add(double[] x, double[] y) {
            for (int i = 0; i < x.length; i++) {
                x[i] += y[i];
            }
            return x;
        }

        /**
         *
         * @param x
         * @param bias
         * @param R
         * @return
         */
        public double[] l2_projection(double[] x, double bias, double R) {
            double norm = 0.0;
            double[] y = new double[x.length + 1];

            for (int i = 0; i < x.length; i++) {
                norm += x[i] * x[i];
            }
            norm = Math.sqrt(norm + bias * bias);
            double a = Math.sqrt(R) / norm;

            if (a < 1) {
                for (int i = 0; i < x.length; i++) {
                    y[i] = a * x[i];
                }
                y[y.length - 1] = a * bias;
            } else {
                for (int i = 0; i < x.length; i++) {
                    y[i] = x[i];
                }
                y[y.length - 1] = bias;
            }
            return y;
        }

        /**
         * Keep only the B largest entries in a vector x
         *
         * @param x
         * @param B
         * @return
         */
        public double[] truncate(double[] x, int B) {
            int[] sorted_indices = bubblesort_index(abs_vector(x));
            for (int i = 0; i < x.length - B - 1; i++) {
                x[sorted_indices[i]] = 0.0;
            }
            return x;
        }

        /**
         * Sort the elements of a vector
         *
         * @param x vector to be sorted
         * @return sorted vector
         */
        public int[] bubblesort_index(double[] x) {
            int[] y = new int[x.length];
            boolean flag = true;
            double t, r;

            /*initialize the indices*/
            for (int i = 0; i < x.length; i++) {
                y[i] = i;
            }

            while (flag) {
                flag = false;
                for (int j = 0; j < x.length - 1; j++) {
                    if (x[j] < x[j + 1]) {
                        t = x[j];
                        r = y[j];

                        x[j] = x[j + 1];
                        y[j] = y[j + 1];

                        x[j + 1] = t;
                        y[j + 1] = (int) r;
                        flag = true;
                    }
                }
            }
            return y;
        }

        /**
         * Compute the absolute value of the elements in a vector
         *
         * @param x
         * @return
         */
        public double[] abs_vector(double[] x) {
            for (int i = 0; i < x.length; i++) {
                if (x[i] < 0) {
                    x[i] = -x[i];
                }
            }
            return x;
        }

/**
 * Create a randomly permutation sequence of a pre-specified length.
 *
 * @param length
 * @return
 */
public int[] perm(int length) {

    // initialize array and fill it with {0,1,2...}
    int[] array = new int[length];
    for (int i = 0; i < array.length; i++) {
        array[i] = i;
    }

    for (int i = 0; i < length; i++) {

       // randomly chosen position in array whose element
        // will be swapped with the element in position i
        // note that when i = 0, any position can chosen (0 thru length-1)
        // when i = 1, only positions 1 through length -1
        // NOTE: r is an instance of java.util.Random
        int ran = i + this.rand.nextInt(length - i);

        // perform swap
        int temp = array[i];
        array[i] = array[ran];
        array[ran] = temp;
    }
    return array;
}>>>>>>>93d 8 b6469d28597a1fc6ba0371d33fd7d02b1856

}