meka.classifiers.multitarget.SCC.java Source code

Introduction

Here is the source code for meka.classifiers.multitarget.SCC.java
Source

/*
 *   This program is free software: you can redistribute it and/or modify
 *   it under the terms of the GNU General Public License as published by
 *   the Free Software Foundation, either version 3 of the License, or
 *   (at your option) any later version.
 *
 *   This program is distributed in the hope that it will be useful,
 *   but WITHOUT ANY WARRANTY; without even the implied warranty of
 *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *   GNU General Public License for more details.
 *
 *   You should have received a copy of the GNU General Public License
 *   along with this program.  If not, see <http://www.gnu.org/licenses/>.
 */

package meka.classifiers.multitarget;

import meka.classifiers.multilabel.Evaluation;
import meka.classifiers.multilabel.ProblemTransformationMethod;
import meka.core.*;
import meka.filters.multilabel.SuperNodeFilter;
import weka.classifiers.Classifier;
import weka.core.*;
import weka.core.TechnicalInformation.Field;
import weka.core.TechnicalInformation.Type;

import java.util.*;

/**
 * SCC.java - Super Class Classifier (aka Super Node Classifier).
 * The output space is manipulated into super classes (based on label dependence), upon which a multi-target base classifier is applied.
 * This is related to the RAkELd-type classifiers for multi-label classification.
 *
 * @author    Jesse Read
 * @version   June 2012
 */
public class SCC extends NSR implements Randomizable, MultiTargetClassifier, TechnicalInformationHandler {

    private SuperNodeFilter f = new SuperNodeFilter();

    private int m_Iv = 0;
    private int m_I = 1000;

    /* TODO make external options */
    private static final int i_SPLIT = 67;
    private static final String i_ErrFn = "Exact match";

    private Random rand = null;

    public SCC() {
        // default classifier for GUI
        this.m_Classifier = new CC();
    }

    @Override
    protected String defaultClassifierString() {
        // default classifier for CLI
        return "meka.classifiers.multitarget.CC";
    }

    /**
     * Description to display in the GUI.
     *
     * @return      the description
     */
    @Override
    public String globalInfo() {
        return "Super Class Classifier (SCC).\n"
                + "The output space is manipulated into super classes (based on label dependence; and pruning and nearest-subset-replacement like NSR), upon which a multi-target base classifier is applied.\n"
                + "For example, a super class based on two labels might take values in {[0,3],[0,0],[1,2]}.\n"
                + "For more information see:\n" + getTechnicalInformation().toString();
    }

    @Override
    public TechnicalInformation getTechnicalInformation() {
        TechnicalInformation result;

        result = new TechnicalInformation(Type.INPROCEEDINGS);
        result.setValue(Field.AUTHOR, "Jesse Read, Concha Blieza, Pedro Larranaga");
        result.setValue(Field.TITLE, "Multi-Dimensional Classification with Super-Classes");
        result.setValue(Field.JOURNAL, "IEEE Transactions on Knowledge and Data Engineering");
        result.setValue(Field.YEAR, "2013");

        return result;
    }

    private double rating(int partition[][], double M[][]) {
        return rating(partition, M, 0.0);
    }

    /**
     * Rating - Return a score for the super-class 'partition' using the pairwise info in 'M'
     * @param   partition   super-class partition, e.g., [[0,3],[2],[1,4]]
     * @param   M         pariwise information \propto M[j][k]
     * @param   CRITICAL   a critical value to use
     *
     * CRITICAL = 2.706;
     * CRITICAL = 6.251;
     * @Note: For now, assume 3 DOF (multi-label classification)
     * @todo set CRITICAL into M, then this can be a generic function
     */
    private double rating(int partition[][], double M[][], double CRITICAL) {

        int L = M.length;

        double S[][] = new double[L][L]; // sums
        boolean T[][] = new boolean[L][L]; // together ?

        double sumTogether = 0.0, sumApart = 0.0;

        // for each combo ...
        for (int i = 0; i < partition.length; i++) {
            Arrays.sort(partition[i]);
            double n = partition[i].length;
            // ... add the AVG score for each together-pair
            for (int j = 0; j < n; j++) {
                for (int k = j + 1; k < n; k++) {
                    T[partition[i][j]][partition[i][k]] = true;
                }
            }
            //score += tot / ((n*(n-1))/2);
        }

        // for each non-together pair ...
        for (int j = 0; j < L; j++) {
            for (int k = j + 1; k < L; k++) {
                if (T[j][k])
                    sumTogether += (M[j][k] - CRITICAL);
                else
                    sumApart += (M[j][k] - CRITICAL);
            }
        }

        return sumTogether - sumApart;
    }

    /**
     * MutateCombinations - mutate the 'partition'.
     */
    private int[][] mutateCombinations(int partition[][], Random r) {

        int from = r.nextInt(partition.length);
        int i = r.nextInt(partition[from].length);

        int to = r.nextInt(partition.length);

        if (to == from) {
            // create new list, add
            partition = Arrays.copyOf(partition, partition.length + 1);
            partition[partition.length - 1] = new int[] { partition[from][i] };
            to = partition.length + 1;
            // delete original
            partition[from] = A.delete(partition[from], i);
        } else {
            // make new slot, copy
            partition[to] = A.append(partition[to], partition[from][i]);
            // delete original
            partition[from] = A.delete(partition[from], i);
        }
        // if empty ...
        if (partition[from].length <= 0) {
            // delete it
            partition[from] = partition[partition.length - 1];
            partition = Arrays.copyOf(partition, partition.length - 1);
        }

        return partition;
    }

    /**
     * Train classifier <code>h</code>, on dataset <code>D</code>, under super-class partition <code>partition</code>.
     */
    public void trainClassifier(Classifier h, Instances D, int partition[][]) throws Exception {
        f = new SuperNodeFilter();
        f.setIndices(partition);
        f.setP(m_P >= 0 ? m_P : rand.nextInt(Math.abs(m_P)));
        f.setN(m_N >= 0 ? m_N : rand.nextInt(Math.abs(m_N)));
        Instances D_ = f.process(D);
        //int K[] = MLUtils.getK(D_); <-- if some K[j] < 2, this is a problem!
        if (getDebug()) {
            int N = D.numInstances();
            int U = MLUtils.numberOfUniqueCombinations(D);
            System.out.println("PS(" + f.getP() + "," + m_N + ") reduced: " + N + " -> " + D_.numInstances() + " / "
                    + U + " -> " + MLUtils.numberOfUniqueCombinations(D_));
            //System.out.println("E_acc P "+f.getP()+" "+(D_.numInstances()/(double)N) +" "+(MLUtils.numberOfUniqueCombinations(D_)/(double)U));
            //m_Info = "P="+f.getP()+"; %N="+(D_.numInstances()/(double)N) +"; %C"+(MLUtils.numberOfUniqueCombinations(D_)/(double)U)+"; size(partition)="+partition.length;
        }

        m_InstancesTemplate = D_;
        m_Classifier.buildClassifier(D_); // build on the processed batch
    }

    /**
     * Test classifier h, on dataset D, under super-class partition 'partition'.
     * <br>
     * TODO should be able to use something out of meka.classifiers.Evaluation instead of all this ...
     */
    public Result testClassifier(Classifier h, Instances D_train, Instances D_test, int partition[][])
            throws Exception {

        trainClassifier(m_Classifier, D_train, partition);

        Result result = Evaluation.testClassifier((ProblemTransformationMethod) h, D_test);

        if (h instanceof MultiTargetClassifier || Evaluation.isMT(D_test)) {
            result.setInfo("Type", "MT");
        } else if (h instanceof ProblemTransformationMethod) {
            result.setInfo("Threshold", MLEvalUtils.getThreshold(result.predictions, D_train, "PCut1"));
            result.setInfo("Type", "ML");
        }

        result.setValue("N_train", D_train.numInstances());
        result.setValue("N_test", D_test.numInstances());
        result.setValue("LCard_train", MLUtils.labelCardinality(D_train));
        result.setValue("LCard_test", MLUtils.labelCardinality(D_test));

        //result.setValue("Build_time",(after - before)/1000.0);
        //result.setValue("Test_time",(after_test - before_test)/1000.0);
        //result.setValue("Total_time",(after_test - before)/1000.0);

        result.setInfo("Classifier_name", h.getClass().getName());
        //result.setInfo("Classifier_ops", Arrays.toString(h.getOptions()));
        result.setInfo("Classifier_info", h.toString());
        result.setInfo("Dataset_name", MLUtils.getDatasetName(D_test));

        result.output = Result.getStats(result, "1");
        return result;
    }

    @Override
    public void buildClassifier(Instances D) throws Exception {

        int N = D.numInstances(); // only for printouts
        int U = MLUtils.numberOfUniqueCombinations(D); // only for printouts
        int L = D.classIndex();
        rand = new Random(m_S);

        if (!(m_Classifier instanceof MultiTargetClassifier)) {
            throw new Exception(
                    "[Error] The base classifier must be multi-target capable, i.e., from meka.classifiers.multitarget.");
        }

        // 0. SPLIT INTO TRAIN AND VALIDATION SET/S
        Instances D_r = new Instances(D);
        D_r.randomize(rand);
        Instances D_train = new Instances(D_r, 0, D_r.numInstances() * i_SPLIT / 100);
        Instances D_test = new Instances(D_r, D_train.numInstances(), D_r.numInstances() - D_train.numInstances());

        // 1. BUILD BR or EBR
        if (getDebug())
            System.out.print("1. BUILD & Evaluate BR: ");
        CR cr = new CR();
        cr.setClassifier(((ProblemTransformationMethod) m_Classifier).getClassifier()); // assume PT
        Result result_1 = Evaluation.evaluateModel((ProblemTransformationMethod) cr, D_train, D_test, "PCut1", "5");
        double acc1 = (Double) result_1.getMeasurement(i_ErrFn);
        if (getDebug())
            System.out.println(" " + acc1);

        int partition[][] = SuperLabelUtils.generatePartition(A.make_sequence(L), rand);

        // 2. SELECT / MODIFY INDICES (using LEAD technique)
        if (getDebug())
            System.out.println("2. GET ERR-CHI-SQUARED MATRIX: ");
        double MER[][] = StatUtils.condDepMatrix(D_test, result_1);
        if (getDebug())
            System.out.println(MatrixUtils.toString(MER));

        /*
         * 3. SIMULATED ANNEALING
         * Always accept if best, progressively less likely accept otherwise.
         */
        if (getDebug())
            System.out.println("3. COMBINE NODES TO FIND THE BEST COMBINATION ACCORDING TO CHI");
        double w = rating(partition, MER);
        if (getDebug())
            System.out.println("@0 : " + SuperLabelUtils.toString(partition) + "\t(" + w + ")");

        for (int i = 0; i < m_I; i++) {
            int partition_[][] = mutateCombinations(MatrixUtils.deep_copy(partition), rand);
            double w_ = rating(partition_, MER); // this is really p_MER(partition_)
            if (w_ > w) {
                // ACCEPT
                partition = partition_;
                w = w_;
                if (getDebug())
                    System.out.println("@" + i + " : " + SuperLabelUtils.toString(partition) + "\t(" + w + ")");
            } else {
                // MAYBE ACCEPT
                double diff = Math.abs(w_ - w);
                double p = (2. * (1. - sigma(diff * i / 1000.)));
                if (p > rand.nextDouble()) {
                    // OK, ACCEPT NOW
                    if (getDebug())
                        System.out.println(
                                "@" + i + " : " + SuperLabelUtils.toString(partition_) + "\t(" + w_ + ")*");
                    partition = partition_;
                    w = w_;
                }
            }

        }

        /*
         * METHOD 2
         * refine the set we started with above, with a few iterations.
         * we mutate a set, and accept whenever the classification performance is GREATER
         */
        if (m_Iv > 0) {
            if (getDebug())
                System.out.println("4. REFINING THE INITIAL SET WITH SOME OLD-FASHIONED INTERNAL EVAL");
            // Build & evaluate the classifier with the latest partition
            result_1 = testClassifier((ProblemTransformationMethod) m_Classifier, D_train, D_test, partition);
            w = (Double) result_1.getMeasurement(i_ErrFn);
            if (getDebug())
                System.out.println("@0 : " + SuperLabelUtils.toString(partition) + "\t(" + w + ")");
            for (int i = 0; i < m_Iv; i++) {
                int partition_[][] = mutateCombinations(MatrixUtils.deep_copy(partition), rand);
                // Build the classifier with the new combination
                trainClassifier(m_Classifier, D_train, partition);
                // Evaluate on D_test
                Result result_2 = testClassifier((ProblemTransformationMethod) m_Classifier, D_train, D_test,
                        partition_);
                double w_ = (Double) result_2.getMeasurement(i_ErrFn);
                if (w_ > w) {
                    w = w_;
                    partition = partition_;
                    if (getDebug())
                        System.out.println(
                                "@" + (i + 1) + "' : " + SuperLabelUtils.toString(partition) + "\t(" + w + ")");
                }
            }
        }

        // 4. DECIDE HOW GOOD THEY ARE, COMPARE EACH LABEL TO BR-result?
        if (getDebug())
            System.out.println("4. TRAIN " + SuperLabelUtils.toString(partition));
        trainClassifier(m_Classifier, D, partition);

        if (getDebug()) {
            //System.out.println("E_acc P "+m_P+" "+(mt.m_InstancesTemplate.numInstances()/(double)N) +" "+(MLUtils.numberOfUniqueCombinations(mt.m_InstancesTemplate)/(double)U));
        }
        // 5. MOVE ON ...
    }

    @Override
    public double[] distributionForInstance(Instance x) throws Exception {

        //return mt.distributionForInstance(x);
        int L = x.classIndex();
        double y[] = new double[L * 2];

        // Convert (x,y) to (x_,y_)
        int L_ = m_InstancesTemplate.classIndex(); // == L-NUM
        Instance x_ = MLUtils.setTemplate(x, f.getTemplate(), m_InstancesTemplate);

        // Get a classification y_ = h(x_)
        double y_[] = null;
        try {
            y_ = ((ProblemTransformationMethod) m_Classifier).distributionForInstance(x_);
        } catch (Exception e) {
            System.err.println("EXCEPTION !!! setting to " + Arrays.toString(y_));
            return y;
            //e.printStackTrace();
            //System.exit(1);
        }

        // For each super node ...
        for (int j = 0; j < L_; j++) {

            int idxs[] = SuperNodeFilter.decodeClasses(m_InstancesTemplate.attribute(j).name()); // 3,4   (partition)
            String vals[] = SuperNodeFilter
                    .decodeValue(m_InstancesTemplate.attribute(j).value((int) Math.round(y_[j]))); // 1,0   (clases)

            for (int i = 0; i < idxs.length; i++) {
                y[idxs[i]] = x.dataset().attribute(idxs[i]).indexOfValue(vals[i]); // y_j = v
                y[idxs[i] + L] = y_[j + L_]; // P(Y_j = v), hence, MUST be a multi-target classifier
            }
        }

        return y;
    }

    public void setI(int i) {
        m_I = i;
    }

    public int getI() {
        return m_I;
    }

    public void setIv(int v) {
        m_Iv = v;
    }

    public int getIv() {
        return m_Iv;
    }

    public static void main(String args[]) {
        ProblemTransformationMethod.evaluation(new SCC(), args);
    }

    /**
     * Sigmoid / Logistic function
     */
    public static final double sigma(double a) {
        return 1.0 / (1.0 + Math.exp(-a));
    }

    @Override
    public Enumeration listOptions() {
        Vector result = new Vector();
        result.addElement(new Option("\tSets the number of simulated annealing iterations\n\tdefault: 1000", "I", 1,
                "-I <value>"));
        result.addElement(new Option("\tSets the number of internal-validation iterations\n\tdefault: 0", "V", 1,
                "-V <value>"));
        OptionUtils.add(result, super.listOptions());
        return OptionUtils.toEnumeration(result);
    }

    @Override
    public void setOptions(String[] options) throws Exception {
        setI(OptionUtils.parse(options, 'I', 1000));
        setIv(OptionUtils.parse(options, 'V', 0));
        super.setOptions(options);
    }

    @Override
    public String[] getOptions() {
        List<String> result = new ArrayList<>();
        OptionUtils.add(result, 'I', getI());
        OptionUtils.add(result, 'V', getIv());
        OptionUtils.add(result, super.getOptions());
        return OptionUtils.toArray(result);
    }

}