org.pentaho.di.trans.steps.multimerge.MultiMergeJoinMeta.java Source code

Java tutorial

Introduction

Here is the source code for org.pentaho.di.trans.steps.multimerge.MultiMergeJoinMeta.java

Source

/*! ******************************************************************************
 *
 * Pentaho Data Integration
 *
 * Copyright (C) 2002-2016 by Pentaho : http://www.pentaho.com
 *
 *******************************************************************************
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with
 * the License. You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 ******************************************************************************/

package org.pentaho.di.trans.steps.multimerge;

import java.util.List;

import org.apache.commons.lang.ArrayUtils;
import org.pentaho.di.core.CheckResult;
import org.pentaho.di.core.CheckResultInterface;
import org.pentaho.di.core.Const;
import org.pentaho.di.core.database.DatabaseMeta;
import org.pentaho.di.core.exception.KettleException;
import org.pentaho.di.core.exception.KettleStepException;
import org.pentaho.di.core.exception.KettleXMLException;
import org.pentaho.di.core.injection.Injection;
import org.pentaho.di.core.injection.InjectionSupported;
import org.pentaho.di.core.row.RowMetaInterface;
import org.pentaho.di.core.variables.VariableSpace;
import org.pentaho.di.core.xml.XMLHandler;
import org.pentaho.di.i18n.BaseMessages;
import org.pentaho.di.repository.ObjectId;
import org.pentaho.di.repository.Repository;
import org.pentaho.di.trans.Trans;
import org.pentaho.di.trans.TransMeta;
import org.pentaho.di.trans.step.BaseStepMeta;
import org.pentaho.di.trans.step.StepDataInterface;
import org.pentaho.di.trans.step.StepInterface;
import org.pentaho.di.trans.step.StepMeta;
import org.pentaho.di.trans.step.StepMetaInterface;
import org.pentaho.di.trans.step.errorhandling.Stream;
import org.pentaho.di.trans.step.errorhandling.StreamIcon;
import org.pentaho.di.trans.step.errorhandling.StreamInterface.StreamType;
import org.pentaho.metastore.api.IMetaStore;
import org.w3c.dom.Node;

/**
 * @author Biswapesh
 * @since 24-nov-2006
 */
@InjectionSupported(localizationPrefix = "MultiMergeJoin.Injection.")
public class MultiMergeJoinMeta extends BaseStepMeta implements StepMetaInterface {
    private static Class<?> PKG = MultiMergeJoinMeta.class; // for i18n purposes, needed by Translator2!!

    public static final String[] join_types = { "INNER", "FULL OUTER" };
    public static final boolean[] optionals = { false, true };

    @Injection(name = "JOIN_TYPE")
    private String joinType;

    /**
     * comma separated key values for each stream
     */
    @Injection(name = "KEY_FIELDS")
    private String[] keyFields;

    /**
     * input stream names
     */
    @Injection(name = "INPUT_STEPS")
    private String[] inputSteps;

    /**
     * The supported join types are INNER, LEFT OUTER, RIGHT OUTER and FULL OUTER
     *
     * @return The type of join
     */
    public String getJoinType() {
        return joinType;
    }

    /**
     * Sets the type of join
     *
     * @param joinType
     *          The type of join, e.g. INNER/FULL OUTER
     */
    public void setJoinType(String joinType) {
        this.joinType = joinType;
    }

    /**
     * @return Returns the keyFields1.
     */
    public String[] getKeyFields() {
        return keyFields;
    }

    /**
     * @param keyFields1
     *          The keyFields1 to set.
     */
    public void setKeyFields(String[] keyFields) {
        this.keyFields = keyFields;
    }

    @Override
    public boolean excludeFromRowLayoutVerification() {
        return true;
    }

    public MultiMergeJoinMeta() {
        super(); // allocate BaseStepMeta
    }

    @Override
    public void loadXML(Node stepnode, List<DatabaseMeta> databases, IMetaStore metaStore)
            throws KettleXMLException {
        readData(stepnode);
    }

    public void allocateKeys(int nrKeys) {
        keyFields = new String[nrKeys];
    }

    @Override
    public Object clone() {
        MultiMergeJoinMeta retval = (MultiMergeJoinMeta) super.clone();
        int nrKeys = keyFields == null ? 0 : keyFields.length;
        int nrSteps = inputSteps == null ? 0 : inputSteps.length;
        retval.allocateKeys(nrKeys);
        retval.allocateInputSteps(nrSteps);
        System.arraycopy(keyFields, 0, retval.keyFields, 0, nrKeys);
        System.arraycopy(inputSteps, 0, retval.inputSteps, 0, nrSteps);
        return retval;
    }

    @Override
    public String getXML() {
        StringBuilder retval = new StringBuilder();

        String[] inputStepsNames = inputSteps != null ? inputSteps : ArrayUtils.EMPTY_STRING_ARRAY;
        retval.append("    ").append(XMLHandler.addTagValue("join_type", getJoinType()));
        for (int i = 0; i < inputStepsNames.length; i++) {
            retval.append("    ").append(XMLHandler.addTagValue("step" + i, inputStepsNames[i]));
        }

        retval.append("    ").append(XMLHandler.addTagValue("number_input", inputStepsNames.length));
        retval.append("    ").append(XMLHandler.openTag("keys")).append(Const.CR);
        for (int i = 0; i < keyFields.length; i++) {
            retval.append("      ").append(XMLHandler.addTagValue("key", keyFields[i]));
        }
        retval.append("    ").append(XMLHandler.closeTag("keys")).append(Const.CR);

        return retval.toString();
    }

    private void readData(Node stepnode) throws KettleXMLException {
        try {

            Node keysNode = XMLHandler.getSubNode(stepnode, "keys");

            int nrKeys = XMLHandler.countNodes(keysNode, "key");

            allocateKeys(nrKeys);

            for (int i = 0; i < nrKeys; i++) {
                Node keynode = XMLHandler.getSubNodeByNr(keysNode, "key", i);
                keyFields[i] = XMLHandler.getNodeValue(keynode);
            }

            int nInputStreams = Integer.parseInt(XMLHandler.getTagValue(stepnode, "number_input"));

            allocateInputSteps(nInputStreams);

            for (int i = 0; i < nInputStreams; i++) {
                inputSteps[i] = XMLHandler.getTagValue(stepnode, "step" + i);
            }

            joinType = XMLHandler.getTagValue(stepnode, "join_type");
        } catch (Exception e) {
            throw new KettleXMLException(
                    BaseMessages.getString(PKG, "MultiMergeJoinMeta.Exception.UnableToLoadStepInfo"), e);
        }
    }

    @Override
    public void setDefault() {
        joinType = join_types[0];
        allocateKeys(0);
        allocateInputSteps(0);
    }

    @Override
    public void readRep(Repository rep, IMetaStore metaStore, ObjectId id_step, List<DatabaseMeta> databases)
            throws KettleException {
        try {
            int nrKeys = rep.countNrStepAttributes(id_step, "keys");

            allocateKeys(nrKeys);

            for (int i = 0; i < nrKeys; i++) {
                keyFields[i] = rep.getStepAttributeString(id_step, i, "keys");
            }

            long nInputStreams = rep.getStepAttributeInteger(id_step, "number_input");

            allocateInputSteps((int) nInputStreams);

            for (int i = 0; i < nInputStreams; i++) {
                inputSteps[i] = rep.getStepAttributeString(id_step, "step" + i);
            }
            // This next bit is completely unnecessary if you just pass the step name into
            // the constructor above. That sets the subject to the step name in one pass
            // instead of a second one.
            // MB - 5/2016
            //
            // List<StreamInterface> infoStreams = getStepIOMeta().getInfoStreams();
            // for ( int i = 0; i < infoStreams.size(); i++ ) {
            //   infoStreams.get( i ).setSubject( rep.getStepAttributeString( id_step, "step" + i ) );
            // }

            joinType = rep.getStepAttributeString(id_step, "join_type");
        } catch (Exception e) {
            throw new KettleException(
                    BaseMessages.getString(PKG, "MultiMergeJoinMeta.Exception.UnexpectedErrorReadingStepInfo"), e);
        }
    }

    @Override
    public void searchInfoAndTargetSteps(List<StepMeta> steps) {
        getStepIOMeta().getInfoStreams().clear();
        for (int i = 0; i < inputSteps.length; i++) {
            String inputStepName = inputSteps[i];
            if (i >= getStepIOMeta().getInfoStreams().size()) {
                getStepIOMeta().addStream(new Stream(StreamType.INFO, StepMeta.findStep(steps, inputStepName),
                        BaseMessages.getString(PKG, "MultiMergeJoin.InfoStream.Description"), StreamIcon.INFO,
                        inputStepName));
            }
        }
    }

    @Override
    public void saveRep(Repository rep, IMetaStore metaStore, ObjectId id_transformation, ObjectId id_step)
            throws KettleException {
        try {
            for (int i = 0; i < keyFields.length; i++) {
                rep.saveStepAttribute(id_transformation, id_step, i, "keys", keyFields[i]);
            }

            String[] inputStepsNames = inputSteps != null ? inputSteps : ArrayUtils.EMPTY_STRING_ARRAY;
            rep.saveStepAttribute(id_transformation, id_step, "number_input", inputStepsNames.length);
            for (int i = 0; i < inputStepsNames.length; i++) {
                rep.saveStepAttribute(id_transformation, id_step, "step" + i, inputStepsNames[i]);
            }
            //      The following was the old way of persisting this step to the repository. This was inconsistent with
            //      how getXML works, and also fails the load/save tester
            //      List<StreamInterface> infoStreams = getStepIOMeta().getInfoStreams();
            //      rep.saveStepAttribute( id_transformation, id_step, "number_input", infoStreams.size() );
            //      for ( int i = 0; i < infoStreams.size(); i++ ) {
            //        rep.saveStepAttribute( id_transformation, id_step, "step" + i, infoStreams.get( i ).getStepname() );
            //      }
            // inputSteps[i]
            rep.saveStepAttribute(id_transformation, id_step, "join_type", getJoinType());
        } catch (Exception e) {
            throw new KettleException(
                    BaseMessages.getString(PKG, "MultiMergeJoinMeta.Exception.UnableToSaveStepInfo") + id_step, e);
        }
    }

    @Override
    public void check(List<CheckResultInterface> remarks, TransMeta transMeta, StepMeta stepMeta,
            RowMetaInterface prev, String[] input, String[] output, RowMetaInterface info, VariableSpace space,
            Repository repository, IMetaStore metaStore) {
        /*
         * @todo Need to check for the following: 1) Join type must be one of INNER / LEFT OUTER / RIGHT OUTER / FULL OUTER
         * 2) Number of input streams must be two (for now at least) 3) The field names of input streams must be unique
         */
        CheckResult cr = new CheckResult(CheckResultInterface.TYPE_RESULT_WARNING,
                BaseMessages.getString(PKG, "MultiMergeJoinMeta.CheckResult.StepNotVerified"), stepMeta);
        remarks.add(cr);
    }

    @Override
    public void getFields(RowMetaInterface r, String name, RowMetaInterface[] info, StepMeta nextStep,
            VariableSpace space, Repository repository, IMetaStore metaStore) throws KettleStepException {
        // We don't have any input fields here in "r" as they are all info fields.
        // So we just merge in the info fields.
        //
        if (info != null) {
            for (int i = 0; i < info.length; i++) {
                if (info[i] != null) {
                    r.mergeRowMeta(info[i]);
                }
            }
        }

        for (int i = 0; i < r.size(); i++) {
            r.getValueMeta(i).setOrigin(name);
        }
        return;
    }

    @Override
    public StepInterface getStep(StepMeta stepMeta, StepDataInterface stepDataInterface, int cnr, TransMeta tr,
            Trans trans) {
        return new MultiMergeJoin(stepMeta, stepDataInterface, cnr, tr, trans);
    }

    @Override
    public StepDataInterface getStepData() {
        return new MultiMergeJoinData();
    }

    @Override
    public void resetStepIoMeta() {
        // Don't reset!
    }

    public void setInputSteps(String[] inputSteps) {
        this.inputSteps = inputSteps;
    }

    public String[] getInputSteps() {
        return inputSteps;
    }

    public void allocateInputSteps(int count) {
        inputSteps = new String[count];

    }
}