org.pentaho.di.job.entries.addresultfilenames.JobEntryAddResultFilenames.java Source code

Java tutorial

Introduction

Here is the source code for org.pentaho.di.job.entries.addresultfilenames.JobEntryAddResultFilenames.java

Source

/*! ******************************************************************************
 *
 * Pentaho Data Integration
 *
 * Copyright (C) 2002-2013 by Pentaho : http://www.pentaho.com
 *
 *******************************************************************************
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with
 * the License. You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 ******************************************************************************/

package org.pentaho.di.job.entries.addresultfilenames;

import static org.pentaho.di.job.entry.validator.AbstractFileValidator.putVariableSpace;
import static org.pentaho.di.job.entry.validator.AndValidator.putValidators;
import static org.pentaho.di.job.entry.validator.JobEntryValidatorUtils.andValidator;
import static org.pentaho.di.job.entry.validator.JobEntryValidatorUtils.fileExistsValidator;
import static org.pentaho.di.job.entry.validator.JobEntryValidatorUtils.notNullValidator;

import java.io.IOException;
import java.util.List;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

import org.apache.commons.vfs.FileObject;
import org.apache.commons.vfs.FileSelectInfo;
import org.apache.commons.vfs.FileSelector;
import org.apache.commons.vfs.FileType;
import org.pentaho.di.cluster.SlaveServer;
import org.pentaho.di.core.CheckResultInterface;
import org.pentaho.di.core.Const;
import org.pentaho.di.core.Result;
import org.pentaho.di.core.ResultFile;
import org.pentaho.di.core.RowMetaAndData;
import org.pentaho.di.core.database.DatabaseMeta;
import org.pentaho.di.core.exception.KettleDatabaseException;
import org.pentaho.di.core.exception.KettleException;
import org.pentaho.di.core.exception.KettleXMLException;
import org.pentaho.di.core.variables.VariableSpace;
import org.pentaho.di.core.vfs.KettleVFS;
import org.pentaho.di.core.xml.XMLHandler;
import org.pentaho.di.i18n.BaseMessages;
import org.pentaho.di.job.Job;
import org.pentaho.di.job.JobMeta;
import org.pentaho.di.job.entry.JobEntryBase;
import org.pentaho.di.job.entry.JobEntryInterface;
import org.pentaho.di.job.entry.validator.ValidatorContext;
import org.pentaho.di.repository.ObjectId;
import org.pentaho.di.repository.Repository;
import org.pentaho.metastore.api.IMetaStore;
import org.w3c.dom.Node;

/**
 * This defines a 'add result filenames' job entry.
 *
 * @author Samatar Hassan
 * @since 06-05-2007
 */
public class JobEntryAddResultFilenames extends JobEntryBase implements Cloneable, JobEntryInterface {
    private static Class<?> PKG = JobEntryAddResultFilenames.class; // for i18n purposes, needed by Translator2!!

    public boolean argFromPrevious;

    public boolean deleteallbefore;

    public boolean includeSubfolders;

    public String[] arguments;

    public String[] filemasks;

    public JobEntryAddResultFilenames(String n) {
        super(n, "");
        argFromPrevious = false;
        deleteallbefore = false;
        arguments = null;

        includeSubfolders = false;
    }

    public JobEntryAddResultFilenames() {
        this("");
    }

    public Object clone() {
        JobEntryAddResultFilenames je = (JobEntryAddResultFilenames) super.clone();
        return je;
    }

    public String getXML() {
        StringBuffer retval = new StringBuffer(300);

        retval.append(super.getXML());
        retval.append("      ").append(XMLHandler.addTagValue("arg_from_previous", argFromPrevious));
        retval.append("      ").append(XMLHandler.addTagValue("include_subfolders", includeSubfolders));
        retval.append("      ").append(XMLHandler.addTagValue("delete_all_before", deleteallbefore));

        retval.append("      <fields>").append(Const.CR);
        if (arguments != null) {
            for (int i = 0; i < arguments.length; i++) {
                retval.append("        <field>").append(Const.CR);
                retval.append("          ").append(XMLHandler.addTagValue("name", arguments[i]));
                retval.append("          ").append(XMLHandler.addTagValue("filemask", filemasks[i]));
                retval.append("        </field>").append(Const.CR);
            }
        }
        retval.append("      </fields>").append(Const.CR);

        return retval.toString();
    }

    public void loadXML(Node entrynode, List<DatabaseMeta> databases, List<SlaveServer> slaveServers,
            Repository rep, IMetaStore metaStore) throws KettleXMLException {
        try {
            super.loadXML(entrynode, databases, slaveServers);
            argFromPrevious = "Y".equalsIgnoreCase(XMLHandler.getTagValue(entrynode, "arg_from_previous"));
            includeSubfolders = "Y".equalsIgnoreCase(XMLHandler.getTagValue(entrynode, "include_subfolders"));
            deleteallbefore = "Y".equalsIgnoreCase(XMLHandler.getTagValue(entrynode, "delete_all_before"));

            Node fields = XMLHandler.getSubNode(entrynode, "fields");

            // How many field arguments?
            int nrFields = XMLHandler.countNodes(fields, "field");
            arguments = new String[nrFields];
            filemasks = new String[nrFields];

            // Read them all...
            for (int i = 0; i < nrFields; i++) {
                Node fnode = XMLHandler.getSubNodeByNr(fields, "field", i);

                arguments[i] = XMLHandler.getTagValue(fnode, "name");
                filemasks[i] = XMLHandler.getTagValue(fnode, "filemask");
            }
        } catch (KettleXMLException xe) {
            throw new KettleXMLException(
                    BaseMessages.getString(PKG, "JobEntryAddResultFilenames.UnableToLoadFromXml"), xe);
        }
    }

    public void loadRep(Repository rep, IMetaStore metaStore, ObjectId id_jobentry, List<DatabaseMeta> databases,
            List<SlaveServer> slaveServers) throws KettleException {
        try {
            argFromPrevious = rep.getJobEntryAttributeBoolean(id_jobentry, "arg_from_previous");
            includeSubfolders = rep.getJobEntryAttributeBoolean(id_jobentry, "include_subfolders");

            deleteallbefore = rep.getJobEntryAttributeBoolean(id_jobentry, "delete_all_before");

            // How many arguments?
            int argnr = rep.countNrJobEntryAttributes(id_jobentry, "name");
            arguments = new String[argnr];
            filemasks = new String[argnr];

            // Read them all...
            for (int a = 0; a < argnr; a++) {
                arguments[a] = rep.getJobEntryAttributeString(id_jobentry, a, "name");
                filemasks[a] = rep.getJobEntryAttributeString(id_jobentry, a, "filemask");
            }
        } catch (KettleException dbe) {
            throw new KettleException(BaseMessages.getString(PKG, "JobEntryAddResultFilenames.UnableToLoadFromRepo",
                    String.valueOf(id_jobentry)), dbe);
        }
    }

    public void saveRep(Repository rep, IMetaStore metaStore, ObjectId id_job) throws KettleException {
        try {
            rep.saveJobEntryAttribute(id_job, getObjectId(), "arg_from_previous", argFromPrevious);
            rep.saveJobEntryAttribute(id_job, getObjectId(), "include_subfolders", includeSubfolders);
            rep.saveJobEntryAttribute(id_job, getObjectId(), "delete_all_before", deleteallbefore);

            // save the arguments...
            if (arguments != null) {
                for (int i = 0; i < arguments.length; i++) {
                    rep.saveJobEntryAttribute(id_job, getObjectId(), i, "name", arguments[i]);
                    rep.saveJobEntryAttribute(id_job, getObjectId(), i, "filemask", filemasks[i]);
                }
            }
        } catch (KettleDatabaseException dbe) {
            throw new KettleException(BaseMessages.getString(PKG, "JobEntryAddResultFilenames.UnableToSaveToRepo",
                    String.valueOf(id_job)), dbe);
        }
    }

    public Result execute(Result result, int nr) throws KettleException {
        List<RowMetaAndData> rows = result.getRows();
        RowMetaAndData resultRow = null;

        int nrErrFiles = 0;
        result.setResult(true);

        if (deleteallbefore) {
            // clear result filenames
            int size = result.getResultFiles().size();
            if (log.isBasic()) {
                logBasic(BaseMessages.getString(PKG, "JobEntryAddResultFilenames.log.FilesFound", "" + size));
            }

            result.getResultFiles().clear();
            if (log.isDetailed()) {
                logDetailed(BaseMessages.getString(PKG, "JobEntryAddResultFilenames.log.DeletedFiles", "" + size));
            }
        }

        if (argFromPrevious) {
            if (log.isDetailed()) {
                logDetailed(BaseMessages.getString(PKG, "JobEntryAddResultFilenames.FoundPreviousRows",
                        String.valueOf((rows != null ? rows.size() : 0))));
            }
        }

        if (argFromPrevious && rows != null) // Copy the input row to the (command line) arguments
        {
            for (int iteration = 0; iteration < rows.size() && !parentJob.isStopped(); iteration++) {
                resultRow = rows.get(iteration);

                // Get values from previous result
                String filefolder_previous = resultRow.getString(0, null);
                String fmasks_previous = resultRow.getString(1, null);

                // ok we can process this file/folder
                if (log.isDetailed()) {
                    logDetailed(BaseMessages.getString(PKG, "JobEntryAddResultFilenames.ProcessingRow",
                            filefolder_previous, fmasks_previous));
                }

                if (!processFile(filefolder_previous, fmasks_previous, parentJob, result)) {
                    nrErrFiles++;
                }

            }
        } else if (arguments != null) {

            for (int i = 0; i < arguments.length && !parentJob.isStopped(); i++) {

                // ok we can process this file/folder
                if (log.isDetailed()) {
                    logDetailed(BaseMessages.getString(PKG, "JobEntryAddResultFilenames.ProcessingArg",
                            arguments[i], filemasks[i]));
                }
                if (!processFile(arguments[i], filemasks[i], parentJob, result)) {
                    nrErrFiles++;
                }
            }
        }

        if (nrErrFiles > 0) {
            result.setResult(false);
            result.setNrErrors(nrErrFiles);
        }

        return result;
    }

    private boolean processFile(String filename, String wildcard, Job parentJob, Result result) {

        boolean rcode = true;
        FileObject filefolder = null;
        String realFilefoldername = environmentSubstitute(filename);
        String realwildcard = environmentSubstitute(wildcard);

        try {
            filefolder = KettleVFS.getFileObject(realFilefoldername, this);

            if (filefolder.exists()) {
                // the file or folder exists

                if (filefolder.getType() == FileType.FILE) {
                    // Add filename to Resultfilenames ...
                    if (log.isDetailed()) {
                        logDetailed(BaseMessages.getString(PKG, "JobEntryAddResultFilenames.AddingFileToResult",
                                filefolder.toString()));
                    }
                    ResultFile resultFile = new ResultFile(ResultFile.FILE_TYPE_GENERAL,
                            KettleVFS.getFileObject(filefolder.toString(), this), parentJob.getJobname(),
                            toString());
                    result.getResultFiles().put(resultFile.getFile().toString(), resultFile);
                } else {
                    FileObject[] list = filefolder
                            .findFiles(new TextFileSelector(filefolder.toString(), realwildcard));

                    for (int i = 0; i < list.length && !parentJob.isStopped(); i++) {
                        // Add filename to Resultfilenames ...
                        if (log.isDetailed()) {
                            logDetailed(BaseMessages.getString(PKG, "JobEntryAddResultFilenames.AddingFileToResult",
                                    list[i].toString()));
                        }
                        ResultFile resultFile = new ResultFile(ResultFile.FILE_TYPE_GENERAL,
                                KettleVFS.getFileObject(list[i].toString(), this), parentJob.getJobname(),
                                toString());
                        result.getResultFiles().put(resultFile.getFile().toString(), resultFile);
                    }
                }

            } else {
                // File can not be found
                if (log.isBasic()) {
                    logBasic(BaseMessages.getString(PKG, "JobEntryAddResultFilenames.FileCanNotbeFound",
                            realFilefoldername));
                }
                rcode = false;
            }
        } catch (Exception e) {
            rcode = false;
            logError(BaseMessages.getString(PKG, "JobEntryAddResultFilenames.CouldNotProcess", realFilefoldername,
                    e.getMessage()), e);
        } finally {
            if (filefolder != null) {
                try {
                    filefolder.close();
                    filefolder = null;
                } catch (IOException ex) {
                    // Ignore
                }
            }
        }

        return rcode;
    }

    private class TextFileSelector implements FileSelector {
        String fileWildcard = null;
        String sourceFolder = null;

        public TextFileSelector(String sourcefolderin, String filewildcard) {
            if (!Const.isEmpty(sourcefolderin)) {
                sourceFolder = sourcefolderin;
            }

            if (!Const.isEmpty(filewildcard)) {
                fileWildcard = filewildcard;
            }
        }

        public boolean includeFile(FileSelectInfo info) {
            boolean returncode = false;
            try {
                if (!info.getFile().toString().equals(sourceFolder)) {
                    // Pass over the Base folder itself
                    String short_filename = info.getFile().getName().getBaseName();

                    if (info.getFile().getParent().equals(info.getBaseFolder())
                            || (!info.getFile().getParent().equals(info.getBaseFolder()) && includeSubfolders)) {
                        if ((info.getFile().getType() == FileType.FILE && fileWildcard == null)
                                || (info.getFile().getType() == FileType.FILE && fileWildcard != null
                                        && GetFileWildcard(short_filename, fileWildcard))) {
                            returncode = true;
                        }
                    }
                }
            } catch (Exception e) {
                logError("Error while finding files ... in [" + info.getFile().toString() + "]. Exception :"
                        + e.getMessage());
                returncode = false;
            }
            return returncode;
        }

        public boolean traverseDescendents(FileSelectInfo info) {
            return true;
        }
    }

    /**********************************************************
     *
     * @param selectedfile
     * @param wildcard
     * @return True if the selectedfile matches the wildcard
     **********************************************************/
    private boolean GetFileWildcard(String selectedfile, String wildcard) {
        Pattern pattern = null;
        boolean getIt = true;

        if (!Const.isEmpty(wildcard)) {
            pattern = Pattern.compile(wildcard);
            // First see if the file matches the regular expression!
            if (pattern != null) {
                Matcher matcher = pattern.matcher(selectedfile);
                getIt = matcher.matches();
            }
        }

        return getIt;
    }

    public void setIncludeSubfolders(boolean includeSubfolders) {
        this.includeSubfolders = includeSubfolders;
    }

    public void setArgumentsPrevious(boolean argFromPrevious) {
        this.argFromPrevious = argFromPrevious;
    }

    public void setDeleteAllBefore(boolean deleteallbefore) {
        this.deleteallbefore = deleteallbefore;
    }

    public boolean evaluates() {
        return true;
    }

    public boolean isArgFromPrevious() {
        return argFromPrevious;
    }

    public boolean deleteAllBefore() {
        return deleteallbefore;
    }

    public String[] getArguments() {
        return arguments;
    }

    public String[] getFilemasks() {
        return filemasks;
    }

    public boolean isIncludeSubfolders() {
        return includeSubfolders;
    }

    public void check(List<CheckResultInterface> remarks, JobMeta jobMeta, VariableSpace space,
            Repository repository, IMetaStore metaStore) {
        boolean res = andValidator().validate(this, "arguments", remarks, putValidators(notNullValidator()));

        if (res == false) {
            return;
        }

        ValidatorContext ctx = new ValidatorContext();
        putVariableSpace(ctx, getVariables());
        putValidators(ctx, notNullValidator(), fileExistsValidator());

        for (int i = 0; i < arguments.length; i++) {
            andValidator().validate(this, "arguments[" + i + "]", remarks, ctx);
        }
    }

}