org.pentaho.di.trans.steps.processfiles.ProcessFiles.java Source code

Java tutorial

Introduction

Here is the source code for org.pentaho.di.trans.steps.processfiles.ProcessFiles.java

Source

/*! ******************************************************************************
 *
 * Pentaho Data Integration
 *
 * Copyright (C) 2002-2013 by Pentaho : http://www.pentaho.com
 *
 *******************************************************************************
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with
 * the License. You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 ******************************************************************************/

package org.pentaho.di.trans.steps.processfiles;

import org.apache.commons.vfs.FileObject;
import org.apache.commons.vfs.FileSelectInfo;
import org.apache.commons.vfs.FileSelector;
import org.apache.commons.vfs.FileType;
import org.pentaho.di.core.Const;
import org.pentaho.di.core.ResultFile;
import org.pentaho.di.core.exception.KettleException;
import org.pentaho.di.core.vfs.KettleVFS;
import org.pentaho.di.i18n.BaseMessages;
import org.pentaho.di.trans.Trans;
import org.pentaho.di.trans.TransMeta;
import org.pentaho.di.trans.step.BaseStep;
import org.pentaho.di.trans.step.StepDataInterface;
import org.pentaho.di.trans.step.StepInterface;
import org.pentaho.di.trans.step.StepMeta;
import org.pentaho.di.trans.step.StepMetaInterface;

/**
 * Copy, move or delete file *
 *
 * @author Samatar
 * @since 03-Juin-2008
 *
 */

public class ProcessFiles extends BaseStep implements StepInterface {
    private static Class<?> PKG = ProcessFilesMeta.class; // for i18n purposes, needed by Translator2!!

    private ProcessFilesMeta meta;
    private ProcessFilesData data;

    public ProcessFiles(StepMeta stepMeta, StepDataInterface stepDataInterface, int copyNr, TransMeta transMeta,
            Trans trans) {
        super(stepMeta, stepDataInterface, copyNr, transMeta, trans);
    }

    public boolean processRow(StepMetaInterface smi, StepDataInterface sdi) throws KettleException {
        meta = (ProcessFilesMeta) smi;
        data = (ProcessFilesData) sdi;

        Object[] r = getRow(); // Get row from input rowset & set row busy!
        if (r == null) { // no more input to be expected...

            setOutputDone();
            return false;
        }
        if (first) {
            first = false;
            // Check is source filename field is provided
            if (Const.isEmpty(meta.getDynamicSourceFileNameField())) {
                throw new KettleException(
                        BaseMessages.getString(PKG, "ProcessFiles.Error.SourceFilenameFieldMissing"));
            }
            // Check is target filename field is provided
            if (meta.getOperationType() != ProcessFilesMeta.OPERATION_TYPE_DELETE
                    && Const.isEmpty(meta.getDynamicTargetFileNameField())) {
                throw new KettleException(
                        BaseMessages.getString(PKG, "ProcessFiles.Error.TargetFilenameFieldMissing"));
            }

            // cache the position of the source filename field
            if (data.indexOfSourceFilename < 0) {
                data.indexOfSourceFilename = getInputRowMeta().indexOfValue(meta.getDynamicSourceFileNameField());
                if (data.indexOfSourceFilename < 0) {
                    // The field is unreachable !
                    throw new KettleException(BaseMessages.getString(PKG,
                            "ProcessFiles.Exception.CouldnotFindField", meta.getDynamicSourceFileNameField()));
                }
            }
            // cache the position of the source filename field
            if (meta.getOperationType() != ProcessFilesMeta.OPERATION_TYPE_DELETE
                    && data.indexOfTargetFilename < 0) {
                data.indexOfTargetFilename = getInputRowMeta().indexOfValue(meta.getDynamicTargetFileNameField());
                if (data.indexOfTargetFilename < 0) {
                    // The field is unreachable !
                    throw new KettleException(BaseMessages.getString(PKG,
                            "ProcessFiles.Exception.CouldnotFindField", meta.getDynamicTargetFileNameField()));
                }
            }

            if (meta.simulate) {
                if (log.isBasic()) {
                    logBasic(BaseMessages.getString(PKG, "ProcessFiles.Log.SimulationModeON"));
                }
            }
        } // End If first
        try {
            // get source filename
            String sourceFilename = getInputRowMeta().getString(r, data.indexOfSourceFilename);

            if (Const.isEmpty(sourceFilename)) {
                logError(BaseMessages.getString(PKG, "ProcessFiles.Error.SourceFileEmpty"));
                throw new KettleException(BaseMessages.getString(PKG, "ProcessFiles.Error.SourceFileEmpty"));
            }
            data.sourceFile = KettleVFS.getFileObject(sourceFilename, getTransMeta());

            if (!data.sourceFile.exists()) {
                logError(BaseMessages.getString(PKG, "ProcessFiles.Error.SourceFileNotExist", sourceFilename));
                throw new KettleException(
                        BaseMessages.getString(PKG, "ProcessFiles.Error.SourceFileNotExist", sourceFilename));
            }
            if (data.sourceFile.getType() != FileType.FILE) {
                logError(BaseMessages.getString(PKG, "ProcessFiles.Error.SourceFileNotFile", sourceFilename));
                throw new KettleException(
                        BaseMessages.getString(PKG, "ProcessFiles.Error.SourceFileNotFile", sourceFilename));
            }
            String targetFilename = null;
            if (meta.getOperationType() != ProcessFilesMeta.OPERATION_TYPE_DELETE) {
                // get value for target filename
                targetFilename = getInputRowMeta().getString(r, data.indexOfTargetFilename);

                if (Const.isEmpty(targetFilename)) {
                    logError(BaseMessages.getString(PKG, "ProcessFiles.Error.TargetFileEmpty"));
                    throw new KettleException(BaseMessages.getString(PKG, "ProcessFiles.Error.TargetFileEmpty"));
                }
                data.targetFile = KettleVFS.getFileObject(targetFilename, getTransMeta());
                if (data.targetFile.exists()) {
                    if (log.isDetailed()) {
                        logDetailed(
                                BaseMessages.getString(PKG, "ProcessFiles.Log.TargetFileExists", targetFilename));
                    }
                    // check if target is really a file otherwise it could overwrite a complete folder by copy or move operations
                    if (data.targetFile.getType() != FileType.FILE) {
                        logError(BaseMessages.getString(PKG, "ProcessFiles.Error.TargetFileNotFile",
                                targetFilename));
                        throw new KettleException(BaseMessages.getString(PKG,
                                "ProcessFiles.Error.TargetFileNotFile", targetFilename));
                    }

                } else {
                    // let's check parent folder
                    FileObject parentFolder = data.targetFile.getParent();
                    if (!parentFolder.exists()) {
                        if (!meta.isCreateParentFolder()) {
                            throw new KettleException(BaseMessages.getString(PKG,
                                    "ProcessFiles.Error.TargetParentFolderNotExists", parentFolder.toString()));
                        } else {
                            parentFolder.createFolder();
                        }
                    }
                    if (parentFolder != null) {
                        parentFolder.close();
                    }
                }
            }

            switch (meta.getOperationType()) {
            case ProcessFilesMeta.OPERATION_TYPE_COPY:
                if (((meta.isOverwriteTargetFile() && data.targetFile.exists()) || !data.targetFile.exists())
                        && !meta.simulate) {
                    data.targetFile.copyFrom(data.sourceFile, new TextOneToOneFileSelector());
                    if (log.isDetailed()) {
                        logDetailed(BaseMessages.getString(PKG, "ProcessFiles.Log.SourceFileCopied", sourceFilename,
                                targetFilename));
                    }
                } else {
                    if (log.isDetailed()) {
                        logDetailed(BaseMessages.getString(PKG, "ProcessFiles.Log.TargetNotOverwritten",
                                sourceFilename, targetFilename));
                    }
                }
                break;
            case ProcessFilesMeta.OPERATION_TYPE_MOVE:
                if (((meta.isOverwriteTargetFile() && data.targetFile.exists()) || !data.targetFile.exists())
                        && !meta.simulate) {
                    data.sourceFile.moveTo(KettleVFS.getFileObject(targetFilename, getTransMeta()));
                    if (log.isDetailed()) {
                        logDetailed(BaseMessages.getString(PKG, "ProcessFiles.Log.SourceFileMoved", sourceFilename,
                                targetFilename));
                    }
                } else {
                    if (log.isDetailed()) {
                        logDetailed(BaseMessages.getString(PKG, "ProcessFiles.Log.TargetNotOverwritten",
                                sourceFilename, targetFilename));
                    }
                }
                break;
            case ProcessFilesMeta.OPERATION_TYPE_DELETE:
                if (!meta.simulate) {
                    if (!data.sourceFile.delete()) {
                        throw new KettleException(BaseMessages.getString(PKG, "ProcessFiles.Error.CanNotDeleteFile",
                                data.sourceFile.toString()));
                    }
                }
                if (log.isDetailed()) {
                    logDetailed(BaseMessages.getString(PKG, "ProcessFiles.Log.SourceFileDeleted", sourceFilename));
                }
                break;
            default:

                break;
            }

            // add filename to result filenames?
            if (meta.isaddTargetFileNametoResult()
                    && meta.getOperationType() != ProcessFilesMeta.OPERATION_TYPE_DELETE
                    && data.sourceFile.getType() == FileType.FILE) {
                // Add this to the result file names...
                ResultFile resultFile = new ResultFile(ResultFile.FILE_TYPE_GENERAL, data.targetFile,
                        getTransMeta().getName(), getStepname());
                resultFile.setComment(BaseMessages.getString(PKG, "ProcessFiles.Log.FileAddedResult"));
                addResultFile(resultFile);

                if (log.isDetailed()) {
                    logDetailed(BaseMessages.getString(PKG, "ProcessFiles.Log.FilenameAddResult",
                            data.sourceFile.toString()));
                }
            }

            putRow(getInputRowMeta(), r); // copy row to possible alternate rowset(s).

            if (checkFeedback(getLinesRead())) {
                if (log.isBasic()) {
                    logBasic(BaseMessages.getString(PKG, "ProcessFiles.LineNumber") + getLinesRead());
                }
            }
        } catch (Exception e) {
            boolean sendToErrorRow = false;
            String errorMessage = null;

            if (getStepMeta().isDoingErrorHandling()) {
                sendToErrorRow = true;
                errorMessage = e.toString();
            } else {
                logError(BaseMessages.getString(PKG, "ProcessFiles.ErrorInStepRunning") + e.getMessage());
                setErrors(1);
                stopAll();
                setOutputDone(); // signal end to receiver(s)
                return false;
            }
            if (sendToErrorRow) {
                // Simply add this row to the error row
                putError(getInputRowMeta(), r, 1, errorMessage, null, "ProcessFiles001");
            }
        }

        return true;
    }

    private class TextOneToOneFileSelector implements FileSelector {
        public boolean includeFile(FileSelectInfo info) throws Exception {
            return true;
        }

        public boolean traverseDescendents(FileSelectInfo info) {
            return false;
        }
    }

    public boolean init(StepMetaInterface smi, StepDataInterface sdi) {
        meta = (ProcessFilesMeta) smi;
        data = (ProcessFilesData) sdi;

        if (super.init(smi, sdi)) {
            return true;
        }
        return false;
    }

    public void dispose(StepMetaInterface smi, StepDataInterface sdi) {
        meta = (ProcessFilesMeta) smi;
        data = (ProcessFilesData) sdi;
        if (data.sourceFile != null) {
            try {
                data.sourceFile.close();
                data.sourceFile = null;
            } catch (Exception e) {
                // Ignore errors
            }

        }
        if (data.targetFile != null) {
            try {
                data.targetFile.close();
                data.targetFile = null;
            } catch (Exception e) {
                // Ignore errors
            }

        }
        super.dispose(smi, sdi);
    }

}