org.apache.tez.mapreduce.processor.MRTask.java Source code

Introduction

Here is the source code for org.apache.tez.mapreduce.processor.MRTask.java
Source

/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements.  See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership.  The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License.  You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.apache.tez.mapreduce.processor;

import java.io.IOException;
import java.net.URI;
import java.text.NumberFormat;
import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;
import java.util.Map.Entry;
import java.util.concurrent.atomic.AtomicBoolean;

import javax.crypto.SecretKey;

import org.apache.commons.lang.StringUtils;
import org.apache.commons.lang.exception.ExceptionUtils;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.classification.InterfaceAudience.Private;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.FileSystem.Statistics;
import org.apache.hadoop.fs.LocalDirAllocator;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.DataInputBuffer;
import org.apache.hadoop.io.RawComparator;
import org.apache.hadoop.mapred.FileAlreadyExistsException;
import org.apache.hadoop.mapred.FileOutputCommitter;
import org.apache.hadoop.mapred.FileOutputFormat;
import org.apache.hadoop.mapred.JobConf;
import org.apache.hadoop.mapred.JobContext;
import org.apache.hadoop.mapred.RawKeyValueIterator;
import org.apache.hadoop.mapred.TaskAttemptContext;
import org.apache.hadoop.mapred.TaskAttemptID;
import org.apache.hadoop.mapred.TaskID;
import org.apache.hadoop.mapreduce.OutputCommitter;
import org.apache.hadoop.mapreduce.TaskType;
import org.apache.hadoop.mapreduce.filecache.DistributedCache;
import org.apache.hadoop.mapreduce.lib.reduce.WrappedReducer;
import org.apache.hadoop.mapreduce.security.token.JobTokenSecretManager;
import org.apache.hadoop.mapreduce.task.ReduceContextImpl;
import org.apache.hadoop.security.Credentials;
import org.apache.hadoop.security.UserGroupInformation;
import org.apache.hadoop.security.token.Token;
import org.apache.hadoop.util.DiskChecker.DiskErrorException;
import org.apache.hadoop.util.Progress;
import org.apache.hadoop.yarn.api.ApplicationConstants.Environment;
import org.apache.tez.common.MRFrameworkConfigs;
import org.apache.tez.common.TezUtils;
import org.apache.tez.common.TezRuntimeFrameworkConfigs;
import org.apache.tez.common.counters.TezCounters;
import org.apache.tez.common.security.JobTokenIdentifier;
import org.apache.tez.common.security.TokenCache;
import org.apache.tez.dag.api.UserPayload;
import org.apache.tez.dag.records.TezDAGID;
import org.apache.tez.mapreduce.hadoop.DeprecatedKeys;
import org.apache.tez.mapreduce.hadoop.IDConverter;
import org.apache.tez.mapreduce.hadoop.MRConfig;
import org.apache.tez.mapreduce.hadoop.MRJobConfig;
import org.apache.tez.mapreduce.hadoop.mapred.TaskAttemptContextImpl;
import org.apache.tez.mapreduce.hadoop.mapreduce.JobContextImpl;
import org.apache.tez.mapreduce.output.MROutputLegacy;
import org.apache.tez.runtime.api.AbstractLogicalIOProcessor;
import org.apache.tez.runtime.api.LogicalInput;
import org.apache.tez.runtime.api.LogicalOutput;
import org.apache.tez.runtime.api.ProcessorContext;
import org.apache.tez.runtime.library.common.Constants;
import org.apache.tez.runtime.library.common.sort.impl.TezRawKeyValueIterator;

@SuppressWarnings("deprecation")
@Private
public abstract class MRTask extends AbstractLogicalIOProcessor {

    static final Log LOG = LogFactory.getLog(MRTask.class);

    protected JobConf jobConf;
    protected JobContext jobContext;
    protected TaskAttemptContext taskAttemptContext;
    protected OutputCommitter committer;

    // Current counters
    transient TezCounters counters;
    protected ProcessorContext processorContext;
    protected TaskAttemptID taskAttemptId;
    protected Progress progress = new Progress();
    protected SecretKey jobTokenSecret;

    LogicalInput input;
    LogicalOutput output;

    boolean isMap;

    /* flag to track whether task is done */
    AtomicBoolean taskDone = new AtomicBoolean(false);

    /** Construct output file names so that, when an output directory listing is
     * sorted lexicographically, positions correspond to output partitions.*/
    private static final NumberFormat NUMBER_FORMAT = NumberFormat.getInstance();
    static {
        NUMBER_FORMAT.setMinimumIntegerDigits(5);
        NUMBER_FORMAT.setGroupingUsed(false);
    }

    protected MRTaskReporter mrReporter;
    protected boolean useNewApi;

    public MRTask(ProcessorContext processorContext, boolean isMap) {
        super(processorContext);
        this.isMap = isMap;
    }

    // TODO how to update progress
    @Override
    public void initialize() throws IOException, InterruptedException {

        DeprecatedKeys.init();

        processorContext = getContext();
        counters = processorContext.getCounters();
        this.taskAttemptId = new TaskAttemptID(
                new TaskID(Long.toString(processorContext.getApplicationId().getClusterTimestamp()),
                        processorContext.getApplicationId().getId(), (isMap ? TaskType.MAP : TaskType.REDUCE),
                        processorContext.getTaskIndex()),
                processorContext.getTaskAttemptNumber());

        UserPayload userPayload = processorContext.getUserPayload();
        Configuration conf = TezUtils.createConfFromUserPayload(userPayload);
        if (conf instanceof JobConf) {
            this.jobConf = (JobConf) conf;
        } else {
            this.jobConf = new JobConf(conf);
        }
        jobConf.set(Constants.TEZ_RUNTIME_TASK_ATTEMPT_ID, taskAttemptId.toString());
        jobConf.set(MRJobConfig.TASK_ATTEMPT_ID, taskAttemptId.toString());
        jobConf.setInt(MRJobConfig.APPLICATION_ATTEMPT_ID, processorContext.getDAGAttemptNumber());

        LOG.info("MRTask.inited: taskAttemptId = " + taskAttemptId.toString());

        // TODO Post MRR
        // A single file per vertex will likely be a better solution. Does not
        // require translation - client can take care of this. Will work independent
        // of whether the configuration is for intermediate tasks or not. Has the
        // overhead of localizing multiple files per job - i.e. the client would
        // need to write these files to hdfs, add them as local resources per
        // vertex. A solution like this may be more practical once it's possible to
        // submit configuration parameters to the AM and effectively tasks via RPC.

        jobConf.set(MRJobConfig.VERTEX_NAME, processorContext.getTaskVertexName());

        if (LOG.isDebugEnabled() && userPayload != null) {
            Iterator<Entry<String, String>> iter = jobConf.iterator();
            String taskIdStr = taskAttemptId.getTaskID().toString();
            while (iter.hasNext()) {
                Entry<String, String> confEntry = iter.next();
                LOG.debug("TaskConf Entry" + ", taskId=" + taskIdStr + ", key=" + confEntry.getKey() + ", value="
                        + confEntry.getValue());
            }
        }

        configureMRTask();
    }

    private void configureMRTask() throws IOException, InterruptedException {

        Credentials credentials = UserGroupInformation.getCurrentUser().getCredentials();
        jobConf.setCredentials(credentials);
        // TODO Can this be avoided all together. Have the MRTezOutputCommitter use
        // the Tez parameter.
        // TODO This could be fetched from the env if YARN is setting it for all
        // Containers.
        // Set it in conf, so as to be able to be used the the OutputCommitter.

        // Not needed. This is probably being set via the source/consumer meta
        Token<JobTokenIdentifier> jobToken = TokenCache.getSessionToken(credentials);
        if (jobToken != null) {
            // Will MR ever run without a job token.
            SecretKey sk = JobTokenSecretManager.createSecretKey(jobToken.getPassword());
            this.jobTokenSecret = sk;
        } else {
            LOG.warn("No job token set");
        }

        configureLocalDirs();

        // Set up the DistributedCache related configs
        setupDistributedCacheConfig(jobConf);
    }

    private void configureLocalDirs() throws IOException {
        // TODO NEWTEZ Is most of this functionality required ?
        jobConf.setStrings(TezRuntimeFrameworkConfigs.LOCAL_DIRS, processorContext.getWorkDirs());
        if (jobConf.get(MRFrameworkConfigs.TASK_LOCAL_RESOURCE_DIR) == null) {
            jobConf.set(MRFrameworkConfigs.TASK_LOCAL_RESOURCE_DIR, System.getenv(Environment.PWD.name()));
        }

        jobConf.setStrings(MRConfig.LOCAL_DIR, processorContext.getWorkDirs());

        LocalDirAllocator lDirAlloc = new LocalDirAllocator(TezRuntimeFrameworkConfigs.LOCAL_DIRS);
        Path workDir = null;
        // First, try to find the JOB_LOCAL_DIR on this host.
        try {
            workDir = lDirAlloc.getLocalPathToRead("work", jobConf);
        } catch (DiskErrorException e) {
            // DiskErrorException means dir not found. If not found, it will
            // be created below.
        }
        if (workDir == null) {
            // JOB_LOCAL_DIR doesn't exist on this host -- Create it.
            workDir = lDirAlloc.getLocalPathForWrite("work", jobConf);
            FileSystem lfs = FileSystem.getLocal(jobConf).getRaw();
            boolean madeDir = false;
            try {
                madeDir = lfs.mkdirs(workDir);
            } catch (FileAlreadyExistsException e) {
                // Since all tasks will be running in their own JVM, the race condition
                // exists where multiple tasks could be trying to create this directory
                // at the same time. If this task loses the race, it's okay because
                // the directory already exists.
                madeDir = true;
                workDir = lDirAlloc.getLocalPathToRead("work", jobConf);
            }
            if (!madeDir) {
                throw new IOException("Mkdirs failed to create " + workDir.toString());
            }
        }
        // TODO NEWTEZ Is this required ?
        jobConf.set(MRFrameworkConfigs.JOB_LOCAL_DIR, workDir.toString());
        jobConf.set(MRJobConfig.JOB_LOCAL_DIR, workDir.toString());
    }

    /**
     * Set up the DistributedCache related configs to make
     * {@link DistributedCache#getLocalCacheFiles(Configuration)} and
     * {@link DistributedCache#getLocalCacheArchives(Configuration)} working.
     *
     * @param job
     * @throws IOException
     */
    private static void setupDistributedCacheConfig(final JobConf job) throws IOException {

        String localWorkDir = (job.get(MRFrameworkConfigs.TASK_LOCAL_RESOURCE_DIR));
        // ^ ^ all symlinks are created in the current work-dir

        // Update the configuration object with localized archives.
        URI[] cacheArchives = DistributedCache.getCacheArchives(job);
        if (cacheArchives != null) {
            List<String> localArchives = new ArrayList<String>();
            for (int i = 0; i < cacheArchives.length; ++i) {
                URI u = cacheArchives[i];
                Path p = new Path(u);
                Path name = new Path((null == u.getFragment()) ? p.getName() : u.getFragment());
                String linkName = name.toUri().getPath();
                localArchives.add(new Path(localWorkDir, linkName).toUri().getPath());
            }
            if (!localArchives.isEmpty()) {
                job.set(MRJobConfig.CACHE_LOCALARCHIVES, StringUtils.join(localArchives, ','));
            }
        }

        // Update the configuration object with localized files.
        URI[] cacheFiles = DistributedCache.getCacheFiles(job);
        if (cacheFiles != null) {
            List<String> localFiles = new ArrayList<String>();
            for (int i = 0; i < cacheFiles.length; ++i) {
                URI u = cacheFiles[i];
                Path p = new Path(u);
                Path name = new Path((null == u.getFragment()) ? p.getName() : u.getFragment());
                String linkName = name.toUri().getPath();
                localFiles.add(new Path(localWorkDir, linkName).toUri().getPath());
            }
            if (!localFiles.isEmpty()) {
                job.set(MRJobConfig.CACHE_LOCALFILES, StringUtils.join(localFiles, ','));
            }
        }
    }

    public ProcessorContext getUmbilical() {
        return this.processorContext;
    }

    public void initTask(LogicalOutput output) throws IOException, InterruptedException {
        // By this time output has been initialized
        this.output = output;
        if (output instanceof MROutputLegacy) {
            committer = ((MROutputLegacy) output).getOutputCommitter();
        }
        this.mrReporter = new MRTaskReporter(processorContext);
        this.useNewApi = jobConf.getUseNewMapper();
        TezDAGID dagId = IDConverter.fromMRTaskAttemptId(taskAttemptId).getTaskID().getVertexID().getDAGId();

        this.jobContext = new JobContextImpl(jobConf, dagId, mrReporter);
        this.taskAttemptContext = new TaskAttemptContextImpl(jobConf, taskAttemptId, mrReporter);

        localizeConfiguration(jobConf);
    }

    public MRTaskReporter getMRReporter() {
        return mrReporter;
    }

    public TezCounters getCounters() {
        return counters;
    }

    public void setConf(JobConf jobConf) {
        this.jobConf = jobConf;
    }

    public JobConf getConf() {
        return this.jobConf;
    }

    /**
     * Gets a handle to the Statistics instance based on the scheme associated
     * with path.
     *
     * @param path the path.
     * @param conf the configuration to extract the scheme from if not part of
     *   the path.
     * @return a Statistics instance, or null if none is found for the scheme.
     */
    @Private
    public static List<Statistics> getFsStatistics(Path path, Configuration conf) throws IOException {
        List<Statistics> matchedStats = new ArrayList<FileSystem.Statistics>();
        path = path.getFileSystem(conf).makeQualified(path);
        String scheme = path.toUri().getScheme();
        for (Statistics stats : FileSystem.getAllStatistics()) {
            if (stats.getScheme().equals(scheme)) {
                matchedStats.add(stats);
            }
        }
        return matchedStats;
    }

    @Private
    public synchronized String getOutputName() {
        return "part-" + NUMBER_FORMAT.format(taskAttemptId.getTaskID().getId());
    }

    public void waitBeforeCompletion(MRTaskReporter reporter) throws IOException, InterruptedException {
    }

    public void done() throws IOException, InterruptedException {

        LOG.info("Task:" + taskAttemptId + " is done." + " And is in the process of committing");
        // TODO change this to use the new context
        // TODO TEZ Interaciton between Commit and OutputReady. Merge ?
        if (output instanceof MROutputLegacy) {
            MROutputLegacy sOut = (MROutputLegacy) output;
            if (sOut.isCommitRequired()) {
                //wait for commit approval and commit
                // TODO EVENTUALLY - Commit is not required for map tasks.
                // skip a couple of RPCs before exiting.
                commit(sOut);
            }
        }
        taskDone.set(true);
        sendLastUpdate();
    }

    /**
     * Send a status update to the task tracker
     * @throws IOException
     */
    public void statusUpdate() throws IOException, InterruptedException {
        // TODO call progress update here if not being called within Map/Reduce
    }

    /**
     * Sends last status update before sending umbilical.done();
     */
    private void sendLastUpdate() throws IOException, InterruptedException {
        statusUpdate();
    }

    private void commit(MROutputLegacy output) throws IOException {
        int retries = 3;
        while (true) {
            // This will loop till the AM asks for the task to be killed. As
            // against, the AM sending a signal to the task to kill itself
            // gracefully.
            try {
                if (processorContext.canCommit()) {
                    break;
                }
                Thread.sleep(1000);
            } catch (InterruptedException ie) {
                //ignore
            } catch (IOException ie) {
                LOG.warn("Failure sending canCommit: " + ExceptionUtils.getStackTrace(ie));
                if (--retries == 0) {
                    throw ie;
                }
            }
        }

        // task can Commit now
        try {
            LOG.info("Task " + taskAttemptId + " is allowed to commit now");
            output.flush();
            if (output.isCommitRequired()) {
                output.commit();
            }
            return;
        } catch (IOException iee) {
            LOG.warn("Failure committing: " + ExceptionUtils.getStackTrace(iee));
            //if it couldn't commit a successfully then delete the output
            discardOutput(output);
            throw iee;
        }
    }

    private void discardOutput(MROutputLegacy output) {
        try {
            output.abort();
        } catch (IOException ioe) {
            LOG.warn("Failure cleaning up: " + ExceptionUtils.getStackTrace(ioe));
        }
    }

    public static String normalizeStatus(String status, Configuration conf) {
        // Check to see if the status string is too long
        // and truncate it if needed.
        int progressStatusLength = conf.getInt(MRConfig.PROGRESS_STATUS_LEN_LIMIT_KEY,
                MRConfig.PROGRESS_STATUS_LEN_LIMIT_DEFAULT);
        if (status.length() > progressStatusLength) {
            LOG.warn("Task status: \"" + status + "\" truncated to max limit (" + progressStatusLength
                    + " characters)");
            status = status.substring(0, progressStatusLength);
        }
        return status;
    }

    protected static <INKEY, INVALUE, OUTKEY, OUTVALUE> org.apache.hadoop.mapreduce.Reducer<INKEY, INVALUE, OUTKEY, OUTVALUE>.Context createReduceContext(
            org.apache.hadoop.mapreduce.Reducer<INKEY, INVALUE, OUTKEY, OUTVALUE> reducer, Configuration job,
            TaskAttemptID taskId, final TezRawKeyValueIterator rIter,
            org.apache.hadoop.mapreduce.Counter inputKeyCounter,
            org.apache.hadoop.mapreduce.Counter inputValueCounter,
            org.apache.hadoop.mapreduce.RecordWriter<OUTKEY, OUTVALUE> output,
            org.apache.hadoop.mapreduce.OutputCommitter committer,
            org.apache.hadoop.mapreduce.StatusReporter reporter, RawComparator<INKEY> comparator,
            Class<INKEY> keyClass, Class<INVALUE> valueClass) throws IOException, InterruptedException {
        RawKeyValueIterator r = new RawKeyValueIterator() {

            @Override
            public boolean next() throws IOException {
                return rIter.next();
            }

            @Override
            public DataInputBuffer getValue() throws IOException {
                return rIter.getValue();
            }

            @Override
            public Progress getProgress() {
                return rIter.getProgress();
            }

            @Override
            public DataInputBuffer getKey() throws IOException {
                return rIter.getKey();
            }

            @Override
            public void close() throws IOException {
                rIter.close();
            }
        };
        org.apache.hadoop.mapreduce.ReduceContext<INKEY, INVALUE, OUTKEY, OUTVALUE> reduceContext = new ReduceContextImpl<INKEY, INVALUE, OUTKEY, OUTVALUE>(
                job, taskId, r, inputKeyCounter, inputValueCounter, output, committer, reporter, comparator,
                keyClass, valueClass);
        if (LOG.isDebugEnabled()) {
            LOG.debug("Using key class: " + keyClass + ", valueClass: " + valueClass);
        }

        org.apache.hadoop.mapreduce.Reducer<INKEY, INVALUE, OUTKEY, OUTVALUE>.Context reducerContext = new WrappedReducer<INKEY, INVALUE, OUTKEY, OUTVALUE>()
                .getReducerContext(reduceContext);

        return reducerContext;
    }

    public void taskCleanup() throws IOException, InterruptedException {
        // set phase for this task
        statusUpdate();
        LOG.info("Runnning cleanup for the task");
        // do the cleanup
        if (output instanceof MROutputLegacy) {
            ((MROutputLegacy) output).abort();
        }
    }

    public void localizeConfiguration(JobConf jobConf) throws IOException, InterruptedException {
        jobConf.set(JobContext.TASK_ID, taskAttemptId.getTaskID().toString());
        jobConf.set(JobContext.TASK_ATTEMPT_ID, taskAttemptId.toString());
        jobConf.setInt(JobContext.TASK_PARTITION, taskAttemptId.getTaskID().getId());
        jobConf.set(JobContext.ID, taskAttemptId.getJobID().toString());

        jobConf.setBoolean(MRJobConfig.TASK_ISMAP, isMap);

        Path outputPath = FileOutputFormat.getOutputPath(jobConf);
        if (outputPath != null) {
            if ((committer instanceof FileOutputCommitter)) {
                FileOutputFormat.setWorkOutputPath(jobConf,
                        ((FileOutputCommitter) committer).getTaskAttemptPath(taskAttemptContext));
            } else {
                FileOutputFormat.setWorkOutputPath(jobConf, outputPath);
            }
        }
    }

    public org.apache.hadoop.mapreduce.TaskAttemptContext getTaskAttemptContext() {
        return taskAttemptContext;
    }

    public JobContext getJobContext() {
        return jobContext;
    }

    public TaskAttemptID getTaskAttemptId() {
        return taskAttemptId;
    }

}