Java tutorial
/* * Copyright 2003-2016 MarkLogic Corporation * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.marklogic.contentpump; import java.io.IOException; import org.apache.commons.logging.Log; import org.apache.commons.logging.LogFactory; import org.apache.hadoop.conf.Configurable; import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.fs.FileStatus; import org.apache.hadoop.fs.FileSystem; import org.apache.hadoop.fs.Path; import org.apache.hadoop.fs.PathFilter; /** * The configured input file pattern applied to input file path. * @author ali * */ public class DocumentPathFilter implements PathFilter, Configurable { public static final Log LOG = LogFactory.getLog(DocumentPathFilter.class); private String pattern; private Configuration conf; private FileSystem fs; public String getPattern() { return pattern; } public void setPattern(String pattern) { this.pattern = pattern; } @Override public boolean accept(Path inPath) { String filename = inPath.getName(); if (filename.matches(pattern) == true) { return true; } // take care of the case when INPUT_FILE_PATH is a DIR try { FileStatus[] status = fs.globStatus(inPath); if (status == null) { throw new IOException("Path in input_file_path doesn't exist: " + inPath); } for (FileStatus s : status) { if (s.isDirectory()) { return true; } } } catch (IOException e) { e.printStackTrace(); } return false; } @Override public Configuration getConf() { return conf; } @Override public void setConf(Configuration conf) { this.conf = conf; pattern = conf.get(ConfigConstants.CONF_INPUT_FILE_PATTERN, ".*"); String inPath = conf.get(ConfigConstants.CONF_INPUT_DIRECTORY); if (LOG.isDebugEnabled()) { LOG.debug(ConfigConstants.CONF_INPUT_DIRECTORY + ": " + inPath); } Path path = new Path(inPath); try { fs = FileSystem.get(path.toUri(), conf); } catch (IOException e) { LOG.error("Please check path: " + inPath, e); } } }