* Copyright (c) 2007-2014 Concurrent, Inc. All Rights Reserved.
* Project and contact information: http://www.cascading.org/
* This file is part of the Cascading project.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
* http://www.apache.org/licenses/LICENSE-2.0
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* See the License for the specific language governing permissions and
* limitations under the License.
package cascading.tap.local;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.util.LinkedHashSet;
import java.util.Properties;
import java.util.Set;
import cascading.flow.FlowProcess;
import cascading.scheme.Scheme;
import cascading.tap.SinkMode;
import cascading.tap.Tap;
import cascading.tap.local.io.TapFileOutputStream;
import cascading.tap.type.FileType;
import cascading.tuple.TupleEntryCollector;
import cascading.tuple.TupleEntryIterator;
import cascading.tuple.TupleEntrySchemeCollector;
import cascading.tuple.TupleEntrySchemeIterator;
* Class FileTap is a {@link Tap} sub-class that allows for direct local file access.
* <p/>
* FileTap must be used with the {@link cascading.flow.local.LocalFlowConnector} to create
* {@link cascading.flow.Flow} instances that run in "local" mode.
public class FileTap extends Tap<Properties, InputStream, OutputStream> implements FileType<Properties>
private final String path;
* Constructor FileTap creates a new FileTap instance using the given {@link cascading.scheme.Scheme} and file {@code path}.
* @param scheme of type LocalScheme
* @param path of type String
public FileTap( Scheme<Properties, InputStream, OutputStream, ?, ?> scheme, String path )
this( scheme, path, SinkMode.KEEP );
* Constructor FileTap creates a new FileTap instance using the given {@link cascading.scheme.Scheme},
* file {@code path}, and {@code SinkMode}.
* @param scheme of type LocalScheme
* @param path of type String
* @param sinkMode of type SinkMode
public FileTap( Scheme<Properties, InputStream, OutputStream, ?, ?> scheme, String path, SinkMode sinkMode )
super( scheme, sinkMode );
this.path = new File( path ).getPath(); // cleans path information
public String getIdentifier()
return path;
public String getFullIdentifier( Properties conf )
return fullyQualifyIdentifier( getIdentifier() );
private String fullyQualifyIdentifier( String identifier )
return new File( identifier ).getAbsoluteFile().toURI().toString();
public TupleEntryIterator openForRead( FlowProcess<? extends Properties> flowProcess, InputStream input ) throws IOException
if( input == null )
input = new FileInputStream( getIdentifier() );
return new TupleEntrySchemeIterator<Properties, InputStream>( flowProcess, getScheme(), input, getIdentifier() );
public TupleEntryCollector openForWrite( FlowProcess<? extends Properties> flowProcess, OutputStream output ) throws IOException
if( output == null )
output = new TapFileOutputStream( getIdentifier(), isUpdate() ); // append if we are in update mode
return new TupleEntrySchemeCollector<Properties, OutputStream>( flowProcess, getScheme(), output, getIdentifier() );
public long getSize( Properties conf ) throws IOException
File file = new File( getIdentifier() );
if( file.isDirectory() )
return 0;
return file.length();
public boolean createResource( Properties conf ) throws IOException
File parentFile = new File( getIdentifier() ).getParentFile();
return parentFile.exists() || parentFile.mkdirs();
public boolean deleteResource( Properties conf ) throws IOException
return new File( getIdentifier() ).delete();
public boolean commitResource( Properties conf ) throws IOException
return true;
public boolean resourceExists( Properties conf ) throws IOException
return new File( getIdentifier() ).exists();
public long getModifiedTime( Properties conf ) throws IOException
return new File( getIdentifier() ).lastModified();
public boolean isDirectory( Properties conf ) throws IOException
return new File( getIdentifier() ).isDirectory();
public String[] getChildIdentifiers( Properties conf ) throws IOException
return getChildIdentifiers( conf, 1, false );
public String[] getChildIdentifiers( Properties conf, int depth, boolean fullyQualified ) throws IOException
if( !resourceExists( conf ) )
return new String[ 0 ];
Set<String> results = new LinkedHashSet<String>();
getChildPaths( results, getIdentifier(), depth );
String[] allPaths = results.toArray( new String[ results.size() ] );
if( !fullyQualified )
return allPaths;
for( int i = 0; i < allPaths.length; i++ )
allPaths[ i ] = fullyQualifyIdentifier( allPaths[ i ] );
return allPaths;
private boolean getChildPaths( Set<String> results, String identifier, int depth )
File file = new File( identifier );
if( depth == 0 || file.isFile() )
results.add( identifier );
return true;
String[] paths = file.list();
if( paths == null )
return false;
boolean result = false;
for( String path : paths )
result |= getChildPaths( results, new File( file, path ).getPath(), depth - 1 );
return result;