// (i.e. we should do the same as above for avro files).
throw new IllegalArgumentException(
"--input-file-reader-schema must be specified when using --input-file-format=avroParquet");
}
Schema schema = opts.inputFileReaderSchema;
Source source = new AvroParquetFileSource(filePaths, Avros.generics(schema), opts.inputFileProjectionSchema);
return pipeline.read(source);
} else if (opts.inputFileFormat.isAssignableFrom(TextInputFormat.class)) {
Source source = From.textFile(filePaths);
return pipeline.read(source);
} else {
// FIXME drop support for this stuff? (doesn't seem to work with spark)
// TODO: intentionally restrict to only allow org.apache.hadoop.mapreduce.lib.input.TextInputFormat ?
TableSource source = new FileTableSourceImpl(