/*
* $Id: ExtractAttachments.java 45 2007-05-15 22:02:53Z chammer $
* Copyright (c) 2005-2007 Paulo Soares, Bruno Lowagie, Carsten Hammer
*
* Permission is hereby granted, free of charge, to any person
* obtaining a copy of this software and associated documentation
* files (the "Software"), to deal in the Software without
* restriction, including without limitation the rights to use,
* copy, modify, merge, publish, distribute, sublicense, and/or sell
* copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following
* conditions:
*
* The above copyright notice and this permission notice shall be
* included in all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
* OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
* HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
* WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
* OTHER DEALINGS IN THE SOFTWARE.
*/
/*
* This class was originally published under the MPL by Bruno Lowagie
* Paulo Soares and Carsten Hammer.
* It was a part of iText, a Java-PDF library. You can now use it under
* the MIT License; for backward compatibility you can also use it under
* the MPL version 1.1: http://www.mozilla.org/MPL/
* A copy of the MPL license is bundled with the source code FYI.
*/
package com.lowagie.tools.plugins;
import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.util.HashMap;
import java.util.Iterator;
import javax.swing.JInternalFrame;
import com.lowagie.text.pdf.PRStream;
import com.lowagie.text.pdf.PdfArray;
import com.lowagie.text.pdf.PdfDictionary;
import com.lowagie.text.pdf.PdfName;
import com.lowagie.text.pdf.PdfNameTree;
import com.lowagie.text.pdf.PdfObject;
import com.lowagie.text.pdf.PdfReader;
import com.lowagie.text.pdf.PdfString;
import com.lowagie.tools.AbstractTool;
import com.lowagie.tools.arguments.FileArgument;
import com.lowagie.tools.arguments.StringArgument;
import com.lowagie.tools.arguments.filters.PdfFilter;
import com.lowagie.tools.swing.PdfInformationPanel;
/**
* This tool lets you extract the attachments of a PDF.
*/
public class ExtractAttachments extends AbstractTool {
static {
addVersion("$Id: ExtractAttachments.java 45 2007-05-15 22:02:53Z chammer $");
}
/**
* Constructs a ExtractAttachements object.
*/
public ExtractAttachments() {
FileArgument f = new FileArgument(this, "srcfile",
"The file you want to operate on", false, new PdfFilter());
f.setLabel(new PdfInformationPanel());
arguments.add(f);
}
/**
* @see com.lowagie.tools.AbstractTool#createFrame()
*/
protected void createFrame() {
internalFrame = new JInternalFrame("ExtractAttachments", true, false,
true);
internalFrame.setSize(300, 80);
internalFrame.setJMenuBar(getMenubar());
System.out.println("=== ExtractAttachments OPENED ===");
}
/**
* @see com.lowagie.tools.AbstractTool#execute()
*/
public void execute() {
try {
if (getValue("srcfile") == null)
throw new InstantiationException(
"You need to choose a sourcefile");
File src = (File) getValue("srcfile");
// we create a reader for a certain document
PdfReader reader = new PdfReader(src.getAbsolutePath());
final File parentFile = src.getParentFile();
final String outPath;
if (parentFile != null) {
outPath = parentFile.getAbsolutePath();
} else {
outPath = "";
}
PdfDictionary catalog = reader.getCatalog();
PdfDictionary names = (PdfDictionary) PdfReader
.getPdfObject(catalog.get(PdfName.NAMES));
if (names != null) {
PdfDictionary embFiles = (PdfDictionary) PdfReader
.getPdfObject(names.get(new PdfName("EmbeddedFiles")));
if (embFiles != null) {
HashMap embMap = PdfNameTree.readTree(embFiles);
for (Iterator i = embMap.values().iterator(); i.hasNext();) {
PdfDictionary filespec = (PdfDictionary) PdfReader
.getPdfObject((PdfObject) i.next());
unpackFile(reader, filespec, outPath);
}
}
}
for (int k = 1; k <= reader.getNumberOfPages(); ++k) {
PdfArray annots = (PdfArray) PdfReader.getPdfObject(reader
.getPageN(k).get(PdfName.ANNOTS));
if (annots == null)
continue;
for (Iterator i = annots.listIterator(); i.hasNext();) {
PdfDictionary annot = (PdfDictionary) PdfReader
.getPdfObject((PdfObject) i.next());
PdfName subType = (PdfName) PdfReader.getPdfObject(annot
.get(PdfName.SUBTYPE));
if (!PdfName.FILEATTACHMENT.equals(subType))
continue;
PdfDictionary filespec = (PdfDictionary) PdfReader
.getPdfObject(annot.get(PdfName.FS));
unpackFile(reader, filespec, outPath);
}
}
} catch (Exception e) {
e.printStackTrace();
}
}
/**
*
* @see com.lowagie.tools.AbstractTool#valueHasChanged(com.lowagie.tools.arguments.StringArgument)
* @param arg StringArgument
*/
public void valueHasChanged(StringArgument arg) {
if (internalFrame == null) {
// if the internal frame is null, the tool was called from the
// commandline
return;
}
// represent the changes of the argument in the internal frame
}
/**
* Extract the attachements of a PDF.
*
* @param args String[]
*/
public static void main(String[] args) {
ExtractAttachments tool = new ExtractAttachments();
if (args.length < 1) {
System.err.println(tool.getUsage());
}
tool.setMainArguments(args);
tool.execute();
}
/**
*
* @see com.lowagie.tools.AbstractTool#getDestPathPDF()
* @throws InstantiationException
* @return File
*/
protected File getDestPathPDF() throws InstantiationException {
throw new InstantiationException("There is more than one destfile.");
}
/**
* Unpacks a file attachment.
*
* @param reader
* The object that reads the PDF document
* @param filespec
* The dictonary containing the file specifications
* @param outPath
* The path where the attachment has to be written
* @throws IOException
*/
public static void unpackFile(PdfReader reader, PdfDictionary filespec,
String outPath) throws IOException {
if (filespec == null)
return;
PdfName type = (PdfName) PdfReader.getPdfObject(filespec
.get(PdfName.TYPE));
if (!PdfName.F.equals(type) && !PdfName.FILESPEC.equals(type))
return;
PdfDictionary ef = (PdfDictionary) PdfReader.getPdfObject(filespec
.get(PdfName.EF));
if (ef == null)
return;
PdfString fn = (PdfString) PdfReader.getPdfObject(filespec
.get(PdfName.F));
System.out.println("Unpacking file '" + fn + "' to " + outPath);
if (fn == null)
return;
File fLast = new File(fn.toUnicodeString());
File fullPath = new File(outPath, fLast.getName());
if (fullPath.exists())
return;
PRStream prs = (PRStream) PdfReader.getPdfObject(ef.get(PdfName.F));
if (prs == null)
return;
byte b[] = PdfReader.getStreamBytes(prs);
FileOutputStream fout = new FileOutputStream(fullPath);
fout.write(b);
fout.close();
}
}