Package com.enterprisedt.net.ftp

Source Code of com.enterprisedt.net.ftp.UnixFileParser

/**
*
*  edtFTPj
*
*  Copyright (C) 2000-2004 Enterprise Distributed Technologies Ltd
*
*  www.enterprisedt.com
*
*  This library is free software; you can redistribute it and/or
*  modify it under the terms of the GNU Lesser General Public
*  License as published by the Free Software Foundation; either
*  version 2.1 of the License, or (at your option) any later version.
*
*  This library is distributed in the hope that it will be useful,
*  but WITHOUT ANY WARRANTY; without even the implied warranty of
*  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
*  Lesser General Public License for more details.
*
*  You should have received a copy of the GNU Lesser General Public
*  License along with this library; if not, write to the Free Software
*  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
*
*  Bug fixes, suggestions and comments should be should posted on
*  http://www.enterprisedt.com/forums/index.php
*
*  Change Log:
*
*    $Log: UnixFileParser.java,v $
*    Revision 1.25  2010-12-21 00:19:28  bruceb
*    length checks
*
*    Revision 1.24  2010-11-04 01:07:46  bruceb
*    tweaking for new formats
*
*    Revision 1.23  2009-01-15 03:36:26  bruceb
*    added isNumeric
*
*    Revision 1.22  2009-01-15 00:16:58  hans
*    Removed unused local variable.
*
*    Revision 1.21  2008-07-29 02:58:44  bruceb
*    Connect:Enterprise tweaks
*
*    Revision 1.20  2008-07-15 05:41:33  bruceb
*    refactor parsing code
*
*    Revision 1.19  2007-12-18 07:52:53  bruceb
*    trimStart() changes
*
*    Revision 1.18  2007-10-12 05:20:44  bruceb
*    permit ignoring date parser errors
*
*    Revision 1.17  2007-06-15 08:15:30  bruceb
*    Connect:Enterprise fix
*
*    Revision 1.16  2007/03/28 06:04:15  bruceb
*    support reverse MMM/dd formats
*
*    Revision 1.15  2007/03/19 22:10:57  bruceb
*    when testing for future, set future date 2 days ahead to account for time zones
*
*    Revision 1.14  2006/10/11 08:57:40  hans
*    Removed usage of deprecated FTPFile constructor and made cvsId final
*
*    Revision 1.13  2006/05/23 04:10:17  bruceb
*    support Unix listing starting with 'p'
*
*    Revision 1.12  2005/06/03 11:26:25  bruceb
*    comment change
*
*    Revision 1.11  2005/04/01 13:57:15  bruceb
*    minor tweak re groups
*
*    Revision 1.10  2004/10/19 16:15:49  bruceb
*    minor restructuring
*
*    Revision 1.9  2004/10/18 15:58:15  bruceb
*    setLocale
*
*    Revision 1.8  2004/09/20 21:36:13  bruceb
*    tweak to skip invalid lines
*
*    Revision 1.7  2004/09/17 14:56:54  bruceb
*    parse fixes including wrong year
*
*    Revision 1.6  2004/07/23 08:32:36  bruceb
*    made cvsId public
*
*    Revision 1.5  2004/06/11 10:19:59  bruceb
*    fixed bug re filename same as user
*
*    Revision 1.4  2004/05/20 19:47:00  bruceb
*    blanks in names fix
*
*    Revision 1.3  2004/05/05 20:27:41  bruceb
*    US locale for date formats
*
*    Revision 1.2  2004/05/01 11:44:21  bruceb
*    modified for server returning "total 3943" as first line
*
*    Revision 1.1  2004/04/17 23:42:07  bruceb
*    file parsing part II
*
*    Revision 1.1  2004/04/17 18:37:23  bruceb
*    new parse functionality
*
*/
package com.enterprisedt.net.ftp;

import java.text.ParseException;
import java.text.SimpleDateFormat;
import java.util.ArrayList;
import java.util.Calendar;
import java.util.Date;
import java.util.Iterator;
import java.util.List;
import java.util.Locale;

import com.enterprisedt.util.debug.Logger;

/**
*  Represents a remote Unix file parser
*
@author      Bruce Blackshaw
@version     $Revision: 1.25 $
*/
public class UnixFileParser extends FTPFileParser {

    /**
     *  Revision control id
     */
  final public static String cvsId = "@(#)$Id: UnixFileParser.java,v 1.25 2010-12-21 00:19:28 bruceb Exp $";
 
  /**
     * Logging object
     */
    private static Logger log = Logger.getLogger("UnixFileParser");

    /**
     * Symbolic link symbol
     */
    private final static String SYMLINK_ARROW = "->";
   
    /**
     * Indicates symbolic link
     */
    private final static char SYMLINK_CHAR = 'l';
       
    /**
     * These chars indicates ordinary files
     */
    private final static char[] FILE_CHARS = {'-', 'p'};
   
    /**
     * Indicates directory
     */
    private final static char DIRECTORY_CHAR = 'd';
   
    /**
     * Date formatter 1 with no HH:mm
     */
    private SimpleDateFormat noHHmmFormatter1;
   
    /**
     * Date formatter 2  with no HH:mm
     */
    private SimpleDateFormat noHHmmFormatter2;
   
    /**
     * Date formatter with no HH:mm
     */
    private SimpleDateFormat noHHmmFormatter;   
   
   
    /**
     * Date formatter with HH:mm
     */
    private SimpleDateFormat hhmmFormatter;
   
    /**
     * List of formatters
     */
    private List hhmmFormatters;
       
    /**
     * Minimum number of expected fields
     */
    private final static int MIN_FIELD_COUNT = 7;
   
    /**
     * Constructor
     */
    public UnixFileParser() {
        setLocale(Locale.getDefault());
    }
   
    /**
     * Set the locale for date parsing of listings
     *
     * @param locale    locale to set
     */
    public void setLocale(Locale locale) {
        noHHmmFormatter1 = new SimpleDateFormat("MMM-dd-yyyy", locale);
        noHHmmFormatter2 = new SimpleDateFormat("dd-MMM-yyyy", locale);
        noHHmmFormatter = noHHmmFormatter1;
       
        hhmmFormatters = new ArrayList();
        hhmmFormatters.add(new SimpleDateFormat("MMM-d-yyyy-HH:mm", locale));
        hhmmFormatters.add(new SimpleDateFormat("MMM-dd-yyyy-HH:mm", locale));
        hhmmFormatters.add(new SimpleDateFormat("MMM-d-yyyy-H:mm", locale));
        hhmmFormatters.add(new SimpleDateFormat("MMM-dd-yyyy-H:mm", locale));
        hhmmFormatters.add(new SimpleDateFormat("MMM-dd-yyyy-H.mm", locale));
        hhmmFormatters.add(new SimpleDateFormat("dd-MMM-yyyy-HH:mm", locale));
   
   
    public String toString() {
        return "UNIX";
    }
   
   
    /**
     * Valid format for this parser
     *
     * @param listing
     * @return true if valid
     */
    public boolean isValidFormat(String[] listing) {
        int count = Math.min(listing.length, 10);
       
        boolean perms1 = false;
        boolean perms2 = false;

        for (int i = 0; i < count; i++) {
            if (listing[i].trim().length() == 0)
                continue;
            String[] fields = split(listing[i]);
            if (fields.length < MIN_FIELD_COUNT)
                continue;
            // check perms
            char ch00 = fields[0].charAt(0);
            if (ch00 == '-' || ch00 == 'l' || ch00 == 'd')
                perms1 = true;
           
            if (fields[0].length() > 1) {
                char ch01 = fields[0].charAt(1);
                if (ch01 == 'r' || ch01 == '-')
                    perms2 = true;  
            }
           
             // last chance - Connect:Enterprise has -ART------TCP
            if (!perms2 && fields[0].length() > 2 && fields[0].indexOf('-', 2) > 0)
                perms2 = true;
        }
        if (perms1 && perms2)
            return true;
        log.debug("Not in UNIX format");
        return false;
    }
   
    /**
     * Is this a Unix format listing?
     *
     * @param raw   raw listing line
     * @return true if Unix, false otherwise
     */
    public static boolean isUnix(String raw) {
        char ch = raw.charAt(0);
        if (ch == DIRECTORY_CHAR || ch == SYMLINK_CHAR)
            return true;
        for (int i = 0; i < FILE_CHARS.length; i++)
          if (ch == FILE_CHARS[i])
            return true;
        return false;
    }
   
    private boolean isNumeric(String field)
    {
        for (int i = 0; i < field.length(); i++)
        {
            if (!Character.isDigit(field.charAt(i)))
                return false;
        }
        return true;
    }
   
    /**
     * Parse server supplied string, e.g.:
     *
     * lrwxrwxrwx   1 wuftpd   wuftpd         14 Jul 22  2002 MIRRORS -> README-MIRRORS
     * -rw-r--r--   1 b173771  users         431 Mar 31 20:04 .htaccess
     *
     * @param raw   raw string to parse
     */
    public FTPFile parse(String raw) throws ParseException {
       
        // test it is a valid line, e.g. "total 342522" is invalid
        if (!isUnix(raw))
            return null;
       
        String[] fields = split(raw);
        
        if (fields.length < MIN_FIELD_COUNT) {
            StringBuffer msg = new StringBuffer("Unexpected number of fields in listing '");
            msg.append(raw).append("' - expected minimum ").append(MIN_FIELD_COUNT).
                    append(" fields but found ").append(fields.length).append(" fields");
            log.warn(msg.toString());
            return null;
        }
       
        // field pos
        int index = 0;
       
        // first field is perms
        char ch = raw.charAt(0);
        String permissions = fields[index++];
        ch = permissions.charAt(0);
        boolean isDir = false;
        boolean isLink = false;
        if (ch == DIRECTORY_CHAR)
            isDir = true;
        else if (ch == SYMLINK_CHAR)
            isLink = true;
       
        // some servers don't supply the link count
        int linkCount = 0;
        if (Character.isDigit(fields[index].charAt(0))) {
            try {
                linkCount = Integer.parseInt(fields[index++]);
            }
            catch (NumberFormatException ignore) {}
        }
        else if (fields[index].charAt(0) == '-') { // IPXOS Treck FTP server
            index++;
        }
       
        // owner and group
        String owner = "";
        String group = "";
        // if 2 fields ahead is numeric and there's enough fields beyond (4) for
        // the date, then the next two fields should be the owner & group
        if (isNumeric(fields[index+2]) &&  fields.length-(index+2) > 4) {
            owner = fields[index++];
            group = fields[index++];
        }
        // no owner
        else if (isNumeric(fields[index + 1]) && fields.length - (index + 1) > 4) {
            group = fields[index++];
        }
       
        // size
        long size = 0L;
        String sizeStr = fields[index++].replace(".", ""); // get rid of .'s in size   
        try {
            size = Long.parseLong(sizeStr);
        }
        catch (NumberFormatException ex) {
            log.warn("Failed to parse size: " + sizeStr);
        }
       
        // next 3 are the date time
       
        // we expect the month first on Unix.
        // Connect:Enterprise UNIX has a weird extra numeric field here - we test if the
        // next field is numeric and if so, we skip it (except we check for a BSD variant
        // that means it is the day of the month)
        int dayOfMonth = -1;
        if (isNumeric(fields[index])) {
            // this just might be the day of month - BSD variant
            // we check it is <= 31 AND that the next field starts
            // with a letter AND the next has a ':' within it
            try
            {
                String str = fields[index];
                while (str.startsWith("0"))
                    str = str.substring(1);
                dayOfMonth = Integer.parseInt(str);
                if (dayOfMonth > 31) // can't be day of month
                    dayOfMonth = -1;
                if (!(Character.isLetter(fields[index + 1].charAt(0))))
                    dayOfMonth = -1;
                if (fields[index + 2].indexOf(':') <= 0)
                    dayOfMonth = -1;
            }
            catch (NumberFormatException ex) {}
            index++;
        }
       
        int dateTimePos = index;
        Date lastModified = null;
        StringBuffer stamp = new StringBuffer(fields[index++]);
        stamp.append('-');
        if (dayOfMonth > 0)
            stamp.append(dayOfMonth);
        else
            stamp.append(fields[index++]);
        stamp.append('-');
       
        String field = fields[index++];
        if (field.indexOf(':') < 0 && field.indexOf('.') < 0) {
            stamp.append(field); // year
            try {
                lastModified = noHHmmFormatter.parse(stamp.toString());
            }
            catch (ParseException ignore) {
                noHHmmFormatter = (noHHmmFormatter == noHHmmFormatter1 ? noHHmmFormatter2 : noHHmmFormatter1);
                try {
                    lastModified = noHHmmFormatter.parse(stamp.toString());
                }
                catch (ParseException ex) {
                    if (!ignoreDateParseErrors)
                        throw new DateParseException(ex.getMessage());
                }
            }
        }
        else { // add the year ourselves as not present
            Calendar cal = Calendar.getInstance();
            int year = cal.get(Calendar.YEAR);
            stamp.append(year).append('-').append(field);
            lastModified = parseTimestamp(stamp.toString());
           
            // can't be in the future - must be the previous year
            // add 2 days just to allow for different time zones
            cal.add(Calendar.DATE, 2);
            if (lastModified != null && lastModified.after(cal.getTime())) {
                cal.setTime(lastModified);
                cal.add(Calendar.YEAR, -1);
                lastModified = cal.getTime();
            }
        }
           
        // name of file or dir. Extract symlink if possible
        String name = null;
        String linkedname = null;
       
        // we've got to find the starting point of the name. We
        // do this by finding the pos of all the date/time fields, then
        // the name - to ensure we don't get tricked up by a userid the
        // same as the filename,for example
        int pos = 0;
        boolean ok = true;
        int dateFieldCount = dayOfMonth > 0 ? 2 : 3; // only 2 fields left if we had a leading day of month
        for (int i = dateTimePos; i < dateTimePos + dateFieldCount; i++) {
            pos = raw.indexOf(fields[i], pos);
            if (pos < 0) {
                ok = false;
                break;
            }
            else { // move on the length of the field
                pos += fields[i].length();
            }
        }
        if (ok) {
            String remainder = trimStart(raw.substring(pos));
            if (!isLink)
                name = remainder;
            else { // symlink, try to extract it
                pos = remainder.indexOf(SYMLINK_ARROW);
                if (pos <= 0) { // couldn't find symlink, give up & just assign as name
                    name = remainder;
                }
                else {
                    int len = SYMLINK_ARROW.length();
                    name = remainder.substring(0, pos).trim();
                    if (pos+len < remainder.length())
                        linkedname = remainder.substring(pos+len);
                }
            }
        }
        else {
            log.warn("Failed to retrieve name: " + raw)
        }
       
        FTPFile file = new FTPFile(raw, name, size, isDir, lastModified);
        file.setGroup(group);
        file.setOwner(owner);
        file.setLink(isLink);
        file.setLinkCount(linkCount);
        file.setLinkedName(linkedname);
        file.setPermissions(permissions);
        return file;
    }
   
   
    private Date parseTimestamp(String ts) throws DateParseException {
        if (hhmmFormatter != null) {
            try {
                return hhmmFormatter.parse(ts);
            }
            catch (ParseException ex) {
                if (!ignoreDateParseErrors)
                    throw new DateParseException(ex.getMessage());
            }
            return null;
        }
        else {
            Iterator i = hhmmFormatters.iterator();
            ParseException ex = null;
            while (i.hasNext()) {
                try {
                    hhmmFormatter = (SimpleDateFormat)i.next();
                    return hhmmFormatter.parse(ts);
                }
                catch (ParseException ignore) {
                    ex = ignore; // record last one
                }
            }
            if (!ignoreDateParseErrors)
                throw new DateParseException(ex.getMessage());
            hhmmFormatter = null; // none of them worked
            return null;
        }
    }
}
TOP

Related Classes of com.enterprisedt.net.ftp.UnixFileParser

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.