Package org.jwat.warc

Source Code of org.jwat.warc.TestWarcReader

/**
* Java Web Archive Toolkit - Software to read and validate ARC, WARC
* and GZip files. (http://jwat.org/)
* Copyright 2011-2012 Netarkivet.dk (http://netarkivet.dk/)
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.jwat.warc;

import java.io.ByteArrayInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.Iterator;
import java.util.NoSuchElementException;

import org.junit.Assert;
import org.junit.Test;
import org.junit.runner.RunWith;
import org.junit.runners.JUnit4;
import org.jwat.common.Diagnosis;
import org.jwat.common.DiagnosisType;

@RunWith(JUnit4.class)
public class TestWarcReader {

    @Test
    public void test_arcreader_iterator_exceptions() {
        WarcReader reader = new WarcReader() {
            @Override
            public boolean isCompressed() {
                return false;
            }
            @Override
            public void close() {
            }
            @Override
            protected void recordClosed() {
            }
            @Override
            public long getStartOffset() {
                return 0;
            }
            @Override
            public long getOffset() {
                return 0;
            }
            @Override
            public long getConsumed() {
                return 0;
            }
            @Override
            public WarcRecord getNextRecord() throws IOException {
                throw new IOException();
            }
            @Override
            public WarcRecord getNextRecordFrom(InputStream in,
                    long offset) throws IOException {
                return null;
            }
            @Override
            public WarcRecord getNextRecordFrom(InputStream in,
                    long offset, int buffer_size) throws IOException {
                return null;
            }
        };
        Iterator<WarcRecord> iter = reader.iterator();

        Assert.assertNull(reader.iteratorExceptionThrown);
        iter.hasNext();
        Assert.assertNotNull(reader.iteratorExceptionThrown);
        try {
            iter.next();
            Assert.fail("Exception expected!");
        } catch (NoSuchElementException e) {
        }
        Assert.assertNotNull(reader.iteratorExceptionThrown);

        Assert.assertTrue(reader.bIsCompliant);
        Assert.assertEquals(0, reader.consumed);
        Assert.assertEquals(0, reader.records);
        Assert.assertEquals(0, reader.errors);
        Assert.assertEquals(0, reader.warnings);

        reader.bIsCompliant = false;
        reader.consumed = 1;
        reader.records = 2;
        reader.errors = 3;
        reader.warnings = 4;

        Assert.assertFalse(reader.bIsCompliant);
        Assert.assertEquals(1, reader.consumed);
        Assert.assertEquals(2, reader.records);
        Assert.assertEquals(3, reader.errors);
        Assert.assertEquals(4, reader.warnings);

        reader.reset();

        Assert.assertTrue(reader.bIsCompliant);
        Assert.assertEquals(0, reader.consumed);
        Assert.assertEquals(0, reader.records);
        Assert.assertEquals(0, reader.errors);
        Assert.assertEquals(0, reader.warnings);
    }

    @Test
    public void test_empty_warcfile() {
        ByteArrayInputStream in = new ByteArrayInputStream(new byte[0]);
        Diagnosis d;
        try {
            WarcReader reader = WarcReaderFactory.getReaderUncompressed(in);
            WarcRecord record = reader.getNextRecord();
            Assert.assertNull(record);
            Assert.assertFalse(reader.isCompliant());
            Assert.assertEquals(1, reader.diagnostics.getErrors().size());
            Assert.assertEquals(0, reader.diagnostics.getWarnings().size());

            d = reader.diagnostics.getErrors().get(0);
            Assert.assertEquals(DiagnosisType.ERROR_EXPECTED, d.type);
            Assert.assertEquals("WARC file", d.entity);
            Assert.assertEquals(1, d.information.length);
        }
        catch (IOException e) {
            e.printStackTrace();
            Assert.fail("Unexpected exception!");
        }
    }

}
TOP

Related Classes of org.jwat.warc.TestWarcReader

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.