Package org.encog.bot.browse

Source Code of org.encog.bot.browse.TestWebPageData

/*
* Encog(tm) Core v3.3 - Java Version
* http://www.heatonresearch.com/encog/
* https://github.com/encog/encog-java-core
* Copyright 2008-2014 Heaton Research, Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*  
* For more information on Heaton Research copyrights, licenses
* and trademarks visit:
* http://www.heatonresearch.com/copyright
*/
package org.encog.bot.browse;

import junit.framework.TestCase;

import org.encog.bot.browse.range.DocumentRange;
import org.encog.bot.browse.range.Link;
import org.encog.bot.dataunit.TagDataUnit;
import org.encog.bot.dataunit.TextDataUnit;
import org.encog.parse.tags.Tag;
import org.junit.Assert;
import org.junit.Test;

public class TestWebPageData extends TestCase {

  @Test
  public void testSimple() throws Throwable
  {
    LoadWebPage load = new LoadWebPage(null);
    WebPage page = load.load("a<b>b</b>c");
    TestCase.assertEquals(5,page.getData().size());
   
    TextDataUnit textDU;
    TagDataUnit tagDU;
   
    // Index 0 (text)
    textDU = (TextDataUnit)page.getDataUnit(0);
    Assert.assertEquals("a", textDU.toString());
    // Index 1 (tag)
    tagDU = (TagDataUnit)page.getDataUnit(1);
    Assert.assertEquals("b", tagDU.getTag().getName());
    Assert.assertEquals("<b>", tagDU.toString());
    Assert.assertEquals(Tag.Type.BEGIN, tagDU.getTag().getType());
    // Index 2 (text)
    textDU = (TextDataUnit)page.getDataUnit(2);
    Assert.assertEquals("b", textDU.toString());
    // Index 3 (tag)
    tagDU = (TagDataUnit)page.getDataUnit(3);
    Assert.assertEquals("b", tagDU.getTag().getName());
    Assert.assertEquals(Tag.Type.END, tagDU.getTag().getType());
    // Index 4 (text)
    textDU = (TextDataUnit)page.getDataUnit(4);
    Assert.assertEquals("c", textDU.toString());   
  }
 
  @Test
  public void testLink() throws Throwable
  {
    LoadWebPage load = new LoadWebPage(null);
    WebPage page = load.load("<a href=\"index.html\">Link <b>1</b></a>");
    Assert.assertEquals(1,page.getContents().size());
   
    DocumentRange span = page.getContents().get(0);
    Assert.assertEquals(0, span.getBegin());
    Assert.assertEquals(5, span.getEnd());
    Assert.assertTrue(span instanceof Link);
    Link link = (Link)span;
    Assert.assertEquals("index.html",link.getTarget().getOriginal().toString());
    Address address = link.getTarget();
    Assert.assertNotNull(address.toString());
   
  }
 
}
TOP

Related Classes of org.encog.bot.browse.TestWebPageData

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.