anl.aida.reader
Class ScraperTests

java.lang.Object
  extended by anl.aida.reader.ScraperTests

public class ScraperTests
extends java.lang.Object

Tests of the web scrapers.


Nested Class Summary
private static class ScraperTests.RRProcessor
           
 
Field Summary
private static java.lang.String AAContent_1
           
private static java.lang.String AAContent_2
           
(package private)  java.util.Calendar cal
           
private  org.apache.uima.cas.CAS cas
           
private static java.lang.String NTARC_CONTENT
           
private static java.lang.String NTARC2_CONTENT
           
private static java.lang.String NYTIMES_CONTENT_A
           
private  org.apache.uima.collection.CollectionReader reader
           
private static java.lang.String TRIB_CONTENT_A
           
private static java.lang.String TRIB_CONTENT_B
           
 
Constructor Summary
ScraperTests()
           
 
Method Summary
 org.apache.uima.resource.metadata.ConfigurationParameterSettings setUpCAS(java.lang.String compsFile, java.lang.String indexKey, java.lang.String indexValue)
           
 void tearDownCAS()
           
 void testAllAfricaHTMLReader()
           
 void testCTReader()
           
 void testLineParser()
           
 void testNTARCHTML()
           
 void testNTARCHTML2()
           
 void testNTARCReader()
           
 void testNY()
           
 void testNYTArchiveReader()
           
 void testNYTimesHTML()
           
 void testNYTReader()
           
 void testTRIBArchiveReader()
           
 void testTribHTML()
           
 
Methods inherited from class java.lang.Object
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
 

Field Detail

cal

java.util.Calendar cal

NTARC_CONTENT

private static java.lang.String NTARC_CONTENT

NTARC2_CONTENT

private static java.lang.String NTARC2_CONTENT

TRIB_CONTENT_A

private static java.lang.String TRIB_CONTENT_A

TRIB_CONTENT_B

private static java.lang.String TRIB_CONTENT_B

cas

private org.apache.uima.cas.CAS cas

reader

private org.apache.uima.collection.CollectionReader reader

NYTIMES_CONTENT_A

private static java.lang.String NYTIMES_CONTENT_A

AAContent_1

private static java.lang.String AAContent_1

AAContent_2

private static java.lang.String AAContent_2
Constructor Detail

ScraperTests

public ScraperTests()
Method Detail

testNTARCHTML

public void testNTARCHTML()
                   throws java.io.IOException
Throws:
java.io.IOException

testNTARCHTML2

public void testNTARCHTML2()
                    throws java.io.IOException
Throws:
java.io.IOException

testTribHTML

public void testTribHTML()
                  throws java.io.IOException
Throws:
java.io.IOException

testNYTimesHTML

public void testNYTimesHTML()
                     throws java.io.IOException
Throws:
java.io.IOException

testNY

public void testNY()
            throws java.io.IOException
Throws:
java.io.IOException

testAllAfricaHTMLReader

public void testAllAfricaHTMLReader()
                             throws java.io.IOException
Throws:
java.io.IOException

testLineParser

public void testLineParser()

testNYTArchiveReader

public void testNYTArchiveReader()
                          throws java.io.IOException,
                                 java.text.ParseException,
                                 AIDAException
Throws:
java.io.IOException
java.text.ParseException
AIDAException

testTRIBArchiveReader

public void testTRIBArchiveReader()
                           throws java.io.IOException,
                                  java.text.ParseException,
                                  AIDAException
Throws:
java.io.IOException
java.text.ParseException
AIDAException

setUpCAS

public org.apache.uima.resource.metadata.ConfigurationParameterSettings setUpCAS(java.lang.String compsFile,
                                                                                 java.lang.String indexKey,
                                                                                 java.lang.String indexValue)
                                                                          throws java.io.IOException,
                                                                                 org.apache.uima.util.InvalidXMLException,
                                                                                 org.apache.uima.resource.ResourceInitializationException,
                                                                                 org.apache.uima.analysis_engine.AnalysisEngineProcessException
Throws:
java.io.IOException
org.apache.uima.util.InvalidXMLException
org.apache.uima.resource.ResourceInitializationException
org.apache.uima.analysis_engine.AnalysisEngineProcessException

tearDownCAS

public void tearDownCAS()

testNTARCReader

public void testNTARCReader()
                     throws java.io.IOException,
                            java.text.ParseException,
                            org.apache.uima.analysis_engine.AnalysisEngineProcessException,
                            org.apache.uima.util.InvalidXMLException,
                            org.apache.uima.resource.ResourceInitializationException,
                            org.apache.uima.collection.CollectionException
Throws:
java.io.IOException
java.text.ParseException
org.apache.uima.analysis_engine.AnalysisEngineProcessException
org.apache.uima.util.InvalidXMLException
org.apache.uima.resource.ResourceInitializationException
org.apache.uima.collection.CollectionException

testNYTReader

public void testNYTReader()
                   throws java.io.IOException,
                          java.text.ParseException,
                          org.apache.uima.analysis_engine.AnalysisEngineProcessException,
                          org.apache.uima.util.InvalidXMLException,
                          org.apache.uima.resource.ResourceInitializationException,
                          org.apache.uima.collection.CollectionException
Throws:
java.io.IOException
java.text.ParseException
org.apache.uima.analysis_engine.AnalysisEngineProcessException
org.apache.uima.util.InvalidXMLException
org.apache.uima.resource.ResourceInitializationException
org.apache.uima.collection.CollectionException

testCTReader

public void testCTReader()
                  throws java.io.IOException,
                         java.text.ParseException,
                         org.apache.uima.analysis_engine.AnalysisEngineProcessException,
                         org.apache.uima.util.InvalidXMLException,
                         org.apache.uima.resource.ResourceInitializationException,
                         org.apache.uima.collection.CollectionException
Throws:
java.io.IOException
java.text.ParseException
org.apache.uima.analysis_engine.AnalysisEngineProcessException
org.apache.uima.util.InvalidXMLException
org.apache.uima.resource.ResourceInitializationException
org.apache.uima.collection.CollectionException