org.apache.nutch.quality.dynamic
Class PageDescription

java.lang.Object
  extended byorg.apache.nutch.quality.dynamic.PageDescription
All Implemented Interfaces:
PageDescriptionConstants

public class PageDescription
extends Object
implements PageDescriptionConstants

PageDescription gives the URL and the textual description for a target page. It loads in a Sherlock plugin file.

Author:
Mike Cafarella

Field Summary
 Token jj_nt
           
 Token token
           
 PageDescriptionTokenManager token_source
           
 
Fields inherited from interface org.apache.nutch.quality.dynamic.PageDescriptionConstants
AFTER_EQUALS, DEFAULT, EOF, EQUALS, KEYWORD, QUOTED_VALUE, tokenImage, UNQUOTED_VALUE
 
Constructor Summary
PageDescription(InputStream stream)
           
PageDescription(PageDescriptionTokenManager tm)
           
PageDescription(Reader stream)
           
 
Method Summary
 void disable_tracing()
           
 void element()
           
 void enable_tracing()
           
 ParseException generateParseException()
           
 ArrayList getInputs()
           
 ArrayList getInterprets()
           
 Token getNextToken()
           
 Token getToken(int index)
           
 HashMap getValues()
           
 void inputItem(HashMap input)
           
static void main(String[] argv)
          Test out sherlock parsing
 void matchItem(HashMap interpret)
           
 void param()
           
 void parse()
           
 void ReInit(InputStream stream)
           
 void ReInit(PageDescriptionTokenManager tm)
           
 void ReInit(Reader stream)
           
 String value()
           
 
Methods inherited from class java.lang.Object
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
 

Field Detail

token_source

public PageDescriptionTokenManager token_source

token

public Token token

jj_nt

public Token jj_nt
Constructor Detail

PageDescription

public PageDescription(InputStream stream)

PageDescription

public PageDescription(Reader stream)

PageDescription

public PageDescription(PageDescriptionTokenManager tm)
Method Detail

getValues

public HashMap getValues()

getInputs

public ArrayList getInputs()

getInterprets

public ArrayList getInterprets()

main

public static void main(String[] argv)
                 throws IOException,
                        ParseException
Test out sherlock parsing

Throws:
IOException
ParseException

parse

public final void parse()
                 throws ParseException
Throws:
ParseException

param

public final void param()
                 throws ParseException
Throws:
ParseException

element

public final void element()
                   throws ParseException
Throws:
ParseException

inputItem

public final void inputItem(HashMap input)
                     throws ParseException
Throws:
ParseException

matchItem

public final void matchItem(HashMap interpret)
                     throws ParseException
Throws:
ParseException

value

public final String value()
                   throws ParseException
Throws:
ParseException

ReInit

public void ReInit(InputStream stream)

ReInit

public void ReInit(Reader stream)

ReInit

public void ReInit(PageDescriptionTokenManager tm)

getNextToken

public final Token getNextToken()

getToken

public final Token getToken(int index)

generateParseException

public ParseException generateParseException()

enable_tracing

public final void enable_tracing()

disable_tracing

public final void disable_tracing()


Copyright © 2006 The Apache Software Foundation