websphinx.workbench
Class ExtractAction

java.lang.Object
  |
  +--websphinx.workbench.ExtractAction
All Implemented Interfaces:
Action, CrawlListener, java.io.Serializable

public class ExtractAction
extends java.lang.Object
implements Action, CrawlListener

See Also:
Serialized Form

Field Summary
(package private)  java.io.File file
           
(package private)  java.lang.String filename
           
(package private)  boolean noFields
           
(package private)  Pattern pattern
           
(package private)  RecordTransformer records
           
(package private)  boolean textOnly
           
(package private)  boolean useBrowser
           
 
Constructor Summary
ExtractAction(Pattern pattern, boolean useBrowser, java.lang.String filename, boolean textOnly)
           
 
Method Summary
 void cleared(CrawlEvent event)
          Notify that the crawler's state was cleared.
 void connected(Crawler crawler)
           
 void disconnected(Crawler crawler)
           
 boolean equals(java.lang.Object object)
           
 java.lang.String getFilename()
           
 Pattern getPattern()
           
 boolean getTextOnly()
           
 boolean getUseBrowser()
           
private  java.lang.String makeTableHeader(java.lang.String[] fieldNames)
           
 void paused(CrawlEvent event)
          Notify that the crawler is paused.
private  boolean same(java.lang.String s1, java.lang.String s2)
           
private  void showit()
           
 void started(CrawlEvent event)
          Notify that the crawler started.
 void stopped(CrawlEvent event)
          Notify that the crawler ran out of links to crawl
 void timedOut(CrawlEvent event)
          Notify that the crawler timed out.
 void visit(Page page)
           
 
Methods inherited from class java.lang.Object
, clone, finalize, getClass, hashCode, notify, notifyAll, registerNatives, toString, wait, wait, wait
 

Field Detail

pattern

Pattern pattern

filename

java.lang.String filename

useBrowser

boolean useBrowser

textOnly

boolean textOnly

file

transient java.io.File file

records

transient RecordTransformer records

noFields

transient boolean noFields
Constructor Detail

ExtractAction

public ExtractAction(Pattern pattern,
                     boolean useBrowser,
                     java.lang.String filename,
                     boolean textOnly)
Method Detail

equals

public boolean equals(java.lang.Object object)
Overrides:
equals in class java.lang.Object

same

private boolean same(java.lang.String s1,
                     java.lang.String s2)

getPattern

public Pattern getPattern()

getUseBrowser

public boolean getUseBrowser()

getFilename

public java.lang.String getFilename()

getTextOnly

public boolean getTextOnly()

connected

public void connected(Crawler crawler)
Specified by:
connected in interface Action

disconnected

public void disconnected(Crawler crawler)
Specified by:
disconnected in interface Action

showit

private void showit()

visit

public void visit(Page page)
Specified by:
visit in interface Action

started

public void started(CrawlEvent event)
Notify that the crawler started.
Specified by:
started in interface CrawlListener

makeTableHeader

private java.lang.String makeTableHeader(java.lang.String[] fieldNames)

stopped

public void stopped(CrawlEvent event)
Notify that the crawler ran out of links to crawl
Specified by:
stopped in interface CrawlListener

cleared

public void cleared(CrawlEvent event)
Notify that the crawler's state was cleared.
Specified by:
cleared in interface CrawlListener

timedOut

public void timedOut(CrawlEvent event)
Notify that the crawler timed out.
Specified by:
timedOut in interface CrawlListener

paused

public void paused(CrawlEvent event)
Notify that the crawler is paused.
Specified by:
paused in interface CrawlListener