|
|||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | ||||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | ||||||||
java.lang.Objectorg.apache.manifoldcf.crawler.system.SeedingActivity
public class SeedingActivity
This class represents the things you can do with the framework while seeding.
| Field Summary | |
|---|---|
static java.lang.String |
_rcsid
|
protected IRepositoryConnection |
connection
|
protected java.lang.String |
connectionName
|
protected IRepositoryConnector |
connector
|
protected IRepositoryConnectionManager |
connManager
|
protected int |
documentCount
|
protected java.lang.String[] |
documentHashList
|
protected java.lang.String[] |
documentList
|
protected java.lang.String[][] |
documentPrereqList
|
protected int |
hopcountMethod
|
protected java.lang.Long |
jobID
|
protected IJobManager |
jobManager
|
protected java.lang.String[] |
legalLinkTypes
|
protected static int |
MAX_COUNT
|
protected boolean |
overrideSchedule
|
protected QueueTracker |
queueTracker
|
protected int |
remainingDocumentCount
|
protected java.lang.String[] |
remainingDocumentHashList
|
| Constructor Summary | |
|---|---|
SeedingActivity(java.lang.String connectionName,
IRepositoryConnectionManager connManager,
IJobManager jobManager,
QueueTracker queueTracker,
IRepositoryConnection connection,
IRepositoryConnector connector,
java.lang.Long jobID,
java.lang.String[] legalLinkTypes,
boolean overrideSchedule,
int hopcountMethod)
Constructor. |
|
| Method Summary | |
|---|---|
void |
addSeedDocument(java.lang.String documentIdentifier)
Record a "seed" document identifier. |
void |
addSeedDocument(java.lang.String documentIdentifier,
java.lang.String[] prereqEventNames)
Record a "seed" document identifier. |
void |
addUnqueuedSeedDocument(java.lang.String documentIdentifier)
This method receives document identifiers that should be considered part of the seeds, but do not need to be queued for processing at this time. |
void |
checkJobStillActive()
Check whether current job is still active. |
java.lang.String |
createConnectionSpecificString(java.lang.String simpleString)
Create a connection-specific string from a simple string. |
java.lang.String |
createGlobalString(java.lang.String simpleString)
Create a global string from a simple string. |
java.lang.String |
createJobSpecificString(java.lang.String simpleString)
Create a job-based string from a simple string. |
void |
doneSeeding(boolean isPartial)
Finish a seeding pass |
void |
recordActivity(java.lang.Long startTime,
java.lang.String activityType,
java.lang.Long dataSize,
java.lang.String entityIdentifier,
java.lang.String resultCode,
java.lang.String resultDescription,
java.lang.String[] childIdentifiers)
Record time-stamped information about the activity of the connector. |
protected void |
writeSeedDocuments(java.lang.String[] docIDHashes,
java.lang.String[] docIDs,
java.lang.String[][] prereqEventNames)
Write specified documents after calculating their priorities |
| Methods inherited from class java.lang.Object |
|---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
| Field Detail |
|---|
public static final java.lang.String _rcsid
protected static final int MAX_COUNT
protected java.lang.String connectionName
protected IRepositoryConnectionManager connManager
protected IJobManager jobManager
protected QueueTracker queueTracker
protected IRepositoryConnection connection
protected IRepositoryConnector connector
protected java.lang.Long jobID
protected java.lang.String[] legalLinkTypes
protected boolean overrideSchedule
protected int hopcountMethod
protected java.lang.String[] documentHashList
protected java.lang.String[] documentList
protected java.lang.String[][] documentPrereqList
protected int documentCount
protected java.lang.String[] remainingDocumentHashList
protected int remainingDocumentCount
| Constructor Detail |
|---|
public SeedingActivity(java.lang.String connectionName,
IRepositoryConnectionManager connManager,
IJobManager jobManager,
QueueTracker queueTracker,
IRepositoryConnection connection,
IRepositoryConnector connector,
java.lang.Long jobID,
java.lang.String[] legalLinkTypes,
boolean overrideSchedule,
int hopcountMethod)
| Method Detail |
|---|
public void addSeedDocument(java.lang.String documentIdentifier,
java.lang.String[] prereqEventNames)
throws ManifoldCFException
addSeedDocument in interface ISeedingActivitydocumentIdentifier - is the identifier of the document to add to the "pending" queue.prereqEventNames - is the list of prerequisite events required for this document, or null if none.
ManifoldCFException
public void addSeedDocument(java.lang.String documentIdentifier)
throws ManifoldCFException
addSeedDocument in interface ISeedingActivitydocumentIdentifier - is the identifier of the document to add to the "pending" queue.
ManifoldCFException
public void addUnqueuedSeedDocument(java.lang.String documentIdentifier)
throws ManifoldCFException
addUnqueuedSeedDocument in interface ISeedingActivitydocumentIdentifier - is the identifier of the document to consider as a seed, but not to put in the
"pending" queue.
ManifoldCFException
public void doneSeeding(boolean isPartial)
throws ManifoldCFException
ManifoldCFException
public void recordActivity(java.lang.Long startTime,
java.lang.String activityType,
java.lang.Long dataSize,
java.lang.String entityIdentifier,
java.lang.String resultCode,
java.lang.String resultDescription,
java.lang.String[] childIdentifiers)
throws ManifoldCFException
recordActivity in interface IHistoryActivitystartTime - is either null or the time since the start of epoch in milliseconds (Jan 1, 1970). Every
activity has an associated time; the startTime field records when the activity began. A null value
indicates that the start time and the finishing time are the same.activityType - is a string which is fully interpretable only in the context of the connector involved, which is
used to categorize what kind of activity is being recorded. For example, a web connector might record a
"fetch document" activity. Cannot be null.dataSize - is the number of bytes of data involved in the activity, or null if not applicable.entityIdentifier - is a (possibly long) string which identifies the object involved in the history record.
The interpretation of this field will differ from connector to connector. May be null.resultCode - contains a terse description of the result of the activity. The description is limited in
size to 255 characters, and can be interpreted only in the context of the current connector. May be null.resultDescription - is a (possibly long) human-readable string which adds detail, if required, to the result
described in the resultCode field. This field is not meant to be queried on. May be null.childIdentifiers - is a set of child entity identifiers associated with this activity. May be null.
ManifoldCFException
protected void writeSeedDocuments(java.lang.String[] docIDHashes,
java.lang.String[] docIDs,
java.lang.String[][] prereqEventNames)
throws ManifoldCFException
ManifoldCFException
public void checkJobStillActive()
throws ManifoldCFException,
ServiceInterruption
checkJobStillActive in interface IAbortActivityManifoldCFException
ServiceInterruptionpublic java.lang.String createGlobalString(java.lang.String simpleString)
createGlobalString in interface INamingActivitysimpleString - is the simple string.
public java.lang.String createConnectionSpecificString(java.lang.String simpleString)
createConnectionSpecificString in interface INamingActivitysimpleString - is the simple string.
public java.lang.String createJobSpecificString(java.lang.String simpleString)
createJobSpecificString in interface INamingActivitysimpleString - is the simple string.
|
|||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | ||||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | ||||||||