org.archive.crawler.deciderules
Class NotExceedsDocumentLengthTresholdDecideRule

java.lang.Object
  extended by javax.management.Attribute
      extended by org.archive.crawler.settings.Type
          extended by org.archive.crawler.settings.ComplexType
              extended by org.archive.crawler.settings.ModuleType
                  extended by org.archive.crawler.deciderules.DecideRule
                      extended by org.archive.crawler.deciderules.ConfiguredDecideRule
                          extended by org.archive.crawler.deciderules.PredicatedDecideRule
                              extended by org.archive.crawler.deciderules.NotExceedsDocumentLengthTresholdDecideRule
All Implemented Interfaces:
java.io.Serializable, javax.management.DynamicMBean, CoreAttributeConstants
Direct Known Subclasses:
ExceedsDocumentLengthTresholdDecideRule

public class NotExceedsDocumentLengthTresholdDecideRule
extends PredicatedDecideRule
implements CoreAttributeConstants

See Also:
Serialized Form

Nested Class Summary
 
Nested classes/interfaces inherited from class org.archive.crawler.settings.ComplexType
ComplexType.MBeanAttributeInfoIterator
 
Field Summary
static java.lang.String ATTR_CONTENT_LENGTH_TRESHOLD
           
static java.lang.String ATTR_USE_AS_MIDFETCH
           
(package private) static java.lang.Integer DEFAULT_CONTENT_LENGTH_TRESHOLD
           
(package private) static java.lang.Boolean DEFAULT_USE_AS_MIDFETCH
           
static int HEADER_PREDICTS_MISSING
           
 
Fields inherited from class org.archive.crawler.deciderules.ConfiguredDecideRule
ALLOWED_TYPES, ATTR_DECISION
 
Fields inherited from class org.archive.crawler.deciderules.DecideRule
ACCEPT, PASS, REJECT
 
Fields inherited from class org.archive.crawler.settings.ComplexType
definition, definitionMap
 
Fields inherited from interface org.archive.crawler.datamodel.CoreAttributeConstants
A_ANNOTATIONS, A_CONTENT_DIGEST, A_CONTENT_TYPE, A_CREDENTIAL_AVATARS_KEY, A_DELAY_FACTOR, A_DISTANCE_FROM_SEED, A_DNS_FETCH_TIME, A_DNS_SERVER_IP_LABEL, A_ETAG_HEADER, A_FETCH_BEGAN_TIME, A_FETCH_COMPLETED_TIME, A_FETCH_HISTORY, A_FORCE_RETIRE, A_FTP_CONTROL_CONVERSATION, A_FTP_FETCH_STATUS, A_HERITABLE_KEYS, A_HTML_BASE, A_HTTP_BIND_ADDRESS, A_HTTP_PROXY_HOST, A_HTTP_PROXY_PORT, A_HTTP_TRANSACTION, A_LAST_MODIFIED_HEADER, A_LOCALIZED_ERRORS, A_META_ROBOTS, A_MINIMUM_DELAY, A_MIRROR_PATH, A_PREREQUISITE_URI, A_REFERENCE_LENGTH, A_RETRY_DELAY, A_RRECORD_SET_LABEL, A_RUNTIME_EXCEPTION, A_SOURCE_TAG, A_STATUS, A_WRITTEN_TO_WARC, HEADER_TRUNC, LENGTH_TRUNC, TIMER_TRUNC, TRUNC_SUFFIX
 
Constructor Summary
NotExceedsDocumentLengthTresholdDecideRule(java.lang.String name)
           
 
Method Summary
protected  boolean evaluate(java.lang.Object object)
           
protected  int getContentLengthTreshold(java.lang.Object obj)
           
protected  java.lang.Boolean makeDecision(int contentLength, java.lang.Object obj)
           
 
Methods inherited from class org.archive.crawler.deciderules.PredicatedDecideRule
decisionFor
 
Methods inherited from class org.archive.crawler.deciderules.ConfiguredDecideRule
singlePossibleNonPassDecision
 
Methods inherited from class org.archive.crawler.deciderules.DecideRule
getController, kickUpdate
 
Methods inherited from class org.archive.crawler.settings.ModuleType
addElement, listUsedFiles
 
Methods inherited from class org.archive.crawler.settings.ComplexType
addElementToDefinition, checkValue, earlyInitialize, getAbsoluteName, getAttribute, getAttribute, getAttribute, getAttributeInfo, getAttributeInfo, getAttributeInfoIterator, getAttributes, getDataContainerRecursive, getDataContainerRecursive, getDefaultValue, getDescription, getElementFromDefinition, getLegalValues, getLocalAttribute, getMBeanInfo, getMBeanInfo, getParent, getPreservedFields, getSettingsHandler, getUncheckedAttribute, getValue, globalSettings, invoke, isInitialized, isOverridden, iterator, removeElementFromDefinition, setAsOrder, setAttribute, setAttribute, setAttributes, setDescription, setPreservedFields, toString, unsetAttribute
 
Methods inherited from class org.archive.crawler.settings.Type
addConstraint, equals, getConstraints, getLegalValueType, isExpertSetting, isOverrideable, isTransient, setExpertSetting, setLegalValueType, setOverrideable, setTransient
 
Methods inherited from class javax.management.Attribute
getName, hashCode
 
Methods inherited from class java.lang.Object
clone, finalize, getClass, notify, notifyAll, wait, wait, wait
 

Field Detail

ATTR_CONTENT_LENGTH_TRESHOLD

public static final java.lang.String ATTR_CONTENT_LENGTH_TRESHOLD
See Also:
Constant Field Values

DEFAULT_CONTENT_LENGTH_TRESHOLD

static final java.lang.Integer DEFAULT_CONTENT_LENGTH_TRESHOLD

ATTR_USE_AS_MIDFETCH

public static final java.lang.String ATTR_USE_AS_MIDFETCH
See Also:
Constant Field Values

DEFAULT_USE_AS_MIDFETCH

static final java.lang.Boolean DEFAULT_USE_AS_MIDFETCH

HEADER_PREDICTS_MISSING

public static final int HEADER_PREDICTS_MISSING
See Also:
Constant Field Values
Constructor Detail

NotExceedsDocumentLengthTresholdDecideRule

public NotExceedsDocumentLengthTresholdDecideRule(java.lang.String name)
Method Detail

evaluate

protected boolean evaluate(java.lang.Object object)
Specified by:
evaluate in class PredicatedDecideRule

makeDecision

protected java.lang.Boolean makeDecision(int contentLength,
                                         java.lang.Object obj)
Parameters:
contentLength - content length to check against treshold
obj - Context object.
Returns:
contentLength not exceeding treshold?

getContentLengthTreshold

protected int getContentLengthTreshold(java.lang.Object obj)
Parameters:
obj - Context object.
Returns:
content length threshold


Copyright © 2003-2011 Internet Archive. All Rights Reserved.